Qwen3 KV cache (#688)

2026-04-10 12:33:42 +00:00 · 2025-06-21 17:34:39 -05:00
parent 2a530b49fe
commit 0b15a00574
8 changed files with 370 additions and 11 deletions
--- a/pkg/llms_from_scratch/tests/test_llama3.py
+++ b/pkg/llms_from_scratch/tests/test_llama3.py
@@ -189,7 +189,7 @@ def llama3_weights_path(tmp_path_factory):
 )
@pytest.mark.parametrize("ModelClass", [Llama3Model, Llama3ModelKV])
@pytest.mark.parametrize("generate_fn", [generate_text_simple, generate_text_simple_cached])
-def test_gpt_model_variants(ModelClass, generate_fn, llama3_weights_path):
+def test_model_variants(ModelClass, generate_fn, llama3_weights_path):

    # Skip incompatible combinations
    if generate_fn is generate_text_simple and getattr(ModelClass, "reset_kv_cache", False):