Improve KV cache code for torch.compile (#705)

* Improve KV cache code for torch.compile * cleanup * cleanup
2026-04-10 12:33:42 +00:00 · 2025-06-23 18:08:49 -05:00
parent 6522be94be
commit 81eda38d3b
8 changed files with 593 additions and 315 deletions
--- a/ch04/03_kv-cache/gpt_ch04.py
+++ b/ch04/03_kv-cache/gpt_ch04.py
@@ -27,7 +27,7 @@ class MultiHeadAttention(nn.Module):
        self.dropout = nn.Dropout(dropout)
        self.register_buffer(
            "mask",
-            torch.triu(torch.ones(context_length, context_length),diagonal=1),
+            torch.triu(torch.ones(context_length, context_length), diagonal=1),
            persistent=False
        )