Reduce Llama 3 RoPE memory requirements (#658)

* Llama3 from scratch improvements * Fix Llama 3 expensive RoPE memory issue * updates * update package * benchmark * remove unused rescale_theta
2026-04-10 12:33:42 +00:00 · 2025-06-12 11:08:02 -05:00
parent c278745aff
commit c4cde1c21b
9 changed files with 405 additions and 2577 deletions
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"

 [project]
 name = "llms-from-scratch"
-version = "1.0.6"
+version = "1.0.7"
 description = "Implement a ChatGPT-like LLM in PyTorch from scratch, step by step"
 readme = "README.md"
 requires-python = ">=3.10"