Qwen3 From Scratch (#678)

* Qwen3 From Scratch * rev other file * upd * upd * upd * url fixes
2026-04-10 12:33:42 +00:00 · 2025-06-19 18:44:38 -05:00
parent 58b8672452
commit e719bd86ad
10 changed files with 2640 additions and 6 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -48,12 +48,13 @@ ch05/07_gpt_to_llama/Llama-3.2-1B
 ch05/07_gpt_to_llama/Llama-3.2-1B-Instruct
 ch05/07_gpt_to_llama/Llama-3.2-3B
 ch05/07_gpt_to_llama/Llama-3.2-3B-Instruct
+ch05/07_gpt_to_llama/llama3.2-1B-instruct.pth
+ch05/07_gpt_to_llama/tokenizer.model
 ch05/10_llm-training-speed/middlemarch.txt
 ch05/10_llm-training-speed/loss.pdf
 ch05/10_llm-training-speed/model.pth
-ch05/07_gpt_to_llama/Untitled.ipynb
-ch05/07_gpt_to_llama/llama3.2-1B-instruct.pth
-ch05/07_gpt_to_llama/tokenizer.model
+ch05/11_qwen3/Qwen3-0.6B
+ch05/11_qwen3/Qwen3-0.6B-Base

 ch06/01_main-chapter-code/gpt2
 ch06/02_bonus_additional-experiments/gpt2