mirror of
https://github.com/rasbt/LLMs-from-scratch.git
synced 2026-04-10 12:33:42 +00:00
Qwen3 From Scratch (#678)
* Qwen3 From Scratch * rev other file * upd * upd * upd * url fixes
This commit is contained in:
committed by
GitHub
parent
58b8672452
commit
e719bd86ad
7
.gitignore
vendored
7
.gitignore
vendored
@@ -48,12 +48,13 @@ ch05/07_gpt_to_llama/Llama-3.2-1B
|
||||
ch05/07_gpt_to_llama/Llama-3.2-1B-Instruct
|
||||
ch05/07_gpt_to_llama/Llama-3.2-3B
|
||||
ch05/07_gpt_to_llama/Llama-3.2-3B-Instruct
|
||||
ch05/07_gpt_to_llama/llama3.2-1B-instruct.pth
|
||||
ch05/07_gpt_to_llama/tokenizer.model
|
||||
ch05/10_llm-training-speed/middlemarch.txt
|
||||
ch05/10_llm-training-speed/loss.pdf
|
||||
ch05/10_llm-training-speed/model.pth
|
||||
ch05/07_gpt_to_llama/Untitled.ipynb
|
||||
ch05/07_gpt_to_llama/llama3.2-1B-instruct.pth
|
||||
ch05/07_gpt_to_llama/tokenizer.model
|
||||
ch05/11_qwen3/Qwen3-0.6B
|
||||
ch05/11_qwen3/Qwen3-0.6B-Base
|
||||
|
||||
ch06/01_main-chapter-code/gpt2
|
||||
ch06/02_bonus_additional-experiments/gpt2
|
||||
|
||||
Reference in New Issue
Block a user