mirror of
https://github.com/rasbt/LLMs-from-scratch.git
synced 2026-04-10 12:33:42 +00:00
Fix code comment
This commit is contained in:
committed by
GitHub
parent
623dc65d5d
commit
5ae41c402e
@@ -64,8 +64,8 @@ QWEN3_CONFIG_8B = {
|
||||
"context_length": 40_960,
|
||||
"emb_dim": 4096, # 60% larger than above
|
||||
"n_heads": 32,
|
||||
"n_layers": 36, # 26% larger than above
|
||||
"hidden_dim": 12288,
|
||||
"n_layers": 36,
|
||||
"hidden_dim": 12288, # 26% larger than above
|
||||
"head_dim": 128,
|
||||
"qk_norm": True,
|
||||
"n_kv_groups": 8,
|
||||
|
||||
Reference in New Issue
Block a user