Mixture-of-Experts intro (#888)

This commit is contained in:
Sebastian Raschka
2025-10-19 22:17:59 -05:00
committed by GitHub
parent 27b6dfab9e
commit 218221ab62
13 changed files with 1333 additions and 228 deletions

5
.gitignore vendored
View File

@@ -12,8 +12,9 @@ appendix-D/01_main-chapter-code/3.pdf
appendix-E/01_main-chapter-code/loss-plot.pdf
ch04/04_gqa/kv_bytes_vs_context_length.pdf
ch05/05_mla/kv_bytes_vs_context_length.pdf
ch06/06_swa/kv_bytes_vs_context_length.pdf
ch04/05_mla/kv_bytes_vs_context_length.pdf
ch04/06_swa/kv_bytes_vs_context_length.pdf
ch04/07_moe/ffn_vs_moe.pdf
ch05/01_main-chapter-code/loss-plot.pdf
ch05/01_main-chapter-code/temperature-plot.pdf