use attn_scores from sec 3.4 instead of 3.3

This commit is contained in:
rasbt
2024-02-14 20:23:59 -06:00
parent 231a854ae7
commit 250e6306e2
4 changed files with 45 additions and 33 deletions

View File

@@ -836,7 +836,7 @@
" x = self.drop_resid(x)\n",
" x = x + shortcut # Add the original input back\n",
"\n",
" # Shortcut connection for feed-forward block\n",
" # Shortcut connection for feed forward block\n",
" shortcut = x\n",
" x = self.norm2(x)\n",
" x = self.ff(x)\n",