some typo fixes (#858)

* fix(typo): correct scaling

* fix(typo): correct comment for `instruct`
This commit is contained in:
casinca
2025-09-30 18:18:02 +02:00
committed by GitHub
parent 458f2d9b67
commit 00c240ff87
4 changed files with 5 additions and 5 deletions

View File

@@ -334,7 +334,7 @@
},
{
"cell_type": "code",
"execution_count": 5,
"execution_count": null,
"id": "9a6bd0a2-f27c-4602-afa0-c96cd295c1a6",
"metadata": {
"colab": {
@@ -395,7 +395,7 @@
" self.mask.bool()[:num_tokens, :num_tokens], -torch.inf\n",
" )\n",
"\n",
" attn_weights = torch.softmax(attn_scores / keys.shape[-1]**-0.5, dim=-1)\n",
" attn_weights = torch.softmax(attn_scores / keys.shape[-1]**0.5, dim=-1)\n",
" attn_weights = self.dropout(attn_weights)\n",
"\n",
" # (b, num_heads, num_tokens, num_tokens) --> (b, num_heads, num_tokens, head_dim)\n",

View File

@@ -51,7 +51,7 @@ USE_REASONING_MODEL = True
USE_INSTRUCT_MODEL = False
# Uses the instruct mode (without reasoning) if
# USE_REASONING_MODEL = True
# USE_INSTRUCT_MODEL = False
# USE_INSTRUCT_MODEL = True
# This setting does have no effect if USE_REASONING_MODEL = False

View File

@@ -121,7 +121,7 @@
"USE_INSTRUCT_MODEL = False\n",
"# Uses the instruct mode (without reasoning) if \n",
"# USE_REASONING_MODEL = True\n",
"# USE_INSTRUCT_MODEL = False\n",
"# USE_INSTRUCT_MODEL = True\n",
"# This setting does have no effect if USE_REASONING_MODEL = False"
]
},

View File

@@ -119,7 +119,7 @@
"USE_INSTRUCT_MODEL = False\n",
"# Uses the instruct mode (without reasoning) if \n",
"# USE_REASONING_MODEL = True\n",
"# USE_INSTRUCT_MODEL = False\n",
"# USE_INSTRUCT_MODEL = True\n",
"# This setting does have no effect if USE_REASONING_MODEL = False"
]
},