mirror of
https://github.com/rasbt/LLMs-from-scratch.git
synced 2026-04-10 12:33:42 +00:00
formatting fix
This commit is contained in:
@@ -2,6 +2,10 @@
|
|||||||
|
|
||||||
Tiny Aya is a new, "small" LLM by Cohere that is said to be the "most capable multi-lingual open-weight model" at the 3B parameter size class. (Tiny Aya outperforms Qwen3-4B, Gemma 3 4B, and Ministral 3 3B according to the [announcement post](https://cohere.com/blog/cohere-labs-tiny-aya)).
|
Tiny Aya is a new, "small" LLM by Cohere that is said to be the "most capable multi-lingual open-weight model" at the 3B parameter size class. (Tiny Aya outperforms Qwen3-4B, Gemma 3 4B, and Ministral 3 3B according to the [announcement post](https://cohere.com/blog/cohere-labs-tiny-aya)).
|
||||||
|
|
||||||
|
<img src="https://sebastianraschka.com/images/LLMs-from-scratch-images/bonus/tiny-aya/01.webp">
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
This is a great model to run and experiment with locally. The only caveat is that while it's an open-weight model, its licensing terms are relatively restricted and only allow non-commercial use.
|
This is a great model to run and experiment with locally. The only caveat is that while it's an open-weight model, its licensing terms are relatively restricted and only allow non-commercial use.
|
||||||
|
|
||||||
That aside, Arya is a 3.35B parameter model that comes in several flavors that are useful for
|
That aside, Arya is a 3.35B parameter model that comes in several flavors that are useful for
|
||||||
|
|||||||
@@ -1291,6 +1291,7 @@
|
|||||||
},
|
},
|
||||||
"widgets": {
|
"widgets": {
|
||||||
"application/vnd.jupyter.widget-state+json": {
|
"application/vnd.jupyter.widget-state+json": {
|
||||||
|
"state": {
|
||||||
"0dccd57dcc5c43a588157cef957c07e8": {
|
"0dccd57dcc5c43a588157cef957c07e8": {
|
||||||
"model_module": "@jupyter-widgets/controls",
|
"model_module": "@jupyter-widgets/controls",
|
||||||
"model_module_version": "2.0.0",
|
"model_module_version": "2.0.0",
|
||||||
@@ -2011,6 +2012,9 @@
|
|||||||
"value": " 2.18M/2.18M [00:00<00:00, 9.47MB/s]"
|
"value": " 2.18M/2.18M [00:00<00:00, 9.47MB/s]"
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
},
|
||||||
|
"version_major": 2,
|
||||||
|
"version_minor": 0
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
|
|||||||
@@ -1210,6 +1210,7 @@
|
|||||||
},
|
},
|
||||||
"widgets": {
|
"widgets": {
|
||||||
"application/vnd.jupyter.widget-state+json": {
|
"application/vnd.jupyter.widget-state+json": {
|
||||||
|
"state": {
|
||||||
"0dccd57dcc5c43a588157cef957c07e8": {
|
"0dccd57dcc5c43a588157cef957c07e8": {
|
||||||
"model_module": "@jupyter-widgets/controls",
|
"model_module": "@jupyter-widgets/controls",
|
||||||
"model_module_version": "2.0.0",
|
"model_module_version": "2.0.0",
|
||||||
@@ -1930,6 +1931,9 @@
|
|||||||
"value": " 2.18M/2.18M [00:00<00:00, 9.47MB/s]"
|
"value": " 2.18M/2.18M [00:00<00:00, 9.47MB/s]"
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
},
|
||||||
|
"version_major": 2,
|
||||||
|
"version_minor": 0
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
|
|||||||
Reference in New Issue
Block a user