|
@@ -822,7 +822,7 @@
|
|
|
},
|
|
},
|
|
|
{
|
|
{
|
|
|
"cell_type": "code",
|
|
"cell_type": "code",
|
|
|
- "execution_count": 37,
|
|
|
|
|
|
|
+ "execution_count": null,
|
|
|
"id": "699cb1b8-a67d-49fb-80a6-0dad9d81f392",
|
|
"id": "699cb1b8-a67d-49fb-80a6-0dad9d81f392",
|
|
|
"metadata": {
|
|
"metadata": {
|
|
|
"colab": {
|
|
"colab": {
|
|
@@ -936,7 +936,8 @@
|
|
|
" weights_dict.update(shard)\n",
|
|
" weights_dict.update(shard)\n",
|
|
|
"\n",
|
|
"\n",
|
|
|
"load_weights_into_qwen(model, QWEN3_CONFIG, weights_dict)\n",
|
|
"load_weights_into_qwen(model, QWEN3_CONFIG, weights_dict)\n",
|
|
|
- "model.to(device);"
|
|
|
|
|
|
|
+ "model.to(device)\n",
|
|
|
|
|
+ "del weights_dict"
|
|
|
]
|
|
]
|
|
|
},
|
|
},
|
|
|
{
|
|
{
|
|
@@ -1187,7 +1188,7 @@
|
|
|
"provenance": []
|
|
"provenance": []
|
|
|
},
|
|
},
|
|
|
"kernelspec": {
|
|
"kernelspec": {
|
|
|
- "display_name": "Python 3 (ipykernel)",
|
|
|
|
|
|
|
+ "display_name": ".venv",
|
|
|
"language": "python",
|
|
"language": "python",
|
|
|
"name": "python3"
|
|
"name": "python3"
|
|
|
},
|
|
},
|
|
@@ -1201,7 +1202,7 @@
|
|
|
"name": "python",
|
|
"name": "python",
|
|
|
"nbconvert_exporter": "python",
|
|
"nbconvert_exporter": "python",
|
|
|
"pygments_lexer": "ipython3",
|
|
"pygments_lexer": "ipython3",
|
|
|
- "version": "3.11.9"
|
|
|
|
|
|
|
+ "version": "3.12.6"
|
|
|
}
|
|
}
|
|
|
},
|
|
},
|
|
|
"nbformat": 4,
|
|
"nbformat": 4,
|