udate weights from disk (#2265)
This commit is contained in:
@@ -82,7 +82,8 @@
|
||||
"Get the information of the model.\n",
|
||||
"\n",
|
||||
"- `model_path`: The path/name of the model.\n",
|
||||
"- `is_generation`: Whether the model is used as generation model or embedding model."
|
||||
"- `is_generation`: Whether the model is used as generation model or embedding model.\n",
|
||||
"- `tokenizer_path`: The path/name of the tokenizer."
|
||||
]
|
||||
},
|
||||
{
|
||||
@@ -98,7 +99,8 @@
|
||||
"print_highlight(response_json)\n",
|
||||
"assert response_json[\"model_path\"] == \"meta-llama/Llama-3.2-1B-Instruct\"\n",
|
||||
"assert response_json[\"is_generation\"] is True\n",
|
||||
"assert response_json.keys() == {\"model_path\", \"is_generation\"}"
|
||||
"assert response_json[\"tokenizer_path\"] == \"meta-llama/Llama-3.2-1B-Instruct\"\n",
|
||||
"assert response_json.keys() == {\"model_path\", \"is_generation\", \"tokenizer_path\"}"
|
||||
]
|
||||
},
|
||||
{
|
||||
@@ -187,9 +189,11 @@
|
||||
"cell_type": "markdown",
|
||||
"metadata": {},
|
||||
"source": [
|
||||
"## Update Weights\n",
|
||||
"## Update Weights From Disk\n",
|
||||
"\n",
|
||||
"Update model weights without restarting the server. Use for continuous evaluation during training. Only applicable for models with the same architecture and parameter size."
|
||||
"Update model weights from disk without restarting the server. Only applicable for models with the same architecture and parameter size.\n",
|
||||
"\n",
|
||||
"SGLang support `update_weights_from_disk` API for continuous evaluation during training (save checkpoint to disk and update weights from disk).\n"
|
||||
]
|
||||
},
|
||||
{
|
||||
@@ -200,7 +204,7 @@
|
||||
"source": [
|
||||
"# successful update with same architecture and size\n",
|
||||
"\n",
|
||||
"url = \"http://localhost:30010/update_weights\"\n",
|
||||
"url = \"http://localhost:30010/update_weights_from_disk\"\n",
|
||||
"data = {\"model_path\": \"meta-llama/Llama-3.2-1B\"}\n",
|
||||
"\n",
|
||||
"response = requests.post(url, json=data)\n",
|
||||
@@ -218,7 +222,7 @@
|
||||
"source": [
|
||||
"# failed update with different parameter size\n",
|
||||
"\n",
|
||||
"url = \"http://localhost:30010/update_weights\"\n",
|
||||
"url = \"http://localhost:30010/update_weights_from_disk\"\n",
|
||||
"data = {\"model_path\": \"meta-llama/Llama-3.2-3B\"}\n",
|
||||
"\n",
|
||||
"response = requests.post(url, json=data)\n",
|
||||
|
||||
Reference in New Issue
Block a user