Expert distribution recording without overhead for EPLB (#4957)
This commit is contained in:
@@ -390,7 +390,7 @@
|
||||
"outputs": [],
|
||||
"source": [
|
||||
"expert_record_server_process, port = launch_server_cmd(\n",
|
||||
" \"python3 -m sglang.launch_server --model-path Qwen/Qwen1.5-MoE-A2.7B --host 0.0.0.0\"\n",
|
||||
" \"python3 -m sglang.launch_server --model-path Qwen/Qwen1.5-MoE-A2.7B --host 0.0.0.0 --expert-distribution-recorder-mode stat\"\n",
|
||||
")\n",
|
||||
"\n",
|
||||
"wait_for_server(f\"http://localhost:{port}\")"
|
||||
@@ -415,19 +415,7 @@
|
||||
"print_highlight(response)\n",
|
||||
"\n",
|
||||
"response = requests.post(f\"http://localhost:{port}/dump_expert_distribution_record\")\n",
|
||||
"print_highlight(response)\n",
|
||||
"\n",
|
||||
"import glob\n",
|
||||
"\n",
|
||||
"output_file = glob.glob(\"expert_distribution_*.csv\")[0]\n",
|
||||
"with open(output_file, \"r\") as f:\n",
|
||||
" print_highlight(\"\\n| Layer ID | Expert ID | Count |\")\n",
|
||||
" print_highlight(\"|----------|-----------|--------|\")\n",
|
||||
" next(f)\n",
|
||||
" for i, line in enumerate(f):\n",
|
||||
" if i < 9:\n",
|
||||
" layer_id, expert_id, count = line.strip().split(\",\")\n",
|
||||
" print_highlight(f\"| {layer_id:8} | {expert_id:9} | {count:6} |\")"
|
||||
"print_highlight(response)"
|
||||
]
|
||||
},
|
||||
{
|
||||
|
||||
Reference in New Issue
Block a user