From 31eec35ba81cd41313807e693ecf1c872b60103b Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Fri, 14 Feb 2025 10:11:31 +0800 Subject: [PATCH] fix doc (#3558) --- docs/backend/speculative_decoding.ipynb | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/backend/speculative_decoding.ipynb b/docs/backend/speculative_decoding.ipynb index 7103469fc..fb748901b 100644 --- a/docs/backend/speculative_decoding.ipynb +++ b/docs/backend/speculative_decoding.ipynb @@ -47,7 +47,7 @@ " \"\"\"\n", "python3 -m sglang.launch_server --model meta-llama/Llama-2-7b-chat-hf --speculative-algo EAGLE \\\n", " --speculative-draft lmzheng/sglang-EAGLE-llama2-chat-7B --speculative-num-steps 5 \\\n", - " --speculative-eagle-topk 8 --speculative-num-draft-tokens 64 --mem-fraction 0.7 --port=30020\n", + " --speculative-eagle-topk 8 --speculative-num-draft-tokens 64 --mem-fraction 0.7 --port=30020 --cuda-graph-max-bs 32\n", "\"\"\"\n", ")\n", "\n",