From 07e58a2dcbfe3ad4c4f3d13e955fe0a00b37c74c Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Thu, 6 Feb 2025 07:13:05 +0800 Subject: [PATCH] update README (#3324) --- benchmark/deepseek_v3/README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/benchmark/deepseek_v3/README.md b/benchmark/deepseek_v3/README.md index ea972831a..387a6629f 100644 --- a/benchmark/deepseek_v3/README.md +++ b/benchmark/deepseek_v3/README.md @@ -31,7 +31,7 @@ For high QPS scenarios, add the `--enable-dp-attention` argument to boost throug ### Using pip ```bash # Installation -pip install "sglang[all]>=0.4.1.post5" --find-links https://flashinfer.ai/whl/cu124/torch2.4/flashinfer +pip install "sglang[all]>=0.4.2.post2" --find-links https://flashinfer.ai/whl/cu124/torch2.5/flashinfer # Launch python3 -m sglang.launch_server --model deepseek-ai/DeepSeek-V3 --tp 8 --trust-remote-code