From 45f75b4178f2e4e73b73d3323f6492defe6670ca Mon Sep 17 00:00:00 2001 From: aipaes <82140963+aipaes@users.noreply.github.com> Date: Thu, 23 Apr 2026 22:56:24 +0800 Subject: [PATCH] [Doc][v0.18.0]Fix minimax2.5 readme (#8638) ### What this PR does / why we need it? Correct the descriptive errors in the document. ### Does this PR introduce _any_ user-facing change? no ### How was this patch tested? doc test --------- Signed-off-by: zjks98 Co-authored-by: zjks98 --- docs/source/tutorials/models/MiniMax-M2.md | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/docs/source/tutorials/models/MiniMax-M2.md b/docs/source/tutorials/models/MiniMax-M2.md index 0b8f4238..2236a4d5 100644 --- a/docs/source/tutorials/models/MiniMax-M2.md +++ b/docs/source/tutorials/models/MiniMax-M2.md @@ -104,7 +104,7 @@ docker run -itd -u 0 --ipc=host --privileged \ --device /dev/davinci_manager \ --device /dev/devmm_svm \ --device /dev/hisi_hdc \ - --shm-size=1200g \ + --shm-size=1g \ -v /usr/local/dcmi:/usr/local/dcmi \ -v /usr/local/Ascend/driver/tools/hccn_tool:/usr/local/Ascend/driver/tools/hccn_tool \ -v /usr/local/bin/npu-smi:/usr/local/bin/npu-smi \ @@ -112,7 +112,7 @@ docker run -itd -u 0 --ipc=host --privileged \ -v /usr/local/Ascend/driver/version.info:/usr/local/Ascend/driver/version.info \ -v /etc/ascend_install.info:/etc/ascend_install.info \ -v /home/:/home/ \ - -v /opt/data/verification/:/opt/data/verification/ \ # Map the model weights here + -v /opt/data/verification/:/opt/data/verification/ \ -v /root/.cache:/root/.cache \ -v /mnt/performance/:/mnt/performance/ \ -it $IMAGE bash @@ -426,9 +426,9 @@ Use vLLM bench for the **190k/1k, concurrency=4, 16 prompts** scenario: ```{code-block} bash vllm bench serve --backend vllm \ --dataset-name prefix_repetition \ - --prefix-repetition-prefix-len 175104 \ # Input: 190×1024 tokens with 90% prefix repetition - --prefix-repetition-suffix-len 19440 \ # Input: 190×1024 tokens minus the prefix length above - --prefix-repetition-output-len 1024 \ # Output: 1024 tokens + --prefix-repetition-prefix-len 175104 \ + --prefix-repetition-suffix-len 19440 \ + --prefix-repetition-output-len 1024 \ --prefix-repetition-num-prefixes 1 \ --num-prompts 16 \ --max-concurrency 4 \