diff --git a/docs/source/tutorials/Qwen3-235B-A22B.md b/docs/source/tutorials/Qwen3-235B-A22B.md index 64ff19b8..85181437 100644 --- a/docs/source/tutorials/Qwen3-235B-A22B.md +++ b/docs/source/tutorials/Qwen3-235B-A22B.md @@ -112,7 +112,7 @@ vllm serve vllm-ascend/Qwen3-235B-A22B-w8a8 \ --seed 1024 \ --quantization ascend \ --served-model-name qwen3 \ ---max-num-seqs 4 \ +--max-num-seqs 32 \ --max-model-len 133000 \ --max-num-batched-tokens 8096 \ --enable-expert-parallel \