diff --git a/tests/e2e/nightly/multi_node/config/DeepSeek-V3_2-W8A8-A3-dual-nodes.yaml b/tests/e2e/nightly/multi_node/config/DeepSeek-V3_2-W8A8-A3-dual-nodes.yaml index a7851471..771b70a0 100644 --- a/tests/e2e/nightly/multi_node/config/DeepSeek-V3_2-W8A8-A3-dual-nodes.yaml +++ b/tests/e2e/nightly/multi_node/config/DeepSeek-V3_2-W8A8-A3-dual-nodes.yaml @@ -39,7 +39,6 @@ deployment: --trust-remote-code --speculative-config '{"num_speculative_tokens": 3, "method":"deepseek_mtp"}' --compilation-config '{"cudagraph_capture_sizes": [8, 16, 24, 32, 40, 48], "cudagraph_mode": "FULL_DECODE_ONLY"}' - --additional-config '{"layer_sharding": ["q_b_proj", "o_proj"]}' --tokenizer-mode deepseek_v32 --reasoning-parser deepseek_v3 @@ -64,7 +63,6 @@ deployment: --trust-remote-code --speculative-config '{"num_speculative_tokens": 3, "method":"deepseek_mtp"}' --compilation-config '{"cudagraph_capture_sizes": [8, 16, 24, 32, 40, 48], "cudagraph_mode": "FULL_DECODE_ONLY"}' - --additional-config '{"layer_sharding": ["q_b_proj", "o_proj"]}' --tokenizer-mode deepseek_v32 --reasoning-parser deepseek_v3 benchmarks: diff --git a/tests/e2e/nightly/single_node/models/configs/DeepSeek-V3.2-W8A8.yaml b/tests/e2e/nightly/single_node/models/configs/DeepSeek-V3.2-W8A8.yaml index 1ab0b3ea..7931c974 100644 --- a/tests/e2e/nightly/single_node/models/configs/DeepSeek-V3.2-W8A8.yaml +++ b/tests/e2e/nightly/single_node/models/configs/DeepSeek-V3.2-W8A8.yaml @@ -38,8 +38,6 @@ test_cases: - '{"cudagraph_capture_sizes":[4, 8, 16, 20, 24, 28, 32], "cudagraph_mode":"FULL_DECODE_ONLY"}' - "--speculative-config" - '{"num_speculative_tokens": 3, "method":"deepseek_mtp"}' - - "--additional-config" - - '{"layer_sharding": ["q_b_proj", "o_proj"]}' - "--reasoning-parser" - "deepseek_v3" - "--tokenizer_mode"