[Fusion] normalize fusion naming and enable e2e test (#4693)

### What this PR does / why we need it? This PR standardizes the fusion naming, changing `enable_quantization_fusion` to `fuse_norm_quant`, and enables e2e testing. ### Does this PR introduce _any_ user-facing change? N/A ### How was this patch tested? CI passed with new added/existing test. - vLLM version: v0.12.0 - vLLM main: ad32e3e19c --------- Signed-off-by: wxsIcey <1790571317@qq.com>
2025-12-11 17:53:43 +08:00
parent 07c7131104
commit 18221c0e1d
8 changed files with 136 additions and 113 deletions
--- a/tests/ut/test_ascend_config.py
+++ b/tests/ut/test_ascend_config.py
@@ -41,14 +41,14 @@ class TestAscendConfig(TestBase):
        self.assertFalse(ascend_config.multistream_overlap_shared_expert)

        ascend_compilation_config = ascend_config.ascend_compilation_config
-        self.assertTrue(ascend_compilation_config.enable_quantization_fusion)
+        self.assertTrue(ascend_compilation_config.fuse_norm_quant)

    @_clean_up_ascend_config
    def test_init_ascend_config_with_additional_config(self):
        test_vllm_config = VllmConfig()
        test_vllm_config.additional_config = {
            "ascend_compilation_config": {
-                "enable_quantization_fusion": False,
+                "fuse_norm_quant": False,
            },
            "multistream_overlap_shared_expert": True,
            "expert_map_path": "test_expert_map_path",
@@ -60,7 +60,7 @@ class TestAscendConfig(TestBase):
        self.assertFalse(ascend_config.enable_npugraph_ex)

        ascend_compilation_config = ascend_config.ascend_compilation_config
-        self.assertFalse(ascend_compilation_config.enable_quantization_fusion)
+        self.assertFalse(ascend_compilation_config.fuse_norm_quant)

    @_clean_up_ascend_config
    def test_init_ascend_config_enable_npugraph_ex(self):