[BugFix]Fix incorrect get_current_vllm_config (#5121)

### What this PR does / why we need it? This PR fixes some incorrect `get_current_vllm_config` calling, which creates empty vllm_config instead. ### Does this PR introduce _any_ user-facing change? No. ### How was this patch tested? - vLLM version: v0.12.0 - vLLM main: ad32e3e19c --------- Signed-off-by: Angazenn <supperccell@163.com>
2025-12-18 22:21:36 +08:00
parent fd9a47c04d
commit 632eab28b7
6 changed files with 12 additions and 15 deletions
--- a/vllm_ascend/ascend_config.py
+++ b/vllm_ascend/ascend_config.py
@@ -154,8 +154,7 @@ class AscendConfig:
        # npu_fused_infer_attention_score in some cases. We allow to execute
        # _npu_paged_attention in this cases. This should be removed once
        # npu_fused_infer_attention_score performs better on all scenarios.
-        self.pa_shape_list = additional_config.get("pa_shape_list",
-                                                   [1, 2, 3, 4])
+        self.pa_shape_list = additional_config.get("pa_shape_list", [])

        kv_cfg = vllm_config.kv_transfer_config
        if kv_cfg is not None and not getattr(kv_cfg, "_engine_id_patched",