Revert "[feat] enable hierarchical mc2 ops on A2 by default (#5300)" (#5434)

We'll release 0.13.0 soon. The main branch is freeze. Let's revert the newest change and redo it once 0.13.0 is released. - vLLM version: release/v0.13.0 - vLLM main: 81786c8774 Signed-off-by: realliujiaxu <realliujiaxu@163.com>
2025-12-27 17:06:58 +08:00
parent 2add3dc3e0
commit 09f71c14a6
2 changed files with 20 additions and 10 deletions
--- a/vllm_ascend/utils.py
+++ b/vllm_ascend/utils.py
@@ -958,6 +958,14 @@ def calculate_dp_buffer_size() -> int:
    return max(dp_buffer_size, _MIN_DP_BUFFER_SIZE)


+# Currently, when in A2, setting the environment variables HCCL_INTRA_PCIE_ENABLE=1
+# and HCCL_INTRA_ROCE_ENABLE=0 can reduce cross-machine communication traffic and
+# significantly improve communication performance of MC2 ops dispatch/combine.
+def is_hierarchical_communication_enabled():
+    return (os.getenv("HCCL_INTRA_ROCE_ENABLE", "") == "0"
+            and os.getenv("HCCL_INTRA_PCIE_ENABLE", "") == "1")
+
+
 def has_layer_idx(model_instance: torch.nn.Module) -> bool:
    if model_instance is None:
        return False