Hint users DeepEP normal mode is incompatible with CUDA Graph (#5014)

This commit is contained in:
fzyzcjy
2025-05-07 22:40:59 +08:00
committed by GitHub
parent 38053c3372
commit 4c7b42424c

View File

@@ -323,6 +323,9 @@ class ServerArgs:
assert (
not self.enable_dp_attention
), "DeepEP MoE `auto` mode is not supported with DP Attention."
if self.deepep_mode == "normal":
logger.warning("Cuda graph is disabled because deepep_mode=`normal`")
self.disable_cuda_graph = True
self.ep_size = self.tp_size
self.enable_sp_layernorm = (
self.dp_size < self.tp_size if self.enable_dp_attention else True