Hint users DeepEP normal mode is incompatible with CUDA Graph (#5014)
This commit is contained in:
@@ -323,6 +323,9 @@ class ServerArgs:
|
||||
assert (
|
||||
not self.enable_dp_attention
|
||||
), "DeepEP MoE `auto` mode is not supported with DP Attention."
|
||||
if self.deepep_mode == "normal":
|
||||
logger.warning("Cuda graph is disabled because deepep_mode=`normal`")
|
||||
self.disable_cuda_graph = True
|
||||
self.ep_size = self.tp_size
|
||||
self.enable_sp_layernorm = (
|
||||
self.dp_size < self.tp_size if self.enable_dp_attention else True
|
||||
|
||||
Reference in New Issue
Block a user