Hint users DeepEP normal mode is incompatible with CUDA Graph (#5014)
This commit is contained in:
@@ -323,6 +323,9 @@ class ServerArgs:
|
|||||||
assert (
|
assert (
|
||||||
not self.enable_dp_attention
|
not self.enable_dp_attention
|
||||||
), "DeepEP MoE `auto` mode is not supported with DP Attention."
|
), "DeepEP MoE `auto` mode is not supported with DP Attention."
|
||||||
|
if self.deepep_mode == "normal":
|
||||||
|
logger.warning("Cuda graph is disabled because deepep_mode=`normal`")
|
||||||
|
self.disable_cuda_graph = True
|
||||||
self.ep_size = self.tp_size
|
self.ep_size = self.tp_size
|
||||||
self.enable_sp_layernorm = (
|
self.enable_sp_layernorm = (
|
||||||
self.dp_size < self.tp_size if self.enable_dp_attention else True
|
self.dp_size < self.tp_size if self.enable_dp_attention else True
|
||||||
|
|||||||
Reference in New Issue
Block a user