DP Attention with Auto DeepEP Dispatch (#7222)
This commit is contained in:
@@ -418,10 +418,6 @@ class ServerArgs:
|
||||
|
||||
# DeepEP MoE
|
||||
if self.enable_deepep_moe:
|
||||
if self.deepep_mode == "auto":
|
||||
assert (
|
||||
not self.enable_dp_attention
|
||||
), "DeepEP MoE `auto` mode is not supported with DP Attention."
|
||||
if self.deepep_mode == "normal":
|
||||
logger.warning("Cuda graph is disabled because deepep_mode=`normal`")
|
||||
self.disable_cuda_graph = True
|
||||
|
||||
Reference in New Issue
Block a user