[sgl-kernel] update deepgemm (#6942)

This commit is contained in:
JieXin Liang
2025-06-07 14:24:41 +08:00
committed by GitHub
parent c4ffbeca19
commit 22fe787852
2 changed files with 5 additions and 2 deletions

View File

@@ -1719,7 +1719,10 @@ class DeepseekV2ForCausalLM(nn.Module):
logger, logger,
"Only Deepseek V3/R1 on NV-platform can use shared experts fusion optimization. Shared experts fusion optimization is disabled.", "Only Deepseek V3/R1 on NV-platform can use shared experts fusion optimization. Shared experts fusion optimization is disabled.",
) )
elif (global_server_args_dict["enable_deepep_moe"] or global_server_args_dict["enable_ep_moe"]): elif (
global_server_args_dict["enable_deepep_moe"]
or global_server_args_dict["enable_ep_moe"]
):
self.num_fused_shared_experts = 0 self.num_fused_shared_experts = 0
global_server_args_dict["disable_shared_experts_fusion"] = True global_server_args_dict["disable_shared_experts_fusion"] = True
log_info_on_rank0( log_info_on_rank0(

View File

@@ -53,7 +53,7 @@ FetchContent_Populate(repo-cutlass)
FetchContent_Declare( FetchContent_Declare(
repo-deepgemm repo-deepgemm
GIT_REPOSITORY https://github.com/deepseek-ai/DeepGEMM GIT_REPOSITORY https://github.com/deepseek-ai/DeepGEMM
GIT_TAG d75b218b7b8f4a5dd5406ac87905039ead3ae42f GIT_TAG 8dfa3298274bfe6b242f6f8a3e6f3eff2707dd9f
GIT_SHALLOW OFF GIT_SHALLOW OFF
) )
FetchContent_Populate(repo-deepgemm) FetchContent_Populate(repo-deepgemm)