diff --git a/python/sglang/srt/layers/moe/ep_moe/layer.py b/python/sglang/srt/layers/moe/ep_moe/layer.py index a4c78c589..d2539edbf 100644 --- a/python/sglang/srt/layers/moe/ep_moe/layer.py +++ b/python/sglang/srt/layers/moe/ep_moe/layer.py @@ -229,7 +229,7 @@ class EPMoE(FusedMoE): ( _cast_to_e8m0_with_rounding_up(gateup_input_scale) if deep_gemm_wrapper.DEEPGEMM_SCALE_UE8M0 - else deep_gemm_wrapper.get_col_major_tma_aligned_tensor( + else deep_gemm_wrapper.get_mn_major_tma_aligned_tensor( gateup_input_scale ) ), @@ -286,9 +286,7 @@ class EPMoE(FusedMoE): ( down_input_scale if deep_gemm_wrapper.DEEPGEMM_SCALE_UE8M0 - else deep_gemm_wrapper.get_col_major_tma_aligned_tensor( - down_input_scale - ) + else deep_gemm_wrapper.get_mn_major_tma_aligned_tensor(down_input_scale) ), ) down_output = torch.empty(