Fix DeepGEMM masked cannot be run on groups not being multiple or 4 (#5340)

This commit is contained in:
fzyzcjy
2025-04-19 13:38:07 +08:00
committed by GitHub
parent 2c11f9c2eb
commit 1e0806f30b

View File

@@ -972,9 +972,6 @@ class DeepEPMoE(EPMoE):
):
assert self.quant_method is not None
assert self.activation == "silu"
assert (
hidden_states_fp8[0].size(0) % 4 == 0
), f"TMA alignment error: {hidden_states_fp8[0].size(0)}"
# GroupGemm-0
num_groups, m, k = hidden_states_fp8[0].size()