Fix DeepGEMM masked cannot be run on groups not being multiple or 4 (#5340)
This commit is contained in:
@@ -972,9 +972,6 @@ class DeepEPMoE(EPMoE):
|
|||||||
):
|
):
|
||||||
assert self.quant_method is not None
|
assert self.quant_method is not None
|
||||||
assert self.activation == "silu"
|
assert self.activation == "silu"
|
||||||
assert (
|
|
||||||
hidden_states_fp8[0].size(0) % 4 == 0
|
|
||||||
), f"TMA alignment error: {hidden_states_fp8[0].size(0)}"
|
|
||||||
|
|
||||||
# GroupGemm-0
|
# GroupGemm-0
|
||||||
num_groups, m, k = hidden_states_fp8[0].size()
|
num_groups, m, k = hidden_states_fp8[0].size()
|
||||||
|
|||||||
Reference in New Issue
Block a user