Tiny fix missing expert location dispatch info (#6620)
This commit is contained in:
@@ -360,6 +360,9 @@ class DeepseekV2MoE(nn.Module):
|
||||
correction_bias=self.correction_bias,
|
||||
routed_scaling_factor=self.routed_scaling_factor,
|
||||
num_token_non_padded=forward_batch.num_token_non_padded,
|
||||
expert_location_dispatch_info=ExpertLocationDispatchInfo.init_new(
|
||||
layer_id=self.layer_id,
|
||||
),
|
||||
)
|
||||
else:
|
||||
topk_idx = torch.full(
|
||||
|
||||
Reference in New Issue
Block a user