Revert "[1/2] sgl-kernel: Fuse routed scaling factor into select_experts" (#8706)
This commit is contained in:
@@ -243,8 +243,7 @@ std::vector<at::Tensor> moe_fused_gate(
|
||||
int64_t topk_group,
|
||||
int64_t topk,
|
||||
int64_t num_fused_shared_experts,
|
||||
double routed_scaling_factor,
|
||||
bool apply_routed_scaling_factor_on_output);
|
||||
double routed_scaling_factor);
|
||||
|
||||
void fp8_blockwise_scaled_grouped_mm(
|
||||
torch::Tensor& output,
|
||||
|
||||
Reference in New Issue
Block a user