[sgl-kernel][3/N]Support Expert Specialization Grouped GEMM (#11674)

This commit is contained in:
Qi Yuhang
2025-10-16 04:39:31 +08:00
committed by GitHub
parent f226d3da2a
commit 6c01844f45
7 changed files with 22 additions and 8 deletions

View File

@@ -12,6 +12,7 @@ def es_fp8_blockwise_scaled_grouped_mm(
stride_d,
problem_sizes,
expert_offsets,
workspace,
):
torch.ops.sgl_kernel.es_fp8_blockwise_scaled_grouped_mm.default(
output,
@@ -24,4 +25,5 @@ def es_fp8_blockwise_scaled_grouped_mm(
stride_d,
problem_sizes,
expert_offsets,
workspace,
)