[sgl-kernel][2/N]Support Expert Specialization Grouped GEMM (#11534)

This commit is contained in:
Qi Yuhang
2025-10-14 07:24:48 +08:00
committed by GitHub
parent 6dc9ca8c85
commit dc48c4c0e3
4 changed files with 112 additions and 106 deletions

View File

@@ -244,7 +244,7 @@ from sgl_kernel.elementwise import (
rmsnorm,
silu_and_mul,
)
from sgl_kernel.expert_specilization import es_fp8_blockwise_scaled_grouped_mm
from sgl_kernel.expert_specialization import es_fp8_blockwise_scaled_grouped_mm
from sgl_kernel.fused_moe import fused_marlin_moe
from sgl_kernel.gemm import (
awq_dequantize,