support blockwise fp8 matmul kernel (#3267)
This commit is contained in:
@@ -96,6 +96,7 @@ sources = [
|
||||
"src/sgl-kernel/csrc/moe_align_kernel.cu",
|
||||
"src/sgl-kernel/csrc/int8_gemm_kernel.cu",
|
||||
"src/sgl-kernel/csrc/fp8_gemm_kernel.cu",
|
||||
"src/sgl-kernel/csrc/fp8_blockwise_gemm_kernel.cu",
|
||||
"src/sgl-kernel/csrc/lightning_attention_decode_kernel.cu",
|
||||
"src/sgl-kernel/csrc/fused_add_rms_norm_kernel.cu",
|
||||
"src/sgl-kernel/csrc/eagle_utils.cu",
|
||||
|
||||
Reference in New Issue
Block a user