[kernel] port rope cuda kernel to sgl-kernel (#2993)

Co-authored-by: Yineng Zhang <me@zhyncs.com>
This commit is contained in:
Byron Hsu
2025-01-20 04:58:51 -08:00
committed by GitHub
parent 73401fd016
commit b5caa22dfb
8 changed files with 255 additions and 1 deletions

View File

@@ -53,6 +53,7 @@ ext_modules = [
"src/sgl-kernel/csrc/int8_gemm_kernel.cu",
"src/sgl-kernel/csrc/sampling_scaling_penalties.cu",
"src/sgl-kernel/csrc/sgl_kernel_ops.cu",
"src/sgl-kernel/csrc/rotary_embedding.cu",
],
include_dirs=include_dirs,
extra_compile_args={