From 02431b9ad21ca779000ed49f1fe60eb3498f7520 Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Sun, 26 Jan 2025 21:30:00 +0800 Subject: [PATCH] fix link in README (#3153) --- sgl-kernel/developer_guide.md | 2 +- sgl-kernel/setup.py | 3 --- 2 files changed, 1 insertion(+), 4 deletions(-) diff --git a/sgl-kernel/developer_guide.md b/sgl-kernel/developer_guide.md index 26426d90d..2b9859d94 100644 --- a/sgl-kernel/developer_guide.md +++ b/sgl-kernel/developer_guide.md @@ -26,7 +26,7 @@ Third-party libraries: Steps to add a new kernel: 1. Implement in [src/sgl-kernel/csrc/](https://github.com/sgl-project/sglang/tree/main/sgl-kernel/src/sgl-kernel/csrc) -2. Expose interface in [src/sgl-kernel/include/sgl_kernel_ops.h](https://github.com/sgl-project/sglang/blob/main/sgl-kernel/src/sgl-kernel/include/sgl_kernel_ops.h) +2. Expose interface in [src/sgl-kernel/include/sgl_kernels_ops.h](https://github.com/sgl-project/sglang/blob/main/sgl-kernel/src/sgl-kernel/include/sgl_kernels_ops.h) 3. Create torch extension in [src/sgl-kernel/torch_extension.cc](https://github.com/sgl-project/sglang/blob/main/sgl-kernel/src/sgl-kernel/torch_extension.cc) 4. Create Python wrapper in [src/sgl-kernel/ops/\_\_init\_\_.py](https://github.com/sgl-project/sglang/blob/main/sgl-kernel/src/sgl-kernel/ops/__init__.py) 5. Expose Python interface in [src/sgl-kernel/\_\_init\_\_.py](https://github.com/sgl-project/sglang/blob/main/sgl-kernel/src/sgl-kernel/__init__.py) diff --git a/sgl-kernel/setup.py b/sgl-kernel/setup.py index c8469dc1c..b982f2b1c 100644 --- a/sgl-kernel/setup.py +++ b/sgl-kernel/setup.py @@ -88,7 +88,6 @@ sources = [ "src/sgl-kernel/csrc/rotary_embedding.cu", "3rdparty/flashinfer/csrc/activation.cu", "3rdparty/flashinfer/csrc/bmm_fp8.cu", - "3rdparty/flashinfer/csrc/group_gemm.cu", "3rdparty/flashinfer/csrc/norm.cu", "3rdparty/flashinfer/csrc/sampling.cu", "3rdparty/flashinfer/csrc/renorm.cu", @@ -103,7 +102,6 @@ sm_version = _get_device_sm() if torch.cuda.is_available(): if cuda_version >= (12, 0) and sm_version >= 90: nvcc_flags.append("-gencode=arch=compute_90a,code=sm_90a") - sources.append("3rdparty/flashinfer/csrc/group_gemm_sm90.cu") if sm_version >= 90: nvcc_flags.extend(nvcc_flags_fp8) if sm_version >= 80: @@ -112,7 +110,6 @@ else: # compilation environment without GPU if enable_sm90a: nvcc_flags.append("-gencode=arch=compute_90a,code=sm_90a") - sources.append("3rdparty/flashinfer/csrc/group_gemm_sm90.cu") if enable_fp8: nvcc_flags.extend(nvcc_flags_fp8) if enable_bf16: