Move cached kernel to srt.utils (#10776)

This commit is contained in:
Lifu Huang
2025-09-22 23:00:36 -07:00
committed by GitHub
parent 063c3791fe
commit 9241f4fd20
4 changed files with 120 additions and 122 deletions

View File

@@ -5,7 +5,7 @@ import triton
import triton.language as tl
from sglang.srt.lora.utils import LoRABatchInfo
from sglang.utils import cached_triton_kernel
from sglang.srt.utils import cached_triton_kernel
@cached_triton_kernel(lambda _, kwargs: (kwargs["NUM_SLICES"], kwargs["BLOCK_M"]))

View File

@@ -3,7 +3,7 @@ import triton
import triton.language as tl
from sglang.srt.lora.utils import LoRABatchInfo
from sglang.utils import cached_triton_kernel
from sglang.srt.utils import cached_triton_kernel
@cached_triton_kernel(lambda _, kwargs: (kwargs["NUM_SLICES"], kwargs["BLOCK_M"]))