chore: upgrade sgl-kernel 0.0.8.post3 (#5342)
This commit is contained in:
@@ -47,7 +47,7 @@ runtime_common = [
|
|||||||
|
|
||||||
srt = [
|
srt = [
|
||||||
"sglang[runtime_common]",
|
"sglang[runtime_common]",
|
||||||
"sgl-kernel==0.0.8",
|
"sgl-kernel==0.0.8.post3",
|
||||||
"flashinfer_python==0.2.3",
|
"flashinfer_python==0.2.3",
|
||||||
"torch==2.5.1",
|
"torch==2.5.1",
|
||||||
"torchvision==0.20.1",
|
"torchvision==0.20.1",
|
||||||
|
|||||||
@@ -41,7 +41,7 @@ fp8_type_ = torch.float8_e4m3fnuz if _is_hip else torch.float8_e4m3fn
|
|||||||
|
|
||||||
_is_cuda = is_cuda()
|
_is_cuda = is_cuda()
|
||||||
if _is_cuda:
|
if _is_cuda:
|
||||||
import deep_gemm # `pip install "sgl-kernel>=0.0.4.post3"`
|
import deep_gemm
|
||||||
from sgl_kernel import sgl_per_token_group_quant_fp8, sgl_per_token_quant_fp8
|
from sgl_kernel import sgl_per_token_group_quant_fp8, sgl_per_token_quant_fp8
|
||||||
|
|
||||||
sm_version = get_device_sm()
|
sm_version = get_device_sm()
|
||||||
|
|||||||
@@ -20,7 +20,7 @@ pip install --upgrade pip
|
|||||||
|
|
||||||
# Install flashinfer and sgl-kernel
|
# Install flashinfer and sgl-kernel
|
||||||
pip install flashinfer_python==0.2.3 --find-links ${FLASHINFER_REPO} --no-cache-dir
|
pip install flashinfer_python==0.2.3 --find-links ${FLASHINFER_REPO} --no-cache-dir
|
||||||
pip install sgl-kernel==0.0.8 --no-cache-dir
|
pip install sgl-kernel==0.0.8.post3 --no-cache-dir
|
||||||
|
|
||||||
# Install the main package
|
# Install the main package
|
||||||
pip install -e "python[all]" --find-links ${FLASHINFER_REPO}
|
pip install -e "python[all]" --find-links ${FLASHINFER_REPO}
|
||||||
|
|||||||
Reference in New Issue
Block a user