Bump Flashinfer to 0.2.5 (#5870)

Co-authored-by: Yuhao Chen <yxckeis8@gmail.com>
This commit is contained in:
Baizhou Zhang
2025-04-29 19:50:57 -07:00
committed by GitHub
parent cc4a80caf6
commit 799789afed
6 changed files with 135 additions and 101 deletions

View File

@@ -37,7 +37,7 @@ runtime_common = [
"python-multipart",
"pyzmq>=25.1.2",
"soundfile==0.13.1",
"torchao>=0.7.0",
"torchao>=0.9.0",
"transformers==4.51.1",
"uvicorn",
"uvloop",
@@ -47,7 +47,7 @@ runtime_common = [
srt = [
"sglang[runtime_common]",
"sgl-kernel==0.1.0",
"flashinfer_python==0.2.3",
"flashinfer_python==0.2.5",
"torch==2.6.0",
"torchvision==0.21.0",
"cuda-python",