integrate blockwise fp8 kernel (#3529)
This commit is contained in:
@@ -25,7 +25,7 @@ runtime_common = [
|
||||
]
|
||||
srt = [
|
||||
"sglang[runtime_common]", "cuda-python",
|
||||
"sgl-kernel>=0.0.3.post4", "torch", "vllm>=0.6.4.post1,<=0.7.2",
|
||||
"sgl-kernel>=0.0.3.post5", "torch", "vllm>=0.6.4.post1,<=0.7.2",
|
||||
"flashinfer_python>=0.2.0.post2", "outlines>=0.0.44,<=0.1.11"
|
||||
]
|
||||
|
||||
|
||||
Reference in New Issue
Block a user