Revert "Integration of TurboMind AWQ" (#2866)

This commit is contained in:
Lianmin Zheng
2025-01-13 04:44:39 -08:00
committed by GitHub
parent f3516c2894
commit 6249e4a19e
8 changed files with 2 additions and 411 deletions

View File

@@ -28,7 +28,7 @@ runtime_common = [
srt = [
"sglang[runtime_common]", "cuda-python",
"sgl-kernel>=0.0.2.post11", "torch", "vllm>=0.6.3.post1,<=0.6.4.post1",
"flashinfer==0.1.6", "turbomind"
"flashinfer==0.1.6"
]
# HIP (Heterogeneous-computing Interface for Portability) for AMD