ROCm: update aiter and its usage to fused moe (bloat16, fp8, fp8 block-quant) (#4053)
This commit is contained in:
@@ -51,7 +51,7 @@ srt = [
|
||||
]
|
||||
|
||||
# HIP (Heterogeneous-computing Interface for Portability) for AMD
|
||||
# => base docker rocm/vllm-dev:20241022, not from public vllm whl
|
||||
# => base docker rocm/vllm-dev:20250114, not from public vllm whl
|
||||
srt_hip = ["sglang[runtime_common]", "sgl-kernel==0.0.3.post6", "torch", "vllm==0.6.7.dev2", "outlines==0.1.11"]
|
||||
|
||||
# xpu is not enabled in public vllm and torch whl,
|
||||
|
||||
Reference in New Issue
Block a user