ROCm: update aiter and its usage to fused moe (bloat16, fp8, fp8 block-quant) (#4053)

This commit is contained in:
HAI
2025-03-04 03:00:46 -08:00
committed by GitHub
parent e0a2c96308
commit 51d25405a7
4 changed files with 82 additions and 40 deletions

View File

@@ -51,7 +51,7 @@ srt = [
]
# HIP (Heterogeneous-computing Interface for Portability) for AMD
# => base docker rocm/vllm-dev:20241022, not from public vllm whl
# => base docker rocm/vllm-dev:20250114, not from public vllm whl
srt_hip = ["sglang[runtime_common]", "sgl-kernel==0.0.3.post6", "torch", "vllm==0.6.7.dev2", "outlines==0.1.11"]
# xpu is not enabled in public vllm and torch whl,