aiter attention-backend (default enabled on AMD/ROCm) (#6381)

This commit is contained in:
HAI
2025-05-20 22:52:41 -07:00
committed by GitHub
parent 30ca18f423
commit 5c0b38f369
9 changed files with 552 additions and 23 deletions

View File

@@ -957,6 +957,7 @@ class ServerArgs:
"--attention-backend",
type=str,
choices=[
"aiter",
"flashinfer",
"triton",
"torch_native",