Integration of TurboMind AWQ (#2828)

Co-authored-by: root <bjmsong@126.com>
This commit is contained in:
bjmsong
2025-01-13 20:14:16 +08:00
committed by GitHub
parent 51ab3ccf47
commit 17de02f98d
8 changed files with 411 additions and 2 deletions

View File

@@ -375,6 +375,7 @@ class ServerArgs:
"marlin",
"gptq_marlin",
"awq_marlin",
"awq_turbomind",
"bitsandbytes",
"gguf",
"modelopt",