Apply sgl w8a8 fp8 kernel (#3148)

This commit is contained in:
HandH1998
2025-03-09 16:03:32 +08:00
committed by GitHub
parent 9fb48f951f
commit 0dd6cda288
13 changed files with 523 additions and 37 deletions

View File

@@ -405,6 +405,7 @@ class ServerArgs:
"gguf",
"modelopt",
"w8a8_int8",
"w8a8_fp8",
],
help="The quantization method.",
)