Revert "enable auto-round quantization model (#6226)" (#10148)

This commit is contained in:
Yineng Zhang
2025-09-07 22:31:11 -07:00
committed by GitHub
parent c8295d2353
commit b7d1f17b8d
8 changed files with 0 additions and 528 deletions

View File

@@ -450,7 +450,6 @@ class ModelConfig:
"petit_nvfp4",
"quark",
"mxfp4",
"auto-round",
]
optimized_quantization_methods = [
"fp8",