enable auto-round quantization model (#6226)
Signed-off-by: Zhang, Weiwei1 <weiwei1.zhang@intel.com>
This commit is contained in:
@@ -80,6 +80,7 @@ QUANTIZATION_CHOICES = [
|
||||
"qoq",
|
||||
"w4afp8",
|
||||
"mxfp4",
|
||||
"auto-round",
|
||||
]
|
||||
|
||||
ATTENTION_BACKEND_CHOICES = [
|
||||
|
||||
Reference in New Issue
Block a user