Amd test fp8 (#4261)
This commit is contained in:
@@ -237,6 +237,7 @@ class ModelConfig:
|
||||
"compressed_tensors",
|
||||
"compressed-tensors",
|
||||
"fbgemm_fp8",
|
||||
"w8a8_fp8",
|
||||
]
|
||||
optimized_quantization_methods = [
|
||||
"fp8",
|
||||
|
||||
Reference in New Issue
Block a user