[2/3] fix dsv3 awq issue (#4625)

Co-authored-by: 晟海 <huangtingwei.htw@antgroup.com>
Co-authored-by: laixinn <xielx@shanghaitech.edu.cn>
This commit is contained in:
AniZpZ
2025-04-04 08:36:39 +08:00
committed by GitHub
parent e53bf190bc
commit d95269f9b3
8 changed files with 1139 additions and 42 deletions

View File

@@ -258,6 +258,7 @@ class ModelConfig:
"experts_int8",
"w8a8_int8",
"w8a8_fp8",
"moe_wna16",
]
compatible_quantization_methods = {
"w8a8_int8": ["compressed-tensors", "compressed_tensors"],