[feature]Ascend quantization support (#7791)

Co-authored-by: ichernob <ichernobnn@gmail.com> Co-authored-by: liupeng <liupeng374@huawei.com>
2025-07-10 19:17:37 +03:00
parent 4a0d19198b
commit 766392c6bd
13 changed files with 889 additions and 34 deletions
--- a/python/sglang/srt/configs/model_config.py
+++ b/python/sglang/srt/configs/model_config.py
@@ -413,7 +413,9 @@ class ModelConfig:
        quant_cfg = self._parse_quant_hf_config()

        if quant_cfg is not None:
-            quant_method = quant_cfg.get("quant_method", "").lower()
+            quant_method = quant_cfg.get(
+                "quant_method", "" if not self.quantization else self.quantization
+            ).lower()

            # Detect which checkpoint is it
            for _, method in QUANTIZATION_METHODS.items():