Revert "[Feature][Quant] Auto-detect quantization format from model f… (#6873)

This reverts commit 3953dcf784. to keep the basic functions available --------- Signed-off-by: wangli <wangli858794774@gmail.com>
2026-03-10 11:27:32 +08:00
parent 40f7d93f1a
commit 33234aa0c5
7 changed files with 12 additions and 584 deletions
--- a/tests/ut/quantization/test_modelslim_config.py
+++ b/tests/ut/quantization/test_modelslim_config.py
@@ -1,6 +1,3 @@
-import json
-import os
-import tempfile
 from unittest.mock import MagicMock, patch

 from vllm.model_executor.layers.fused_moe import FusedMoE
@@ -10,7 +7,6 @@ from vllm.model_executor.layers.linear import LinearBase
 from tests.ut.base import TestBase
 from vllm_ascend.ops.linear import AscendUnquantizedLinearMethod
 from vllm_ascend.quantization.modelslim_config import (
-    MODELSLIM_CONFIG_FILENAME,
    AscendModelSlimConfig,
 )
 from vllm_ascend.utils import ASCEND_QUANTIZATION_METHOD
@@ -57,7 +53,7 @@ class TestAscendModelSlimConfig(TestBase):

    def test_get_config_filenames(self):
        filenames = AscendModelSlimConfig.get_config_filenames()
-        self.assertEqual(filenames, [])
+        self.assertEqual(filenames, ["quant_model_description.json"])

    def test_from_config(self):
        config = AscendModelSlimConfig.from_config(self.sample_config)
@@ -165,90 +161,5 @@ class TestAscendModelSlimConfig(TestBase):
        with self.assertRaises(ValueError):
            config.is_layer_skipped_ascend("fused_layer", fused_mapping)

-    def test_init_with_none_config(self):
-        config = AscendModelSlimConfig(None)
-        self.assertEqual(config.quant_description, {})
-
-    def test_init_with_default_config(self):
-        config = AscendModelSlimConfig()
-        self.assertEqual(config.quant_description, {})
-
-    def test_maybe_update_config_already_populated(self):
-        # When quant_description is already populated, should be a no-op
-        self.assertTrue(len(self.ascend_config.quant_description) > 0)
-        self.ascend_config.maybe_update_config("/some/model/path")
-        # quant_description should remain unchanged
-        self.assertEqual(self.ascend_config.quant_description,
-                         self.sample_config)
-
-    def test_maybe_update_config_loads_from_file(self):
-        config = AscendModelSlimConfig()
-        self.assertEqual(config.quant_description, {})
-
-        quant_data = {"layer1.weight": "INT8", "layer2.weight": "FLOAT"}
-        with tempfile.TemporaryDirectory() as tmpdir:
-            config_path = os.path.join(tmpdir, MODELSLIM_CONFIG_FILENAME)
-            with open(config_path, "w") as f:
-                json.dump(quant_data, f)
-
-            config.maybe_update_config(tmpdir)
-
-        self.assertEqual(config.quant_description, quant_data)
-
-    def test_maybe_update_config_raises_when_file_missing(self):
-        config = AscendModelSlimConfig()
-
-        with tempfile.TemporaryDirectory() as tmpdir:
-            with self.assertRaises(ValueError) as ctx:
-                config.maybe_update_config(tmpdir)
-
-            error_msg = str(ctx.exception)
-            self.assertIn("ModelSlim Quantization Config Not Found", error_msg)
-            self.assertIn(MODELSLIM_CONFIG_FILENAME, error_msg)
-
-    def test_maybe_update_config_raises_with_json_files_listed(self):
-        config = AscendModelSlimConfig()
-
-        with tempfile.TemporaryDirectory() as tmpdir:
-            # Create a dummy json file that is NOT the config file
-            dummy_path = os.path.join(tmpdir, "config.json")
-            with open(dummy_path, "w") as f:
-                json.dump({"dummy": True}, f)
-
-            with self.assertRaises(ValueError) as ctx:
-                config.maybe_update_config(tmpdir)
-
-            error_msg = str(ctx.exception)
-            self.assertIn("config.json", error_msg)
-
-    def test_maybe_update_config_non_directory_raises(self):
-        config = AscendModelSlimConfig()
-
-        with self.assertRaises(ValueError) as ctx:
-            config.maybe_update_config("not_a_real_directory_path")
-
-        error_msg = str(ctx.exception)
-        self.assertIn("ModelSlim Quantization Config Not Found", error_msg)
-
-    def test_apply_extra_quant_adaptations_shared_head(self):
-        config = AscendModelSlimConfig()
-        config.quant_description = {
-            "model.layers.0.shared_head.weight": "INT8",
-        }
-        config._apply_extra_quant_adaptations()
-        self.assertIn("model.layers.0.weight", config.quant_description)
-        self.assertEqual(config.quant_description["model.layers.0.weight"],
-                         "INT8")
-
-    def test_apply_extra_quant_adaptations_weight_packed(self):
-        config = AscendModelSlimConfig()
-        config.quant_description = {
-            "model.layers.0.weight_packed": "INT8",
-        }
-        config._apply_extra_quant_adaptations()
-        self.assertIn("model.layers.0.weight", config.quant_description)
-        self.assertEqual(config.quant_description["model.layers.0.weight"],
-                         "INT8")
-
    def test_get_scaled_act_names(self):
        self.assertEqual(self.ascend_config.get_scaled_act_names(), [])