初始化项目，由ModelHub XC社区提供模型

Model: RedHatAI/Qwen3-30B-A3B-Instruct-2507-quantized.w8a8 Source: Original Platform
2026-04-10 20:20:07 +08:00
commit 8a656e620a
20 changed files with 189727 additions and 0 deletions
--- a/recipe.yaml
+++ b/recipe.yaml
@@ -0,0 +1,46 @@
+quant_stage:
+  quant_modifiers:
+    SmoothQuantModifier:
+      smoothing_strength: 0.7
+      mappings:
+      - - ['re:.*q_proj', 're:.*k_proj', 're:.*v_proj']
+        - re:.*input_layernorm
+      ignore: []
+    GPTQModifier:
+      config_groups:
+        group_0:
+          targets: [Linear]
+          weights:
+            num_bits: 8
+            type: int
+            symmetric: true
+            group_size: null
+            strategy: channel
+            block_structure: null
+            dynamic: false
+            actorder: null
+            scale_dtype: null
+            zp_dtype: null
+            observer: mse
+            observer_kwargs: {}
+          input_activations:
+            num_bits: 8
+            type: int
+            symmetric: true
+            group_size: null
+            strategy: token
+            block_structure: null
+            dynamic: true
+            actorder: null
+            scale_dtype: null
+            zp_dtype: null
+            observer: null
+            observer_kwargs: {}
+          output_activations: null
+          format: null
+      targets: [Linear]
+      ignore: [lm_head, 're:.*mlp.gate$', 're:.*mlp.shared_expert_gate$']
+      block_size: 128
+      dampening_frac: 0.1
+      actorder: static
+      offload_hessians: false