初始化项目,由ModelHub XC社区提供模型
Model: cyankiwi/Qwen3-VL-8B-Instruct-AWQ-4bit Source: Original Platform
This commit is contained in:
33
recipe.yaml
Normal file
33
recipe.yaml
Normal file
@@ -0,0 +1,33 @@
|
||||
default_stage:
|
||||
default_modifiers:
|
||||
AWQModifier:
|
||||
config_groups:
|
||||
group_0:
|
||||
targets: [Linear]
|
||||
weights:
|
||||
num_bits: 4
|
||||
type: int
|
||||
symmetric: true
|
||||
group_size: 32
|
||||
strategy: group
|
||||
block_structure: null
|
||||
dynamic: false
|
||||
actorder: null
|
||||
observer: mse
|
||||
observer_kwargs: {}
|
||||
input_activations: null
|
||||
output_activations: null
|
||||
format: null
|
||||
targets: [Linear]
|
||||
ignore: ['re:.*embed_tokens', 're:.*input_layernorm$', 're:.*mlp[.]gate$', 're:.*post_attention_layernorm$',
|
||||
're:.*norm$', 're:model[.]visual.*', lm_head]
|
||||
mappings:
|
||||
- smooth_layer: re:.*input_layernorm$
|
||||
balance_layers: ['re:.*q_proj$', 're:.*k_proj$', 're:.*v_proj$']
|
||||
- smooth_layer: re:.*v_proj$
|
||||
balance_layers: ['re:.*o_proj$']
|
||||
- smooth_layer: re:.*post_attention_layernorm$
|
||||
balance_layers: ['re:.*gate_proj$', 're:.*up_proj$']
|
||||
- smooth_layer: re:.*up_proj$
|
||||
balance_layers: ['re:.*down_proj$']
|
||||
duo_scaling: true
|
||||
Reference in New Issue
Block a user