34 lines
1.1 KiB
YAML
34 lines
1.1 KiB
YAML
|
|
default_stage:
|
||
|
|
default_modifiers:
|
||
|
|
AWQModifier:
|
||
|
|
config_groups:
|
||
|
|
group_0:
|
||
|
|
targets: [Linear]
|
||
|
|
weights:
|
||
|
|
num_bits: 4
|
||
|
|
type: int
|
||
|
|
symmetric: true
|
||
|
|
group_size: 32
|
||
|
|
strategy: group
|
||
|
|
block_structure: null
|
||
|
|
dynamic: false
|
||
|
|
actorder: null
|
||
|
|
observer: mse
|
||
|
|
observer_kwargs: {}
|
||
|
|
input_activations: null
|
||
|
|
output_activations: null
|
||
|
|
format: null
|
||
|
|
targets: [Linear]
|
||
|
|
ignore: ['re:.*embed_tokens', 're:.*input_layernorm$', 're:.*mlp[.]gate$', 're:.*post_attention_layernorm$',
|
||
|
|
're:.*norm$', 're:model[.]visual.*', lm_head]
|
||
|
|
mappings:
|
||
|
|
- smooth_layer: re:.*input_layernorm$
|
||
|
|
balance_layers: ['re:.*q_proj$', 're:.*k_proj$', 're:.*v_proj$']
|
||
|
|
- smooth_layer: re:.*v_proj$
|
||
|
|
balance_layers: ['re:.*o_proj$']
|
||
|
|
- smooth_layer: re:.*post_attention_layernorm$
|
||
|
|
balance_layers: ['re:.*gate_proj$', 're:.*up_proj$']
|
||
|
|
- smooth_layer: re:.*up_proj$
|
||
|
|
balance_layers: ['re:.*down_proj$']
|
||
|
|
duo_scaling: true
|