Files
LLMC_SmoothQuant88/recipe.yaml

12 lines
254 B
YAML
Raw Permalink Normal View History

default_stage:
default_modifiers:
SmoothQuantModifier:
smoothing_strength: 0.8
ignore: [lm_head]
num_calibration_steps: 2048
GPTQModifier:
block_size: 128
scheme: W8A8
targets: Linear
ignore: [lm_head]