File size: 215 Bytes
05ccd2f
 
 
 
f9580de
05ccd2f
 
 
1
2
3
4
5
6
7
8
9
default_stage:
  default_modifiers:
    SmoothQuantModifier: {smoothing_strength: 0.7}
    GPTQModifier:
      dampening_frac: 0.05
      scheme: W8A8
      targets: Linear
      ignore: [lm_head, 're:.*mlp.gate$']