|
default_stage: |
|
default_modifiers: |
|
QuantizationModifier: |
|
config_groups: |
|
group_0: |
|
targets: [Linear] |
|
weights: {num_bits: 8, type: float, symmetric: true, strategy: channel, observer: mse} |
|
input_activations: {num_bits: 8, type: float, symmetric: true, strategy: token, |
|
dynamic: true, observer: null} |
|
output_activations: null |
|
ignore: ['re:.*lm_head', 're:.*self_attn', 're:.*router', 're:.*vision_model', 're:.*multi_modal_projector', |
|
're:.*shared_expert', 're:.*feed_forward.gate_proj', 're:.*feed_forward.up_proj', |
|
're:.*feed_forward.down_proj'] |
|
targets: [Linear] |
|
|