default_stage: | |
default_modifiers: | |
QuantizationModifier: | |
config_groups: | |
group_0: | |
targets: [Linear] | |
weights: {num_bits: 8, type: float, symmetric: true, strategy: channel, observer: mse} | |
input_activations: {num_bits: 8, type: float, symmetric: true, strategy: token, | |
dynamic: true, observer: null} | |
output_activations: null | |
ignore: ['re:.*lm_head', 're:.*self_attn', 're:.*router', 're:.*vision_model', 're:.*multi_modal_projector'] | |
targets: [Linear] | |