default_stage: default_modifiers: AWQModifier: targets: [Linear] ignore: ['re:.*lm_head.*', 're:.*embed_tokens.*', 're:vision_tower.*', 're:multi_modal_projector.*', 're:.*model.vision_tower.vision_model.encoder.layers.0.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.1.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.2.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.3.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.4.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.5.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.6.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.7.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.8.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.9.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.10.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.11.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.12.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.13.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.14.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.15.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.16.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.17.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.18.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.19.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.20.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.21.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.22.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.23.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.24.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.25.mlp.fc2.*', 're:.*model.vision_tower.vision_model.encoder.layers.26.mlp.fc2.*'] scheme: W4A16 sequential_targets: [Gemma3DecoderLayer] mappings: - smooth_layer: re:.*input_layernorm$ balance_layers: ['re:.*q_proj$', 're:.*k_proj$', 're:.*v_proj$'] - smooth_layer: re:.*v_proj$ balance_layers: ['re:.*o_proj$'] - smooth_layer: re:.*pre_feedforward_layernorm$ balance_layers: ['re:.*gate_proj$', 're:.*up_proj$'] - smooth_layer: re:.*up_proj$ balance_layers: ['re:.*down_proj$'] duo_scaling: true