default_stage: default_modifiers: QuantizationModifier: targets: [Linear] ignore: [lm_head, 're:.*embed_tokens$', 're:.*linear_attn\.conv1d$', 're:.*linear_attn\.in_proj_a$', 're:.*linear_attn\.in_proj_b$', 're:.*mlp\.gate$', 're:.*mlp\.shared_expert_gate$', 're:.*visual\..*', 're:^mtp\..*'] scheme: FP8_DYNAMIC bypass_divisibility_checks: false