default_stage: default_modifiers: QuantizationModifier: targets: [Linear] ignore: [lm_head, 're:.*mlp\.gate$', 're:.*mlp\.shared_expert_gate$', 're:.*linear_attn.*', 're:visual.*', 're:model\.visual.*', 're:.*mtp.*'] scheme: FP8_DYNAMIC bypass_divisibility_checks: false