quant_stage: quant_modifiers: QuantizationModifier: ignore: [lm_head] config_groups: fp8_linear: input_activations: {num_bits: 8, type: float, strategy: channel, dynamic: false, symmetric: true} targets: [Linear]