quant_stage: quant_modifiers: QuantizationModifier: ignore: [lm_head] targets: [Linear] scheme: FP8