quant_stage: quant_modifiers: GPTQModifier: ignore: [lm_head] config_groups: group_0: weights: {num_bits: 8, strategy: tensor} input_activations: {num_bits: 8, strategy: tensor} targets: [Linear]