default_stage: default_modifiers: QuantizationModifier: targets: [Linear] ignore: ['re:.*embed_tokens.*', 're:.*lm_head.*'] scheme: W8A16