default_stage: default_modifiers: QuantizationModifier: targets: [Linear] ignore: [model.embed_tokens, lm_head, 're:model\.layers\.[12](\..*)?$'] scheme: W4A16