File size: 280 Bytes
86c65cb
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
default_stage:
  default_modifiers:
    QuantizationModifier:
      targets: [Linear]
      ignore: [lm_head, 're:.*visual.*', 're:.*mlp.gate$', 're:.*mlp.shared_expert_gate$',
        're:.*linear_attn.*', 're:^mtp.*']
      scheme: NVFP4
      bypass_divisibility_checks: false