| default_stage: | |
| default_modifiers: | |
| QuantizationModifier: | |
| targets: [Linear] | |
| ignore: ['re:.*lm_head', 're:.*self_attn', 're:.*attn', 're:.*attention.*', 're:.*router'] | |
| scheme: FP8_DYNAMIC | |
| default_stage: | |
| default_modifiers: | |
| QuantizationModifier: | |
| targets: [Linear] | |
| ignore: ['re:.*lm_head', 're:.*self_attn', 're:.*attn', 're:.*attention.*', 're:.*router'] | |
| scheme: FP8_DYNAMIC | |