default_stage: | |
default_modifiers: | |
QuantizationModifier: | |
targets: [Linear] | |
ignore: ['re:.*lm_head', 're:.*self_attn', 're:.*attn', 're:.*attention.*', 're:.*router'] | |
scheme: FP8_DYNAMIC | |
default_stage: | |
default_modifiers: | |
QuantizationModifier: | |
targets: [Linear] | |
ignore: ['re:.*lm_head', 're:.*self_attn', 're:.*attn', 're:.*attention.*', 're:.*router'] | |
scheme: FP8_DYNAMIC | |