RelaxingSnorlax's picture
Upload folder using huggingface_hub
a4e6d8d verified
default_stage:
default_modifiers:
SmoothQuantModifier: {smoothing_strength: 0.8}
QuantizationModifier:
targets: [Linear]
ignore: [lm_head, 're:.*mlp.gate$']
scheme: W8A8