R15-quantized / recipe.yaml
andrew-wang's picture
Upload folder using huggingface_hub
f4b29af verified
DEFAULT_stage:
DEFAULT_modifiers:
SmoothQuantModifier: {smoothing_strength: 0.8}
GPTQModifier:
dampening_frac: 0.1
scheme: W8A8
targets: Linear
ignore: [lm_head]