R200-q / recipe.yaml
andrew-wang's picture
Upload folder using huggingface_hub
c6d4526 verified
DEFAULT_stage:
DEFAULT_modifiers:
SmoothQuantModifier: {smoothing_strength: 0.8}
GPTQModifier:
dampening_frac: 0.15
scheme: W8A8
targets: Linear
ignore: [lm_head]