NuExtract3-W8A8 / recipe.yaml
SorenDreano's picture
Upload folder using huggingface_hub
a302bff verified
default_stage:
default_modifiers:
GPTQModifier:
targets: [Linear]
ignore: [lm_head, 're:.*visual.*', 're:.*linear_attn.*']
scheme: W8A8
bypass_divisibility_checks: false
block_size: 128
dampening_frac: 0.01
actorder: static
offload_hessians: false