NuExtract3-W4A16 / recipe.yaml
SorenDreano's picture
Upload folder using huggingface_hub
d992f4d verified
raw
history blame contribute delete
303 Bytes
default_stage:
default_modifiers:
GPTQModifier:
targets: [Linear]
ignore: [lm_head, 're:.*visual.*', 're:.*linear_attn.*']
scheme: W4A16
bypass_divisibility_checks: false
block_size: 128
dampening_frac: 0.01
actorder: static
offload_hessians: false