drawais's picture
Initial upload of Qwen2.5-Coder-32B-Instruct-NVFP4
9db2d96 verified
default_stage:
default_modifiers:
QuantizationModifier:
targets: [Linear]
ignore: [lm_head, 're:.*embed.*', 're:.*router.*']
scheme: NVFP4
bypass_divisibility_checks: false