| { | |
| "quantization": "4bit_nf4", | |
| "base_model": "Content/MLModels/quant_fp16_spectrostream_decoder.onnx", | |
| "block_size": 64, | |
| "double_quant": true, | |
| "note": "4-bit quantization requires runtime dequantization" | |
| } |
| { | |
| "quantization": "4bit_nf4", | |
| "base_model": "Content/MLModels/quant_fp16_spectrostream_decoder.onnx", | |
| "block_size": 64, | |
| "double_quant": true, | |
| "note": "4-bit quantization requires runtime dequantization" | |
| } |