{ "quantization": "4bit_nf4", "base_model": "Content/MLModels/quant_fp16_spectrostream_decoder.onnx", "block_size": 64, "double_quant": true, "note": "4-bit quantization requires runtime dequantization" }