File size: 1,140 Bytes
c2d6f85 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 | {
"version": 2,
"weight_format": "mxtq",
"profile": "JANGTQ",
"cache_subtype": "kv",
"source_model": {
"name": "Hy3-preview",
"org": "tencent",
"architecture": "hy_v3"
},
"expert_layout": "per_expert",
"mxtq_seed": 42,
"mxtq_bits": {
"routed_expert": 2,
"attention": 8,
"shared_expert": 8,
"dense_ffn": 8,
"mtp": 8,
"embed_tokens": 8,
"lm_head": 8,
"norms_router_biases": 16
},
"quantization": {
"method": "affine+mxtq",
"group_size": 64,
"bits_default": 2
},
"runtime": {
"bundle_has_mtp": true,
"mtp_layers": 1,
"mtp_mode": "preserved_disabled",
"mtp_status": "MTP tensors are preserved in the bundle, but the first JANG runtime path must use normal autoregressive decode until an accept/reject speculative loop is implemented and tested."
},
"bundle_has_mtp": true,
"mtp_layers": 1,
"capabilities": {
"reasoning_parser": "qwen3",
"tool_parser": "hunyuan",
"think_in_template": false,
"supports_tools": true,
"supports_thinking": true,
"family": "hy_v3",
"modality": "text",
"cache_type": "kv"
}
}
|