| { |
| "model_id": "moonshotai/Kimi-K2-Instruct", |
| "moe_config": { |
| "model_type": "kimi_k2", |
| "num_layers": 61, |
| "hidden_size": 7168, |
| "intermediate_size": 18432, |
| "moe_intermediate_size": 2048, |
| "n_routed_experts": 384, |
| "n_shared_experts": 1, |
| "num_experts_per_tok": 8, |
| "first_k_dense_replace": 1, |
| "torch_dtype": "bfloat16", |
| "quant_method": "fp8" |
| }, |
| "num_feats": 64, |
| "provenance": { |
| "aggregator_type": "moe", |
| "quant_format": "fp8", |
| "probe_mode": "weight_svd_per_expert", |
| "fp8_handling": "cast_to_bfloat16_for_svd" |
| } |
| } |