| { |
| "base_model": "Qwen/Qwen3-Coder-Next", |
| "prune_mask": "/nfs/scistore19/alistgrp/mhelcig/repos/rco/llm/results/coder_next/mask_perexpert_reap_50pct.pt", |
| "original_num_experts": 512, |
| "num_hidden_layers": 48, |
| "num_experts_per_tok": 10, |
| "per_layer_num_experts": [ |
| 359, |
| 279, |
| 365, |
| 194, |
| 214, |
| 270, |
| 287, |
| 272, |
| 245, |
| 212, |
| 218, |
| 231, |
| 188, |
| 213, |
| 236, |
| 272, |
| 208, |
| 281, |
| 278, |
| 265, |
| 236, |
| 227, |
| 223, |
| 250, |
| 205, |
| 230, |
| 253, |
| 288, |
| 217, |
| 289, |
| 289, |
| 281, |
| 226, |
| 213, |
| 215, |
| 238, |
| 217, |
| 226, |
| 267, |
| 303, |
| 304, |
| 297, |
| 290, |
| 285, |
| 296, |
| 269, |
| 267, |
| 300 |
| ], |
| "total_pruned": 12288, |
| "sparsity": 0.5, |
| "allocation": "nonuniform" |
| } |