kimi-k2-instruct-vindex / gate_vectors_index.json
mikeumus-divincian's picture
Add gate_vectors_index.json
c77991d verified
{
"version": 2,
"model_id": "moonshotai/Kimi-K2-Instruct",
"model_config": {
"moe": {
"model_type": "kimi_k2",
"num_layers": 61,
"hidden_size": 7168,
"intermediate_size": 18432,
"moe_intermediate_size": 2048,
"n_routed_experts": 384,
"n_shared_experts": 1,
"num_experts_per_tok": 8,
"first_k_dense_replace": 1,
"torch_dtype": "bfloat16",
"quant_method": "fp8"
}
},
"num_feats": 64,
"dtype": "float32",
"gate_vector_semantics": "right_singular_vectors_of_gate_proj",
"layers": {
"1": {
"shape": [
384,
64,
7168
],
"file_offset": 0
},
"2": {
"shape": [
384,
64,
7168
],
"file_offset": 704643072
},
"3": {
"shape": [
384,
64,
7168
],
"file_offset": 1409286144
},
"4": {
"shape": [
384,
64,
7168
],
"file_offset": 2113929216
},
"5": {
"shape": [
384,
64,
7168
],
"file_offset": 2818572288
},
"6": {
"shape": [
384,
64,
7168
],
"file_offset": 3523215360
},
"7": {
"shape": [
384,
64,
7168
],
"file_offset": 4227858432
},
"8": {
"shape": [
384,
64,
7168
],
"file_offset": 4932501504
},
"9": {
"shape": [
384,
64,
7168
],
"file_offset": 5637144576
},
"10": {
"shape": [
384,
64,
7168
],
"file_offset": 6341787648
},
"11": {
"shape": [
384,
64,
7168
],
"file_offset": 7046430720
},
"12": {
"shape": [
384,
64,
7168
],
"file_offset": 7751073792
},
"13": {
"shape": [
384,
64,
7168
],
"file_offset": 8455716864
},
"14": {
"shape": [
384,
64,
7168
],
"file_offset": 9160359936
},
"15": {
"shape": [
384,
64,
7168
],
"file_offset": 9865003008
},
"16": {
"shape": [
384,
64,
7168
],
"file_offset": 10569646080
},
"17": {
"shape": [
384,
64,
7168
],
"file_offset": 11274289152
},
"18": {
"shape": [
384,
64,
7168
],
"file_offset": 11978932224
},
"19": {
"shape": [
384,
64,
7168
],
"file_offset": 12683575296
},
"20": {
"shape": [
384,
64,
7168
],
"file_offset": 13388218368
},
"21": {
"shape": [
384,
64,
7168
],
"file_offset": 14092861440
},
"22": {
"shape": [
384,
64,
7168
],
"file_offset": 14797504512
},
"23": {
"shape": [
384,
64,
7168
],
"file_offset": 15502147584
},
"24": {
"shape": [
384,
64,
7168
],
"file_offset": 16206790656
},
"25": {
"shape": [
384,
64,
7168
],
"file_offset": 16911433728
},
"26": {
"shape": [
384,
64,
7168
],
"file_offset": 17616076800
},
"27": {
"shape": [
384,
64,
7168
],
"file_offset": 18320719872
},
"28": {
"shape": [
384,
64,
7168
],
"file_offset": 19025362944
},
"29": {
"shape": [
384,
64,
7168
],
"file_offset": 19730006016
},
"30": {
"shape": [
384,
64,
7168
],
"file_offset": 20434649088
},
"31": {
"shape": [
384,
64,
7168
],
"file_offset": 21139292160
},
"32": {
"shape": [
384,
64,
7168
],
"file_offset": 21843935232
},
"33": {
"shape": [
384,
64,
7168
],
"file_offset": 22548578304
},
"34": {
"shape": [
384,
64,
7168
],
"file_offset": 23253221376
},
"35": {
"shape": [
384,
64,
7168
],
"file_offset": 23957864448
},
"36": {
"shape": [
384,
64,
7168
],
"file_offset": 24662507520
},
"37": {
"shape": [
384,
64,
7168
],
"file_offset": 25367150592
},
"38": {
"shape": [
384,
64,
7168
],
"file_offset": 26071793664
},
"39": {
"shape": [
384,
64,
7168
],
"file_offset": 26776436736
},
"40": {
"shape": [
384,
64,
7168
],
"file_offset": 27481079808
},
"41": {
"shape": [
384,
64,
7168
],
"file_offset": 28185722880
},
"42": {
"shape": [
384,
64,
7168
],
"file_offset": 28890365952
},
"43": {
"shape": [
384,
64,
7168
],
"file_offset": 29595009024
},
"44": {
"shape": [
384,
64,
7168
],
"file_offset": 30299652096
},
"45": {
"shape": [
384,
64,
7168
],
"file_offset": 31004295168
},
"46": {
"shape": [
384,
64,
7168
],
"file_offset": 31708938240
},
"47": {
"shape": [
384,
64,
7168
],
"file_offset": 32413581312
},
"48": {
"shape": [
384,
64,
7168
],
"file_offset": 33118224384
},
"49": {
"shape": [
384,
64,
7168
],
"file_offset": 33822867456
},
"50": {
"shape": [
384,
64,
7168
],
"file_offset": 34527510528
},
"51": {
"shape": [
384,
64,
7168
],
"file_offset": 35232153600
},
"52": {
"shape": [
384,
64,
7168
],
"file_offset": 35936796672
},
"53": {
"shape": [
384,
64,
7168
],
"file_offset": 36641439744
},
"54": {
"shape": [
384,
64,
7168
],
"file_offset": 37346082816
},
"55": {
"shape": [
384,
64,
7168
],
"file_offset": 38050725888
},
"56": {
"shape": [
384,
64,
7168
],
"file_offset": 38755368960
},
"57": {
"shape": [
384,
64,
7168
],
"file_offset": 39460012032
},
"58": {
"shape": [
384,
64,
7168
],
"file_offset": 40164655104
},
"59": {
"shape": [
384,
64,
7168
],
"file_offset": 40869298176
},
"60": {
"shape": [
384,
64,
7168
],
"file_offset": 41573941248
}
},
"layer_stats": {
"1": {
"median_var64": 0.0946,
"q25_var64": 0.0858,
"q75_var64": 0.1024,
"n_experts": 384
},
"2": {
"median_var64": 0.0968,
"q25_var64": 0.0927,
"q75_var64": 0.1005,
"n_experts": 384
},
"3": {
"median_var64": 0.0954,
"q25_var64": 0.0927,
"q75_var64": 0.0991,
"n_experts": 384
},
"4": {
"median_var64": 0.0963,
"q25_var64": 0.0928,
"q75_var64": 0.1008,
"n_experts": 384
},
"5": {
"median_var64": 0.098,
"q25_var64": 0.0944,
"q75_var64": 0.1022,
"n_experts": 384
},
"6": {
"median_var64": 0.0944,
"q25_var64": 0.0913,
"q75_var64": 0.0975,
"n_experts": 384
},
"7": {
"median_var64": 0.0925,
"q25_var64": 0.0895,
"q75_var64": 0.0965,
"n_experts": 384
},
"8": {
"median_var64": 0.0925,
"q25_var64": 0.0889,
"q75_var64": 0.0971,
"n_experts": 384
},
"9": {
"median_var64": 0.091,
"q25_var64": 0.0869,
"q75_var64": 0.096,
"n_experts": 384
},
"10": {
"median_var64": 0.0926,
"q25_var64": 0.0876,
"q75_var64": 0.0984,
"n_experts": 384
},
"11": {
"median_var64": 0.0927,
"q25_var64": 0.0874,
"q75_var64": 0.0996,
"n_experts": 384
},
"12": {
"median_var64": 0.0961,
"q25_var64": 0.089,
"q75_var64": 0.1033,
"n_experts": 384
},
"13": {
"median_var64": 0.1009,
"q25_var64": 0.0925,
"q75_var64": 0.1102,
"n_experts": 384
},
"14": {
"median_var64": 0.1015,
"q25_var64": 0.0919,
"q75_var64": 0.1102,
"n_experts": 384
},
"15": {
"median_var64": 0.1003,
"q25_var64": 0.0913,
"q75_var64": 0.1137,
"n_experts": 384
},
"16": {
"median_var64": 0.1007,
"q25_var64": 0.0912,
"q75_var64": 0.1146,
"n_experts": 384
},
"17": {
"median_var64": 0.1047,
"q25_var64": 0.0924,
"q75_var64": 0.1171,
"n_experts": 384
},
"18": {
"median_var64": 0.1034,
"q25_var64": 0.0902,
"q75_var64": 0.1158,
"n_experts": 384
},
"19": {
"median_var64": 0.1018,
"q25_var64": 0.0888,
"q75_var64": 0.1168,
"n_experts": 384
},
"20": {
"median_var64": 0.1023,
"q25_var64": 0.0882,
"q75_var64": 0.1181,
"n_experts": 384
},
"21": {
"median_var64": 0.1061,
"q25_var64": 0.09,
"q75_var64": 0.1209,
"n_experts": 384
},
"22": {
"median_var64": 0.106,
"q25_var64": 0.09,
"q75_var64": 0.1248,
"n_experts": 384
},
"23": {
"median_var64": 0.1065,
"q25_var64": 0.0882,
"q75_var64": 0.1258,
"n_experts": 384
},
"24": {
"median_var64": 0.1079,
"q25_var64": 0.0916,
"q75_var64": 0.1298,
"n_experts": 384
},
"25": {
"median_var64": 0.106,
"q25_var64": 0.0895,
"q75_var64": 0.1251,
"n_experts": 384
},
"26": {
"median_var64": 0.1042,
"q25_var64": 0.09,
"q75_var64": 0.1263,
"n_experts": 384
},
"27": {
"median_var64": 0.1013,
"q25_var64": 0.089,
"q75_var64": 0.1229,
"n_experts": 384
},
"28": {
"median_var64": 0.0995,
"q25_var64": 0.0875,
"q75_var64": 0.1186,
"n_experts": 384
},
"29": {
"median_var64": 0.1005,
"q25_var64": 0.0873,
"q75_var64": 0.1157,
"n_experts": 384
},
"30": {
"median_var64": 0.0955,
"q25_var64": 0.0864,
"q75_var64": 0.1129,
"n_experts": 384
},
"31": {
"median_var64": 0.0927,
"q25_var64": 0.0856,
"q75_var64": 0.1083,
"n_experts": 384
},
"32": {
"median_var64": 0.09,
"q25_var64": 0.0843,
"q75_var64": 0.1049,
"n_experts": 384
},
"33": {
"median_var64": 0.0903,
"q25_var64": 0.0833,
"q75_var64": 0.1028,
"n_experts": 384
},
"34": {
"median_var64": 0.0893,
"q25_var64": 0.0844,
"q75_var64": 0.0996,
"n_experts": 384
},
"35": {
"median_var64": 0.0874,
"q25_var64": 0.0829,
"q75_var64": 0.0984,
"n_experts": 384
},
"36": {
"median_var64": 0.0879,
"q25_var64": 0.083,
"q75_var64": 0.0988,
"n_experts": 384
},
"37": {
"median_var64": 0.0866,
"q25_var64": 0.0821,
"q75_var64": 0.0966,
"n_experts": 384
},
"38": {
"median_var64": 0.0867,
"q25_var64": 0.0824,
"q75_var64": 0.0939,
"n_experts": 384
},
"39": {
"median_var64": 0.0848,
"q25_var64": 0.0812,
"q75_var64": 0.0916,
"n_experts": 384
},
"40": {
"median_var64": 0.0835,
"q25_var64": 0.0806,
"q75_var64": 0.0903,
"n_experts": 384
},
"41": {
"median_var64": 0.0832,
"q25_var64": 0.0802,
"q75_var64": 0.0892,
"n_experts": 384
},
"42": {
"median_var64": 0.0832,
"q25_var64": 0.0804,
"q75_var64": 0.0898,
"n_experts": 384
},
"43": {
"median_var64": 0.083,
"q25_var64": 0.0804,
"q75_var64": 0.0892,
"n_experts": 384
},
"44": {
"median_var64": 0.0832,
"q25_var64": 0.0805,
"q75_var64": 0.0905,
"n_experts": 384
},
"45": {
"median_var64": 0.0831,
"q25_var64": 0.0802,
"q75_var64": 0.0889,
"n_experts": 384
},
"46": {
"median_var64": 0.0834,
"q25_var64": 0.0802,
"q75_var64": 0.0907,
"n_experts": 384
},
"47": {
"median_var64": 0.0833,
"q25_var64": 0.0799,
"q75_var64": 0.0901,
"n_experts": 384
},
"48": {
"median_var64": 0.0834,
"q25_var64": 0.0798,
"q75_var64": 0.0901,
"n_experts": 384
},
"49": {
"median_var64": 0.0835,
"q25_var64": 0.0799,
"q75_var64": 0.0921,
"n_experts": 384
},
"50": {
"median_var64": 0.0848,
"q25_var64": 0.0806,
"q75_var64": 0.0921,
"n_experts": 384
},
"51": {
"median_var64": 0.0856,
"q25_var64": 0.0808,
"q75_var64": 0.0951,
"n_experts": 384
},
"52": {
"median_var64": 0.0872,
"q25_var64": 0.081,
"q75_var64": 0.097,
"n_experts": 384
},
"53": {
"median_var64": 0.0872,
"q25_var64": 0.0817,
"q75_var64": 0.1009,
"n_experts": 384
},
"54": {
"median_var64": 0.0911,
"q25_var64": 0.0827,
"q75_var64": 0.1038,
"n_experts": 384
},
"55": {
"median_var64": 0.0932,
"q25_var64": 0.0845,
"q75_var64": 0.1058,
"n_experts": 384
},
"56": {
"median_var64": 0.0944,
"q25_var64": 0.0844,
"q75_var64": 0.109,
"n_experts": 384
},
"57": {
"median_var64": 0.096,
"q25_var64": 0.0873,
"q75_var64": 0.1137,
"n_experts": 384
},
"58": {
"median_var64": 0.0959,
"q25_var64": 0.0863,
"q75_var64": 0.1112,
"n_experts": 384
},
"59": {
"median_var64": 0.0955,
"q25_var64": 0.0866,
"q75_var64": 0.1091,
"n_experts": 384
},
"60": {
"median_var64": 0.0975,
"q25_var64": 0.0884,
"q75_var64": 0.1075,
"n_experts": 384
}
}
}