DeepSeek-V4-Flash-INT2-G64 / quant_stats.json
Infatoshi's picture
Add files using upload-large-folder tool
15d1fc7 verified
[
{
"layer": 0,
"n_experts": 256,
"n_rtn_fallback": 20,
"visit_min": 0,
"visit_max": 104701,
"visit_median": 1554,
"rec_err_mean": {
"w1": 0.012415080978826154,
"w2": 0.01343309399089776,
"w3": 0.01253566544255591
}
},
{
"layer": 1,
"n_experts": 256,
"n_rtn_fallback": 13,
"visit_min": 0,
"visit_max": 90933,
"visit_median": 2058,
"rec_err_mean": {
"w1": 0.012326016072620405,
"w2": 0.013364352460484952,
"w3": 0.012376106271403842
}
},
{
"layer": 2,
"n_experts": 256,
"n_rtn_fallback": 14,
"visit_min": 0,
"visit_max": 89672,
"visit_median": 1993,
"rec_err_mean": {
"w1": 0.012438499546988169,
"w2": 0.013484358845744282,
"w3": 0.012577164387039375
}
},
{
"layer": 3,
"n_experts": 256,
"n_rtn_fallback": 28,
"visit_min": 0,
"visit_max": 87656,
"visit_median": 1593,
"rec_err_mean": {
"w1": 0.012284352793358266,
"w2": 0.013022524533880642,
"w3": 0.01228655110753607
}
},
{
"layer": 4,
"n_experts": 256,
"n_rtn_fallback": 22,
"visit_min": 0,
"visit_max": 91759,
"visit_median": 2509,
"rec_err_mean": {
"w1": 0.012322144266363466,
"w2": 0.013148894046025816,
"w3": 0.012335499126493232
}
},
{
"layer": 5,
"n_experts": 256,
"n_rtn_fallback": 22,
"visit_min": 0,
"visit_max": 53067,
"visit_median": 2692,
"rec_err_mean": {
"w1": 0.012205896578961983,
"w2": 0.013076323386485456,
"w3": 0.012235811740538338
}
},
{
"layer": 6,
"n_experts": 256,
"n_rtn_fallback": 13,
"visit_min": 0,
"visit_max": 105315,
"visit_median": 2462,
"rec_err_mean": {
"w1": 0.012188850159873255,
"w2": 0.013173459687095601,
"w3": 0.012253230812348193
}
},
{
"layer": 7,
"n_experts": 256,
"n_rtn_fallback": 10,
"visit_min": 0,
"visit_max": 89430,
"visit_median": 2105,
"rec_err_mean": {
"w1": 0.0121999701623281,
"w2": 0.013163029976567486,
"w3": 0.012289142563531641
}
},
{
"layer": 8,
"n_experts": 256,
"n_rtn_fallback": 21,
"visit_min": 0,
"visit_max": 69468,
"visit_median": 2146,
"rec_err_mean": {
"w1": 0.012145253331254935,
"w2": 0.013199328950577183,
"w3": 0.012249131043063244
}
},
{
"layer": 9,
"n_experts": 256,
"n_rtn_fallback": 20,
"visit_min": 0,
"visit_max": 74772,
"visit_median": 1885,
"rec_err_mean": {
"w1": 0.012222615572682116,
"w2": 0.013086030532576842,
"w3": 0.012252453707333189
}
},
{
"layer": 10,
"n_experts": 256,
"n_rtn_fallback": 28,
"visit_min": 0,
"visit_max": 78211,
"visit_median": 2122,
"rec_err_mean": {
"w1": 0.012135391662013717,
"w2": 0.01296397465193877,
"w3": 0.012168045926955529
}
},
{
"layer": 11,
"n_experts": 256,
"n_rtn_fallback": 24,
"visit_min": 0,
"visit_max": 59807,
"visit_median": 2105,
"rec_err_mean": {
"w1": 0.012127576275815954,
"w2": 0.012990429178898921,
"w3": 0.012161536022176733
}
},
{
"layer": 12,
"n_experts": 256,
"n_rtn_fallback": 23,
"visit_min": 0,
"visit_max": 120073,
"visit_median": 1352,
"rec_err_mean": {
"w1": 0.012006504137389129,
"w2": 0.012896691245259717,
"w3": 0.012060902728990186
}
},
{
"layer": 13,
"n_experts": 256,
"n_rtn_fallback": 33,
"visit_min": 0,
"visit_max": 86203,
"visit_median": 1580,
"rec_err_mean": {
"w1": 0.011981866897258442,
"w2": 0.012806476159312297,
"w3": 0.012059378317644587
}
},
{
"layer": 14,
"n_experts": 256,
"n_rtn_fallback": 18,
"visit_min": 0,
"visit_max": 84296,
"visit_median": 2398,
"rec_err_mean": {
"w1": 0.012034156163281295,
"w2": 0.01298547148326179,
"w3": 0.012165923355496489
}
},
{
"layer": 15,
"n_experts": 256,
"n_rtn_fallback": 17,
"visit_min": 0,
"visit_max": 90098,
"visit_median": 1650,
"rec_err_mean": {
"w1": 0.012026469823467778,
"w2": 0.012949477848451352,
"w3": 0.012168781540822238
}
},
{
"layer": 16,
"n_experts": 256,
"n_rtn_fallback": 16,
"visit_min": 0,
"visit_max": 138818,
"visit_median": 2080,
"rec_err_mean": {
"w1": 0.0119970367049973,
"w2": 0.013099638956191484,
"w3": 0.012215566694067093
}
},
{
"layer": 17,
"n_experts": 256,
"n_rtn_fallback": 22,
"visit_min": 0,
"visit_max": 81805,
"visit_median": 1463,
"rec_err_mean": {
"w1": 0.011958844468608731,
"w2": 0.013121607535140356,
"w3": 0.01224544375872938
}
},
{
"layer": 18,
"n_experts": 256,
"n_rtn_fallback": 17,
"visit_min": 0,
"visit_max": 118432,
"visit_median": 1752,
"rec_err_mean": {
"w1": 0.011972683361818781,
"w2": 0.013337772059458075,
"w3": 0.01234140323867905
}
},
{
"layer": 19,
"n_experts": 256,
"n_rtn_fallback": 16,
"visit_min": 0,
"visit_max": 62625,
"visit_median": 2217,
"rec_err_mean": {
"w1": 0.01252702346755541,
"w2": 0.01334010675054742,
"w3": 0.012576570428791456
}
},
{
"layer": 20,
"n_experts": 256,
"n_rtn_fallback": 29,
"visit_min": 0,
"visit_max": 98240,
"visit_median": 1558,
"rec_err_mean": {
"w1": 0.012045820782077499,
"w2": 0.013375726299273083,
"w3": 0.01248381885670824
}
},
{
"layer": 21,
"n_experts": 256,
"n_rtn_fallback": 23,
"visit_min": 0,
"visit_max": 95130,
"visit_median": 1399,
"rec_err_mean": {
"w1": 0.012071445104083978,
"w2": 0.013229186693934025,
"w3": 0.012358925163425738
}
},
{
"layer": 22,
"n_experts": 256,
"n_rtn_fallback": 22,
"visit_min": 0,
"visit_max": 112438,
"visit_median": 1997,
"rec_err_mean": {
"w1": 0.012246504975337302,
"w2": 0.013522858513169922,
"w3": 0.01259598697288311
}
},
{
"layer": 23,
"n_experts": 256,
"n_rtn_fallback": 18,
"visit_min": 0,
"visit_max": 92691,
"visit_median": 2472,
"rec_err_mean": {
"w1": 0.012362111072434345,
"w2": 0.013373729965678649,
"w3": 0.012536489943158813
}
},
{
"layer": 24,
"n_experts": 256,
"n_rtn_fallback": 14,
"visit_min": 0,
"visit_max": 80941,
"visit_median": 1817,
"rec_err_mean": {
"w1": 0.012180447134596761,
"w2": 0.013405652913206723,
"w3": 0.012389732190058567
}
},
{
"layer": 25,
"n_experts": 256,
"n_rtn_fallback": 9,
"visit_min": 0,
"visit_max": 58896,
"visit_median": 2313,
"rec_err_mean": {
"w1": 0.01233544500428252,
"w2": 0.013383177894866094,
"w3": 0.01257531678857049
}
},
{
"layer": 26,
"n_experts": 256,
"n_rtn_fallback": 10,
"visit_min": 8,
"visit_max": 100000,
"visit_median": 2916,
"rec_err_mean": {
"w1": 0.012328778535447782,
"w2": 0.013479596622346435,
"w3": 0.012599166751897428
}
},
{
"layer": 27,
"n_experts": 256,
"n_rtn_fallback": 10,
"visit_min": 0,
"visit_max": 69160,
"visit_median": 1757,
"rec_err_mean": {
"w1": 0.012426368215528782,
"w2": 0.013210742919909535,
"w3": 0.012652500234253239
}
},
{
"layer": 28,
"n_experts": 256,
"n_rtn_fallback": 8,
"visit_min": 8,
"visit_max": 102322,
"visit_median": 2247,
"rec_err_mean": {
"w1": 0.012327002572419588,
"w2": 0.013446205142827239,
"w3": 0.012607248230779078
}
},
{
"layer": 29,
"n_experts": 256,
"n_rtn_fallback": 16,
"visit_min": 0,
"visit_max": 105865,
"visit_median": 1893,
"rec_err_mean": {
"w1": 0.012322824510192731,
"w2": 0.01330637131104595,
"w3": 0.012568867361551384
}
},
{
"layer": 30,
"n_experts": 256,
"n_rtn_fallback": 12,
"visit_min": 0,
"visit_max": 91393,
"visit_median": 2442,
"rec_err_mean": {
"w1": 0.012352064775768667,
"w2": 0.013372166551562259,
"w3": 0.012607292326720199
}
},
{
"layer": 31,
"n_experts": 256,
"n_rtn_fallback": 11,
"visit_min": 0,
"visit_max": 129256,
"visit_median": 2164,
"rec_err_mean": {
"w1": 0.012379363139189081,
"w2": 0.01339083846687572,
"w3": 0.012637160616577603
}
},
{
"layer": 32,
"n_experts": 256,
"n_rtn_fallback": 14,
"visit_min": 0,
"visit_max": 117053,
"visit_median": 1704,
"rec_err_mean": {
"w1": 0.012300585967750521,
"w2": 0.013404446373897372,
"w3": 0.01260461766651133
}
},
{
"layer": 33,
"n_experts": 256,
"n_rtn_fallback": 14,
"visit_min": 0,
"visit_max": 86566,
"visit_median": 1884,
"rec_err_mean": {
"w1": 0.012293105512071634,
"w2": 0.013338803430087864,
"w3": 0.012589504429342924
}
},
{
"layer": 34,
"n_experts": 256,
"n_rtn_fallback": 27,
"visit_min": 0,
"visit_max": 104265,
"visit_median": 1972,
"rec_err_mean": {
"w1": 0.01226013481937116,
"w2": 0.013365076509217033,
"w3": 0.012629955643205903
}
},
{
"layer": 35,
"n_experts": 256,
"n_rtn_fallback": 19,
"visit_min": 0,
"visit_max": 81482,
"visit_median": 1441,
"rec_err_mean": {
"w1": 0.012239336298080161,
"w2": 0.013319830293767154,
"w3": 0.012585276490426622
}
},
{
"layer": 36,
"n_experts": 256,
"n_rtn_fallback": 31,
"visit_min": 0,
"visit_max": 76229,
"visit_median": 1601,
"rec_err_mean": {
"w1": 0.012273650947463466,
"w2": 0.01333218400759506,
"w3": 0.012649128948396537
}
},
{
"layer": 37,
"n_experts": 256,
"n_rtn_fallback": 29,
"visit_min": 0,
"visit_max": 140116,
"visit_median": 2095,
"rec_err_mean": {
"w1": 0.012312455397477606,
"w2": 0.01347610967059154,
"w3": 0.012669756655668607
}
},
{
"layer": 38,
"n_experts": 256,
"n_rtn_fallback": 29,
"visit_min": 0,
"visit_max": 85568,
"visit_median": 1999,
"rec_err_mean": {
"w1": 0.012275624583708122,
"w2": 0.013469703590089921,
"w3": 0.012665822468989063
}
},
{
"layer": 39,
"n_experts": 256,
"n_rtn_fallback": 35,
"visit_min": 0,
"visit_max": 116615,
"visit_median": 1707,
"rec_err_mean": {
"w1": 0.012040700054058107,
"w2": 0.01377619295817567,
"w3": 0.01264991252537584
}
},
{
"layer": 40,
"n_experts": 256,
"n_rtn_fallback": 40,
"visit_min": 0,
"visit_max": 112269,
"visit_median": 1404,
"rec_err_mean": {
"w1": 0.012377002352877753,
"w2": 0.013884072603104869,
"w3": 0.012798941337678116
}
},
{
"layer": 41,
"n_experts": 256,
"n_rtn_fallback": 35,
"visit_min": 0,
"visit_max": 164712,
"visit_median": 2210,
"rec_err_mean": {
"w1": 0.01262030862926622,
"w2": 0.014570762788935099,
"w3": 0.012976833964785328
}
},
{
"layer": 42,
"n_experts": 256,
"n_rtn_fallback": 24,
"visit_min": 0,
"visit_max": 82726,
"visit_median": 1562,
"rec_err_mean": {
"w1": 0.01345529514219379,
"w2": 0.015836902584851487,
"w3": 0.013570939121564152
}
}
]