taf-agent / data /exp_t2 /icl_spatial_gpt2-medium.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
{
"model": "gpt2-medium",
"n_layers": 24,
"L_crit_known": 23,
"L_jump_detected": 22,
"dist_easy": 50,
"dist_hard": 500,
"n_prompts": 50,
"icl_score": {
"0": 0.01107959747314453,
"1": 0.9006196594238282,
"2": 1.6509499740600586,
"3": 1.849005813598633,
"4": 0.75073974609375,
"5": 0.1664865493774414,
"6": 1.3327793884277344,
"7": 2.555304012298584,
"8": 4.202056732177734,
"9": 4.950149993896485,
"10": 4.938382263183594,
"11": 7.841646461486817,
"12": 7.6333463096618654,
"13": 9.802567367553712,
"14": 14.741650924682617,
"15": 17.086366357803346,
"16": 17.862788043022157,
"17": 23.91103755950928,
"18": 25.81832295894623,
"19": 32.52337613683194,
"20": 38.87951512813569,
"21": 44.101259082196194,
"22": 52.011237938553094,
"23": 58.23494463443756,
"24": 2.0833090686798097
},
"mean_delta": {
"0": -0.01107959747314453,
"1": -0.9006196594238282,
"2": -1.6509499740600586,
"3": -1.849005813598633,
"4": -0.75073974609375,
"5": -0.1664865493774414,
"6": -1.3327793884277344,
"7": -2.555304012298584,
"8": -4.202056732177734,
"9": -4.950149993896485,
"10": -4.938382263183594,
"11": -7.841646461486817,
"12": -7.6333463096618654,
"13": -9.802567367553712,
"14": -14.741650924682617,
"15": -17.086366357803346,
"16": -17.862788043022157,
"17": -23.91103755950928,
"18": -25.81832295894623,
"19": -32.52337613683194,
"20": -38.87951512813569,
"21": -44.101259082196194,
"22": -52.011237938553094,
"23": -58.23494463443756,
"24": -2.0833090686798097
},
"mean_easy": {
"0": -15.701723613739013,
"1": -60.01761688232422,
"2": -60.68398200988769,
"3": -60.7508895111084,
"4": -63.70591766357422,
"5": -66.5406484222412,
"6": -67.88113548278808,
"7": -69.42489345550537,
"8": -71.10670009613037,
"9": -76.11728954315186,
"10": -75.0453564453125,
"11": -75.19998359680176,
"12": -76.44891380310058,
"13": -77.41143787384033,
"14": -79.31632915496826,
"15": -85.85235014915466,
"16": -91.33954855442047,
"17": -94.16897157669068,
"18": -96.06297297000884,
"19": -94.72350374598057,
"20": -96.96555620670318,
"21": -92.7302533499022,
"22": -86.60161088943481,
"23": -83.87639896392822,
"24": -7.816802892684937
},
"mean_hard": {
"0": -15.712803211212158,
"1": -60.918236541748044,
"2": -62.334931983947754,
"3": -62.599895324707035,
"4": -64.45665740966797,
"5": -66.70713497161866,
"6": -69.21391487121582,
"7": -71.98019746780396,
"8": -75.3087568283081,
"9": -81.06743953704834,
"10": -79.98373870849609,
"11": -83.04163005828858,
"12": -84.08226011276246,
"13": -87.21400524139405,
"14": -94.05798007965087,
"15": -102.938716506958,
"16": -109.20233659744262,
"17": -118.08000913619995,
"18": -121.88129592895508,
"19": -127.2468798828125,
"20": -135.84507133483888,
"21": -136.83151243209838,
"22": -138.6128488279879,
"23": -142.11134359836578,
"24": -9.900111961364747
}
}