anshdadhich commited on
Commit
3a13752
·
verified ·
1 Parent(s): e94b874

Add v7 results

Browse files
Files changed (1) hide show
  1. results_v7.json +408 -0
results_v7.json ADDED
@@ -0,0 +1,408 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "tasks": {
3
+ "Complex Fn (4D)": {
4
+ "Vanilla": {
5
+ "mean": 0.0574857605000337,
6
+ "std": 0.008335319220438129,
7
+ "scores": [
8
+ 0.0631193146109581,
9
+ 0.06363634765148163,
10
+ 0.04570161923766136
11
+ ],
12
+ "params": 4993,
13
+ "hidden": 48
14
+ },
15
+ "SinGLU": {
16
+ "mean": 0.014336802531033754,
17
+ "std": 0.011309525106379352,
18
+ "scores": [
19
+ 0.03023100085556507,
20
+ 0.007935304194688797,
21
+ 0.004844102542847395
22
+ ],
23
+ "params": 4811,
24
+ "hidden": 31
25
+ },
26
+ "Hybrid": {
27
+ "mean": 0.07689925034840901,
28
+ "std": 0.02610708296796532,
29
+ "scores": [
30
+ 0.06204311549663544,
31
+ 0.11359916627407074,
32
+ 0.055055469274520874
33
+ ],
34
+ "params": 4959,
35
+ "hidden": 34
36
+ },
37
+ "LearnFreq": {
38
+ "mean": 0.02943541668355465,
39
+ "std": 0.0034757515195282824,
40
+ "scores": [
41
+ 0.026053782552480698,
42
+ 0.02803678624331951,
43
+ 0.03421568125486374
44
+ ],
45
+ "params": 5055,
46
+ "hidden": 29
47
+ }
48
+ },
49
+ "Nested Fn (2D)": {
50
+ "Vanilla": {
51
+ "mean": 0.0486922413110733,
52
+ "std": 0.0030859308547071134,
53
+ "scores": [
54
+ 0.0464077852666378,
55
+ 0.05305477976799011,
56
+ 0.046614158898591995
57
+ ],
58
+ "params": 2961,
59
+ "hidden": 37
60
+ },
61
+ "SinGLU": {
62
+ "mean": 0.00021879897879747054,
63
+ "std": 9.755789869089583e-05,
64
+ "scores": [
65
+ 8.296288433484733e-05,
66
+ 0.00030763907125219703,
67
+ 0.00026579498080536723
68
+ ],
69
+ "params": 2993,
70
+ "hidden": 24
71
+ },
72
+ "Hybrid": {
73
+ "mean": 0.001271639756547908,
74
+ "std": 0.000170726739254775,
75
+ "scores": [
76
+ 0.0013282388681545854,
77
+ 0.0010400698520243168,
78
+ 0.0014466105494648218
79
+ ],
80
+ "params": 2959,
81
+ "hidden": 26
82
+ },
83
+ "LearnFreq": {
84
+ "mean": 0.0011319405166432261,
85
+ "std": 0.000570320048877411,
86
+ "scores": [
87
+ 0.0006881068693473935,
88
+ 0.0007706282194703817,
89
+ 0.0019370864611119032
90
+ ],
91
+ "params": 3041,
92
+ "hidden": 22
93
+ }
94
+ },
95
+ "Spiral": {
96
+ "Vanilla": {
97
+ "mean": 0.851111114025116,
98
+ "std": 0.12812993960807575,
99
+ "scores": [
100
+ 0.9366666674613953,
101
+ 0.6700000166893005,
102
+ 0.9466666579246521
103
+ ],
104
+ "params": 2999,
105
+ "hidden": 37
106
+ },
107
+ "SinGLU": {
108
+ "mean": 0.4422222177187602,
109
+ "std": 0.020427534068557608,
110
+ "scores": [
111
+ 0.46666666865348816,
112
+ 0.4166666567325592,
113
+ 0.44333332777023315
114
+ ],
115
+ "params": 3018,
116
+ "hidden": 24
117
+ },
118
+ "Hybrid": {
119
+ "mean": 1.0,
120
+ "std": 0.0,
121
+ "scores": [
122
+ 1.0,
123
+ 1.0,
124
+ 1.0
125
+ ],
126
+ "params": 2986,
127
+ "hidden": 26
128
+ },
129
+ "LearnFreq": {
130
+ "mean": 0.9977777798970541,
131
+ "std": 0.0015713469040821585,
132
+ "scores": [
133
+ 1.0,
134
+ 0.996666669845581,
135
+ 0.996666669845581
136
+ ],
137
+ "params": 3064,
138
+ "hidden": 22
139
+ }
140
+ },
141
+ "Checkerboard": {
142
+ "Vanilla": {
143
+ "mean": 0.5788888931274414,
144
+ "std": 0.022825147689377753,
145
+ "scores": [
146
+ 0.596666693687439,
147
+ 0.54666668176651,
148
+ 0.5933333039283752
149
+ ],
150
+ "params": 2999,
151
+ "hidden": 37
152
+ },
153
+ "SinGLU": {
154
+ "mean": 0.9377777775128683,
155
+ "std": 0.014989694108291244,
156
+ "scores": [
157
+ 0.9166666865348816,
158
+ 0.9466666579246521,
159
+ 0.949999988079071
160
+ ],
161
+ "params": 3018,
162
+ "hidden": 24
163
+ },
164
+ "Hybrid": {
165
+ "mean": 0.9022222359975179,
166
+ "std": 0.02060804929952367,
167
+ "scores": [
168
+ 0.9133333563804626,
169
+ 0.8733333349227905,
170
+ 0.9200000166893005
171
+ ],
172
+ "params": 2986,
173
+ "hidden": 26
174
+ },
175
+ "LearnFreq": {
176
+ "mean": 0.8911110957463583,
177
+ "std": 0.0068493423601396295,
178
+ "scores": [
179
+ 0.8833333253860474,
180
+ 0.8899999856948853,
181
+ 0.8999999761581421
182
+ ],
183
+ "params": 3064,
184
+ "hidden": 22
185
+ }
186
+ },
187
+ "High-Freq": {
188
+ "Vanilla": {
189
+ "mean": 1.099808136622111,
190
+ "std": 0.01846947085143113,
191
+ "scores": [
192
+ 1.0741740465164185,
193
+ 1.108283281326294,
194
+ 1.1169670820236206
195
+ ],
196
+ "params": 7999,
197
+ "hidden": 62
198
+ },
199
+ "SinGLU": {
200
+ "mean": 1.0171122153600056,
201
+ "std": 0.06186627648533991,
202
+ "scores": [
203
+ 1.0643826723098755,
204
+ 0.9297174215316772,
205
+ 1.0572365522384644
206
+ ],
207
+ "params": 8214,
208
+ "hidden": 41
209
+ },
210
+ "Hybrid": {
211
+ "mean": 1.1086766123771667,
212
+ "std": 0.2812712331673168,
213
+ "scores": [
214
+ 0.8738470673561096,
215
+ 1.5041409730911255,
216
+ 0.9480417966842651
217
+ ],
218
+ "params": 7997,
219
+ "hidden": 44
220
+ },
221
+ "LearnFreq": {
222
+ "mean": 1.1098253726959229,
223
+ "std": 0.18937521791609951,
224
+ "scores": [
225
+ 1.1677247285842896,
226
+ 0.8544243574142456,
227
+ 1.3073270320892334
228
+ ],
229
+ "params": 8115,
230
+ "hidden": 39
231
+ }
232
+ },
233
+ "Memorization": {
234
+ "Vanilla": {
235
+ "mean": 0.15677066644032797,
236
+ "std": 0.010408440580230162,
237
+ "scores": [
238
+ 0.1653069108724594,
239
+ 0.14211732149124146,
240
+ 0.16288776695728302
241
+ ],
242
+ "params": 4926,
243
+ "hidden": 46
244
+ },
245
+ "SinGLU": {
246
+ "mean": 9.313488410119438e-07,
247
+ "std": 1.0663730164468857e-06,
248
+ "scores": [
249
+ 1.7445064770527097e-07,
250
+ 1.801714688554057e-07,
251
+ 2.4394244064751547e-06
252
+ ],
253
+ "params": 5067,
254
+ "hidden": 31
255
+ },
256
+ "Hybrid": {
257
+ "mean": 4.9525905675788335e-06,
258
+ "std": 4.7364751238755085e-06,
259
+ "scores": [
260
+ 2.1999953787599225e-06,
261
+ 1.1617433301580604e-05,
262
+ 1.040343022395973e-06
263
+ ],
264
+ "params": 4807,
265
+ "hidden": 32
266
+ },
267
+ "LearnFreq": {
268
+ "mean": 2.6240666746465042e-05,
269
+ "std": 3.307782608500158e-05,
270
+ "scores": [
271
+ 5.2258528739912435e-06,
272
+ 5.541920700125047e-07,
273
+ 7.294195529539138e-05
274
+ ],
275
+ "params": 5088,
276
+ "hidden": 28
277
+ }
278
+ },
279
+ "OOD": {
280
+ "Vanilla": {
281
+ "mean": 1.5319531361262004,
282
+ "std": 0.2293290940636717,
283
+ "scores": [
284
+ 1.5319531361262004
285
+ ],
286
+ "params": 0,
287
+ "hidden": 0
288
+ },
289
+ "SinGLU": {
290
+ "mean": 5.897943178812663,
291
+ "std": 0.8500770525046415,
292
+ "scores": [
293
+ 5.897943178812663
294
+ ],
295
+ "params": 0,
296
+ "hidden": 0
297
+ },
298
+ "Hybrid": {
299
+ "mean": 4.738887468973796,
300
+ "std": 1.5966265517441278,
301
+ "scores": [
302
+ 4.738887468973796
303
+ ],
304
+ "params": 0,
305
+ "hidden": 0
306
+ },
307
+ "LearnFreq": {
308
+ "mean": 4.607403993606567,
309
+ "std": 0.8245368317971109,
310
+ "scores": [
311
+ 4.607403993606567
312
+ ],
313
+ "params": 0,
314
+ "hidden": 0
315
+ }
316
+ }
317
+ },
318
+ "ood": {
319
+ "Vanilla": {
320
+ "id_mean": 0.21685118973255157,
321
+ "ood_mean": 1.5319531361262004,
322
+ "id_std": 0.011753120779597635,
323
+ "ood_std": 0.2293290940636717,
324
+ "params": 5097,
325
+ "degradation": 7.064536459383043
326
+ },
327
+ "SinGLU": {
328
+ "id_mean": 0.24567786852518717,
329
+ "ood_mean": 5.897943178812663,
330
+ "id_std": 0.013796241102558409,
331
+ "ood_std": 0.8500770525046415,
332
+ "params": 5109,
333
+ "degradation": 24.006815160918734
334
+ },
335
+ "Hybrid": {
336
+ "id_mean": 0.0039149638420591755,
337
+ "ood_mean": 4.738887468973796,
338
+ "id_std": 0.0004443769118260595,
339
+ "ood_std": 1.5966265517441278,
340
+ "params": 4819,
341
+ "degradation": 1210.4549774031263
342
+ },
343
+ "LearnFreq": {
344
+ "id_mean": 0.001126814594802757,
345
+ "ood_mean": 4.607403993606567,
346
+ "id_std": 0.00014240349487589104,
347
+ "ood_std": 0.8245368317971109,
348
+ "params": 4935,
349
+ "degradation": 4088.8749709645617
350
+ }
351
+ },
352
+ "omega_analysis": {
353
+ "Complex Fn (4D)": {
354
+ "mean": 29.90054702758789,
355
+ "std": 0.11681375652551651,
356
+ "min": 29.346439361572266,
357
+ "max": 30.322891235351562,
358
+ "pct_low": 0.0,
359
+ "pct_high": 1.0
360
+ },
361
+ "Nested Fn (2D)": {
362
+ "mean": 20.020727157592773,
363
+ "std": 0.08033245801925659,
364
+ "min": 19.81328582763672,
365
+ "max": 20.469907760620117,
366
+ "pct_low": 0.0,
367
+ "pct_high": 0.564393937587738
368
+ },
369
+ "Spiral": {
370
+ "mean": 15.019983291625977,
371
+ "std": 0.2329777479171753,
372
+ "min": 14.042118072509766,
373
+ "max": 15.971786499023438,
374
+ "pct_low": 0.0,
375
+ "pct_high": 0.0
376
+ },
377
+ "Checkerboard": {
378
+ "mean": 20.046358108520508,
379
+ "std": 0.22777396440505981,
380
+ "min": 18.44003677368164,
381
+ "max": 21.628402709960938,
382
+ "pct_low": 0.0,
383
+ "pct_high": 0.6133333444595337
384
+ },
385
+ "High-Freq": {
386
+ "mean": 59.986297607421875,
387
+ "std": 0.04323225095868111,
388
+ "min": 59.84984588623047,
389
+ "max": 60.28833770751953,
390
+ "pct_low": 0.0,
391
+ "pct_high": 1.0
392
+ },
393
+ "Memorization": {
394
+ "mean": 10.043514251708984,
395
+ "std": 0.21410533785820007,
396
+ "min": 8.955178260803223,
397
+ "max": 11.059739112854004,
398
+ "pct_low": 0.0,
399
+ "pct_high": 0.0
400
+ }
401
+ },
402
+ "ood_omega": {
403
+ "id_mean": 19.987701416015625,
404
+ "id_std": 0.08571236580610275,
405
+ "ood_mean": 20.00179100036621,
406
+ "ood_std": 0.07179910689592361
407
+ }
408
+ }