Spaces:
Running
Running
| { | |
| "config": { | |
| "N_full": 2048, | |
| "f_target": 0.9, | |
| "eval_len": 64, | |
| "n_samples": 120 | |
| }, | |
| "results": [ | |
| { | |
| "model": "EleutherAI/pythia-1b", | |
| "tag": "pythia-1b", | |
| "gamma": 0.931, | |
| "phase": "A", | |
| "N_full": 2048, | |
| "D_f": 445, | |
| "f_target": 0.9, | |
| "ppl_full": 11.79557674849907, | |
| "sweep": [ | |
| { | |
| "window": 64, | |
| "ppl": 19.77381769411898, | |
| "delta_ppl": 7.978240945619909, | |
| "ratio": 0.03125 | |
| }, | |
| { | |
| "window": 128, | |
| "ppl": 16.397073349119978, | |
| "delta_ppl": 4.601496600620909, | |
| "ratio": 0.0625 | |
| }, | |
| { | |
| "window": 256, | |
| "ppl": 14.005542232108976, | |
| "delta_ppl": 2.2099654836099063, | |
| "ratio": 0.125 | |
| }, | |
| { | |
| "window": 384, | |
| "ppl": 12.949847142073574, | |
| "delta_ppl": 1.154270393574505, | |
| "ratio": 0.1875 | |
| }, | |
| { | |
| "window": 445, | |
| "ppl": 13.23990899615875, | |
| "delta_ppl": 1.4443322476596805, | |
| "ratio": 0.21728515625 | |
| }, | |
| { | |
| "window": 512, | |
| "ppl": 13.265685506123768, | |
| "delta_ppl": 1.4701087576246987, | |
| "ratio": 0.25 | |
| }, | |
| { | |
| "window": 640, | |
| "ppl": 12.585584646558791, | |
| "delta_ppl": 0.7900078980597218, | |
| "ratio": 0.3125 | |
| }, | |
| { | |
| "window": 768, | |
| "ppl": 12.062434404070897, | |
| "delta_ppl": 0.26685765557182783, | |
| "ratio": 0.375 | |
| }, | |
| { | |
| "window": 1024, | |
| "ppl": 11.65227339392187, | |
| "delta_ppl": -0.14330335457719912, | |
| "ratio": 0.5 | |
| }, | |
| { | |
| "window": 1280, | |
| "ppl": 11.561641727306759, | |
| "delta_ppl": -0.2339350211923108, | |
| "ratio": 0.625 | |
| }, | |
| { | |
| "window": 1536, | |
| "ppl": 11.190116400723584, | |
| "delta_ppl": -0.6054603477754856, | |
| "ratio": 0.75 | |
| }, | |
| { | |
| "window": 1792, | |
| "ppl": 11.750546375872558, | |
| "delta_ppl": -0.04503037262651155, | |
| "ratio": 0.875 | |
| }, | |
| { | |
| "window": 2048, | |
| "ppl": 11.79557674849907, | |
| "delta_ppl": 0.0, | |
| "ratio": 1.0 | |
| } | |
| ] | |
| }, | |
| { | |
| "model": "EleutherAI/pythia-2.8b", | |
| "tag": "pythia-2.8b", | |
| "gamma": 0.674, | |
| "phase": "A", | |
| "N_full": 2048, | |
| "D_f": 1482, | |
| "f_target": 0.9, | |
| "ppl_full": 9.242118727247712, | |
| "sweep": [ | |
| { | |
| "window": 64, | |
| "ppl": 15.474991362569368, | |
| "delta_ppl": 6.232872635321655, | |
| "ratio": 0.03125 | |
| }, | |
| { | |
| "window": 128, | |
| "ppl": 12.784194911370733, | |
| "delta_ppl": 3.5420761841230206, | |
| "ratio": 0.0625 | |
| }, | |
| { | |
| "window": 256, | |
| "ppl": 10.839832447967765, | |
| "delta_ppl": 1.5977137207200531, | |
| "ratio": 0.125 | |
| }, | |
| { | |
| "window": 384, | |
| "ppl": 10.115023661805676, | |
| "delta_ppl": 0.8729049345579636, | |
| "ratio": 0.1875 | |
| }, | |
| { | |
| "window": 512, | |
| "ppl": 10.232507490949049, | |
| "delta_ppl": 0.9903887637013362, | |
| "ratio": 0.25 | |
| }, | |
| { | |
| "window": 640, | |
| "ppl": 9.754356736249541, | |
| "delta_ppl": 0.5122380090018286, | |
| "ratio": 0.3125 | |
| }, | |
| { | |
| "window": 768, | |
| "ppl": 9.403105800965589, | |
| "delta_ppl": 0.16098707371787668, | |
| "ratio": 0.375 | |
| }, | |
| { | |
| "window": 1024, | |
| "ppl": 9.22952920678111, | |
| "delta_ppl": -0.012589520466601556, | |
| "ratio": 0.5 | |
| }, | |
| { | |
| "window": 1280, | |
| "ppl": 9.028686534058226, | |
| "delta_ppl": -0.2134321931894867, | |
| "ratio": 0.625 | |
| }, | |
| { | |
| "window": 1482, | |
| "ppl": 8.728037345559589, | |
| "delta_ppl": -0.5140813816881238, | |
| "ratio": 0.7236328125 | |
| }, | |
| { | |
| "window": 1536, | |
| "ppl": 8.6772931886815, | |
| "delta_ppl": -0.5648255385662129, | |
| "ratio": 0.75 | |
| }, | |
| { | |
| "window": 1792, | |
| "ppl": 9.120183357326662, | |
| "delta_ppl": -0.1219353699210508, | |
| "ratio": 0.875 | |
| }, | |
| { | |
| "window": 2048, | |
| "ppl": 9.242118727247712, | |
| "delta_ppl": 0.0, | |
| "ratio": 1.0 | |
| } | |
| ] | |
| } | |
| ] | |
| } |