r2egym-nl2bashseq / trainer_state.json
penfever
Reset repository without checkpoint dirs
1e548d4
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 5026,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.006963788300835654,
"grad_norm": 16.70025919180339,
"learning_rate": 3.180914512922465e-07,
"loss": 0.6604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31003373861312866,
"step": 5,
"valid_targets_mean": 7389.0,
"valid_targets_min": 5627
},
{
"epoch": 0.013927576601671309,
"grad_norm": 15.950547440699722,
"learning_rate": 7.157057654075547e-07,
"loss": 0.6983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23548319935798645,
"step": 10,
"valid_targets_mean": 1294.8,
"valid_targets_min": 422
},
{
"epoch": 0.020891364902506964,
"grad_norm": 13.622952098366161,
"learning_rate": 1.113320079522863e-06,
"loss": 0.6693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31765997409820557,
"step": 15,
"valid_targets_mean": 8539.9,
"valid_targets_min": 6761
},
{
"epoch": 0.027855153203342618,
"grad_norm": 9.836072650243178,
"learning_rate": 1.5109343936381709e-06,
"loss": 0.5881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27282822132110596,
"step": 20,
"valid_targets_mean": 7579.0,
"valid_targets_min": 6174
},
{
"epoch": 0.034818941504178275,
"grad_norm": 6.354639801298961,
"learning_rate": 1.9085487077534792e-06,
"loss": 0.5734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2713155746459961,
"step": 25,
"valid_targets_mean": 7328.2,
"valid_targets_min": 4839
},
{
"epoch": 0.04178272980501393,
"grad_norm": 5.430407653710302,
"learning_rate": 2.3061630218687873e-06,
"loss": 0.559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29282844066619873,
"step": 30,
"valid_targets_mean": 6838.2,
"valid_targets_min": 5034
},
{
"epoch": 0.04874651810584958,
"grad_norm": 4.877388127505224,
"learning_rate": 2.703777335984096e-06,
"loss": 0.5283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25860846042633057,
"step": 35,
"valid_targets_mean": 7248.2,
"valid_targets_min": 5567
},
{
"epoch": 0.055710306406685235,
"grad_norm": 2.846484730228359,
"learning_rate": 3.101391650099404e-06,
"loss": 0.4665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21636009216308594,
"step": 40,
"valid_targets_mean": 6234.0,
"valid_targets_min": 5603
},
{
"epoch": 0.06267409470752089,
"grad_norm": 2.963648252530947,
"learning_rate": 3.499005964214712e-06,
"loss": 0.4547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10212111473083496,
"step": 45,
"valid_targets_mean": 602.0,
"valid_targets_min": 152
},
{
"epoch": 0.06963788300835655,
"grad_norm": 1.0973687974221902,
"learning_rate": 3.89662027833002e-06,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20101504027843475,
"step": 50,
"valid_targets_mean": 7299.9,
"valid_targets_min": 6158
},
{
"epoch": 0.0766016713091922,
"grad_norm": 0.8984488229396836,
"learning_rate": 4.294234592445328e-06,
"loss": 0.4052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1902889907360077,
"step": 55,
"valid_targets_mean": 6140.0,
"valid_targets_min": 4648
},
{
"epoch": 0.08356545961002786,
"grad_norm": 0.78646128561226,
"learning_rate": 4.6918489065606366e-06,
"loss": 0.3897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1944657266139984,
"step": 60,
"valid_targets_mean": 6603.0,
"valid_targets_min": 4882
},
{
"epoch": 0.0905292479108635,
"grad_norm": 0.6308887930432894,
"learning_rate": 5.089463220675944e-06,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1896740198135376,
"step": 65,
"valid_targets_mean": 8015.0,
"valid_targets_min": 6344
},
{
"epoch": 0.09749303621169916,
"grad_norm": 0.7528753110445529,
"learning_rate": 5.487077534791253e-06,
"loss": 0.3587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17312809824943542,
"step": 70,
"valid_targets_mean": 6305.2,
"valid_targets_min": 4622
},
{
"epoch": 0.10445682451253482,
"grad_norm": 0.5487849390115586,
"learning_rate": 5.8846918489065606e-06,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18349185585975647,
"step": 75,
"valid_targets_mean": 7890.8,
"valid_targets_min": 5485
},
{
"epoch": 0.11142061281337047,
"grad_norm": 0.5189028061387841,
"learning_rate": 6.28230616302187e-06,
"loss": 0.3552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606183648109436,
"step": 80,
"valid_targets_mean": 7016.6,
"valid_targets_min": 4960
},
{
"epoch": 0.11838440111420613,
"grad_norm": 0.5214627334126402,
"learning_rate": 6.679920477137178e-06,
"loss": 0.3415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.160720095038414,
"step": 85,
"valid_targets_mean": 6527.1,
"valid_targets_min": 5399
},
{
"epoch": 0.12534818941504178,
"grad_norm": 0.6006447673375296,
"learning_rate": 7.077534791252486e-06,
"loss": 0.3419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17021866142749786,
"step": 90,
"valid_targets_mean": 4995.0,
"valid_targets_min": 618
},
{
"epoch": 0.13231197771587744,
"grad_norm": 0.49819624129860873,
"learning_rate": 7.475149105367794e-06,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1750391721725464,
"step": 95,
"valid_targets_mean": 7219.4,
"valid_targets_min": 5764
},
{
"epoch": 0.1392757660167131,
"grad_norm": 0.49092772422498776,
"learning_rate": 7.872763419483102e-06,
"loss": 0.3305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17389681935310364,
"step": 100,
"valid_targets_mean": 7998.5,
"valid_targets_min": 5902
},
{
"epoch": 0.14623955431754876,
"grad_norm": 0.5105786705340714,
"learning_rate": 8.27037773359841e-06,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13476799428462982,
"step": 105,
"valid_targets_mean": 7377.4,
"valid_targets_min": 5015
},
{
"epoch": 0.1532033426183844,
"grad_norm": 0.4395069780745515,
"learning_rate": 8.667992047713719e-06,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134280264377594,
"step": 110,
"valid_targets_mean": 6794.0,
"valid_targets_min": 5283
},
{
"epoch": 0.16016713091922005,
"grad_norm": 0.5344731312163281,
"learning_rate": 9.065606361829027e-06,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17999088764190674,
"step": 115,
"valid_targets_mean": 6656.4,
"valid_targets_min": 4364
},
{
"epoch": 0.1671309192200557,
"grad_norm": 0.46349547442614725,
"learning_rate": 9.463220675944334e-06,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1460513472557068,
"step": 120,
"valid_targets_mean": 7178.4,
"valid_targets_min": 4448
},
{
"epoch": 0.17409470752089137,
"grad_norm": 0.49695390233410575,
"learning_rate": 9.860834990059643e-06,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17316694557666779,
"step": 125,
"valid_targets_mean": 7619.8,
"valid_targets_min": 5737
},
{
"epoch": 0.181058495821727,
"grad_norm": 0.4131284400571314,
"learning_rate": 1.0258449304174951e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13033336400985718,
"step": 130,
"valid_targets_mean": 8754.4,
"valid_targets_min": 5752
},
{
"epoch": 0.18802228412256267,
"grad_norm": 0.46954213145258955,
"learning_rate": 1.065606361829026e-05,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14443400502204895,
"step": 135,
"valid_targets_mean": 6341.0,
"valid_targets_min": 4543
},
{
"epoch": 0.19498607242339833,
"grad_norm": 0.5305150388984193,
"learning_rate": 1.1053677932405567e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14701451361179352,
"step": 140,
"valid_targets_mean": 7181.9,
"valid_targets_min": 4563
},
{
"epoch": 0.201949860724234,
"grad_norm": 1.1100672340753313,
"learning_rate": 1.1451292246520875e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11581391841173172,
"step": 145,
"valid_targets_mean": 1104.4,
"valid_targets_min": 161
},
{
"epoch": 0.20891364902506965,
"grad_norm": 0.42654296534182173,
"learning_rate": 1.1848906560636184e-05,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13008113205432892,
"step": 150,
"valid_targets_mean": 7018.2,
"valid_targets_min": 5424
},
{
"epoch": 0.21587743732590528,
"grad_norm": 0.4847320156022274,
"learning_rate": 1.2246520874751492e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15399551391601562,
"step": 155,
"valid_targets_mean": 7738.4,
"valid_targets_min": 5329
},
{
"epoch": 0.22284122562674094,
"grad_norm": 0.5316398632314259,
"learning_rate": 1.26441351888668e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14879417419433594,
"step": 160,
"valid_targets_mean": 6426.6,
"valid_targets_min": 5560
},
{
"epoch": 0.2298050139275766,
"grad_norm": 0.64130569981037,
"learning_rate": 1.3041749502982108e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15116575360298157,
"step": 165,
"valid_targets_mean": 6169.9,
"valid_targets_min": 3446
},
{
"epoch": 0.23676880222841226,
"grad_norm": 0.4742255633480007,
"learning_rate": 1.3439363817097418e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14647752046585083,
"step": 170,
"valid_targets_mean": 7204.6,
"valid_targets_min": 5381
},
{
"epoch": 0.24373259052924792,
"grad_norm": 0.47419429273153524,
"learning_rate": 1.3836978131212723e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14805693924427032,
"step": 175,
"valid_targets_mean": 7600.4,
"valid_targets_min": 5241
},
{
"epoch": 0.25069637883008355,
"grad_norm": 0.4888837565186023,
"learning_rate": 1.4234592445328033e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15302909910678864,
"step": 180,
"valid_targets_mean": 7098.5,
"valid_targets_min": 5607
},
{
"epoch": 0.2576601671309192,
"grad_norm": 0.5085230199199996,
"learning_rate": 1.4632206759443342e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14871110022068024,
"step": 185,
"valid_targets_mean": 6955.1,
"valid_targets_min": 5530
},
{
"epoch": 0.2646239554317549,
"grad_norm": 0.47969863426103976,
"learning_rate": 1.502982107355865e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14307832717895508,
"step": 190,
"valid_targets_mean": 6748.1,
"valid_targets_min": 5364
},
{
"epoch": 0.27158774373259054,
"grad_norm": 0.5300381897608597,
"learning_rate": 1.5427435387673956e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13810153305530548,
"step": 195,
"valid_targets_mean": 6273.9,
"valid_targets_min": 5438
},
{
"epoch": 0.2785515320334262,
"grad_norm": 0.4680707912423161,
"learning_rate": 1.5825049701789266e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13786497712135315,
"step": 200,
"valid_targets_mean": 6419.5,
"valid_targets_min": 4879
},
{
"epoch": 0.28551532033426186,
"grad_norm": 0.4720452212866539,
"learning_rate": 1.6222664015904573e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13714374601840973,
"step": 205,
"valid_targets_mean": 6483.4,
"valid_targets_min": 4309
},
{
"epoch": 0.2924791086350975,
"grad_norm": 0.5255652733594837,
"learning_rate": 1.662027833001988e-05,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1564159393310547,
"step": 210,
"valid_targets_mean": 6825.0,
"valid_targets_min": 5205
},
{
"epoch": 0.2994428969359331,
"grad_norm": 0.49603459688272655,
"learning_rate": 1.701789264413519e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12593704462051392,
"step": 215,
"valid_targets_mean": 6729.4,
"valid_targets_min": 5200
},
{
"epoch": 0.3064066852367688,
"grad_norm": 0.509332149215568,
"learning_rate": 1.74155069582505e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13264459371566772,
"step": 220,
"valid_targets_mean": 6094.0,
"valid_targets_min": 5302
},
{
"epoch": 0.31337047353760444,
"grad_norm": 0.5608083132142618,
"learning_rate": 1.7813121272365807e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14229202270507812,
"step": 225,
"valid_targets_mean": 7140.0,
"valid_targets_min": 5270
},
{
"epoch": 0.3203342618384401,
"grad_norm": 0.4518894667306929,
"learning_rate": 1.8210735586481114e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12612324953079224,
"step": 230,
"valid_targets_mean": 7425.0,
"valid_targets_min": 5281
},
{
"epoch": 0.32729805013927576,
"grad_norm": 0.5269894067130169,
"learning_rate": 1.8608349900596424e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16548216342926025,
"step": 235,
"valid_targets_mean": 7063.4,
"valid_targets_min": 5386
},
{
"epoch": 0.3342618384401114,
"grad_norm": 0.5088318301963545,
"learning_rate": 1.900596421471173e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1421387791633606,
"step": 240,
"valid_targets_mean": 6827.0,
"valid_targets_min": 4547
},
{
"epoch": 0.3412256267409471,
"grad_norm": 0.8073008646600404,
"learning_rate": 1.9403578528827038e-05,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08542703092098236,
"step": 245,
"valid_targets_mean": 2047.0,
"valid_targets_min": 165
},
{
"epoch": 0.34818941504178275,
"grad_norm": 0.4927784128489709,
"learning_rate": 1.9801192842942348e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13067278265953064,
"step": 250,
"valid_targets_mean": 6754.1,
"valid_targets_min": 5196
},
{
"epoch": 0.3551532033426184,
"grad_norm": 0.5689943591952936,
"learning_rate": 2.0198807157057655e-05,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13194392621517181,
"step": 255,
"valid_targets_mean": 5985.6,
"valid_targets_min": 5028
},
{
"epoch": 0.362116991643454,
"grad_norm": 0.6584472361090068,
"learning_rate": 2.0596421471172965e-05,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12018608301877975,
"step": 260,
"valid_targets_mean": 5963.9,
"valid_targets_min": 5237
},
{
"epoch": 0.36908077994428967,
"grad_norm": 0.507426793822691,
"learning_rate": 2.0994035785288272e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1359572857618332,
"step": 265,
"valid_targets_mean": 6319.0,
"valid_targets_min": 5412
},
{
"epoch": 0.37604456824512533,
"grad_norm": 0.4533447276132855,
"learning_rate": 2.139165009940358e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10632900148630142,
"step": 270,
"valid_targets_mean": 7125.8,
"valid_targets_min": 5080
},
{
"epoch": 0.383008356545961,
"grad_norm": 0.5072627844159278,
"learning_rate": 2.1789264413518886e-05,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12942767143249512,
"step": 275,
"valid_targets_mean": 6123.5,
"valid_targets_min": 4521
},
{
"epoch": 0.38997214484679665,
"grad_norm": 2.3716958270807,
"learning_rate": 2.2186878727634196e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23617935180664062,
"step": 280,
"valid_targets_mean": 1886.0,
"valid_targets_min": 1111
},
{
"epoch": 0.3969359331476323,
"grad_norm": 1.5308735634592507,
"learning_rate": 2.2584493041749503e-05,
"loss": 0.3968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19828379154205322,
"step": 285,
"valid_targets_mean": 1497.6,
"valid_targets_min": 893
},
{
"epoch": 0.403899721448468,
"grad_norm": 1.1543013502299828,
"learning_rate": 2.2982107355864813e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1195836067199707,
"step": 290,
"valid_targets_mean": 1356.0,
"valid_targets_min": 914
},
{
"epoch": 0.41086350974930363,
"grad_norm": 1.094348041750749,
"learning_rate": 2.3379721669980124e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13568729162216187,
"step": 295,
"valid_targets_mean": 1324.5,
"valid_targets_min": 680
},
{
"epoch": 0.4178272980501393,
"grad_norm": 0.9321428551455399,
"learning_rate": 2.377733598409543e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14562851190567017,
"step": 300,
"valid_targets_mean": 1931.8,
"valid_targets_min": 876
},
{
"epoch": 0.42479108635097496,
"grad_norm": 1.2058603525575806,
"learning_rate": 2.4174950298210734e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1342366337776184,
"step": 305,
"valid_targets_mean": 1292.2,
"valid_targets_min": 734
},
{
"epoch": 0.43175487465181056,
"grad_norm": 1.2425037495378959,
"learning_rate": 2.4572564612326044e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1206846684217453,
"step": 310,
"valid_targets_mean": 1469.6,
"valid_targets_min": 655
},
{
"epoch": 0.4387186629526462,
"grad_norm": 0.970667265555978,
"learning_rate": 2.4970178926441354e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1465504765510559,
"step": 315,
"valid_targets_mean": 1548.4,
"valid_targets_min": 737
},
{
"epoch": 0.4456824512534819,
"grad_norm": 1.0165307573128308,
"learning_rate": 2.536779324055666e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1261579394340515,
"step": 320,
"valid_targets_mean": 1316.5,
"valid_targets_min": 759
},
{
"epoch": 0.45264623955431754,
"grad_norm": 0.9803325403945289,
"learning_rate": 2.576540755467197e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10474079847335815,
"step": 325,
"valid_targets_mean": 1249.6,
"valid_targets_min": 753
},
{
"epoch": 0.4596100278551532,
"grad_norm": 0.9660896867872805,
"learning_rate": 2.616302186878728e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17885830998420715,
"step": 330,
"valid_targets_mean": 1833.0,
"valid_targets_min": 927
},
{
"epoch": 0.46657381615598886,
"grad_norm": 0.9889163176342366,
"learning_rate": 2.656063618290259e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1363910287618637,
"step": 335,
"valid_targets_mean": 1338.4,
"valid_targets_min": 679
},
{
"epoch": 0.4735376044568245,
"grad_norm": 1.061457665973345,
"learning_rate": 2.6958250497017892e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12158133089542389,
"step": 340,
"valid_targets_mean": 1244.6,
"valid_targets_min": 771
},
{
"epoch": 0.4805013927576602,
"grad_norm": 1.0563598410355024,
"learning_rate": 2.7355864811133202e-05,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12138071656227112,
"step": 345,
"valid_targets_mean": 1732.5,
"valid_targets_min": 986
},
{
"epoch": 0.48746518105849584,
"grad_norm": 1.1235998467468378,
"learning_rate": 2.775347912524851e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11856169253587723,
"step": 350,
"valid_targets_mean": 1389.9,
"valid_targets_min": 1103
},
{
"epoch": 0.49442896935933145,
"grad_norm": 0.942754195687271,
"learning_rate": 2.815109343936382e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14676061272621155,
"step": 355,
"valid_targets_mean": 1593.2,
"valid_targets_min": 675
},
{
"epoch": 0.5013927576601671,
"grad_norm": 0.927084600615998,
"learning_rate": 2.8548707753479126e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16312474012374878,
"step": 360,
"valid_targets_mean": 1926.6,
"valid_targets_min": 974
},
{
"epoch": 0.5083565459610028,
"grad_norm": 1.0089719119822702,
"learning_rate": 2.8946322067594437e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16004151105880737,
"step": 365,
"valid_targets_mean": 1953.1,
"valid_targets_min": 869
},
{
"epoch": 0.5153203342618384,
"grad_norm": 1.0547290812174692,
"learning_rate": 2.9343936381709747e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11815130710601807,
"step": 370,
"valid_targets_mean": 1327.2,
"valid_targets_min": 1023
},
{
"epoch": 0.5222841225626741,
"grad_norm": 1.091197129252169,
"learning_rate": 2.974155069582505e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14482921361923218,
"step": 375,
"valid_targets_mean": 1717.9,
"valid_targets_min": 709
},
{
"epoch": 0.5292479108635098,
"grad_norm": 1.041832550945947,
"learning_rate": 3.0139165009940357e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.111148402094841,
"step": 380,
"valid_targets_mean": 1139.9,
"valid_targets_min": 658
},
{
"epoch": 0.5362116991643454,
"grad_norm": 1.0373743215959594,
"learning_rate": 3.053677932405567e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12807971239089966,
"step": 385,
"valid_targets_mean": 1444.8,
"valid_targets_min": 662
},
{
"epoch": 0.5431754874651811,
"grad_norm": 0.9362737502243705,
"learning_rate": 3.0934393638170974e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0938352644443512,
"step": 390,
"valid_targets_mean": 1242.2,
"valid_targets_min": 859
},
{
"epoch": 0.5501392757660167,
"grad_norm": 0.9658781825606017,
"learning_rate": 3.133200795228629e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.149136483669281,
"step": 395,
"valid_targets_mean": 1569.2,
"valid_targets_min": 950
},
{
"epoch": 0.5571030640668524,
"grad_norm": 1.1094086785951527,
"learning_rate": 3.1729622266401595e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12185294181108475,
"step": 400,
"valid_targets_mean": 1539.8,
"valid_targets_min": 686
},
{
"epoch": 0.564066852367688,
"grad_norm": 0.8987556090799284,
"learning_rate": 3.21272365805169e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13875404000282288,
"step": 405,
"valid_targets_mean": 1610.6,
"valid_targets_min": 702
},
{
"epoch": 0.5710306406685237,
"grad_norm": 0.9570507306238789,
"learning_rate": 3.252485089463221e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09257258474826813,
"step": 410,
"valid_targets_mean": 1190.4,
"valid_targets_min": 779
},
{
"epoch": 0.5779944289693594,
"grad_norm": 1.041172830465715,
"learning_rate": 3.2922465208747515e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13315311074256897,
"step": 415,
"valid_targets_mean": 1467.1,
"valid_targets_min": 822
},
{
"epoch": 0.584958217270195,
"grad_norm": 0.986140542035632,
"learning_rate": 3.332007952286282e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10449384897947311,
"step": 420,
"valid_targets_mean": 1350.5,
"valid_targets_min": 868
},
{
"epoch": 0.5919220055710307,
"grad_norm": 1.065472844147368,
"learning_rate": 3.3717693836978136e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10323739796876907,
"step": 425,
"valid_targets_mean": 1283.5,
"valid_targets_min": 781
},
{
"epoch": 0.5988857938718662,
"grad_norm": 0.9665463285582397,
"learning_rate": 3.411530815109344e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10586751997470856,
"step": 430,
"valid_targets_mean": 1303.2,
"valid_targets_min": 793
},
{
"epoch": 0.6058495821727019,
"grad_norm": 1.2852362210237431,
"learning_rate": 3.451292246520875e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10657232999801636,
"step": 435,
"valid_targets_mean": 1309.1,
"valid_targets_min": 806
},
{
"epoch": 0.6128133704735376,
"grad_norm": 0.8736026107192932,
"learning_rate": 3.491053677932406e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1021880954504013,
"step": 440,
"valid_targets_mean": 1397.6,
"valid_targets_min": 803
},
{
"epoch": 0.6197771587743732,
"grad_norm": 1.0411104476153328,
"learning_rate": 3.530815109343936e-05,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0923558846116066,
"step": 445,
"valid_targets_mean": 1187.8,
"valid_targets_min": 660
},
{
"epoch": 0.6267409470752089,
"grad_norm": 0.9460837866342159,
"learning_rate": 3.570576540755467e-05,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10013886541128159,
"step": 450,
"valid_targets_mean": 1547.0,
"valid_targets_min": 853
},
{
"epoch": 0.6337047353760445,
"grad_norm": 0.9098298102835145,
"learning_rate": 3.6103379721669984e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1290132701396942,
"step": 455,
"valid_targets_mean": 1704.2,
"valid_targets_min": 719
},
{
"epoch": 0.6406685236768802,
"grad_norm": 0.9535602596956675,
"learning_rate": 3.650099403578529e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08892850577831268,
"step": 460,
"valid_targets_mean": 1255.0,
"valid_targets_min": 765
},
{
"epoch": 0.6476323119777159,
"grad_norm": 0.9327456495578426,
"learning_rate": 3.68986083499006e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11986593157052994,
"step": 465,
"valid_targets_mean": 1550.8,
"valid_targets_min": 875
},
{
"epoch": 0.6545961002785515,
"grad_norm": 1.0928873361476414,
"learning_rate": 3.729622266401591e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12141738831996918,
"step": 470,
"valid_targets_mean": 1362.0,
"valid_targets_min": 739
},
{
"epoch": 0.6615598885793872,
"grad_norm": 0.9405266158146244,
"learning_rate": 3.769383697813122e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13972696661949158,
"step": 475,
"valid_targets_mean": 1666.8,
"valid_targets_min": 760
},
{
"epoch": 0.6685236768802229,
"grad_norm": 0.9803157445663641,
"learning_rate": 3.8091451292246525e-05,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10272186994552612,
"step": 480,
"valid_targets_mean": 1319.6,
"valid_targets_min": 1046
},
{
"epoch": 0.6754874651810585,
"grad_norm": 0.8300161576779523,
"learning_rate": 3.848906560636183e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13779720664024353,
"step": 485,
"valid_targets_mean": 1727.9,
"valid_targets_min": 851
},
{
"epoch": 0.6824512534818942,
"grad_norm": 0.958305960647266,
"learning_rate": 3.888667992047714e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.129207044839859,
"step": 490,
"valid_targets_mean": 1643.2,
"valid_targets_min": 907
},
{
"epoch": 0.6894150417827298,
"grad_norm": 0.9358380856267636,
"learning_rate": 3.9284294234592445e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11121398210525513,
"step": 495,
"valid_targets_mean": 1478.5,
"valid_targets_min": 764
},
{
"epoch": 0.6963788300835655,
"grad_norm": 0.8280865710705787,
"learning_rate": 3.968190854870776e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1098678931593895,
"step": 500,
"valid_targets_mean": 1522.6,
"valid_targets_min": 822
},
{
"epoch": 0.7033426183844012,
"grad_norm": 0.8854144055119295,
"learning_rate": 3.999999517556397e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11844191700220108,
"step": 505,
"valid_targets_mean": 1589.0,
"valid_targets_min": 982
},
{
"epoch": 0.7103064066852368,
"grad_norm": 0.889147230178005,
"learning_rate": 3.9999826320547226e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12125623971223831,
"step": 510,
"valid_targets_mean": 1574.8,
"valid_targets_min": 816
},
{
"epoch": 0.7172701949860725,
"grad_norm": 1.0297104353022954,
"learning_rate": 3.999941624605637e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12160146236419678,
"step": 515,
"valid_targets_mean": 1422.0,
"valid_targets_min": 721
},
{
"epoch": 0.724233983286908,
"grad_norm": 0.9715916674508144,
"learning_rate": 3.999876495703734e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08852733671665192,
"step": 520,
"valid_targets_mean": 1150.6,
"valid_targets_min": 741
},
{
"epoch": 0.7311977715877437,
"grad_norm": 0.9348675328466968,
"learning_rate": 3.999787246134539e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1302892565727234,
"step": 525,
"valid_targets_mean": 1684.2,
"valid_targets_min": 734
},
{
"epoch": 0.7381615598885793,
"grad_norm": 0.9829460553497974,
"learning_rate": 3.999673876974498e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14294780790805817,
"step": 530,
"valid_targets_mean": 1937.1,
"valid_targets_min": 744
},
{
"epoch": 0.745125348189415,
"grad_norm": 1.00886311547871,
"learning_rate": 3.9995363895909654e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1358570158481598,
"step": 535,
"valid_targets_mean": 1842.2,
"valid_targets_min": 620
},
{
"epoch": 0.7520891364902507,
"grad_norm": 0.9029995225438505,
"learning_rate": 3.9993747856421865e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13714322447776794,
"step": 540,
"valid_targets_mean": 1637.6,
"valid_targets_min": 785
},
{
"epoch": 0.7590529247910863,
"grad_norm": 0.8367188043813011,
"learning_rate": 3.99918906707728e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11780621111392975,
"step": 545,
"valid_targets_mean": 1969.9,
"valid_targets_min": 740
},
{
"epoch": 0.766016713091922,
"grad_norm": 0.9884389058338642,
"learning_rate": 3.9989792361362124e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1071939691901207,
"step": 550,
"valid_targets_mean": 1432.1,
"valid_targets_min": 711
},
{
"epoch": 0.7729805013927576,
"grad_norm": 0.9502178485105263,
"learning_rate": 3.99874529534977e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12912839651107788,
"step": 555,
"valid_targets_mean": 1695.6,
"valid_targets_min": 1122
},
{
"epoch": 0.7799442896935933,
"grad_norm": 0.9668592085821732,
"learning_rate": 3.9984872475395325e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12528224289417267,
"step": 560,
"valid_targets_mean": 1524.5,
"valid_targets_min": 722
},
{
"epoch": 0.786908077994429,
"grad_norm": 0.8799325389323717,
"learning_rate": 3.998205095817833e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10128602385520935,
"step": 565,
"valid_targets_mean": 1289.2,
"valid_targets_min": 661
},
{
"epoch": 0.7938718662952646,
"grad_norm": 0.9446705425289179,
"learning_rate": 3.997898843587727e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1078827977180481,
"step": 570,
"valid_targets_mean": 1519.5,
"valid_targets_min": 1011
},
{
"epoch": 0.8008356545961003,
"grad_norm": 0.8325950401643598,
"learning_rate": 3.997568494542946e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12279678881168365,
"step": 575,
"valid_targets_mean": 1731.4,
"valid_targets_min": 1277
},
{
"epoch": 0.807799442896936,
"grad_norm": 0.898136637442764,
"learning_rate": 3.997214052667856e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11773974448442459,
"step": 580,
"valid_targets_mean": 1486.1,
"valid_targets_min": 807
},
{
"epoch": 0.8147632311977716,
"grad_norm": 0.8718990576135462,
"learning_rate": 3.996835522237408e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13190338015556335,
"step": 585,
"valid_targets_mean": 1549.9,
"valid_targets_min": 679
},
{
"epoch": 0.8217270194986073,
"grad_norm": 0.9293519703318798,
"learning_rate": 3.9964329078170874e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11136806011199951,
"step": 590,
"valid_targets_mean": 1656.0,
"valid_targets_min": 1294
},
{
"epoch": 0.8286908077994429,
"grad_norm": 0.9027962521886033,
"learning_rate": 3.996006214262858e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10627582669258118,
"step": 595,
"valid_targets_mean": 1368.8,
"valid_targets_min": 790
},
{
"epoch": 0.8356545961002786,
"grad_norm": 0.9202444501195384,
"learning_rate": 3.995555446721104e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12929676473140717,
"step": 600,
"valid_targets_mean": 1765.8,
"valid_targets_min": 592
},
{
"epoch": 0.8426183844011143,
"grad_norm": 0.8667866984685644,
"learning_rate": 3.9950806106285694e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12393373250961304,
"step": 605,
"valid_targets_mean": 1586.8,
"valid_targets_min": 662
},
{
"epoch": 0.8495821727019499,
"grad_norm": 0.9721183405017587,
"learning_rate": 3.9945817117122884e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1137949600815773,
"step": 610,
"valid_targets_mean": 1336.9,
"valid_targets_min": 622
},
{
"epoch": 0.8565459610027855,
"grad_norm": 0.9071022828100963,
"learning_rate": 3.994058755989521e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07271943986415863,
"step": 615,
"valid_targets_mean": 1097.1,
"valid_targets_min": 625
},
{
"epoch": 0.8635097493036211,
"grad_norm": 0.9327235573302172,
"learning_rate": 3.993511749767676e-05,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09269745647907257,
"step": 620,
"valid_targets_mean": 1484.9,
"valid_targets_min": 888
},
{
"epoch": 0.8704735376044568,
"grad_norm": 0.8523136084427271,
"learning_rate": 3.992940699644238e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12552563846111298,
"step": 625,
"valid_targets_mean": 1757.0,
"valid_targets_min": 635
},
{
"epoch": 0.8774373259052924,
"grad_norm": 0.9675785553764196,
"learning_rate": 3.9923456125066886e-05,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370333880186081,
"step": 630,
"valid_targets_mean": 1476.1,
"valid_targets_min": 522
},
{
"epoch": 0.8844011142061281,
"grad_norm": 0.9240372392580922,
"learning_rate": 3.9917264955324205e-05,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10322962701320648,
"step": 635,
"valid_targets_mean": 1230.9,
"valid_targets_min": 697
},
{
"epoch": 0.8913649025069638,
"grad_norm": 0.8039407980641069,
"learning_rate": 3.991083356188651e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12441124022006989,
"step": 640,
"valid_targets_mean": 1671.0,
"valid_targets_min": 1010
},
{
"epoch": 0.8983286908077994,
"grad_norm": 0.901298627076697,
"learning_rate": 3.9904162022323356e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11574780941009521,
"step": 645,
"valid_targets_mean": 1411.0,
"valid_targets_min": 769
},
{
"epoch": 0.9052924791086351,
"grad_norm": 0.8076274204627811,
"learning_rate": 3.9897250417100685e-05,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.097521111369133,
"step": 650,
"valid_targets_mean": 1298.6,
"valid_targets_min": 745
},
{
"epoch": 0.9122562674094707,
"grad_norm": 0.8790050634268944,
"learning_rate": 3.9890098829579936e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09707553684711456,
"step": 655,
"valid_targets_mean": 1118.9,
"valid_targets_min": 680
},
{
"epoch": 0.9192200557103064,
"grad_norm": 0.8222830712195175,
"learning_rate": 3.988270734601694e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13638588786125183,
"step": 660,
"valid_targets_mean": 1905.9,
"valid_targets_min": 1347
},
{
"epoch": 0.9261838440111421,
"grad_norm": 0.9010068300752175,
"learning_rate": 3.987507605556098e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16486553847789764,
"step": 665,
"valid_targets_mean": 1636.0,
"valid_targets_min": 851
},
{
"epoch": 0.9331476323119777,
"grad_norm": 0.8103801455626374,
"learning_rate": 3.9867205050253635e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09920711815357208,
"step": 670,
"valid_targets_mean": 1457.2,
"valid_targets_min": 903
},
{
"epoch": 0.9401114206128134,
"grad_norm": 0.8043472181124449,
"learning_rate": 3.9859094425027726e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12532712519168854,
"step": 675,
"valid_targets_mean": 1674.4,
"valid_targets_min": 1240
},
{
"epoch": 0.947075208913649,
"grad_norm": 0.8118897965994559,
"learning_rate": 3.985074427770614e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09223470091819763,
"step": 680,
"valid_targets_mean": 1697.1,
"valid_targets_min": 917
},
{
"epoch": 0.9540389972144847,
"grad_norm": 0.9472041237654983,
"learning_rate": 3.9842154709000665e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09532526135444641,
"step": 685,
"valid_targets_mean": 1580.9,
"valid_targets_min": 930
},
{
"epoch": 0.9610027855153204,
"grad_norm": 0.8083428002058612,
"learning_rate": 3.983332582251074e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11902359873056412,
"step": 690,
"valid_targets_mean": 1655.1,
"valid_targets_min": 1227
},
{
"epoch": 0.967966573816156,
"grad_norm": 0.8148921698054701,
"learning_rate": 3.982425772472228e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11095002293586731,
"step": 695,
"valid_targets_mean": 1565.8,
"valid_targets_min": 870
},
{
"epoch": 0.9749303621169917,
"grad_norm": 2.1396789291672396,
"learning_rate": 3.9814950525006315e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10898259282112122,
"step": 700,
"valid_targets_mean": 1564.6,
"valid_targets_min": 822
},
{
"epoch": 0.9818941504178273,
"grad_norm": 0.8780065601127116,
"learning_rate": 3.980540433561771e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10233960300683975,
"step": 705,
"valid_targets_mean": 1540.5,
"valid_targets_min": 1214
},
{
"epoch": 0.9888579387186629,
"grad_norm": 0.8908774625256577,
"learning_rate": 3.979561927169381e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10410676151514053,
"step": 710,
"valid_targets_mean": 1268.6,
"valid_targets_min": 591
},
{
"epoch": 0.9958217270194986,
"grad_norm": 0.8377782810822102,
"learning_rate": 3.978559545125303e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08468751609325409,
"step": 715,
"valid_targets_mean": 1232.5,
"valid_targets_min": 646
},
{
"epoch": 1.0027855153203342,
"grad_norm": 0.5045448459523831,
"learning_rate": 3.977533299519347e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12714359164237976,
"step": 720,
"valid_targets_mean": 8514.0,
"valid_targets_min": 6788
},
{
"epoch": 1.00974930362117,
"grad_norm": 0.5387200781137093,
"learning_rate": 3.97648320272914e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13830497860908508,
"step": 725,
"valid_targets_mean": 6668.0,
"valid_targets_min": 5933
},
{
"epoch": 1.0167130919220055,
"grad_norm": 0.6200314371011584,
"learning_rate": 3.9754092674199816e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12560366094112396,
"step": 730,
"valid_targets_mean": 4107.0,
"valid_targets_min": 161
},
{
"epoch": 1.0236768802228413,
"grad_norm": 0.41903186731709363,
"learning_rate": 3.974311506544692e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11801932752132416,
"step": 735,
"valid_targets_mean": 7946.0,
"valid_targets_min": 5596
},
{
"epoch": 1.0306406685236769,
"grad_norm": 0.43595924603479874,
"learning_rate": 3.973189933343449e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13217604160308838,
"step": 740,
"valid_targets_mean": 7392.8,
"valid_targets_min": 5629
},
{
"epoch": 1.0376044568245126,
"grad_norm": 0.5245267930858062,
"learning_rate": 3.972044561343636e-05,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12668457627296448,
"step": 745,
"valid_targets_mean": 6879.6,
"valid_targets_min": 5113
},
{
"epoch": 1.0445682451253482,
"grad_norm": 0.4794835613989842,
"learning_rate": 3.970875404359675e-05,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1310746967792511,
"step": 750,
"valid_targets_mean": 6919.5,
"valid_targets_min": 5080
},
{
"epoch": 1.051532033426184,
"grad_norm": 0.47039907099593237,
"learning_rate": 3.969682476492858e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1175151839852333,
"step": 755,
"valid_targets_mean": 6377.0,
"valid_targets_min": 3939
},
{
"epoch": 1.0584958217270195,
"grad_norm": 0.4472868406904229,
"learning_rate": 3.968465792131184e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12472754716873169,
"step": 760,
"valid_targets_mean": 6392.2,
"valid_targets_min": 4355
},
{
"epoch": 1.065459610027855,
"grad_norm": 0.5109948443641175,
"learning_rate": 3.9672253659491776e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14166294038295746,
"step": 765,
"valid_targets_mean": 5196.5,
"valid_targets_min": 137
},
{
"epoch": 1.0724233983286908,
"grad_norm": 0.3950884119973961,
"learning_rate": 3.965961212907716e-05,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10841463506221771,
"step": 770,
"valid_targets_mean": 7344.4,
"valid_targets_min": 5244
},
{
"epoch": 1.0793871866295264,
"grad_norm": 0.39325931847169565,
"learning_rate": 3.9646733482538486e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10372970998287201,
"step": 775,
"valid_targets_mean": 7921.0,
"valid_targets_min": 5311
},
{
"epoch": 1.0863509749303621,
"grad_norm": 0.39685130314701833,
"learning_rate": 3.963361787520612e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12329264730215073,
"step": 780,
"valid_targets_mean": 7931.2,
"valid_targets_min": 6015
},
{
"epoch": 1.0933147632311977,
"grad_norm": 0.36954967114170856,
"learning_rate": 3.9620265465268423e-05,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11054964363574982,
"step": 785,
"valid_targets_mean": 7640.8,
"valid_targets_min": 5248
},
{
"epoch": 1.1002785515320335,
"grad_norm": 0.39689900322648536,
"learning_rate": 3.960667641376987e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11496052145957947,
"step": 790,
"valid_targets_mean": 7249.6,
"valid_targets_min": 5217
},
{
"epoch": 1.107242339832869,
"grad_norm": 0.433531433289986,
"learning_rate": 3.959285088460908e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13216888904571533,
"step": 795,
"valid_targets_mean": 7619.9,
"valid_targets_min": 5094
},
{
"epoch": 1.1142061281337048,
"grad_norm": 0.39505484410680386,
"learning_rate": 3.957878904453683e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11113603413105011,
"step": 800,
"valid_targets_mean": 7732.8,
"valid_targets_min": 5842
},
{
"epoch": 1.1211699164345403,
"grad_norm": 0.4052047229981209,
"learning_rate": 3.9564491063154084e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12098728865385056,
"step": 805,
"valid_targets_mean": 7952.9,
"valid_targets_min": 5494
},
{
"epoch": 1.128133704735376,
"grad_norm": 0.417279220495771,
"learning_rate": 3.9549957112909914e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12448830902576447,
"step": 810,
"valid_targets_mean": 8001.0,
"valid_targets_min": 5454
},
{
"epoch": 1.1350974930362117,
"grad_norm": 0.5319248244035725,
"learning_rate": 3.9535187369099437e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09340626001358032,
"step": 815,
"valid_targets_mean": 2985.1,
"valid_targets_min": 1896
},
{
"epoch": 1.1420612813370474,
"grad_norm": 0.39891658368515515,
"learning_rate": 3.952018200986169e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10278548300266266,
"step": 820,
"valid_targets_mean": 6714.6,
"valid_targets_min": 4917
},
{
"epoch": 1.149025069637883,
"grad_norm": 0.4249036845709375,
"learning_rate": 3.950494121617749e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1260872483253479,
"step": 825,
"valid_targets_mean": 7595.2,
"valid_targets_min": 5488
},
{
"epoch": 1.1559888579387188,
"grad_norm": 0.45070868901900607,
"learning_rate": 3.9489465171867254e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1257646679878235,
"step": 830,
"valid_targets_mean": 7046.1,
"valid_targets_min": 5579
},
{
"epoch": 1.1629526462395543,
"grad_norm": 0.4439435807963078,
"learning_rate": 3.947375406358874e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1169155091047287,
"step": 835,
"valid_targets_mean": 7108.0,
"valid_targets_min": 4963
},
{
"epoch": 1.16991643454039,
"grad_norm": 0.44221583815751264,
"learning_rate": 3.9457808080834884e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11854035407304764,
"step": 840,
"valid_targets_mean": 6810.1,
"valid_targets_min": 5666
},
{
"epoch": 1.1768802228412256,
"grad_norm": 0.4316908401901056,
"learning_rate": 3.944162741593142e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11046448349952698,
"step": 845,
"valid_targets_mean": 8068.5,
"valid_targets_min": 5524
},
{
"epoch": 1.1838440111420612,
"grad_norm": 0.4180604360052473,
"learning_rate": 3.9425212264034626e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09698522835969925,
"step": 850,
"valid_targets_mean": 6553.8,
"valid_targets_min": 3621
},
{
"epoch": 1.190807799442897,
"grad_norm": 0.4189841877717661,
"learning_rate": 3.940856282312893e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10995703935623169,
"step": 855,
"valid_targets_mean": 6762.5,
"valid_targets_min": 4968
},
{
"epoch": 1.1977715877437327,
"grad_norm": 0.45595104424848715,
"learning_rate": 3.9391679294024543e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11162762343883514,
"step": 860,
"valid_targets_mean": 6143.9,
"valid_targets_min": 4917
},
{
"epoch": 1.2047353760445683,
"grad_norm": 0.5851346783403598,
"learning_rate": 3.937456188035504e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16354359686374664,
"step": 865,
"valid_targets_mean": 4583.8,
"valid_targets_min": 215
},
{
"epoch": 1.2116991643454038,
"grad_norm": 0.4055676263805544,
"learning_rate": 3.935721078857489e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11995077133178711,
"step": 870,
"valid_targets_mean": 7317.1,
"valid_targets_min": 4948
},
{
"epoch": 1.2186629526462396,
"grad_norm": 0.42172517542326765,
"learning_rate": 3.9339626227956966e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12088988721370697,
"step": 875,
"valid_targets_mean": 6437.6,
"valid_targets_min": 4510
},
{
"epoch": 1.2256267409470751,
"grad_norm": 0.4535203146647295,
"learning_rate": 3.932180841059004e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13094569742679596,
"step": 880,
"valid_targets_mean": 7707.9,
"valid_targets_min": 5796
},
{
"epoch": 1.232590529247911,
"grad_norm": 0.418577272093497,
"learning_rate": 3.93037575513762e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11241194605827332,
"step": 885,
"valid_targets_mean": 7900.9,
"valid_targets_min": 5643
},
{
"epoch": 1.2395543175487465,
"grad_norm": 0.4344807498847784,
"learning_rate": 3.9285473868028287e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12634864449501038,
"step": 890,
"valid_targets_mean": 7627.2,
"valid_targets_min": 5742
},
{
"epoch": 1.2465181058495822,
"grad_norm": 0.40801176738421346,
"learning_rate": 3.9266957581067215e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13307298719882965,
"step": 895,
"valid_targets_mean": 8725.6,
"valid_targets_min": 5141
},
{
"epoch": 1.2534818941504178,
"grad_norm": 0.4451588968606175,
"learning_rate": 3.924820891381939e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12867535650730133,
"step": 900,
"valid_targets_mean": 6967.8,
"valid_targets_min": 6088
},
{
"epoch": 1.2604456824512535,
"grad_norm": 0.4207887725907819,
"learning_rate": 3.922922809241397e-05,
"loss": 0.2333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10731957852840424,
"step": 905,
"valid_targets_mean": 7140.1,
"valid_targets_min": 4834
},
{
"epoch": 1.267409470752089,
"grad_norm": 0.43935252315939416,
"learning_rate": 3.92100153457801e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10727177560329437,
"step": 910,
"valid_targets_mean": 6706.9,
"valid_targets_min": 5108
},
{
"epoch": 1.2743732590529249,
"grad_norm": 0.4987156443279082,
"learning_rate": 3.9190570905644254e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11678919196128845,
"step": 915,
"valid_targets_mean": 5931.4,
"valid_targets_min": 4708
},
{
"epoch": 1.2813370473537604,
"grad_norm": 0.4407354572740225,
"learning_rate": 3.917089500652733e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10812367498874664,
"step": 920,
"valid_targets_mean": 7145.6,
"valid_targets_min": 5280
},
{
"epoch": 1.2883008356545962,
"grad_norm": 0.7644739613411758,
"learning_rate": 3.915098788574191e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0803007185459137,
"step": 925,
"valid_targets_mean": 1554.9,
"valid_targets_min": 592
},
{
"epoch": 1.2952646239554317,
"grad_norm": 0.45530435313643286,
"learning_rate": 3.913084978338931e-05,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12958484888076782,
"step": 930,
"valid_targets_mean": 7069.5,
"valid_targets_min": 4765
},
{
"epoch": 1.3022284122562673,
"grad_norm": 0.4187104102266161,
"learning_rate": 3.911048094235679e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11318781226873398,
"step": 935,
"valid_targets_mean": 6193.4,
"valid_targets_min": 5587
},
{
"epoch": 1.309192200557103,
"grad_norm": 0.4642694802664071,
"learning_rate": 3.9089881608314534e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11810522526502609,
"step": 940,
"valid_targets_mean": 6612.2,
"valid_targets_min": 4894
},
{
"epoch": 1.3161559888579388,
"grad_norm": 0.40454438050769786,
"learning_rate": 3.9069052029712713e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10395780950784683,
"step": 945,
"valid_targets_mean": 6605.9,
"valid_targets_min": 3795
},
{
"epoch": 1.3231197771587744,
"grad_norm": 0.4215605431440107,
"learning_rate": 3.9047992457778524e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11420217156410217,
"step": 950,
"valid_targets_mean": 7186.8,
"valid_targets_min": 4890
},
{
"epoch": 1.33008356545961,
"grad_norm": 0.620429539040831,
"learning_rate": 3.90267031465131e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1147976964712143,
"step": 955,
"valid_targets_mean": 6544.4,
"valid_targets_min": 4615
},
{
"epoch": 1.3370473537604457,
"grad_norm": 0.47863602052631893,
"learning_rate": 3.9005184352688514e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1220189705491066,
"step": 960,
"valid_targets_mean": 6339.2,
"valid_targets_min": 4798
},
{
"epoch": 1.3440111420612815,
"grad_norm": 0.6133989682966983,
"learning_rate": 3.89834363358446e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313786804676056,
"step": 965,
"valid_targets_mean": 4558.8,
"valid_targets_min": 148
},
{
"epoch": 1.350974930362117,
"grad_norm": 0.45702297334659797,
"learning_rate": 3.896145935828592e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.124158576130867,
"step": 970,
"valid_targets_mean": 6807.9,
"valid_targets_min": 5164
},
{
"epoch": 1.3579387186629526,
"grad_norm": 0.4313724233091901,
"learning_rate": 3.893925368507852e-05,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11191289126873016,
"step": 975,
"valid_targets_mean": 7011.8,
"valid_targets_min": 4974
},
{
"epoch": 1.3649025069637883,
"grad_norm": 0.46720364315569657,
"learning_rate": 3.891681958404675e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10171587765216827,
"step": 980,
"valid_targets_mean": 5794.2,
"valid_targets_min": 4809
},
{
"epoch": 1.371866295264624,
"grad_norm": 0.43110533517562993,
"learning_rate": 3.8894157325770085e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10188580304384232,
"step": 985,
"valid_targets_mean": 6401.8,
"valid_targets_min": 4842
},
{
"epoch": 1.3788300835654597,
"grad_norm": 0.44932522936305014,
"learning_rate": 3.887126718357978e-05,
"loss": 0.2193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1125284880399704,
"step": 990,
"valid_targets_mean": 6182.1,
"valid_targets_min": 5116
},
{
"epoch": 1.3857938718662952,
"grad_norm": 0.42140650517718253,
"learning_rate": 3.884814943355565e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10108678042888641,
"step": 995,
"valid_targets_mean": 6165.1,
"valid_targets_min": 5764
},
{
"epoch": 1.392757660167131,
"grad_norm": 0.9460709949341402,
"learning_rate": 3.882480435452268e-05,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09195755422115326,
"step": 1000,
"valid_targets_mean": 1428.2,
"valid_targets_min": 1062
},
{
"epoch": 1.3997214484679665,
"grad_norm": 1.0910007125977519,
"learning_rate": 3.88012322280477e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10902673006057739,
"step": 1005,
"valid_targets_mean": 1663.0,
"valid_targets_min": 960
},
{
"epoch": 1.4066852367688023,
"grad_norm": 0.8694966611159818,
"learning_rate": 3.877743333843599e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10752002894878387,
"step": 1010,
"valid_targets_mean": 1476.5,
"valid_targets_min": 933
},
{
"epoch": 1.4136490250696379,
"grad_norm": 0.8363762394596167,
"learning_rate": 3.875340797272781e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10708215087652206,
"step": 1015,
"valid_targets_mean": 1478.1,
"valid_targets_min": 881
},
{
"epoch": 1.4206128133704734,
"grad_norm": 0.9058452941123465,
"learning_rate": 3.872915642069499e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283268928527832,
"step": 1020,
"valid_targets_mean": 1640.6,
"valid_targets_min": 869
},
{
"epoch": 1.4275766016713092,
"grad_norm": 1.1890706352537899,
"learning_rate": 3.87046789748374e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11645996570587158,
"step": 1025,
"valid_targets_mean": 1709.0,
"valid_targets_min": 1090
},
{
"epoch": 1.434540389972145,
"grad_norm": 0.8343148724615661,
"learning_rate": 3.867997593037943e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08550204336643219,
"step": 1030,
"valid_targets_mean": 1157.9,
"valid_targets_min": 761
},
{
"epoch": 1.4415041782729805,
"grad_norm": 0.7596563407523057,
"learning_rate": 3.865504758526644e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1036420613527298,
"step": 1035,
"valid_targets_mean": 1553.6,
"valid_targets_min": 1241
},
{
"epoch": 1.448467966573816,
"grad_norm": 0.8589106034441814,
"learning_rate": 3.8629894240161153e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09890624135732651,
"step": 1040,
"valid_targets_mean": 1538.1,
"valid_targets_min": 733
},
{
"epoch": 1.4554317548746518,
"grad_norm": 0.7911151876930106,
"learning_rate": 3.8604516198440036e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06528353691101074,
"step": 1045,
"valid_targets_mean": 1250.6,
"valid_targets_min": 835
},
{
"epoch": 1.4623955431754876,
"grad_norm": 0.787767064205962,
"learning_rate": 3.857891376618965e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12352828681468964,
"step": 1050,
"valid_targets_mean": 1596.2,
"valid_targets_min": 1046
},
{
"epoch": 1.4693593314763231,
"grad_norm": 0.8571652833546958,
"learning_rate": 3.855308725220293e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10267695039510727,
"step": 1055,
"valid_targets_mean": 1646.5,
"valid_targets_min": 797
},
{
"epoch": 1.4763231197771587,
"grad_norm": 0.9386572516522071,
"learning_rate": 3.85270369679755e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1088155061006546,
"step": 1060,
"valid_targets_mean": 1448.9,
"valid_targets_min": 570
},
{
"epoch": 1.4832869080779945,
"grad_norm": 0.8090527333348528,
"learning_rate": 3.850076322770186e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07706055045127869,
"step": 1065,
"valid_targets_mean": 1164.1,
"valid_targets_min": 548
},
{
"epoch": 1.49025069637883,
"grad_norm": 0.888098593113638,
"learning_rate": 3.847426634827167e-05,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1056225374341011,
"step": 1070,
"valid_targets_mean": 1338.0,
"valid_targets_min": 682
},
{
"epoch": 1.4972144846796658,
"grad_norm": 0.7475892854829238,
"learning_rate": 3.844754664926586e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10795626044273376,
"step": 1075,
"valid_targets_mean": 1632.8,
"valid_targets_min": 896
},
{
"epoch": 1.5041782729805013,
"grad_norm": 0.7767225037367806,
"learning_rate": 3.842060445295283e-05,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13912582397460938,
"step": 1080,
"valid_targets_mean": 1806.5,
"valid_targets_min": 597
},
{
"epoch": 1.511142061281337,
"grad_norm": 0.8482626365324997,
"learning_rate": 3.839344008428451e-05,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09307943284511566,
"step": 1085,
"valid_targets_mean": 1289.9,
"valid_targets_min": 706
},
{
"epoch": 1.5181058495821727,
"grad_norm": 0.7497328533096577,
"learning_rate": 3.836605387089248e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06710005551576614,
"step": 1090,
"valid_targets_mean": 1354.1,
"valid_targets_min": 754
},
{
"epoch": 1.5250696378830084,
"grad_norm": 0.7897926297952617,
"learning_rate": 3.8338446143084015e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0963955968618393,
"step": 1095,
"valid_targets_mean": 1461.9,
"valid_targets_min": 819
},
{
"epoch": 1.532033426183844,
"grad_norm": 0.8054353338785877,
"learning_rate": 3.8310617233838094e-05,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08029267191886902,
"step": 1100,
"valid_targets_mean": 1225.5,
"valid_targets_min": 684
},
{
"epoch": 1.5389972144846795,
"grad_norm": 0.9118859088683984,
"learning_rate": 3.828256747880137e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10978655517101288,
"step": 1105,
"valid_targets_mean": 1282.2,
"valid_targets_min": 711
},
{
"epoch": 1.5459610027855153,
"grad_norm": 0.7673580373354333,
"learning_rate": 3.825429721628411e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11380324512720108,
"step": 1110,
"valid_targets_mean": 1634.8,
"valid_targets_min": 1190
},
{
"epoch": 1.552924791086351,
"grad_norm": 0.8522675201936903,
"learning_rate": 3.822580678725621e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10675722360610962,
"step": 1115,
"valid_targets_mean": 1615.9,
"valid_targets_min": 774
},
{
"epoch": 1.5598885793871866,
"grad_norm": 0.7180000643578018,
"learning_rate": 3.819709653534295e-05,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10761082917451859,
"step": 1120,
"valid_targets_mean": 1848.4,
"valid_targets_min": 734
},
{
"epoch": 1.5668523676880222,
"grad_norm": 0.8256061679097826,
"learning_rate": 3.8168166806820924e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10491684079170227,
"step": 1125,
"valid_targets_mean": 1570.6,
"valid_targets_min": 1011
},
{
"epoch": 1.573816155988858,
"grad_norm": 0.800219846734056,
"learning_rate": 3.813901795061387e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1188449040055275,
"step": 1130,
"valid_targets_mean": 1697.0,
"valid_targets_min": 803
},
{
"epoch": 1.5807799442896937,
"grad_norm": 0.7849874656744029,
"learning_rate": 3.810965031828843e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08988340198993683,
"step": 1135,
"valid_targets_mean": 1307.1,
"valid_targets_min": 782
},
{
"epoch": 1.5877437325905293,
"grad_norm": 0.7519337668408274,
"learning_rate": 3.808006426404991e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10832203924655914,
"step": 1140,
"valid_targets_mean": 1596.6,
"valid_targets_min": 646
},
{
"epoch": 1.5947075208913648,
"grad_norm": 0.7913090801912336,
"learning_rate": 3.805026014473803e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14530369639396667,
"step": 1145,
"valid_targets_mean": 1817.5,
"valid_targets_min": 922
},
{
"epoch": 1.6016713091922006,
"grad_norm": 0.8006210281974334,
"learning_rate": 3.802023831982262e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11583166569471359,
"step": 1150,
"valid_targets_mean": 1822.2,
"valid_targets_min": 796
},
{
"epoch": 1.6086350974930363,
"grad_norm": 0.8429365694331502,
"learning_rate": 3.798999915139926e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10505574196577072,
"step": 1155,
"valid_targets_mean": 1542.4,
"valid_targets_min": 903
},
{
"epoch": 1.615598885793872,
"grad_norm": 0.9071692515157804,
"learning_rate": 3.795954300418494e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11454838514328003,
"step": 1160,
"valid_targets_mean": 1459.5,
"valid_targets_min": 780
},
{
"epoch": 1.6225626740947074,
"grad_norm": 0.7700813936036295,
"learning_rate": 3.792887024551363e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10751248896121979,
"step": 1165,
"valid_targets_mean": 1581.1,
"valid_targets_min": 783
},
{
"epoch": 1.6295264623955432,
"grad_norm": 0.7587182482455052,
"learning_rate": 3.7897981245331895e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07905155420303345,
"step": 1170,
"valid_targets_mean": 1342.1,
"valid_targets_min": 662
},
{
"epoch": 1.636490250696379,
"grad_norm": 0.8016804160384552,
"learning_rate": 3.786687637619437e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08902774751186371,
"step": 1175,
"valid_targets_mean": 1269.1,
"valid_targets_min": 724
},
{
"epoch": 1.6434540389972145,
"grad_norm": 0.8762625648078411,
"learning_rate": 3.783555601325933e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11289331316947937,
"step": 1180,
"valid_targets_mean": 1510.1,
"valid_targets_min": 966
},
{
"epoch": 1.65041782729805,
"grad_norm": 0.8362696841731547,
"learning_rate": 3.7804020534284125e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08795975148677826,
"step": 1185,
"valid_targets_mean": 1327.8,
"valid_targets_min": 773
},
{
"epoch": 1.6573816155988856,
"grad_norm": 0.8217589431615828,
"learning_rate": 3.7772270319620655e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08339729905128479,
"step": 1190,
"valid_targets_mean": 1353.2,
"valid_targets_min": 807
},
{
"epoch": 1.6643454038997214,
"grad_norm": 0.8481129752613321,
"learning_rate": 3.774030575221073e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07550103962421417,
"step": 1195,
"valid_targets_mean": 1142.5,
"valid_targets_min": 782
},
{
"epoch": 1.6713091922005572,
"grad_norm": 0.7883067686921773,
"learning_rate": 3.770812721758151e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.112126424908638,
"step": 1200,
"valid_targets_mean": 1849.9,
"valid_targets_min": 634
},
{
"epoch": 1.6782729805013927,
"grad_norm": 0.7411457071163579,
"learning_rate": 3.7675735103840844e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10241081565618515,
"step": 1205,
"valid_targets_mean": 1599.6,
"valid_targets_min": 573
},
{
"epoch": 1.6852367688022283,
"grad_norm": 0.7086572852054175,
"learning_rate": 3.7643129801672535e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11208580434322357,
"step": 1210,
"valid_targets_mean": 1994.9,
"valid_targets_min": 1102
},
{
"epoch": 1.692200557103064,
"grad_norm": 0.8779677269614039,
"learning_rate": 3.76103117043317e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07884174585342407,
"step": 1215,
"valid_targets_mean": 1239.2,
"valid_targets_min": 841
},
{
"epoch": 1.6991643454038998,
"grad_norm": 0.7715841944120366,
"learning_rate": 3.757728120763998e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09706147015094757,
"step": 1220,
"valid_targets_mean": 1467.5,
"valid_targets_min": 956
},
{
"epoch": 1.7061281337047354,
"grad_norm": 0.8840496408494232,
"learning_rate": 3.754403870998079e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10566884279251099,
"step": 1225,
"valid_targets_mean": 1300.9,
"valid_targets_min": 857
},
{
"epoch": 1.713091922005571,
"grad_norm": 0.9178621719926586,
"learning_rate": 3.7510584612294506e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10823386162519455,
"step": 1230,
"valid_targets_mean": 1389.8,
"valid_targets_min": 808
},
{
"epoch": 1.7200557103064067,
"grad_norm": 0.938154160967897,
"learning_rate": 3.747691931807362e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08545945584774017,
"step": 1235,
"valid_targets_mean": 1303.8,
"valid_targets_min": 677
},
{
"epoch": 1.7270194986072425,
"grad_norm": 0.8217723401413547,
"learning_rate": 3.744304323335787e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0866972804069519,
"step": 1240,
"valid_targets_mean": 1220.1,
"valid_targets_min": 727
},
{
"epoch": 1.733983286908078,
"grad_norm": 0.7965558518328687,
"learning_rate": 3.7408956766729406e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0839056596159935,
"step": 1245,
"valid_targets_mean": 1262.0,
"valid_targets_min": 726
},
{
"epoch": 1.7409470752089136,
"grad_norm": 0.7985361430147639,
"learning_rate": 3.737466032930775e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11801943182945251,
"step": 1250,
"valid_targets_mean": 1615.0,
"valid_targets_min": 669
},
{
"epoch": 1.7479108635097493,
"grad_norm": 0.7163362819024491,
"learning_rate": 3.7340154334744933e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11403729021549225,
"step": 1255,
"valid_targets_mean": 1806.5,
"valid_targets_min": 792
},
{
"epoch": 1.754874651810585,
"grad_norm": 0.76114767590763,
"learning_rate": 3.7305439199220466e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09969079494476318,
"step": 1260,
"valid_targets_mean": 1627.6,
"valid_targets_min": 736
},
{
"epoch": 1.7618384401114207,
"grad_norm": 0.7967512334914618,
"learning_rate": 3.727051534143631e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14327603578567505,
"step": 1265,
"valid_targets_mean": 1822.9,
"valid_targets_min": 694
},
{
"epoch": 1.7688022284122562,
"grad_norm": 0.7047699568272487,
"learning_rate": 3.723538318261186e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1259545087814331,
"step": 1270,
"valid_targets_mean": 1848.9,
"valid_targets_min": 1437
},
{
"epoch": 1.775766016713092,
"grad_norm": 0.7684434862741877,
"learning_rate": 3.720004314647884e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12424354255199432,
"step": 1275,
"valid_targets_mean": 1852.4,
"valid_targets_min": 809
},
{
"epoch": 1.7827298050139275,
"grad_norm": 0.7865791196195834,
"learning_rate": 3.7164495659276195e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09065093100070953,
"step": 1280,
"valid_targets_mean": 1375.5,
"valid_targets_min": 790
},
{
"epoch": 1.7896935933147633,
"grad_norm": 0.8290020685682563,
"learning_rate": 3.712874114974496e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0918719470500946,
"step": 1285,
"valid_targets_mean": 1338.8,
"valid_targets_min": 750
},
{
"epoch": 1.7966573816155988,
"grad_norm": 0.7994498344708911,
"learning_rate": 3.7092780049123076e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12238575518131256,
"step": 1290,
"valid_targets_mean": 1778.8,
"valid_targets_min": 826
},
{
"epoch": 1.8036211699164344,
"grad_norm": 0.7645358833299734,
"learning_rate": 3.7056612791140204e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08983242511749268,
"step": 1295,
"valid_targets_mean": 1600.8,
"valid_targets_min": 907
},
{
"epoch": 1.8105849582172702,
"grad_norm": 0.7839077663753583,
"learning_rate": 3.7020239812012473e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1056416928768158,
"step": 1300,
"valid_targets_mean": 1474.5,
"valid_targets_min": 1093
},
{
"epoch": 1.817548746518106,
"grad_norm": 0.76163948748665,
"learning_rate": 3.698366155043724e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10014639794826508,
"step": 1305,
"valid_targets_mean": 1577.2,
"valid_targets_min": 1119
},
{
"epoch": 1.8245125348189415,
"grad_norm": 1.7707818510491133,
"learning_rate": 3.694687844758779e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11413945257663727,
"step": 1310,
"valid_targets_mean": 1512.1,
"valid_targets_min": 700
},
{
"epoch": 1.831476323119777,
"grad_norm": 0.7668240309562283,
"learning_rate": 3.6909890947108016e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07934726029634476,
"step": 1315,
"valid_targets_mean": 1288.2,
"valid_targets_min": 810
},
{
"epoch": 1.8384401114206128,
"grad_norm": 0.8996028117422565,
"learning_rate": 3.687269949510705e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09808281809091568,
"step": 1320,
"valid_targets_mean": 1328.9,
"valid_targets_min": 635
},
{
"epoch": 1.8454038997214486,
"grad_norm": 0.8176602096459092,
"learning_rate": 3.6835304540153914e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11697147786617279,
"step": 1325,
"valid_targets_mean": 1542.5,
"valid_targets_min": 673
},
{
"epoch": 1.8523676880222841,
"grad_norm": 1.1979420435140948,
"learning_rate": 3.67977065332721e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1085534319281578,
"step": 1330,
"valid_targets_mean": 1215.6,
"valid_targets_min": 641
},
{
"epoch": 1.8593314763231197,
"grad_norm": 0.8466439137236119,
"learning_rate": 3.6759905927934115e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08859957754611969,
"step": 1335,
"valid_targets_mean": 1222.6,
"valid_targets_min": 701
},
{
"epoch": 1.8662952646239555,
"grad_norm": 0.7520419595750739,
"learning_rate": 3.672190318005603e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10533758252859116,
"step": 1340,
"valid_targets_mean": 1850.6,
"valid_targets_min": 1202
},
{
"epoch": 1.8732590529247912,
"grad_norm": 0.7954441568911064,
"learning_rate": 3.6683698747991963e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07728315144777298,
"step": 1345,
"valid_targets_mean": 1265.5,
"valid_targets_min": 657
},
{
"epoch": 1.8802228412256268,
"grad_norm": 0.8167699792397287,
"learning_rate": 3.6645293092528565e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09353001415729523,
"step": 1350,
"valid_targets_mean": 1388.0,
"valid_targets_min": 672
},
{
"epoch": 1.8871866295264623,
"grad_norm": 0.7414620593948343,
"learning_rate": 3.660668667687946e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.119552381336689,
"step": 1355,
"valid_targets_mean": 1813.6,
"valid_targets_min": 1019
},
{
"epoch": 1.894150417827298,
"grad_norm": 0.8151102750049719,
"learning_rate": 3.6567879966679667e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07849185168743134,
"step": 1360,
"valid_targets_mean": 1114.6,
"valid_targets_min": 732
},
{
"epoch": 1.9011142061281339,
"grad_norm": 0.8226820998476463,
"learning_rate": 3.6528873429979946e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07085934281349182,
"step": 1365,
"valid_targets_mean": 1194.5,
"valid_targets_min": 634
},
{
"epoch": 1.9080779944289694,
"grad_norm": 0.6954859825201096,
"learning_rate": 3.64896675372412e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10201038420200348,
"step": 1370,
"valid_targets_mean": 1756.5,
"valid_targets_min": 905
},
{
"epoch": 1.915041782729805,
"grad_norm": 0.7713340565719015,
"learning_rate": 3.645026276132877e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1128055602312088,
"step": 1375,
"valid_targets_mean": 1554.9,
"valid_targets_min": 596
},
{
"epoch": 1.9220055710306405,
"grad_norm": 0.7927271064032854,
"learning_rate": 3.6410659577506773e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07899089902639389,
"step": 1380,
"valid_targets_mean": 1214.6,
"valid_targets_min": 687
},
{
"epoch": 1.9289693593314763,
"grad_norm": 0.7718601693739504,
"learning_rate": 3.63708584634323e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11290781199932098,
"step": 1385,
"valid_targets_mean": 1955.1,
"valid_targets_min": 1199
},
{
"epoch": 1.935933147632312,
"grad_norm": 0.7193801549469071,
"learning_rate": 3.6330859899149694e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10013289004564285,
"step": 1390,
"valid_targets_mean": 1758.6,
"valid_targets_min": 1214
},
{
"epoch": 1.9428969359331476,
"grad_norm": 0.726016091373521,
"learning_rate": 3.629066436708481e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09914419054985046,
"step": 1395,
"valid_targets_mean": 1711.5,
"valid_targets_min": 1122
},
{
"epoch": 1.9498607242339832,
"grad_norm": 0.8210382354675453,
"learning_rate": 3.625027235203909e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09899426996707916,
"step": 1400,
"valid_targets_mean": 1489.6,
"valid_targets_min": 850
},
{
"epoch": 1.956824512534819,
"grad_norm": 0.7429817246292151,
"learning_rate": 3.6209684341183803e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08339495956897736,
"step": 1405,
"valid_targets_mean": 1572.4,
"valid_targets_min": 1318
},
{
"epoch": 1.9637883008356547,
"grad_norm": 0.7739403851396445,
"learning_rate": 3.6168900824054135e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1083778664469719,
"step": 1410,
"valid_targets_mean": 1500.0,
"valid_targets_min": 1043
},
{
"epoch": 1.9707520891364902,
"grad_norm": 0.7568148924154536,
"learning_rate": 3.612792229254327e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11948154121637344,
"step": 1415,
"valid_targets_mean": 1774.9,
"valid_targets_min": 920
},
{
"epoch": 1.9777158774373258,
"grad_norm": 0.6992261616231107,
"learning_rate": 3.608674924089651e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10174979269504547,
"step": 1420,
"valid_targets_mean": 1547.1,
"valid_targets_min": 847
},
{
"epoch": 1.9846796657381616,
"grad_norm": 0.7035138286444061,
"learning_rate": 3.6045382165705255e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10589592158794403,
"step": 1425,
"valid_targets_mean": 1769.4,
"valid_targets_min": 738
},
{
"epoch": 1.9916434540389973,
"grad_norm": 0.8155181230292006,
"learning_rate": 3.600382156590104e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10955852270126343,
"step": 1430,
"valid_targets_mean": 1540.1,
"valid_targets_min": 594
},
{
"epoch": 1.998607242339833,
"grad_norm": 0.6347666367578908,
"learning_rate": 3.5962067942749516e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10341192036867142,
"step": 1435,
"valid_targets_mean": 2228.6,
"valid_targets_min": 1393
},
{
"epoch": 2.0055710306406684,
"grad_norm": 0.5577761958239622,
"learning_rate": 3.592012179984442e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18662209808826447,
"step": 1440,
"valid_targets_mean": 8029.9,
"valid_targets_min": 6142
},
{
"epoch": 2.012534818941504,
"grad_norm": 0.483618877635035,
"learning_rate": 3.587798364310146e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11201878637075424,
"step": 1445,
"valid_targets_mean": 6664.0,
"valid_targets_min": 5470
},
{
"epoch": 2.01949860724234,
"grad_norm": 0.5185691459202105,
"learning_rate": 3.583565398075226e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11615484952926636,
"step": 1450,
"valid_targets_mean": 7126.9,
"valid_targets_min": 5368
},
{
"epoch": 2.0264623955431755,
"grad_norm": 0.438228030552986,
"learning_rate": 3.579313332333819e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10276132822036743,
"step": 1455,
"valid_targets_mean": 7634.9,
"valid_targets_min": 5614
},
{
"epoch": 2.033426183844011,
"grad_norm": 0.3948344228513168,
"learning_rate": 3.575042218370423e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1019166111946106,
"step": 1460,
"valid_targets_mean": 8630.8,
"valid_targets_min": 6362
},
{
"epoch": 2.0403899721448466,
"grad_norm": 0.4535316383686147,
"learning_rate": 3.570752107699281e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10765604674816132,
"step": 1465,
"valid_targets_mean": 7383.6,
"valid_targets_min": 5844
},
{
"epoch": 2.0473537604456826,
"grad_norm": 0.4216201437635594,
"learning_rate": 3.566443052063751e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12464028596878052,
"step": 1470,
"valid_targets_mean": 8017.0,
"valid_targets_min": 5283
},
{
"epoch": 2.054317548746518,
"grad_norm": 0.3816491538208156,
"learning_rate": 3.5621151034356927e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09279941767454147,
"step": 1475,
"valid_targets_mean": 7051.1,
"valid_targets_min": 4135
},
{
"epoch": 2.0612813370473537,
"grad_norm": 0.41992932447893627,
"learning_rate": 3.557768314014834e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09113673865795135,
"step": 1480,
"valid_targets_mean": 5370.4,
"valid_targets_min": 3919
},
{
"epoch": 2.0682451253481893,
"grad_norm": 0.3912975995428693,
"learning_rate": 3.5534027362281436e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0919366329908371,
"step": 1485,
"valid_targets_mean": 6063.6,
"valid_targets_min": 4863
},
{
"epoch": 2.0752089136490253,
"grad_norm": 0.4107622241608645,
"learning_rate": 3.549018422729197e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10401890426874161,
"step": 1490,
"valid_targets_mean": 7001.2,
"valid_targets_min": 6020
},
{
"epoch": 2.082172701949861,
"grad_norm": 0.39061276611048656,
"learning_rate": 3.544615426397543e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.101812943816185,
"step": 1495,
"valid_targets_mean": 6181.9,
"valid_targets_min": 4669
},
{
"epoch": 2.0891364902506964,
"grad_norm": 0.38035206361099594,
"learning_rate": 3.5401938003380666e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09549552947282791,
"step": 1500,
"valid_targets_mean": 6250.2,
"valid_targets_min": 4900
},
{
"epoch": 2.096100278551532,
"grad_norm": 0.43005142535025387,
"learning_rate": 3.5357535978803455e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09210428595542908,
"step": 1505,
"valid_targets_mean": 7156.4,
"valid_targets_min": 5323
},
{
"epoch": 2.103064066852368,
"grad_norm": 0.40901081252647176,
"learning_rate": 3.53129487257801e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10530374944210052,
"step": 1510,
"valid_targets_mean": 7215.8,
"valid_targets_min": 4720
},
{
"epoch": 2.1100278551532035,
"grad_norm": 0.412691959227041,
"learning_rate": 3.5268176782080967e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10234518349170685,
"step": 1515,
"valid_targets_mean": 6550.8,
"valid_targets_min": 5739
},
{
"epoch": 2.116991643454039,
"grad_norm": 0.3904193639606634,
"learning_rate": 3.522322068770397e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10454997420310974,
"step": 1520,
"valid_targets_mean": 6726.8,
"valid_targets_min": 4540
},
{
"epoch": 2.1239554317548746,
"grad_norm": 0.5086857986092044,
"learning_rate": 3.51780809848681e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11639285087585449,
"step": 1525,
"valid_targets_mean": 4573.4,
"valid_targets_min": 1039
},
{
"epoch": 2.13091922005571,
"grad_norm": 0.4916720484004185,
"learning_rate": 3.513275821800684e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10517747700214386,
"step": 1530,
"valid_targets_mean": 6430.0,
"valid_targets_min": 5412
},
{
"epoch": 2.137883008356546,
"grad_norm": 0.7279504673107768,
"learning_rate": 3.5087252933761654e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03320852294564247,
"step": 1535,
"valid_targets_mean": 583.1,
"valid_targets_min": 158
},
{
"epoch": 2.1448467966573816,
"grad_norm": 0.38537163974446353,
"learning_rate": 3.504156568097533e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10623390972614288,
"step": 1540,
"valid_targets_mean": 8230.9,
"valid_targets_min": 5061
},
{
"epoch": 2.151810584958217,
"grad_norm": 0.41759228803004284,
"learning_rate": 3.4995697010685415e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11333325505256653,
"step": 1545,
"valid_targets_mean": 7238.9,
"valid_targets_min": 5112
},
{
"epoch": 2.1587743732590527,
"grad_norm": 0.4142412953268547,
"learning_rate": 3.4949647476117535e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09155681729316711,
"step": 1550,
"valid_targets_mean": 6322.8,
"valid_targets_min": 4867
},
{
"epoch": 2.1657381615598887,
"grad_norm": 0.38370921033703687,
"learning_rate": 3.4903417632678746e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10269880294799805,
"step": 1555,
"valid_targets_mean": 7887.0,
"valid_targets_min": 6004
},
{
"epoch": 2.1727019498607243,
"grad_norm": 0.3711170733226334,
"learning_rate": 3.4857008037950814e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09217008948326111,
"step": 1560,
"valid_targets_mean": 7090.2,
"valid_targets_min": 4917
},
{
"epoch": 2.17966573816156,
"grad_norm": 0.3940923954443781,
"learning_rate": 3.481041925168349e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09533364325761795,
"step": 1565,
"valid_targets_mean": 7441.9,
"valid_targets_min": 4202
},
{
"epoch": 2.1866295264623954,
"grad_norm": 0.38589644774474163,
"learning_rate": 3.476365183578779e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09489143639802933,
"step": 1570,
"valid_targets_mean": 7901.8,
"valid_targets_min": 5060
},
{
"epoch": 2.1935933147632314,
"grad_norm": 0.32887624393579473,
"learning_rate": 3.471670635432919e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08562236279249191,
"step": 1575,
"valid_targets_mean": 8557.6,
"valid_targets_min": 6331
},
{
"epoch": 2.200557103064067,
"grad_norm": 0.45867578912244944,
"learning_rate": 3.466958337352082e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09923288971185684,
"step": 1580,
"valid_targets_mean": 4976.4,
"valid_targets_min": 2847
},
{
"epoch": 2.2075208913649025,
"grad_norm": 0.4238519335072428,
"learning_rate": 3.462228346171664e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11293122917413712,
"step": 1585,
"valid_targets_mean": 7129.1,
"valid_targets_min": 5331
},
{
"epoch": 2.214484679665738,
"grad_norm": 0.4164534419411376,
"learning_rate": 3.457480718940461e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1091599240899086,
"step": 1590,
"valid_targets_mean": 6864.0,
"valid_targets_min": 4697
},
{
"epoch": 2.2214484679665736,
"grad_norm": 0.42010359781278844,
"learning_rate": 3.4527155129199766e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10069143772125244,
"step": 1595,
"valid_targets_mean": 6631.9,
"valid_targets_min": 4623
},
{
"epoch": 2.2284122562674096,
"grad_norm": 0.43617878030396867,
"learning_rate": 3.447932785583735e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09616230428218842,
"step": 1600,
"valid_targets_mean": 6330.4,
"valid_targets_min": 5424
},
{
"epoch": 2.235376044568245,
"grad_norm": 0.41414881589071445,
"learning_rate": 3.4431325946165847e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09712429344654083,
"step": 1605,
"valid_targets_mean": 6814.8,
"valid_targets_min": 4964
},
{
"epoch": 2.2423398328690807,
"grad_norm": 0.4444215191301066,
"learning_rate": 3.438314997914006e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11258673667907715,
"step": 1610,
"valid_targets_mean": 6915.8,
"valid_targets_min": 5321
},
{
"epoch": 2.2493036211699167,
"grad_norm": 0.41522878354353365,
"learning_rate": 3.433480053581412e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10380226373672485,
"step": 1615,
"valid_targets_mean": 6464.5,
"valid_targets_min": 5185
},
{
"epoch": 2.256267409470752,
"grad_norm": 0.4467050398625796,
"learning_rate": 3.4286278199334436e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10517797619104385,
"step": 1620,
"valid_targets_mean": 7048.6,
"valid_targets_min": 4913
},
{
"epoch": 2.2632311977715878,
"grad_norm": 0.4232921124371884,
"learning_rate": 3.4237583554932726e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11401194334030151,
"step": 1625,
"valid_targets_mean": 7469.2,
"valid_targets_min": 5426
},
{
"epoch": 2.2701949860724233,
"grad_norm": 0.4259278689375421,
"learning_rate": 3.4188717189918915e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10883718729019165,
"step": 1630,
"valid_targets_mean": 6819.4,
"valid_targets_min": 5286
},
{
"epoch": 2.277158774373259,
"grad_norm": 0.412251669431946,
"learning_rate": 3.413967969367406e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10999740660190582,
"step": 1635,
"valid_targets_mean": 7107.5,
"valid_targets_min": 5201
},
{
"epoch": 2.284122562674095,
"grad_norm": 0.42374140207835653,
"learning_rate": 3.4090471657643254e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09911487251520157,
"step": 1640,
"valid_targets_mean": 5642.6,
"valid_targets_min": 4838
},
{
"epoch": 2.2910863509749304,
"grad_norm": 0.9807420220774704,
"learning_rate": 3.404109367532847e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19164110720157623,
"step": 1645,
"valid_targets_mean": 2054.1,
"valid_targets_min": 134
},
{
"epoch": 2.298050139275766,
"grad_norm": 0.5566049180562685,
"learning_rate": 3.399154634228144e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0960545465350151,
"step": 1650,
"valid_targets_mean": 6686.4,
"valid_targets_min": 5256
},
{
"epoch": 2.3050139275766015,
"grad_norm": 0.4253696878618078,
"learning_rate": 3.394183025609644e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1074969694018364,
"step": 1655,
"valid_targets_mean": 6216.6,
"valid_targets_min": 5542
},
{
"epoch": 2.3119777158774375,
"grad_norm": 0.4131104336589319,
"learning_rate": 3.3891946016403056e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10091003775596619,
"step": 1660,
"valid_targets_mean": 6486.1,
"valid_targets_min": 5531
},
{
"epoch": 2.318941504178273,
"grad_norm": 0.45874934809459283,
"learning_rate": 3.384189422485904e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09876036643981934,
"step": 1665,
"valid_targets_mean": 5797.4,
"valid_targets_min": 3911
},
{
"epoch": 2.3259052924791086,
"grad_norm": 0.4246615076495944,
"learning_rate": 3.3791675485142974e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10160474479198456,
"step": 1670,
"valid_targets_mean": 6357.5,
"valid_targets_min": 5195
},
{
"epoch": 2.332869080779944,
"grad_norm": 0.43609990408164573,
"learning_rate": 3.374129040294701e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10332215577363968,
"step": 1675,
"valid_targets_mean": 5808.9,
"valid_targets_min": 4959
},
{
"epoch": 2.33983286908078,
"grad_norm": 0.5400090427254614,
"learning_rate": 3.369073958596958e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06865261495113373,
"step": 1680,
"valid_targets_mean": 2591.5,
"valid_targets_min": 842
},
{
"epoch": 2.3467966573816157,
"grad_norm": 0.457933957702517,
"learning_rate": 3.364002364390805e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09762382507324219,
"step": 1685,
"valid_targets_mean": 6006.9,
"valid_targets_min": 4769
},
{
"epoch": 2.3537604456824512,
"grad_norm": 0.4088785055658562,
"learning_rate": 3.358914318845138e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09737879037857056,
"step": 1690,
"valid_targets_mean": 6764.2,
"valid_targets_min": 5046
},
{
"epoch": 2.360724233983287,
"grad_norm": 0.47400359842514794,
"learning_rate": 3.353809883327273e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10614047944545746,
"step": 1695,
"valid_targets_mean": 6055.8,
"valid_targets_min": 5182
},
{
"epoch": 2.3676880222841223,
"grad_norm": 0.44156250020466503,
"learning_rate": 3.348689119402209e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10033164173364639,
"step": 1700,
"valid_targets_mean": 7101.6,
"valid_targets_min": 5366
},
{
"epoch": 2.3746518105849583,
"grad_norm": 0.41213498850675423,
"learning_rate": 3.343552088831878e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1027466282248497,
"step": 1705,
"valid_targets_mean": 7111.9,
"valid_targets_min": 5192
},
{
"epoch": 2.381615598885794,
"grad_norm": 0.5040432860111047,
"learning_rate": 3.338398853574411e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09895579516887665,
"step": 1710,
"valid_targets_mean": 5509.9,
"valid_targets_min": 4790
},
{
"epoch": 2.3885793871866294,
"grad_norm": 1.1363379165814331,
"learning_rate": 3.333229475783383e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11968301236629486,
"step": 1715,
"valid_targets_mean": 1581.9,
"valid_targets_min": 864
},
{
"epoch": 2.3955431754874654,
"grad_norm": 0.8698074566188687,
"learning_rate": 3.3280440178070635e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09715799242258072,
"step": 1720,
"valid_targets_mean": 1333.2,
"valid_targets_min": 632
},
{
"epoch": 2.402506963788301,
"grad_norm": 0.8444689746099655,
"learning_rate": 3.322842542187669e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10113231092691422,
"step": 1725,
"valid_targets_mean": 1602.9,
"valid_targets_min": 875
},
{
"epoch": 2.4094707520891365,
"grad_norm": 1.1270431114328114,
"learning_rate": 3.317625111660605e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1020176112651825,
"step": 1730,
"valid_targets_mean": 1340.4,
"valid_targets_min": 701
},
{
"epoch": 2.416434540389972,
"grad_norm": 0.7839393431669954,
"learning_rate": 3.3123917891537085e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11173247545957565,
"step": 1735,
"valid_targets_mean": 1792.9,
"valid_targets_min": 898
},
{
"epoch": 2.4233983286908076,
"grad_norm": 0.7608101315047425,
"learning_rate": 3.307142637786496e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09726438671350479,
"step": 1740,
"valid_targets_mean": 1433.1,
"valid_targets_min": 1070
},
{
"epoch": 2.4303621169916436,
"grad_norm": 0.851244310222369,
"learning_rate": 3.3018777208693916e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10597909986972809,
"step": 1745,
"valid_targets_mean": 1589.5,
"valid_targets_min": 970
},
{
"epoch": 2.437325905292479,
"grad_norm": 0.7562891748345674,
"learning_rate": 3.2965971019029716e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08589346706867218,
"step": 1750,
"valid_targets_mean": 1270.5,
"valid_targets_min": 648
},
{
"epoch": 2.4442896935933147,
"grad_norm": 0.8072271025740217,
"learning_rate": 3.291300844577196e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1143551915884018,
"step": 1755,
"valid_targets_mean": 1674.5,
"valid_targets_min": 727
},
{
"epoch": 2.4512534818941503,
"grad_norm": 0.8040766542030429,
"learning_rate": 3.28598901277064e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07331328094005585,
"step": 1760,
"valid_targets_mean": 1406.0,
"valid_targets_min": 770
},
{
"epoch": 2.4582172701949863,
"grad_norm": 0.7600004146401925,
"learning_rate": 3.280661670549723e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08032012730836868,
"step": 1765,
"valid_targets_mean": 1381.2,
"valid_targets_min": 572
},
{
"epoch": 2.465181058495822,
"grad_norm": 0.8186128164361567,
"learning_rate": 3.275318882167938e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11326928436756134,
"step": 1770,
"valid_targets_mean": 1580.4,
"valid_targets_min": 633
},
{
"epoch": 2.4721448467966574,
"grad_norm": 0.7878473077583293,
"learning_rate": 3.269960712065074e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09199025481939316,
"step": 1775,
"valid_targets_mean": 1478.8,
"valid_targets_min": 923
},
{
"epoch": 2.479108635097493,
"grad_norm": 0.7408103486539382,
"learning_rate": 3.264587224866442e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08334987610578537,
"step": 1780,
"valid_targets_mean": 1401.0,
"valid_targets_min": 740
},
{
"epoch": 2.486072423398329,
"grad_norm": 0.7785323575154897,
"learning_rate": 3.2591984853820926e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08059869706630707,
"step": 1785,
"valid_targets_mean": 1588.9,
"valid_targets_min": 870
},
{
"epoch": 2.4930362116991645,
"grad_norm": 0.7501213652690097,
"learning_rate": 3.2537945586060336e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12979084253311157,
"step": 1790,
"valid_targets_mean": 2008.4,
"valid_targets_min": 1042
},
{
"epoch": 2.5,
"grad_norm": 0.769300550573875,
"learning_rate": 3.248375509715452e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07505079358816147,
"step": 1795,
"valid_targets_mean": 1209.0,
"valid_targets_min": 870
},
{
"epoch": 2.5069637883008355,
"grad_norm": 0.8297708977009772,
"learning_rate": 3.242941404069921e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09335260093212128,
"step": 1800,
"valid_targets_mean": 1535.5,
"valid_targets_min": 740
},
{
"epoch": 2.513927576601671,
"grad_norm": 0.731844058605371,
"learning_rate": 3.237492307210614e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09308585524559021,
"step": 1805,
"valid_targets_mean": 1642.9,
"valid_targets_min": 906
},
{
"epoch": 2.520891364902507,
"grad_norm": 0.8193149089522122,
"learning_rate": 3.2320282848595174e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09537345170974731,
"step": 1810,
"valid_targets_mean": 1570.5,
"valid_targets_min": 814
},
{
"epoch": 2.5278551532033426,
"grad_norm": 0.8371651941131215,
"learning_rate": 3.226549402918631e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08008214086294174,
"step": 1815,
"valid_targets_mean": 1722.1,
"valid_targets_min": 832
},
{
"epoch": 2.534818941504178,
"grad_norm": 0.7018441413273226,
"learning_rate": 3.221055727469182e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06970568746328354,
"step": 1820,
"valid_targets_mean": 1453.5,
"valid_targets_min": 891
},
{
"epoch": 2.541782729805014,
"grad_norm": 0.7963146448093934,
"learning_rate": 3.21554732477082e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11181323230266571,
"step": 1825,
"valid_targets_mean": 1584.4,
"valid_targets_min": 734
},
{
"epoch": 2.5487465181058497,
"grad_norm": 0.7592311759031534,
"learning_rate": 3.2100242612608213e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08187158405780792,
"step": 1830,
"valid_targets_mean": 1495.2,
"valid_targets_min": 737
},
{
"epoch": 2.5557103064066853,
"grad_norm": 0.773359400074154,
"learning_rate": 3.204486603553289e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0989374965429306,
"step": 1835,
"valid_targets_mean": 1737.0,
"valid_targets_min": 872
},
{
"epoch": 2.562674094707521,
"grad_norm": 0.7743236506768809,
"learning_rate": 3.1989344184383476e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09391649067401886,
"step": 1840,
"valid_targets_mean": 1431.6,
"valid_targets_min": 805
},
{
"epoch": 2.5696378830083564,
"grad_norm": 0.7358590006225955,
"learning_rate": 3.1933677728813364e-05,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10584774613380432,
"step": 1845,
"valid_targets_mean": 2060.2,
"valid_targets_min": 1253
},
{
"epoch": 2.5766016713091924,
"grad_norm": 0.7193105312572781,
"learning_rate": 3.1877867340220045e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10305032879114151,
"step": 1850,
"valid_targets_mean": 2063.9,
"valid_targets_min": 1264
},
{
"epoch": 2.583565459610028,
"grad_norm": 0.7695266994780475,
"learning_rate": 3.1821913691736995e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0683041363954544,
"step": 1855,
"valid_targets_mean": 1036.5,
"valid_targets_min": 613
},
{
"epoch": 2.5905292479108635,
"grad_norm": 0.7101389867132969,
"learning_rate": 3.1765817458225546e-05,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08477064967155457,
"step": 1860,
"valid_targets_mean": 1674.4,
"valid_targets_min": 768
},
{
"epoch": 2.597493036211699,
"grad_norm": 0.8599774854634431,
"learning_rate": 3.170957931626679e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.080399289727211,
"step": 1865,
"valid_targets_mean": 1249.8,
"valid_targets_min": 714
},
{
"epoch": 2.6044568245125346,
"grad_norm": 0.7993028212492834,
"learning_rate": 3.165319994415336e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06606724113225937,
"step": 1870,
"valid_targets_mean": 1114.8,
"valid_targets_min": 800
},
{
"epoch": 2.6114206128133706,
"grad_norm": 0.7781447333017487,
"learning_rate": 3.159668002188128e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10036128759384155,
"step": 1875,
"valid_targets_mean": 1780.9,
"valid_targets_min": 933
},
{
"epoch": 2.618384401114206,
"grad_norm": 0.8858832068872401,
"learning_rate": 3.1540020231141774e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07642105966806412,
"step": 1880,
"valid_targets_mean": 1113.6,
"valid_targets_min": 746
},
{
"epoch": 2.6253481894150417,
"grad_norm": 0.8236948964912306,
"learning_rate": 3.148322125531302e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09135651588439941,
"step": 1885,
"valid_targets_mean": 1265.0,
"valid_targets_min": 814
},
{
"epoch": 2.6323119777158777,
"grad_norm": 0.7402380099739323,
"learning_rate": 3.142628377945191e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10815448313951492,
"step": 1890,
"valid_targets_mean": 1652.1,
"valid_targets_min": 635
},
{
"epoch": 2.639275766016713,
"grad_norm": 0.7766341389183821,
"learning_rate": 3.1369208490285824e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06988343596458435,
"step": 1895,
"valid_targets_mean": 1231.2,
"valid_targets_min": 739
},
{
"epoch": 2.6462395543175488,
"grad_norm": 0.790490819348294,
"learning_rate": 3.13119960762043e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10846837610006332,
"step": 1900,
"valid_targets_mean": 1682.4,
"valid_targets_min": 831
},
{
"epoch": 2.6532033426183843,
"grad_norm": 0.8701861923326255,
"learning_rate": 3.125464722725074e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08927632868289948,
"step": 1905,
"valid_targets_mean": 1571.6,
"valid_targets_min": 1015
},
{
"epoch": 2.66016713091922,
"grad_norm": 0.7672559496303158,
"learning_rate": 3.119716263511412e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07645729184150696,
"step": 1910,
"valid_targets_mean": 1276.8,
"valid_targets_min": 711
},
{
"epoch": 2.667130919220056,
"grad_norm": 0.7633251851517129,
"learning_rate": 3.1139542993120615e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05591302365064621,
"step": 1915,
"valid_targets_mean": 1147.5,
"valid_targets_min": 733
},
{
"epoch": 2.6740947075208914,
"grad_norm": 0.8548710751284283,
"learning_rate": 3.108178899622524e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11267301440238953,
"step": 1920,
"valid_targets_mean": 1604.0,
"valid_targets_min": 953
},
{
"epoch": 2.681058495821727,
"grad_norm": 0.7154752716285275,
"learning_rate": 3.102390134100349e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08892469853162766,
"step": 1925,
"valid_targets_mean": 1784.0,
"valid_targets_min": 1011
},
{
"epoch": 2.688022284122563,
"grad_norm": 0.7886303529310777,
"learning_rate": 3.096588072564291e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10861388593912125,
"step": 1930,
"valid_targets_mean": 1729.0,
"valid_targets_min": 1143
},
{
"epoch": 2.6949860724233985,
"grad_norm": 0.7782781896814367,
"learning_rate": 3.09077278499347e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0805855244398117,
"step": 1935,
"valid_targets_mean": 1483.9,
"valid_targets_min": 699
},
{
"epoch": 2.701949860724234,
"grad_norm": 0.7716708466878998,
"learning_rate": 3.084944341526524e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07467707991600037,
"step": 1940,
"valid_targets_mean": 1198.4,
"valid_targets_min": 680
},
{
"epoch": 2.7089136490250696,
"grad_norm": 0.7956657891036718,
"learning_rate": 3.079102812460769e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08717083930969238,
"step": 1945,
"valid_targets_mean": 1365.2,
"valid_targets_min": 687
},
{
"epoch": 2.715877437325905,
"grad_norm": 0.8040752534275205,
"learning_rate": 3.0732482682513435e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06229158490896225,
"step": 1950,
"valid_targets_mean": 1142.9,
"valid_targets_min": 835
},
{
"epoch": 2.722841225626741,
"grad_norm": 0.7747436174550746,
"learning_rate": 3.067380779510365e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07470732927322388,
"step": 1955,
"valid_targets_mean": 1316.9,
"valid_targets_min": 829
},
{
"epoch": 2.7298050139275767,
"grad_norm": 0.7825972178164834,
"learning_rate": 3.061500417006076e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09210141003131866,
"step": 1960,
"valid_targets_mean": 1739.2,
"valid_targets_min": 1138
},
{
"epoch": 2.7367688022284122,
"grad_norm": 0.696392311199642,
"learning_rate": 3.0556072516619896e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07831001281738281,
"step": 1965,
"valid_targets_mean": 1592.2,
"valid_targets_min": 1174
},
{
"epoch": 2.743732590529248,
"grad_norm": 0.7770652602858239,
"learning_rate": 3.0497013545560354e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08863939344882965,
"step": 1970,
"valid_targets_mean": 1543.1,
"valid_targets_min": 554
},
{
"epoch": 2.7506963788300833,
"grad_norm": 0.7372103268972405,
"learning_rate": 3.043782796919701e-05,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08466736972332001,
"step": 1975,
"valid_targets_mean": 1430.0,
"valid_targets_min": 843
},
{
"epoch": 2.7576601671309193,
"grad_norm": 0.7288721894678064,
"learning_rate": 3.0378516501371752e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08267127722501755,
"step": 1980,
"valid_targets_mean": 1622.9,
"valid_targets_min": 849
},
{
"epoch": 2.764623955431755,
"grad_norm": 0.819855661582502,
"learning_rate": 3.0319079857444844e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08106249570846558,
"step": 1985,
"valid_targets_mean": 1429.0,
"valid_targets_min": 612
},
{
"epoch": 2.7715877437325904,
"grad_norm": 0.7552847804482032,
"learning_rate": 3.0259518754286302e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07017084956169128,
"step": 1990,
"valid_targets_mean": 1283.0,
"valid_targets_min": 782
},
{
"epoch": 2.7785515320334264,
"grad_norm": 0.8464332743776155,
"learning_rate": 3.0199833910267286e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09966123104095459,
"step": 1995,
"valid_targets_mean": 1457.0,
"valid_targets_min": 926
},
{
"epoch": 2.785515320334262,
"grad_norm": 0.7123507198714567,
"learning_rate": 3.0140026045251357e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0700862854719162,
"step": 2000,
"valid_targets_mean": 1399.6,
"valid_targets_min": 822
},
{
"epoch": 2.7924791086350975,
"grad_norm": 0.7070416875399016,
"learning_rate": 3.0080095880585884e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07886691391468048,
"step": 2005,
"valid_targets_mean": 1464.6,
"valid_targets_min": 670
},
{
"epoch": 2.799442896935933,
"grad_norm": 0.7839739267460378,
"learning_rate": 3.002004413909326e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08037430047988892,
"step": 2010,
"valid_targets_mean": 1504.8,
"valid_targets_min": 647
},
{
"epoch": 2.8064066852367686,
"grad_norm": 0.7325386392599472,
"learning_rate": 2.995987154506228e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06354961544275284,
"step": 2015,
"valid_targets_mean": 1276.9,
"valid_targets_min": 791
},
{
"epoch": 2.8133704735376046,
"grad_norm": 0.7963527637303378,
"learning_rate": 2.98995788242393e-05,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07502847909927368,
"step": 2020,
"valid_targets_mean": 1291.4,
"valid_targets_min": 746
},
{
"epoch": 2.82033426183844,
"grad_norm": 0.7325341255976993,
"learning_rate": 2.9839166703819572e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06790463626384735,
"step": 2025,
"valid_targets_mean": 1409.1,
"valid_targets_min": 892
},
{
"epoch": 2.8272980501392757,
"grad_norm": 1.0267772645703437,
"learning_rate": 2.97786359124384e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10208472609519958,
"step": 2030,
"valid_targets_mean": 1581.9,
"valid_targets_min": 914
},
{
"epoch": 2.8342618384401113,
"grad_norm": 0.7487266217807981,
"learning_rate": 2.971798718016242e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07919836044311523,
"step": 2035,
"valid_targets_mean": 1647.6,
"valid_targets_min": 636
},
{
"epoch": 2.841225626740947,
"grad_norm": 0.9158258240874332,
"learning_rate": 2.9657221238480746e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0867113322019577,
"step": 2040,
"valid_targets_mean": 1523.5,
"valid_targets_min": 641
},
{
"epoch": 2.848189415041783,
"grad_norm": 0.8495953544791401,
"learning_rate": 2.9596338820296163e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09921315312385559,
"step": 2045,
"valid_targets_mean": 1629.4,
"valid_targets_min": 1020
},
{
"epoch": 2.8551532033426184,
"grad_norm": 1.1190071551544958,
"learning_rate": 2.953534065991631e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08030430972576141,
"step": 2050,
"valid_targets_mean": 1163.4,
"valid_targets_min": 729
},
{
"epoch": 2.862116991643454,
"grad_norm": 0.7607775978376603,
"learning_rate": 2.947422749304476e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10393047332763672,
"step": 2055,
"valid_targets_mean": 1613.2,
"valid_targets_min": 1001
},
{
"epoch": 2.86908077994429,
"grad_norm": 0.783991662666305,
"learning_rate": 2.9413000056772225e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0888073593378067,
"step": 2060,
"valid_targets_mean": 1567.0,
"valid_targets_min": 1175
},
{
"epoch": 2.8760445682451254,
"grad_norm": 0.7826353186492123,
"learning_rate": 2.9351659089567622e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10893246531486511,
"step": 2065,
"valid_targets_mean": 1609.0,
"valid_targets_min": 892
},
{
"epoch": 2.883008356545961,
"grad_norm": 0.7934696501334912,
"learning_rate": 2.9290205331269158e-05,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08275732398033142,
"step": 2070,
"valid_targets_mean": 1425.2,
"valid_targets_min": 801
},
{
"epoch": 2.8899721448467965,
"grad_norm": 0.7172842896059596,
"learning_rate": 2.9228639523075432e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08390860259532928,
"step": 2075,
"valid_targets_mean": 1462.4,
"valid_targets_min": 564
},
{
"epoch": 2.896935933147632,
"grad_norm": 0.8356533188243083,
"learning_rate": 2.9166962407536496e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08387964218854904,
"step": 2080,
"valid_targets_mean": 1749.1,
"valid_targets_min": 651
},
{
"epoch": 2.903899721448468,
"grad_norm": 0.780853509813084,
"learning_rate": 2.910517472854487e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07162684202194214,
"step": 2085,
"valid_targets_mean": 1161.0,
"valid_targets_min": 716
},
{
"epoch": 2.9108635097493036,
"grad_norm": 0.7403317269239412,
"learning_rate": 2.9043277231326606e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08211035281419754,
"step": 2090,
"valid_targets_mean": 1425.6,
"valid_targets_min": 744
},
{
"epoch": 2.917827298050139,
"grad_norm": 0.7512823712045082,
"learning_rate": 2.8981270662432258e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0736178457736969,
"step": 2095,
"valid_targets_mean": 1391.1,
"valid_targets_min": 1218
},
{
"epoch": 2.924791086350975,
"grad_norm": 0.8217643276597543,
"learning_rate": 2.8919155769727932e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09656500816345215,
"step": 2100,
"valid_targets_mean": 1724.5,
"valid_targets_min": 793
},
{
"epoch": 2.9317548746518107,
"grad_norm": 0.7855411813191986,
"learning_rate": 2.8856933302386224e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07395291328430176,
"step": 2105,
"valid_targets_mean": 1366.8,
"valid_targets_min": 846
},
{
"epoch": 2.9387186629526463,
"grad_norm": 0.9080574970183085,
"learning_rate": 2.879460401087718e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09661687910556793,
"step": 2110,
"valid_targets_mean": 1772.1,
"valid_targets_min": 979
},
{
"epoch": 2.945682451253482,
"grad_norm": 0.7185745540261005,
"learning_rate": 2.873216864695928e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09203220903873444,
"step": 2115,
"valid_targets_mean": 1778.9,
"valid_targets_min": 1093
},
{
"epoch": 2.9526462395543174,
"grad_norm": 0.8058469860251909,
"learning_rate": 2.8669627963670348e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0805043950676918,
"step": 2120,
"valid_targets_mean": 1510.8,
"valid_targets_min": 595
},
{
"epoch": 2.9596100278551534,
"grad_norm": 0.8161844468728507,
"learning_rate": 2.8606982715318467e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08108193427324295,
"step": 2125,
"valid_targets_mean": 1330.4,
"valid_targets_min": 868
},
{
"epoch": 2.966573816155989,
"grad_norm": 0.8048088395167377,
"learning_rate": 2.8544233657472893e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10407143086194992,
"step": 2130,
"valid_targets_mean": 1504.2,
"valid_targets_min": 914
},
{
"epoch": 2.9735376044568245,
"grad_norm": 0.7696287813690902,
"learning_rate": 2.8481381546954944e-05,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10349928587675095,
"step": 2135,
"valid_targets_mean": 1972.9,
"valid_targets_min": 1080
},
{
"epoch": 2.98050139275766,
"grad_norm": 0.7248553330646451,
"learning_rate": 2.8418427141828836e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08698803186416626,
"step": 2140,
"valid_targets_mean": 1519.6,
"valid_targets_min": 658
},
{
"epoch": 2.9874651810584956,
"grad_norm": 0.8081002064785113,
"learning_rate": 2.835537120139261e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07442046701908112,
"step": 2145,
"valid_targets_mean": 1362.0,
"valid_targets_min": 1018
},
{
"epoch": 2.9944289693593316,
"grad_norm": 0.7441884200422766,
"learning_rate": 2.8292214486168887e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1013420969247818,
"step": 2150,
"valid_targets_mean": 1623.0,
"valid_targets_min": 1041
},
{
"epoch": 3.001392757660167,
"grad_norm": 0.582670213892772,
"learning_rate": 2.8228957757895787e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10588406026363373,
"step": 2155,
"valid_targets_mean": 8215.2,
"valid_targets_min": 6163
},
{
"epoch": 3.0083565459610027,
"grad_norm": 0.45807589528981335,
"learning_rate": 2.816560177951765e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10979750752449036,
"step": 2160,
"valid_targets_mean": 8594.4,
"valid_targets_min": 6006
},
{
"epoch": 3.0153203342618387,
"grad_norm": 0.5425898684830011,
"learning_rate": 2.810214731517592e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0921827107667923,
"step": 2165,
"valid_targets_mean": 3578.4,
"valid_targets_min": 289
},
{
"epoch": 3.022284122562674,
"grad_norm": 0.41010535238599494,
"learning_rate": 2.8038595130199846e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10162421315908432,
"step": 2170,
"valid_targets_mean": 7019.9,
"valid_targets_min": 4985
},
{
"epoch": 3.0292479108635098,
"grad_norm": 0.408252787870625,
"learning_rate": 2.7974945991097343e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09866312146186829,
"step": 2175,
"valid_targets_mean": 6956.6,
"valid_targets_min": 1457
},
{
"epoch": 3.0362116991643453,
"grad_norm": 0.376422224239574,
"learning_rate": 2.791120066554565e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09282627701759338,
"step": 2180,
"valid_targets_mean": 7361.6,
"valid_targets_min": 4961
},
{
"epoch": 3.043175487465181,
"grad_norm": 0.4174310411579024,
"learning_rate": 2.7847359922382154e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12435085326433182,
"step": 2185,
"valid_targets_mean": 7058.5,
"valid_targets_min": 5985
},
{
"epoch": 3.050139275766017,
"grad_norm": 0.40649864588422974,
"learning_rate": 2.7783424531595057e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11022967100143433,
"step": 2190,
"valid_targets_mean": 7664.2,
"valid_targets_min": 5169
},
{
"epoch": 3.0571030640668524,
"grad_norm": 0.3894067905652123,
"learning_rate": 2.7719395264314125e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09706021845340729,
"step": 2195,
"valid_targets_mean": 7111.8,
"valid_targets_min": 5348
},
{
"epoch": 3.064066852367688,
"grad_norm": 0.4571915199208844,
"learning_rate": 2.7655272892801376e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0859590619802475,
"step": 2200,
"valid_targets_mean": 4238.9,
"valid_targets_min": 152
},
{
"epoch": 3.0710306406685235,
"grad_norm": 0.442146850622646,
"learning_rate": 2.7591058190441754e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0988345593214035,
"step": 2205,
"valid_targets_mean": 7199.4,
"valid_targets_min": 4258
},
{
"epoch": 3.0779944289693595,
"grad_norm": 0.3888970877948061,
"learning_rate": 2.7526751931733824e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09356151521205902,
"step": 2210,
"valid_targets_mean": 7243.4,
"valid_targets_min": 5831
},
{
"epoch": 3.084958217270195,
"grad_norm": 0.3880326891417797,
"learning_rate": 2.7462354892280428e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09559017419815063,
"step": 2215,
"valid_targets_mean": 6950.6,
"valid_targets_min": 3862
},
{
"epoch": 3.0919220055710306,
"grad_norm": 0.38716280782428913,
"learning_rate": 2.7397867848779296e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10002546012401581,
"step": 2220,
"valid_targets_mean": 6991.9,
"valid_targets_min": 5696
},
{
"epoch": 3.098885793871866,
"grad_norm": 0.3892772405020075,
"learning_rate": 2.733329157901373e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1018202155828476,
"step": 2225,
"valid_targets_mean": 6963.5,
"valid_targets_min": 4947
},
{
"epoch": 3.105849582172702,
"grad_norm": 0.3954300382500997,
"learning_rate": 2.7268626861843176e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08901640772819519,
"step": 2230,
"valid_targets_mean": 6436.9,
"valid_targets_min": 4988
},
{
"epoch": 3.1128133704735377,
"grad_norm": 0.38253440455307475,
"learning_rate": 2.7203874477193867e-05,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09357216954231262,
"step": 2235,
"valid_targets_mean": 7518.0,
"valid_targets_min": 5476
},
{
"epoch": 3.1197771587743732,
"grad_norm": 0.37760495023063456,
"learning_rate": 2.7139035206049392e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0883115828037262,
"step": 2240,
"valid_targets_mean": 7422.6,
"valid_targets_min": 5226
},
{
"epoch": 3.1267409470752088,
"grad_norm": 0.4492359216101069,
"learning_rate": 2.707410983044128e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12339232116937637,
"step": 2245,
"valid_targets_mean": 7080.0,
"valid_targets_min": 3753
},
{
"epoch": 3.1337047353760448,
"grad_norm": 0.478752949833473,
"learning_rate": 2.7009099133439588e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10847386717796326,
"step": 2250,
"valid_targets_mean": 6064.6,
"valid_targets_min": 5161
},
{
"epoch": 3.1406685236768803,
"grad_norm": 0.41876052780288764,
"learning_rate": 2.6944003899143424e-05,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09066791832447052,
"step": 2255,
"valid_targets_mean": 7388.1,
"valid_targets_min": 5795
},
{
"epoch": 3.147632311977716,
"grad_norm": 0.4035596406534088,
"learning_rate": 2.6878824912671526e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0864686593413353,
"step": 2260,
"valid_targets_mean": 7696.0,
"valid_targets_min": 4658
},
{
"epoch": 3.1545961002785514,
"grad_norm": 0.3924938647790918,
"learning_rate": 2.6813562960152754e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10020910203456879,
"step": 2265,
"valid_targets_mean": 7799.1,
"valid_targets_min": 5508
},
{
"epoch": 3.1615598885793874,
"grad_norm": 0.39783779066844704,
"learning_rate": 2.6748218828716637e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0940442681312561,
"step": 2270,
"valid_targets_mean": 7341.6,
"valid_targets_min": 6454
},
{
"epoch": 3.168523676880223,
"grad_norm": 0.40685251066765943,
"learning_rate": 2.6682793306483875e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08199045807123184,
"step": 2275,
"valid_targets_mean": 6818.0,
"valid_targets_min": 4392
},
{
"epoch": 3.1754874651810585,
"grad_norm": 0.3774943376487801,
"learning_rate": 2.6617287182556818e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08261384814977646,
"step": 2280,
"valid_targets_mean": 7857.6,
"valid_targets_min": 5394
},
{
"epoch": 3.182451253481894,
"grad_norm": 0.3962509851654937,
"learning_rate": 2.6551701247009974e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07782858610153198,
"step": 2285,
"valid_targets_mean": 8314.1,
"valid_targets_min": 4837
},
{
"epoch": 3.1894150417827296,
"grad_norm": 0.3805935986013425,
"learning_rate": 2.6486036290880447e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07052335143089294,
"step": 2290,
"valid_targets_mean": 7368.2,
"valid_targets_min": 6027
},
{
"epoch": 3.1963788300835656,
"grad_norm": 0.4494256622684818,
"learning_rate": 2.6420293106158425e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09394653886556625,
"step": 2295,
"valid_targets_mean": 6435.0,
"valid_targets_min": 4238
},
{
"epoch": 3.203342618384401,
"grad_norm": 1.3891357549119348,
"learning_rate": 2.6354472485777627e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05725764483213425,
"step": 2300,
"valid_targets_mean": 247.8,
"valid_targets_min": 137
},
{
"epoch": 3.2103064066852367,
"grad_norm": 0.44440730067879897,
"learning_rate": 2.6288575223605703e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09099040925502777,
"step": 2305,
"valid_targets_mean": 6807.0,
"valid_targets_min": 5165
},
{
"epoch": 3.2172701949860723,
"grad_norm": 0.47854206372685043,
"learning_rate": 2.622260211443471e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10358612984418869,
"step": 2310,
"valid_targets_mean": 6989.9,
"valid_targets_min": 5104
},
{
"epoch": 3.2242339832869082,
"grad_norm": 0.40218643285685773,
"learning_rate": 2.615655395397149e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10578115284442902,
"step": 2315,
"valid_targets_mean": 6692.2,
"valid_targets_min": 5068
},
{
"epoch": 3.231197771587744,
"grad_norm": 0.4823984099669414,
"learning_rate": 2.6090431538828095e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11674507707357407,
"step": 2320,
"valid_targets_mean": 7419.6,
"valid_targets_min": 5578
},
{
"epoch": 3.2381615598885793,
"grad_norm": 0.3808006367102266,
"learning_rate": 2.6024235666512154e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09444583207368851,
"step": 2325,
"valid_targets_mean": 7536.5,
"valid_targets_min": 5075
},
{
"epoch": 3.245125348189415,
"grad_norm": 0.3735886845835376,
"learning_rate": 2.5957967135417272e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08822908252477646,
"step": 2330,
"valid_targets_mean": 7221.5,
"valid_targets_min": 5841
},
{
"epoch": 3.252089136490251,
"grad_norm": 0.38530492214279993,
"learning_rate": 2.5891626744813413e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0928116887807846,
"step": 2335,
"valid_targets_mean": 7287.5,
"valid_targets_min": 5151
},
{
"epoch": 3.2590529247910864,
"grad_norm": 0.431169270507617,
"learning_rate": 2.5825215294837213e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09144345670938492,
"step": 2340,
"valid_targets_mean": 6738.4,
"valid_targets_min": 4042
},
{
"epoch": 3.266016713091922,
"grad_norm": 0.42057933866822494,
"learning_rate": 2.5758733586482402e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10509088635444641,
"step": 2345,
"valid_targets_mean": 6331.0,
"valid_targets_min": 5496
},
{
"epoch": 3.2729805013927575,
"grad_norm": 0.43887987652105004,
"learning_rate": 2.5692182421590062e-05,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0931042730808258,
"step": 2350,
"valid_targets_mean": 6271.1,
"valid_targets_min": 4695
},
{
"epoch": 3.279944289693593,
"grad_norm": 0.6506631337130584,
"learning_rate": 2.5625562602839024e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09925953298807144,
"step": 2355,
"valid_targets_mean": 5790.8,
"valid_targets_min": 5021
},
{
"epoch": 3.286908077994429,
"grad_norm": 0.5048077739195413,
"learning_rate": 2.555887493373614e-05,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07177004218101501,
"step": 2360,
"valid_targets_mean": 3386.8,
"valid_targets_min": 2279
},
{
"epoch": 3.2938718662952646,
"grad_norm": 0.6120098262207729,
"learning_rate": 2.549212021860662e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09277001023292542,
"step": 2365,
"valid_targets_mean": 6240.5,
"valid_targets_min": 5093
},
{
"epoch": 3.3008356545961,
"grad_norm": 0.7108808669473043,
"learning_rate": 2.542529926258433e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09597060084342957,
"step": 2370,
"valid_targets_mean": 6329.5,
"valid_targets_min": 4589
},
{
"epoch": 3.307799442896936,
"grad_norm": 0.3884309764014742,
"learning_rate": 2.5358412871602046e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0994221642613411,
"step": 2375,
"valid_targets_mean": 7589.2,
"valid_targets_min": 4963
},
{
"epoch": 3.3147632311977717,
"grad_norm": 0.43936327155895843,
"learning_rate": 2.5291461852381788e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07934075593948364,
"step": 2380,
"valid_targets_mean": 5577.9,
"valid_targets_min": 4458
},
{
"epoch": 3.3217270194986073,
"grad_norm": 0.4459328442427666,
"learning_rate": 2.522444701242505e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0892050564289093,
"step": 2385,
"valid_targets_mean": 5432.5,
"valid_targets_min": 4433
},
{
"epoch": 3.328690807799443,
"grad_norm": 0.5161665476844713,
"learning_rate": 2.5157369160003066e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09683055430650711,
"step": 2390,
"valid_targets_mean": 6361.8,
"valid_targets_min": 5201
},
{
"epoch": 3.3356545961002784,
"grad_norm": 0.45408075599291947,
"learning_rate": 2.509022910414708e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08833605796098709,
"step": 2395,
"valid_targets_mean": 5824.4,
"valid_targets_min": 5129
},
{
"epoch": 3.3426183844011144,
"grad_norm": 0.7702050101973215,
"learning_rate": 2.5023027654638576e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10458929091691971,
"step": 2400,
"valid_targets_mean": 1637.6,
"valid_targets_min": 137
},
{
"epoch": 3.34958217270195,
"grad_norm": 0.4785675018453149,
"learning_rate": 2.4955765621999505e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09321224689483643,
"step": 2405,
"valid_targets_mean": 6474.6,
"valid_targets_min": 4751
},
{
"epoch": 3.3565459610027855,
"grad_norm": 0.413066098207994,
"learning_rate": 2.4888443817482517e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10013020038604736,
"step": 2410,
"valid_targets_mean": 7186.2,
"valid_targets_min": 5358
},
{
"epoch": 3.363509749303621,
"grad_norm": 0.3906129731653948,
"learning_rate": 2.4821063053061184e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09480290114879608,
"step": 2415,
"valid_targets_mean": 7126.8,
"valid_targets_min": 4078
},
{
"epoch": 3.370473537604457,
"grad_norm": 0.45841696400076865,
"learning_rate": 2.4753624141420182e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09096138924360275,
"step": 2420,
"valid_targets_mean": 7022.1,
"valid_targets_min": 4940
},
{
"epoch": 3.3774373259052926,
"grad_norm": 0.4351904530245512,
"learning_rate": 2.4686127895945517e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09502632170915604,
"step": 2425,
"valid_targets_mean": 5900.6,
"valid_targets_min": 4779
},
{
"epoch": 3.384401114206128,
"grad_norm": 0.47258906281645247,
"learning_rate": 2.4618575130714707e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09541469812393188,
"step": 2430,
"valid_targets_mean": 6290.1,
"valid_targets_min": 4620
},
{
"epoch": 3.3913649025069637,
"grad_norm": 0.886229632768184,
"learning_rate": 2.4550966660486944e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07395320385694504,
"step": 2435,
"valid_targets_mean": 1162.2,
"valid_targets_min": 788
},
{
"epoch": 3.3983286908077996,
"grad_norm": 0.7835854833673302,
"learning_rate": 2.4483303300693296e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08432234823703766,
"step": 2440,
"valid_targets_mean": 1500.6,
"valid_targets_min": 957
},
{
"epoch": 3.405292479108635,
"grad_norm": 0.7364784582289423,
"learning_rate": 2.4415585867426854e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07511076331138611,
"step": 2445,
"valid_targets_mean": 1371.2,
"valid_targets_min": 796
},
{
"epoch": 3.4122562674094707,
"grad_norm": 0.9103744401835016,
"learning_rate": 2.434781517743289e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09593386203050613,
"step": 2450,
"valid_targets_mean": 1433.6,
"valid_targets_min": 697
},
{
"epoch": 3.4192200557103063,
"grad_norm": 0.7736223123121384,
"learning_rate": 2.4279992048099016e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07917076349258423,
"step": 2455,
"valid_targets_mean": 1578.9,
"valid_targets_min": 638
},
{
"epoch": 3.426183844011142,
"grad_norm": 0.7034601262769054,
"learning_rate": 2.4212117297445307e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07970526069402695,
"step": 2460,
"valid_targets_mean": 1746.4,
"valid_targets_min": 727
},
{
"epoch": 3.433147632311978,
"grad_norm": 0.7382178076531261,
"learning_rate": 2.4144191744114457e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06873296201229095,
"step": 2465,
"valid_targets_mean": 1309.9,
"valid_targets_min": 761
},
{
"epoch": 3.4401114206128134,
"grad_norm": 0.8425832615711547,
"learning_rate": 2.4076216207361904e-05,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09206151962280273,
"step": 2470,
"valid_targets_mean": 1368.6,
"valid_targets_min": 714
},
{
"epoch": 3.447075208913649,
"grad_norm": 0.8395407250078996,
"learning_rate": 2.4008191507045913e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08047881722450256,
"step": 2475,
"valid_targets_mean": 1491.8,
"valid_targets_min": 867
},
{
"epoch": 3.4540389972144845,
"grad_norm": 0.7755881495928278,
"learning_rate": 2.3940118463617745e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09353938698768616,
"step": 2480,
"valid_targets_mean": 1994.0,
"valid_targets_min": 790
},
{
"epoch": 3.4610027855153205,
"grad_norm": 0.7814533436270437,
"learning_rate": 2.3871997898111707e-05,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08098438382148743,
"step": 2485,
"valid_targets_mean": 1523.4,
"valid_targets_min": 896
},
{
"epoch": 3.467966573816156,
"grad_norm": 0.8288270044083298,
"learning_rate": 2.3803830632135284e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08329111337661743,
"step": 2490,
"valid_targets_mean": 1790.1,
"valid_targets_min": 1009
},
{
"epoch": 3.4749303621169916,
"grad_norm": 0.7061032285936508,
"learning_rate": 2.3735617487859224e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06442536413669586,
"step": 2495,
"valid_targets_mean": 1394.0,
"valid_targets_min": 717
},
{
"epoch": 3.481894150417827,
"grad_norm": 0.9020364718977384,
"learning_rate": 2.3667359288007612e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06079908832907677,
"step": 2500,
"valid_targets_mean": 1129.0,
"valid_targets_min": 659
},
{
"epoch": 3.488857938718663,
"grad_norm": 0.7566586323370277,
"learning_rate": 2.3599056855847937e-05,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07075653970241547,
"step": 2505,
"valid_targets_mean": 1466.9,
"valid_targets_min": 642
},
{
"epoch": 3.4958217270194987,
"grad_norm": 0.7734326889825535,
"learning_rate": 2.353071101518121e-05,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054345741868019104,
"step": 2510,
"valid_targets_mean": 1129.4,
"valid_targets_min": 765
},
{
"epoch": 3.502785515320334,
"grad_norm": 0.804981371612974,
"learning_rate": 2.346232259033196e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07415035367012024,
"step": 2515,
"valid_targets_mean": 1322.8,
"valid_targets_min": 631
},
{
"epoch": 3.5097493036211698,
"grad_norm": 0.9012347000535628,
"learning_rate": 2.3393892406138354e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09443515539169312,
"step": 2520,
"valid_targets_mean": 1612.0,
"valid_targets_min": 623
},
{
"epoch": 3.5167130919220053,
"grad_norm": 0.8529475358392916,
"learning_rate": 2.332542128794221e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060877248644828796,
"step": 2525,
"valid_targets_mean": 1402.1,
"valid_targets_min": 940
},
{
"epoch": 3.5236768802228413,
"grad_norm": 0.7346114867964298,
"learning_rate": 2.325691006157905e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06927518546581268,
"step": 2530,
"valid_targets_mean": 1337.8,
"valid_targets_min": 776
},
{
"epoch": 3.530640668523677,
"grad_norm": 0.7848390780850379,
"learning_rate": 2.3188359553368157e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08660085499286652,
"step": 2535,
"valid_targets_mean": 1525.5,
"valid_targets_min": 623
},
{
"epoch": 3.5376044568245124,
"grad_norm": 0.7918791101050114,
"learning_rate": 2.3119770590102585e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08223545551300049,
"step": 2540,
"valid_targets_mean": 1441.0,
"valid_targets_min": 693
},
{
"epoch": 3.5445682451253484,
"grad_norm": 0.9253216126700171,
"learning_rate": 2.3051143999039198e-05,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042962588369846344,
"step": 2545,
"valid_targets_mean": 847.9,
"valid_targets_min": 611
},
{
"epoch": 3.551532033426184,
"grad_norm": 0.8194995897407035,
"learning_rate": 2.2982480607888693e-05,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07983898371458054,
"step": 2550,
"valid_targets_mean": 1524.9,
"valid_targets_min": 793
},
{
"epoch": 3.5584958217270195,
"grad_norm": 0.7123126085956808,
"learning_rate": 2.291378124480563e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08361306041479111,
"step": 2555,
"valid_targets_mean": 1779.4,
"valid_targets_min": 563
},
{
"epoch": 3.565459610027855,
"grad_norm": 0.7375463773516223,
"learning_rate": 2.284504673837839e-05,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08410098403692245,
"step": 2560,
"valid_targets_mean": 1741.2,
"valid_targets_min": 1341
},
{
"epoch": 3.5724233983286906,
"grad_norm": 0.813717402129795,
"learning_rate": 2.277627791761927e-05,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0976366251707077,
"step": 2565,
"valid_targets_mean": 1875.6,
"valid_targets_min": 1107
},
{
"epoch": 3.5793871866295266,
"grad_norm": 0.7638558548512067,
"learning_rate": 2.270747561195441e-05,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07316169142723083,
"step": 2570,
"valid_targets_mean": 1419.5,
"valid_targets_min": 680
},
{
"epoch": 3.586350974930362,
"grad_norm": 0.7546648374433426,
"learning_rate": 2.2638640651213804e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10009348392486572,
"step": 2575,
"valid_targets_mean": 1968.2,
"valid_targets_min": 981
},
{
"epoch": 3.5933147632311977,
"grad_norm": 0.8517766302015852,
"learning_rate": 2.2569773865621324e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07636626064777374,
"step": 2580,
"valid_targets_mean": 1568.9,
"valid_targets_min": 937
},
{
"epoch": 3.6002785515320337,
"grad_norm": 0.8067654097110404,
"learning_rate": 2.2500876085784665e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08284150809049606,
"step": 2585,
"valid_targets_mean": 1645.2,
"valid_targets_min": 804
},
{
"epoch": 3.6072423398328692,
"grad_norm": 0.7691207000641539,
"learning_rate": 2.2431948142685352e-05,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07658159732818604,
"step": 2590,
"valid_targets_mean": 1574.9,
"valid_targets_min": 1019
},
{
"epoch": 3.614206128133705,
"grad_norm": 0.7783596723806455,
"learning_rate": 2.236299086766873e-05,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06561608612537384,
"step": 2595,
"valid_targets_mean": 1121.6,
"valid_targets_min": 882
},
{
"epoch": 3.6211699164345403,
"grad_norm": 0.7775958409848589,
"learning_rate": 2.2294005092433887e-05,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08176523447036743,
"step": 2600,
"valid_targets_mean": 1818.1,
"valid_targets_min": 1168
},
{
"epoch": 3.628133704735376,
"grad_norm": 0.828811804727648,
"learning_rate": 2.2224991649023675e-05,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07202639430761337,
"step": 2605,
"valid_targets_mean": 1417.8,
"valid_targets_min": 678
},
{
"epoch": 3.635097493036212,
"grad_norm": 0.8282689257518919,
"learning_rate": 2.2155951369814644e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058761902153491974,
"step": 2610,
"valid_targets_mean": 1051.0,
"valid_targets_min": 676
},
{
"epoch": 3.6420612813370474,
"grad_norm": 1.7079878973692406,
"learning_rate": 2.2086885087507027e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06798002123832703,
"step": 2615,
"valid_targets_mean": 1431.1,
"valid_targets_min": 794
},
{
"epoch": 3.649025069637883,
"grad_norm": 0.7717379455457729,
"learning_rate": 2.2017793635114667e-05,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07599664479494095,
"step": 2620,
"valid_targets_mean": 1486.9,
"valid_targets_min": 742
},
{
"epoch": 3.6559888579387185,
"grad_norm": 0.7698310794801155,
"learning_rate": 2.1948677845954985e-05,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08982954919338226,
"step": 2625,
"valid_targets_mean": 1734.5,
"valid_targets_min": 741
},
{
"epoch": 3.662952646239554,
"grad_norm": 0.8944739797043322,
"learning_rate": 2.1879538553638942e-05,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09024101495742798,
"step": 2630,
"valid_targets_mean": 1712.5,
"valid_targets_min": 1157
},
{
"epoch": 3.66991643454039,
"grad_norm": 0.7894287756846752,
"learning_rate": 2.1810376592060968e-05,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09558722376823425,
"step": 2635,
"valid_targets_mean": 1723.8,
"valid_targets_min": 862
},
{
"epoch": 3.6768802228412256,
"grad_norm": 0.8796292419764679,
"learning_rate": 2.174119279538891e-05,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09259238839149475,
"step": 2640,
"valid_targets_mean": 1633.1,
"valid_targets_min": 1019
},
{
"epoch": 3.683844011142061,
"grad_norm": 0.7361323056285416,
"learning_rate": 2.1671987998053954e-05,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0679299384355545,
"step": 2645,
"valid_targets_mean": 1376.1,
"valid_targets_min": 1058
},
{
"epoch": 3.690807799442897,
"grad_norm": 0.7916992537280872,
"learning_rate": 2.16027630347406e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08028727769851685,
"step": 2650,
"valid_targets_mean": 1576.5,
"valid_targets_min": 618
},
{
"epoch": 3.6977715877437327,
"grad_norm": 0.8165492508178849,
"learning_rate": 2.1533518740376557e-05,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0871560126543045,
"step": 2655,
"valid_targets_mean": 1615.8,
"valid_targets_min": 629
},
{
"epoch": 3.7047353760445683,
"grad_norm": 0.8981802581015453,
"learning_rate": 2.146425595012269e-05,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08319033682346344,
"step": 2660,
"valid_targets_mean": 1881.2,
"valid_targets_min": 1167
},
{
"epoch": 3.711699164345404,
"grad_norm": 0.7955838043549589,
"learning_rate": 2.1394975499362947e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07869289815425873,
"step": 2665,
"valid_targets_mean": 1367.2,
"valid_targets_min": 699
},
{
"epoch": 3.7186629526462394,
"grad_norm": 0.7732510809048744,
"learning_rate": 2.132567822369428e-05,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058514297008514404,
"step": 2670,
"valid_targets_mean": 1174.9,
"valid_targets_min": 679
},
{
"epoch": 3.7256267409470754,
"grad_norm": 0.7978233555615979,
"learning_rate": 2.1256364958916564e-05,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07325758785009384,
"step": 2675,
"valid_targets_mean": 1556.2,
"valid_targets_min": 504
},
{
"epoch": 3.732590529247911,
"grad_norm": 0.8402148455143513,
"learning_rate": 2.1187036541022533e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08283115178346634,
"step": 2680,
"valid_targets_mean": 1885.0,
"valid_targets_min": 1331
},
{
"epoch": 3.7395543175487465,
"grad_norm": 0.764780642210825,
"learning_rate": 2.1117693806187657e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055060356855392456,
"step": 2685,
"valid_targets_mean": 1306.1,
"valid_targets_min": 661
},
{
"epoch": 3.7465181058495824,
"grad_norm": 0.7707860162726192,
"learning_rate": 2.104833759076011e-05,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05953007936477661,
"step": 2690,
"valid_targets_mean": 1330.1,
"valid_targets_min": 958
},
{
"epoch": 3.7534818941504176,
"grad_norm": 0.7132388417704622,
"learning_rate": 2.0978968731250648e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057646650820970535,
"step": 2695,
"valid_targets_mean": 1465.0,
"valid_targets_min": 963
},
{
"epoch": 3.7604456824512535,
"grad_norm": 0.7777931157465899,
"learning_rate": 2.0909588064322524e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07116229832172394,
"step": 2700,
"valid_targets_mean": 1428.0,
"valid_targets_min": 793
},
{
"epoch": 3.767409470752089,
"grad_norm": 0.7925330730772479,
"learning_rate": 2.08401964267814e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.091750867664814,
"step": 2705,
"valid_targets_mean": 1633.1,
"valid_targets_min": 917
},
{
"epoch": 3.7743732590529246,
"grad_norm": 0.8377874283930322,
"learning_rate": 2.0770794655565278e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06515245139598846,
"step": 2710,
"valid_targets_mean": 1246.5,
"valid_targets_min": 872
},
{
"epoch": 3.7813370473537606,
"grad_norm": 0.7500409300068362,
"learning_rate": 2.0701383587734334e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07608701288700104,
"step": 2715,
"valid_targets_mean": 1903.6,
"valid_targets_min": 1220
},
{
"epoch": 3.788300835654596,
"grad_norm": 0.8435711995319485,
"learning_rate": 2.0631964060460934e-05,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06794526427984238,
"step": 2720,
"valid_targets_mean": 1391.6,
"valid_targets_min": 712
},
{
"epoch": 3.7952646239554317,
"grad_norm": 0.8724016823017468,
"learning_rate": 2.0562536911019415e-05,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0759831964969635,
"step": 2725,
"valid_targets_mean": 1295.0,
"valid_targets_min": 605
},
{
"epoch": 3.8022284122562673,
"grad_norm": 0.7990588269247201,
"learning_rate": 2.049310297677609e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05404563248157501,
"step": 2730,
"valid_targets_mean": 1414.8,
"valid_targets_min": 746
},
{
"epoch": 3.809192200557103,
"grad_norm": 0.9100646789026491,
"learning_rate": 2.0423663095179084e-05,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06111488863825798,
"step": 2735,
"valid_targets_mean": 1059.4,
"valid_targets_min": 723
},
{
"epoch": 3.816155988857939,
"grad_norm": 0.7835072806883097,
"learning_rate": 2.0354218103748253e-05,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08211217820644379,
"step": 2740,
"valid_targets_mean": 1634.2,
"valid_targets_min": 1327
},
{
"epoch": 3.8231197771587744,
"grad_norm": 0.8355043521576563,
"learning_rate": 2.028476884006508e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07008926570415497,
"step": 2745,
"valid_targets_mean": 1412.5,
"valid_targets_min": 902
},
{
"epoch": 3.83008356545961,
"grad_norm": 0.8578826264946082,
"learning_rate": 2.02153161417626e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07012935727834702,
"step": 2750,
"valid_targets_mean": 1558.8,
"valid_targets_min": 803
},
{
"epoch": 3.837047353760446,
"grad_norm": 0.8206701722875304,
"learning_rate": 2.0145860846515234e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07594504952430725,
"step": 2755,
"valid_targets_mean": 1441.2,
"valid_targets_min": 1079
},
{
"epoch": 3.8440111420612815,
"grad_norm": 0.7481367084277267,
"learning_rate": 2.0076403792028757e-05,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06753340363502502,
"step": 2760,
"valid_targets_mean": 1449.8,
"valid_targets_min": 1263
},
{
"epoch": 3.850974930362117,
"grad_norm": 0.7968317810485137,
"learning_rate": 2.000694581603016e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07419832050800323,
"step": 2765,
"valid_targets_mean": 1487.4,
"valid_targets_min": 844
},
{
"epoch": 3.8579387186629526,
"grad_norm": 0.8690761427120194,
"learning_rate": 1.993748775625752e-05,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06871486455202103,
"step": 2770,
"valid_targets_mean": 1421.4,
"valid_targets_min": 667
},
{
"epoch": 3.864902506963788,
"grad_norm": 0.8975013022838169,
"learning_rate": 1.986803045044996e-05,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08886584639549255,
"step": 2775,
"valid_targets_mean": 1822.6,
"valid_targets_min": 1041
},
{
"epoch": 3.871866295264624,
"grad_norm": 0.7977117949143756,
"learning_rate": 1.9798574736337487e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06609257310628891,
"step": 2780,
"valid_targets_mean": 1327.4,
"valid_targets_min": 777
},
{
"epoch": 3.8788300835654597,
"grad_norm": 0.7438548739680065,
"learning_rate": 1.972912145163093e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07537013292312622,
"step": 2785,
"valid_targets_mean": 1823.8,
"valid_targets_min": 1283
},
{
"epoch": 3.885793871866295,
"grad_norm": 0.928372055697338,
"learning_rate": 1.965967143401178e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05227617174386978,
"step": 2790,
"valid_targets_mean": 924.0,
"valid_targets_min": 620
},
{
"epoch": 3.8927576601671308,
"grad_norm": 0.8016846902818193,
"learning_rate": 1.9590225521122167e-05,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06370696425437927,
"step": 2795,
"valid_targets_mean": 1480.2,
"valid_targets_min": 656
},
{
"epoch": 3.8997214484679663,
"grad_norm": 0.8062692815757603,
"learning_rate": 1.9520784550554683e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059848278760910034,
"step": 2800,
"valid_targets_mean": 1415.5,
"valid_targets_min": 697
},
{
"epoch": 3.9066852367688023,
"grad_norm": 0.8353157154283097,
"learning_rate": 1.9451349359842332e-05,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07082884013652802,
"step": 2805,
"valid_targets_mean": 1655.8,
"valid_targets_min": 816
},
{
"epoch": 3.913649025069638,
"grad_norm": 0.7597621427921378,
"learning_rate": 1.938192078644839e-05,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06765986979007721,
"step": 2810,
"valid_targets_mean": 1553.0,
"valid_targets_min": 850
},
{
"epoch": 3.9206128133704734,
"grad_norm": 0.7816154228464142,
"learning_rate": 1.931249966775633e-05,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06977061927318573,
"step": 2815,
"valid_targets_mean": 1353.9,
"valid_targets_min": 747
},
{
"epoch": 3.9275766016713094,
"grad_norm": 0.8523628518802676,
"learning_rate": 1.92430868410597e-05,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0653572827577591,
"step": 2820,
"valid_targets_mean": 1420.9,
"valid_targets_min": 933
},
{
"epoch": 3.934540389972145,
"grad_norm": 0.801382105679613,
"learning_rate": 1.9173683143552057e-05,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07180759310722351,
"step": 2825,
"valid_targets_mean": 1394.9,
"valid_targets_min": 827
},
{
"epoch": 3.9415041782729805,
"grad_norm": 0.7523245478800936,
"learning_rate": 1.910428941231684e-05,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06203988194465637,
"step": 2830,
"valid_targets_mean": 1383.2,
"valid_targets_min": 909
},
{
"epoch": 3.948467966573816,
"grad_norm": 0.7403715943582305,
"learning_rate": 1.903490648431728e-05,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08447936922311783,
"step": 2835,
"valid_targets_mean": 1682.4,
"valid_targets_min": 1094
},
{
"epoch": 3.9554317548746516,
"grad_norm": 0.8253011305912571,
"learning_rate": 1.8965535196386326e-05,
"loss": 0.1358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06693306565284729,
"step": 2840,
"valid_targets_mean": 1118.4,
"valid_targets_min": 720
},
{
"epoch": 3.9623955431754876,
"grad_norm": 0.7530842490472827,
"learning_rate": 1.889617638521651e-05,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07407623529434204,
"step": 2845,
"valid_targets_mean": 1538.2,
"valid_targets_min": 610
},
{
"epoch": 3.969359331476323,
"grad_norm": 0.7546263356082901,
"learning_rate": 1.8826830887349902e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07467672973871231,
"step": 2850,
"valid_targets_mean": 1570.1,
"valid_targets_min": 713
},
{
"epoch": 3.9763231197771587,
"grad_norm": 0.833106804892126,
"learning_rate": 1.8757499539167986e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07438725978136063,
"step": 2855,
"valid_targets_mean": 1537.8,
"valid_targets_min": 874
},
{
"epoch": 3.9832869080779947,
"grad_norm": 0.7504076181098892,
"learning_rate": 1.8688183176881596e-05,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07164924591779709,
"step": 2860,
"valid_targets_mean": 1471.2,
"valid_targets_min": 765
},
{
"epoch": 3.9902506963788302,
"grad_norm": 0.7785848799373203,
"learning_rate": 1.861888263652081e-05,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06348396092653275,
"step": 2865,
"valid_targets_mean": 1254.4,
"valid_targets_min": 816
},
{
"epoch": 3.997214484679666,
"grad_norm": 0.78598015466159,
"learning_rate": 1.8549598753924894e-05,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0708591490983963,
"step": 2870,
"valid_targets_mean": 1482.9,
"valid_targets_min": 1182
},
{
"epoch": 4.004178272980502,
"grad_norm": 0.7745411560000336,
"learning_rate": 1.8480332364732178e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09853234887123108,
"step": 2875,
"valid_targets_mean": 5435.1,
"valid_targets_min": 3516
},
{
"epoch": 4.011142061281337,
"grad_norm": 0.45693392884456113,
"learning_rate": 1.8411084304370014e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09516393393278122,
"step": 2880,
"valid_targets_mean": 7654.2,
"valid_targets_min": 6354
},
{
"epoch": 4.018105849582173,
"grad_norm": 0.4319211248040884,
"learning_rate": 1.8341855408044697e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10908873379230499,
"step": 2885,
"valid_targets_mean": 7341.6,
"valid_targets_min": 5754
},
{
"epoch": 4.025069637883008,
"grad_norm": 0.35087638698700635,
"learning_rate": 1.8272646510731375e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08147092163562775,
"step": 2890,
"valid_targets_mean": 7666.2,
"valid_targets_min": 5666
},
{
"epoch": 4.032033426183844,
"grad_norm": 0.4079352838694494,
"learning_rate": 1.820345844716399e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09540951251983643,
"step": 2895,
"valid_targets_mean": 7469.0,
"valid_targets_min": 5646
},
{
"epoch": 4.03899721448468,
"grad_norm": 0.453891412990921,
"learning_rate": 1.81342920518252e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1076955646276474,
"step": 2900,
"valid_targets_mean": 7046.9,
"valid_targets_min": 5571
},
{
"epoch": 4.045961002785515,
"grad_norm": 0.44912248872165283,
"learning_rate": 1.8065148158936323e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10332390666007996,
"step": 2905,
"valid_targets_mean": 7827.6,
"valid_targets_min": 5405
},
{
"epoch": 4.052924791086351,
"grad_norm": 0.3855281872703947,
"learning_rate": 1.799602760244728e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09584302455186844,
"step": 2910,
"valid_targets_mean": 7023.5,
"valid_targets_min": 5664
},
{
"epoch": 4.059888579387187,
"grad_norm": 0.39674294021757817,
"learning_rate": 1.7926931216026518e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08769885450601578,
"step": 2915,
"valid_targets_mean": 7069.8,
"valid_targets_min": 5103
},
{
"epoch": 4.066852367688022,
"grad_norm": 0.4247588326582294,
"learning_rate": 1.7857859833050983e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08552022278308868,
"step": 2920,
"valid_targets_mean": 6712.4,
"valid_targets_min": 5469
},
{
"epoch": 4.073816155988858,
"grad_norm": 0.4334738323877378,
"learning_rate": 1.7788814286596044e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0862928107380867,
"step": 2925,
"valid_targets_mean": 7289.2,
"valid_targets_min": 5513
},
{
"epoch": 4.080779944289693,
"grad_norm": 0.5671431858648565,
"learning_rate": 1.7719795409425443e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08433561772108078,
"step": 2930,
"valid_targets_mean": 7022.1,
"valid_targets_min": 5691
},
{
"epoch": 4.087743732590529,
"grad_norm": 0.5417102538090298,
"learning_rate": 1.765080403398127e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0926387831568718,
"step": 2935,
"valid_targets_mean": 6736.0,
"valid_targets_min": 5550
},
{
"epoch": 4.094707520891365,
"grad_norm": 0.3961734843289232,
"learning_rate": 1.758184099237393e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08144709467887878,
"step": 2940,
"valid_targets_mean": 6346.9,
"valid_targets_min": 5067
},
{
"epoch": 4.1016713091922,
"grad_norm": 0.3937587901125671,
"learning_rate": 1.7512907116372066e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08808314055204391,
"step": 2945,
"valid_targets_mean": 6784.0,
"valid_targets_min": 5618
},
{
"epoch": 4.108635097493036,
"grad_norm": 0.43597320037991466,
"learning_rate": 1.7444003237392567e-05,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10079539567232132,
"step": 2950,
"valid_targets_mean": 7568.4,
"valid_targets_min": 5856
},
{
"epoch": 4.1155988857938715,
"grad_norm": 0.3994536656356681,
"learning_rate": 1.737513018649053e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08414926379919052,
"step": 2955,
"valid_targets_mean": 7198.5,
"valid_targets_min": 4793
},
{
"epoch": 4.1225626740947074,
"grad_norm": 0.4184797204828292,
"learning_rate": 1.7306288794349213e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08882571756839752,
"step": 2960,
"valid_targets_mean": 6680.5,
"valid_targets_min": 5350
},
{
"epoch": 4.129526462395543,
"grad_norm": 0.4148372539820588,
"learning_rate": 1.7237479891270054e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0935942679643631,
"step": 2965,
"valid_targets_mean": 6770.6,
"valid_targets_min": 5753
},
{
"epoch": 4.1364902506963785,
"grad_norm": 0.7626972756641216,
"learning_rate": 1.7168704307162625e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06254291534423828,
"step": 2970,
"valid_targets_mean": 1419.8,
"valid_targets_min": 289
},
{
"epoch": 4.1434540389972145,
"grad_norm": 0.4371572099046906,
"learning_rate": 1.7099962871534644e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09101256728172302,
"step": 2975,
"valid_targets_mean": 6784.2,
"valid_targets_min": 5042
},
{
"epoch": 4.1504178272980505,
"grad_norm": 0.4078695342570583,
"learning_rate": 1.703125641348197e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08425340801477432,
"step": 2980,
"valid_targets_mean": 6774.9,
"valid_targets_min": 3875
},
{
"epoch": 4.157381615598886,
"grad_norm": 0.43908909204234714,
"learning_rate": 1.696258576167856e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09084954857826233,
"step": 2985,
"valid_targets_mean": 7047.6,
"valid_targets_min": 6134
},
{
"epoch": 4.164345403899722,
"grad_norm": 0.3923313188578705,
"learning_rate": 1.6893951744366547e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09309709817171097,
"step": 2990,
"valid_targets_mean": 6886.6,
"valid_targets_min": 5869
},
{
"epoch": 4.171309192200557,
"grad_norm": 0.377006462886014,
"learning_rate": 1.6825355189346192e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08231081813573837,
"step": 2995,
"valid_targets_mean": 7559.8,
"valid_targets_min": 6145
},
{
"epoch": 4.178272980501393,
"grad_norm": 0.3411126289914851,
"learning_rate": 1.675679692396593e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07891160249710083,
"step": 3000,
"valid_targets_mean": 8920.5,
"valid_targets_min": 4780
},
{
"epoch": 4.185236768802229,
"grad_norm": 0.3592395577774327,
"learning_rate": 1.6688277775112377e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06996404379606247,
"step": 3005,
"valid_targets_mean": 7393.4,
"valid_targets_min": 5116
},
{
"epoch": 4.192200557103064,
"grad_norm": 0.34174396201498236,
"learning_rate": 1.6619798569200368e-05,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07682168483734131,
"step": 3010,
"valid_targets_mean": 8477.5,
"valid_targets_min": 4033
},
{
"epoch": 4.1991643454039,
"grad_norm": 0.40130345703058956,
"learning_rate": 1.6551360132162967e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08580783009529114,
"step": 3015,
"valid_targets_mean": 6736.6,
"valid_targets_min": 4646
},
{
"epoch": 4.206128133704736,
"grad_norm": 0.43606325450974787,
"learning_rate": 1.6482963289441533e-05,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09041762351989746,
"step": 3020,
"valid_targets_mean": 7551.5,
"valid_targets_min": 5461
},
{
"epoch": 4.213091922005571,
"grad_norm": 0.45829099636483556,
"learning_rate": 1.6414608865975757e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10397613048553467,
"step": 3025,
"valid_targets_mean": 7091.0,
"valid_targets_min": 4879
},
{
"epoch": 4.220055710306407,
"grad_norm": 0.42080713802214453,
"learning_rate": 1.6346297686193698e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08283068239688873,
"step": 3030,
"valid_targets_mean": 6269.8,
"valid_targets_min": 4606
},
{
"epoch": 4.227019498607242,
"grad_norm": 0.4001310643885332,
"learning_rate": 1.6278030574001863e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08124437183141708,
"step": 3035,
"valid_targets_mean": 6818.4,
"valid_targets_min": 5525
},
{
"epoch": 4.233983286908078,
"grad_norm": 0.3928643150423594,
"learning_rate": 1.6209808352775227e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08757513761520386,
"step": 3040,
"valid_targets_mean": 7365.4,
"valid_targets_min": 5000
},
{
"epoch": 4.240947075208914,
"grad_norm": 0.42455615486180276,
"learning_rate": 1.6141631845347368e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07783573120832443,
"step": 3045,
"valid_targets_mean": 6212.1,
"valid_targets_min": 3988
},
{
"epoch": 4.247910863509749,
"grad_norm": 0.42241913812780074,
"learning_rate": 1.607350187400049e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08539704978466034,
"step": 3050,
"valid_targets_mean": 8396.9,
"valid_targets_min": 6131
},
{
"epoch": 4.254874651810585,
"grad_norm": 0.4237454815884405,
"learning_rate": 1.6005419260455512e-05,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0880412757396698,
"step": 3055,
"valid_targets_mean": 7651.0,
"valid_targets_min": 4061
},
{
"epoch": 4.26183844011142,
"grad_norm": 0.37280072499256484,
"learning_rate": 1.593738482586219e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0859137699007988,
"step": 3060,
"valid_targets_mean": 7090.1,
"valid_targets_min": 5203
},
{
"epoch": 4.268802228412256,
"grad_norm": 0.41477357509750673,
"learning_rate": 1.5869399390789172e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08433390408754349,
"step": 3065,
"valid_targets_mean": 7001.0,
"valid_targets_min": 5362
},
{
"epoch": 4.275766016713092,
"grad_norm": 0.40793877263257894,
"learning_rate": 1.5801463775214118e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08703209459781647,
"step": 3070,
"valid_targets_mean": 6359.2,
"valid_targets_min": 5236
},
{
"epoch": 4.282729805013927,
"grad_norm": 0.44350806675129867,
"learning_rate": 1.573357879851381e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09586170315742493,
"step": 3075,
"valid_targets_mean": 5939.8,
"valid_targets_min": 4693
},
{
"epoch": 4.289693593314763,
"grad_norm": 1.146676173490332,
"learning_rate": 1.5665745279454294e-05,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030542651191353798,
"step": 3080,
"valid_targets_mean": 208.6,
"valid_targets_min": 134
},
{
"epoch": 4.296657381615599,
"grad_norm": 0.48379943817559756,
"learning_rate": 1.5597964036180955e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09201765060424805,
"step": 3085,
"valid_targets_mean": 6008.5,
"valid_targets_min": 4956
},
{
"epoch": 4.303621169916434,
"grad_norm": 0.4202491008226685,
"learning_rate": 1.553023588620869e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07570789754390717,
"step": 3090,
"valid_targets_mean": 6042.0,
"valid_targets_min": 4817
},
{
"epoch": 4.31058495821727,
"grad_norm": 0.42477738905964485,
"learning_rate": 1.5462561646412028e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08630920946598053,
"step": 3095,
"valid_targets_mean": 6608.6,
"valid_targets_min": 5102
},
{
"epoch": 4.3175487465181055,
"grad_norm": 0.42688040529738014,
"learning_rate": 1.5394942133015278e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08623873442411423,
"step": 3100,
"valid_targets_mean": 6670.1,
"valid_targets_min": 4869
},
{
"epoch": 4.3245125348189415,
"grad_norm": 0.42003992455965294,
"learning_rate": 1.5327378161582697e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07713023573160172,
"step": 3105,
"valid_targets_mean": 6088.4,
"valid_targets_min": 4946
},
{
"epoch": 4.3314763231197775,
"grad_norm": 0.4216278012962236,
"learning_rate": 1.5259870547008647e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08279541879892349,
"step": 3110,
"valid_targets_mean": 6228.4,
"valid_targets_min": 4856
},
{
"epoch": 4.338440111420613,
"grad_norm": 0.44787796967160803,
"learning_rate": 1.5192420103507765e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08231884241104126,
"step": 3115,
"valid_targets_mean": 5376.6,
"valid_targets_min": 4145
},
{
"epoch": 4.345403899721449,
"grad_norm": 0.4676976765001585,
"learning_rate": 1.5125027644605143e-05,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08625025302171707,
"step": 3120,
"valid_targets_mean": 6309.2,
"valid_targets_min": 5305
},
{
"epoch": 4.352367688022284,
"grad_norm": 0.4889513820698066,
"learning_rate": 1.50576939831265e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08322583138942719,
"step": 3125,
"valid_targets_mean": 6221.5,
"valid_targets_min": 4636
},
{
"epoch": 4.35933147632312,
"grad_norm": 0.4369115623225211,
"learning_rate": 1.4990419931188425e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09070675075054169,
"step": 3130,
"valid_targets_mean": 6831.5,
"valid_targets_min": 5668
},
{
"epoch": 4.366295264623956,
"grad_norm": 0.42542268683362244,
"learning_rate": 1.4923206300188522e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09038935601711273,
"step": 3135,
"valid_targets_mean": 6437.1,
"valid_targets_min": 5004
},
{
"epoch": 4.373259052924791,
"grad_norm": 0.5378332721568458,
"learning_rate": 1.4856053900795682e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08066794276237488,
"step": 3140,
"valid_targets_mean": 6205.8,
"valid_targets_min": 5341
},
{
"epoch": 4.380222841225627,
"grad_norm": 0.4295836677794995,
"learning_rate": 1.4788963542940251e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09073355048894882,
"step": 3145,
"valid_targets_mean": 6748.0,
"valid_targets_min": 5363
},
{
"epoch": 4.387186629526463,
"grad_norm": 0.4850027247112984,
"learning_rate": 1.4721936035804307e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07909142971038818,
"step": 3150,
"valid_targets_mean": 5210.5,
"valid_targets_min": 791
},
{
"epoch": 4.394150417827298,
"grad_norm": 0.7383337146665891,
"learning_rate": 1.4654972187811858e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06561724841594696,
"step": 3155,
"valid_targets_mean": 1279.5,
"valid_targets_min": 746
},
{
"epoch": 4.401114206128134,
"grad_norm": 0.8310596897559344,
"learning_rate": 1.4588072806619135e-05,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08013515174388885,
"step": 3160,
"valid_targets_mean": 1635.8,
"valid_targets_min": 661
},
{
"epoch": 4.408077994428969,
"grad_norm": 0.8516771248517533,
"learning_rate": 1.4521238699104828e-05,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07185165584087372,
"step": 3165,
"valid_targets_mean": 1420.2,
"valid_targets_min": 826
},
{
"epoch": 4.415041782729805,
"grad_norm": 0.825781158854519,
"learning_rate": 1.4454470671360337e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06541028618812561,
"step": 3170,
"valid_targets_mean": 1399.9,
"valid_targets_min": 742
},
{
"epoch": 4.422005571030641,
"grad_norm": 0.8548496982709529,
"learning_rate": 1.4387769528680098e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060420047491788864,
"step": 3175,
"valid_targets_mean": 1309.9,
"valid_targets_min": 718
},
{
"epoch": 4.428969359331476,
"grad_norm": 0.8030341275951788,
"learning_rate": 1.4321136075551816e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08500155806541443,
"step": 3180,
"valid_targets_mean": 1729.4,
"valid_targets_min": 764
},
{
"epoch": 4.435933147632312,
"grad_norm": 0.7574670919758995,
"learning_rate": 1.4254571115646795e-05,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06925354897975922,
"step": 3185,
"valid_targets_mean": 1651.4,
"valid_targets_min": 814
},
{
"epoch": 4.442896935933147,
"grad_norm": 0.8399886623759784,
"learning_rate": 1.4188075451810238e-05,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05408865213394165,
"step": 3190,
"valid_targets_mean": 1192.0,
"valid_targets_min": 610
},
{
"epoch": 4.449860724233983,
"grad_norm": 0.8256278183381764,
"learning_rate": 1.4121649886051567e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07870268821716309,
"step": 3195,
"valid_targets_mean": 1879.0,
"valid_targets_min": 817
},
{
"epoch": 4.456824512534819,
"grad_norm": 0.7713275384072368,
"learning_rate": 1.4055295219534735e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06405435502529144,
"step": 3200,
"valid_targets_mean": 1500.4,
"valid_targets_min": 837
},
{
"epoch": 4.463788300835654,
"grad_norm": 0.9706438394826296,
"learning_rate": 1.3989012252568596e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09357143938541412,
"step": 3205,
"valid_targets_mean": 1661.8,
"valid_targets_min": 593
},
{
"epoch": 4.47075208913649,
"grad_norm": 0.7845778542370729,
"learning_rate": 1.3922801784597191e-05,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06827139109373093,
"step": 3210,
"valid_targets_mean": 1537.8,
"valid_targets_min": 704
},
{
"epoch": 4.477715877437326,
"grad_norm": 0.7759659105769868,
"learning_rate": 1.3856664614190186e-05,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0502796433866024,
"step": 3215,
"valid_targets_mean": 1227.0,
"valid_targets_min": 722
},
{
"epoch": 4.484679665738161,
"grad_norm": 0.8287147960258013,
"learning_rate": 1.3790601539033168e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06461460888385773,
"step": 3220,
"valid_targets_mean": 1364.5,
"valid_targets_min": 642
},
{
"epoch": 4.491643454038997,
"grad_norm": 0.8589525229582935,
"learning_rate": 1.3724613355918077e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06513009965419769,
"step": 3225,
"valid_targets_mean": 1358.5,
"valid_targets_min": 518
},
{
"epoch": 4.498607242339833,
"grad_norm": 0.8202013278047937,
"learning_rate": 1.3658700860733566e-05,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07893405854701996,
"step": 3230,
"valid_targets_mean": 1590.6,
"valid_targets_min": 728
},
{
"epoch": 4.505571030640668,
"grad_norm": 0.7966714906034105,
"learning_rate": 1.3592864848455415e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0855114758014679,
"step": 3235,
"valid_targets_mean": 1791.4,
"valid_targets_min": 820
},
{
"epoch": 4.512534818941504,
"grad_norm": 0.8234446947551594,
"learning_rate": 1.3527106113136915e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07350599765777588,
"step": 3240,
"valid_targets_mean": 1470.8,
"valid_targets_min": 818
},
{
"epoch": 4.5194986072423395,
"grad_norm": 0.909954505776544,
"learning_rate": 1.3461425447899345e-05,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05728901922702789,
"step": 3245,
"valid_targets_mean": 1278.6,
"valid_targets_min": 625
},
{
"epoch": 4.5264623955431755,
"grad_norm": 0.7815284768559326,
"learning_rate": 1.3395823644922357e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08874043077230453,
"step": 3250,
"valid_targets_mean": 2313.5,
"valid_targets_min": 790
},
{
"epoch": 4.5334261838440115,
"grad_norm": 0.8603759963719848,
"learning_rate": 1.3330301495434439e-05,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09591110795736313,
"step": 3255,
"valid_targets_mean": 2231.9,
"valid_targets_min": 1335
},
{
"epoch": 4.540389972144847,
"grad_norm": 0.758467847298457,
"learning_rate": 1.3264859789703391e-05,
"loss": 0.1334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07577726244926453,
"step": 3260,
"valid_targets_mean": 1729.5,
"valid_targets_min": 719
},
{
"epoch": 4.547353760445683,
"grad_norm": 0.8154388753592663,
"learning_rate": 1.3199499317026741e-05,
"loss": 0.1302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052854329347610474,
"step": 3265,
"valid_targets_mean": 1222.9,
"valid_targets_min": 697
},
{
"epoch": 4.554317548746518,
"grad_norm": 0.8552854445354738,
"learning_rate": 1.3134220865722282e-05,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07314737141132355,
"step": 3270,
"valid_targets_mean": 1521.1,
"valid_targets_min": 998
},
{
"epoch": 4.561281337047354,
"grad_norm": 0.7820786112177985,
"learning_rate": 1.3069025223118539e-05,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06754308938980103,
"step": 3275,
"valid_targets_mean": 1693.9,
"valid_targets_min": 629
},
{
"epoch": 4.56824512534819,
"grad_norm": 0.8755511497986203,
"learning_rate": 1.3003913175545271e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07453906536102295,
"step": 3280,
"valid_targets_mean": 1630.2,
"valid_targets_min": 1078
},
{
"epoch": 4.575208913649025,
"grad_norm": 0.7758564032420037,
"learning_rate": 1.2938885508323989e-05,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06837262213230133,
"step": 3285,
"valid_targets_mean": 1843.0,
"valid_targets_min": 1075
},
{
"epoch": 4.582172701949861,
"grad_norm": 0.7809622207382767,
"learning_rate": 1.28739430057585e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07848972082138062,
"step": 3290,
"valid_targets_mean": 1848.2,
"valid_targets_min": 1317
},
{
"epoch": 4.589136490250697,
"grad_norm": 0.7816839323875953,
"learning_rate": 1.2809086451125402e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07772564888000488,
"step": 3295,
"valid_targets_mean": 1727.4,
"valid_targets_min": 957
},
{
"epoch": 4.596100278551532,
"grad_norm": 0.9203545388755756,
"learning_rate": 1.2744316626664702e-05,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060780055820941925,
"step": 3300,
"valid_targets_mean": 1115.4,
"valid_targets_min": 643
},
{
"epoch": 4.603064066852368,
"grad_norm": 0.896065872644034,
"learning_rate": 1.2679634313570324e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07272806763648987,
"step": 3305,
"valid_targets_mean": 1547.2,
"valid_targets_min": 1111
},
{
"epoch": 4.610027855153203,
"grad_norm": 0.7733642462901773,
"learning_rate": 1.2615040291980729e-05,
"loss": 0.1273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061603400856256485,
"step": 3310,
"valid_targets_mean": 1450.0,
"valid_targets_min": 705
},
{
"epoch": 4.616991643454039,
"grad_norm": 0.8143367409475855,
"learning_rate": 1.2550535340969483e-05,
"loss": 0.1305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07132863998413086,
"step": 3315,
"valid_targets_mean": 1539.0,
"valid_targets_min": 1288
},
{
"epoch": 4.623955431754875,
"grad_norm": 0.8553022073322677,
"learning_rate": 1.2486120238535845e-05,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06410254538059235,
"step": 3320,
"valid_targets_mean": 1321.2,
"valid_targets_min": 753
},
{
"epoch": 4.63091922005571,
"grad_norm": 0.8567062695633868,
"learning_rate": 1.2421795761595424e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0614665150642395,
"step": 3325,
"valid_targets_mean": 1480.0,
"valid_targets_min": 817
},
{
"epoch": 4.637883008356546,
"grad_norm": 0.8755257408477221,
"learning_rate": 1.2357562685970787e-05,
"loss": 0.1262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05426248908042908,
"step": 3330,
"valid_targets_mean": 1293.9,
"valid_targets_min": 974
},
{
"epoch": 4.644846796657381,
"grad_norm": 0.9722123694394161,
"learning_rate": 1.2293421786382094e-05,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07091125100851059,
"step": 3335,
"valid_targets_mean": 1529.2,
"valid_targets_min": 657
},
{
"epoch": 4.651810584958217,
"grad_norm": 0.9541829768814589,
"learning_rate": 1.2229373836437764e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07790433615446091,
"step": 3340,
"valid_targets_mean": 1678.0,
"valid_targets_min": 880
},
{
"epoch": 4.658774373259053,
"grad_norm": 0.8576485652747621,
"learning_rate": 1.2165419608625157e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07814347743988037,
"step": 3345,
"valid_targets_mean": 1609.4,
"valid_targets_min": 1050
},
{
"epoch": 4.665738161559888,
"grad_norm": 0.8917597302101115,
"learning_rate": 1.2101559874301217e-05,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05816866457462311,
"step": 3350,
"valid_targets_mean": 1449.0,
"valid_targets_min": 682
},
{
"epoch": 4.672701949860724,
"grad_norm": 0.832501950400249,
"learning_rate": 1.2037795403683212e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06002386286854744,
"step": 3355,
"valid_targets_mean": 1344.0,
"valid_targets_min": 703
},
{
"epoch": 4.67966573816156,
"grad_norm": 0.8308585092709525,
"learning_rate": 1.1974126965839434e-05,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06484422087669373,
"step": 3360,
"valid_targets_mean": 1469.4,
"valid_targets_min": 934
},
{
"epoch": 4.686629526462395,
"grad_norm": 0.8444644777001103,
"learning_rate": 1.1910555328679896e-05,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1002117171883583,
"step": 3365,
"valid_targets_mean": 1829.1,
"valid_targets_min": 734
},
{
"epoch": 4.693593314763231,
"grad_norm": 0.7838276598240631,
"learning_rate": 1.18470812589471e-05,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08434125781059265,
"step": 3370,
"valid_targets_mean": 2010.8,
"valid_targets_min": 1437
},
{
"epoch": 4.7005571030640665,
"grad_norm": 0.8121696038208687,
"learning_rate": 1.1783705522206794e-05,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05047055333852768,
"step": 3375,
"valid_targets_mean": 1405.2,
"valid_targets_min": 551
},
{
"epoch": 4.7075208913649025,
"grad_norm": 0.9702607731512856,
"learning_rate": 1.1720428882838694e-05,
"loss": 0.1335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08291260153055191,
"step": 3380,
"valid_targets_mean": 1817.6,
"valid_targets_min": 931
},
{
"epoch": 4.7144846796657385,
"grad_norm": 0.820699694440321,
"learning_rate": 1.1657252104027314e-05,
"loss": 0.1277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06308387219905853,
"step": 3385,
"valid_targets_mean": 1599.1,
"valid_targets_min": 904
},
{
"epoch": 4.721448467966574,
"grad_norm": 0.829670605394756,
"learning_rate": 1.1594175947752749e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07266199588775635,
"step": 3390,
"valid_targets_mean": 1774.8,
"valid_targets_min": 1158
},
{
"epoch": 4.72841225626741,
"grad_norm": 0.8896710009000609,
"learning_rate": 1.1531201174781459e-05,
"loss": 0.1211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05510660260915756,
"step": 3395,
"valid_targets_mean": 1229.2,
"valid_targets_min": 756
},
{
"epoch": 4.735376044568245,
"grad_norm": 1.1555963653569135,
"learning_rate": 1.1468328544657132e-05,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08370531350374222,
"step": 3400,
"valid_targets_mean": 1536.9,
"valid_targets_min": 854
},
{
"epoch": 4.742339832869081,
"grad_norm": 0.8354454053066505,
"learning_rate": 1.1405558815691466e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07298648357391357,
"step": 3405,
"valid_targets_mean": 1739.5,
"valid_targets_min": 1462
},
{
"epoch": 4.749303621169917,
"grad_norm": 0.8260820753810716,
"learning_rate": 1.1342892744955112e-05,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05890219286084175,
"step": 3410,
"valid_targets_mean": 1475.9,
"valid_targets_min": 944
},
{
"epoch": 4.756267409470752,
"grad_norm": 0.8016656660345047,
"learning_rate": 1.1280331088268452e-05,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060654304921627045,
"step": 3415,
"valid_targets_mean": 1482.6,
"valid_targets_min": 1227
},
{
"epoch": 4.763231197771588,
"grad_norm": 0.7864044513954926,
"learning_rate": 1.1217874600192542e-05,
"loss": 0.1309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051892273128032684,
"step": 3420,
"valid_targets_mean": 1276.5,
"valid_targets_min": 740
},
{
"epoch": 4.770194986072424,
"grad_norm": 0.774017966732346,
"learning_rate": 1.1155524034019981e-05,
"loss": 0.131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07892292737960815,
"step": 3425,
"valid_targets_mean": 2024.8,
"valid_targets_min": 881
},
{
"epoch": 4.777158774373259,
"grad_norm": 0.8962743138721668,
"learning_rate": 1.1093280141765837e-05,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06519632786512375,
"step": 3430,
"valid_targets_mean": 1288.6,
"valid_targets_min": 636
},
{
"epoch": 4.784122562674095,
"grad_norm": 0.8008310946938783,
"learning_rate": 1.103114367415858e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04663780331611633,
"step": 3435,
"valid_targets_mean": 1103.9,
"valid_targets_min": 814
},
{
"epoch": 4.791086350974931,
"grad_norm": 0.857674350118069,
"learning_rate": 1.0969115380631015e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061598315834999084,
"step": 3440,
"valid_targets_mean": 1392.9,
"valid_targets_min": 820
},
{
"epoch": 4.798050139275766,
"grad_norm": 0.8096519542290342,
"learning_rate": 1.090719600931126e-05,
"loss": 0.129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057360272854566574,
"step": 3445,
"valid_targets_mean": 1392.4,
"valid_targets_min": 661
},
{
"epoch": 4.805013927576602,
"grad_norm": 0.8515212322986098,
"learning_rate": 1.0845386307013703e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06106788292527199,
"step": 3450,
"valid_targets_mean": 1441.8,
"valid_targets_min": 728
},
{
"epoch": 4.811977715877437,
"grad_norm": 0.8509639251731652,
"learning_rate": 1.078368701923003e-05,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060364048928022385,
"step": 3455,
"valid_targets_mean": 1413.5,
"valid_targets_min": 692
},
{
"epoch": 4.818941504178273,
"grad_norm": 0.8405241655525482,
"learning_rate": 1.0722098890120176e-05,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06148139387369156,
"step": 3460,
"valid_targets_mean": 1323.5,
"valid_targets_min": 840
},
{
"epoch": 4.825905292479108,
"grad_norm": 0.9119451778532717,
"learning_rate": 1.0660622662503389e-05,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06766475737094879,
"step": 3465,
"valid_targets_mean": 1488.4,
"valid_targets_min": 950
},
{
"epoch": 4.832869080779944,
"grad_norm": 0.7915913493434501,
"learning_rate": 1.0599259077849294e-05,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07292820513248444,
"step": 3470,
"valid_targets_mean": 1935.9,
"valid_targets_min": 878
},
{
"epoch": 4.83983286908078,
"grad_norm": 0.8489205471637494,
"learning_rate": 1.0538008876268887e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06822683662176132,
"step": 3475,
"valid_targets_mean": 1502.1,
"valid_targets_min": 836
},
{
"epoch": 4.846796657381615,
"grad_norm": 0.8786148894939648,
"learning_rate": 1.0476872796505658e-05,
"loss": 0.1264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07060012221336365,
"step": 3480,
"valid_targets_mean": 1535.1,
"valid_targets_min": 1013
},
{
"epoch": 4.853760445682451,
"grad_norm": 0.8959033919138696,
"learning_rate": 1.0415851575926656e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05586308240890503,
"step": 3485,
"valid_targets_mean": 1346.4,
"valid_targets_min": 748
},
{
"epoch": 4.860724233983287,
"grad_norm": 0.9017231573931604,
"learning_rate": 1.035494595051361e-05,
"loss": 0.1294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06896314024925232,
"step": 3490,
"valid_targets_mean": 1543.9,
"valid_targets_min": 729
},
{
"epoch": 4.867688022284122,
"grad_norm": 0.8540161387269878,
"learning_rate": 1.0294156654854053e-05,
"loss": 0.1372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058618832379579544,
"step": 3495,
"valid_targets_mean": 1541.9,
"valid_targets_min": 1219
},
{
"epoch": 4.874651810584958,
"grad_norm": 0.8673351138138804,
"learning_rate": 1.023348442213244e-05,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06518058478832245,
"step": 3500,
"valid_targets_mean": 1632.8,
"valid_targets_min": 916
},
{
"epoch": 4.881615598885794,
"grad_norm": 0.8662755506535637,
"learning_rate": 1.0172929984121333e-05,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0599341094493866,
"step": 3505,
"valid_targets_mean": 1349.9,
"valid_targets_min": 646
},
{
"epoch": 4.888579387186629,
"grad_norm": 0.8789665027258394,
"learning_rate": 1.0112494071172549e-05,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06385256350040436,
"step": 3510,
"valid_targets_mean": 1383.0,
"valid_targets_min": 906
},
{
"epoch": 4.895543175487465,
"grad_norm": 0.8475866768723133,
"learning_rate": 1.0052177412208401e-05,
"loss": 0.1225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059585411101579666,
"step": 3515,
"valid_targets_mean": 1577.5,
"valid_targets_min": 848
},
{
"epoch": 4.9025069637883005,
"grad_norm": 0.9212057570976543,
"learning_rate": 9.991980734712821e-06,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06198536604642868,
"step": 3520,
"valid_targets_mean": 1183.5,
"valid_targets_min": 692
},
{
"epoch": 4.9094707520891365,
"grad_norm": 0.8950552623059923,
"learning_rate": 9.931904764722661e-06,
"loss": 0.123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058858513832092285,
"step": 3525,
"valid_targets_mean": 1373.9,
"valid_targets_min": 821
},
{
"epoch": 4.9164345403899725,
"grad_norm": 0.7942490619902811,
"learning_rate": 9.871950226818907e-06,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05587601661682129,
"step": 3530,
"valid_targets_mean": 1428.1,
"valid_targets_min": 1013
},
{
"epoch": 4.923398328690808,
"grad_norm": 0.7959315882544532,
"learning_rate": 9.812117844117955e-06,
"loss": 0.1243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06044112890958786,
"step": 3535,
"valid_targets_mean": 1420.9,
"valid_targets_min": 781
},
{
"epoch": 4.930362116991644,
"grad_norm": 0.9261429168716236,
"learning_rate": 9.752408338262864e-06,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06673343479633331,
"step": 3540,
"valid_targets_mean": 1255.1,
"valid_targets_min": 548
},
{
"epoch": 4.937325905292479,
"grad_norm": 0.7859825717323234,
"learning_rate": 9.692822429414657e-06,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0637277364730835,
"step": 3545,
"valid_targets_mean": 1411.0,
"valid_targets_min": 694
},
{
"epoch": 4.944289693593315,
"grad_norm": 0.8542974067863182,
"learning_rate": 9.633360836243656e-06,
"loss": 0.1335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08179077506065369,
"step": 3550,
"valid_targets_mean": 1973.8,
"valid_targets_min": 1030
},
{
"epoch": 4.951253481894151,
"grad_norm": 0.7455850946114743,
"learning_rate": 9.57402427592081e-06,
"loss": 0.1209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05281627178192139,
"step": 3555,
"valid_targets_mean": 1580.2,
"valid_targets_min": 682
},
{
"epoch": 4.958217270194986,
"grad_norm": 0.8918246113696654,
"learning_rate": 9.514813464109023e-06,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06317047029733658,
"step": 3560,
"valid_targets_mean": 1425.4,
"valid_targets_min": 990
},
{
"epoch": 4.965181058495822,
"grad_norm": 0.8206588096352696,
"learning_rate": 9.455729114954542e-06,
"loss": 0.128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04826410859823227,
"step": 3565,
"valid_targets_mean": 1299.6,
"valid_targets_min": 639
},
{
"epoch": 4.972144846796658,
"grad_norm": 0.8215144309267559,
"learning_rate": 9.396771941078335e-06,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053259532898664474,
"step": 3570,
"valid_targets_mean": 1458.8,
"valid_targets_min": 721
},
{
"epoch": 4.979108635097493,
"grad_norm": 0.8423487434531587,
"learning_rate": 9.337942653567504e-06,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05987967178225517,
"step": 3575,
"valid_targets_mean": 1329.8,
"valid_targets_min": 874
},
{
"epoch": 4.986072423398329,
"grad_norm": 0.7786328247052688,
"learning_rate": 9.279241961966698e-06,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0674387663602829,
"step": 3580,
"valid_targets_mean": 1559.9,
"valid_targets_min": 686
},
{
"epoch": 4.993036211699164,
"grad_norm": 0.8885857987523331,
"learning_rate": 9.220670574269564e-06,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07278092205524445,
"step": 3585,
"valid_targets_mean": 1392.5,
"valid_targets_min": 713
},
{
"epoch": 5.0,
"grad_norm": 0.9810812179546335,
"learning_rate": 9.162229196910201e-06,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09730862826108932,
"step": 3590,
"valid_targets_mean": 6130.4,
"valid_targets_min": 920
},
{
"epoch": 5.006963788300836,
"grad_norm": 0.7395884420407827,
"learning_rate": 9.103918534754648e-06,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09225118160247803,
"step": 3595,
"valid_targets_mean": 7389.0,
"valid_targets_min": 5627
},
{
"epoch": 5.013927576601671,
"grad_norm": 0.7448900926657113,
"learning_rate": 9.045739291092377e-06,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05141618102788925,
"step": 3600,
"valid_targets_mean": 1294.8,
"valid_targets_min": 422
},
{
"epoch": 5.020891364902507,
"grad_norm": 0.43737029497845903,
"learning_rate": 8.987692167627807e-06,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09226194024085999,
"step": 3605,
"valid_targets_mean": 8539.9,
"valid_targets_min": 6761
},
{
"epoch": 5.027855153203342,
"grad_norm": 0.40244324306844387,
"learning_rate": 8.929777864471847e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0802266001701355,
"step": 3610,
"valid_targets_mean": 7579.0,
"valid_targets_min": 6174
},
{
"epoch": 5.034818941504178,
"grad_norm": 0.3948157476493201,
"learning_rate": 8.871997080133446e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07746812701225281,
"step": 3615,
"valid_targets_mean": 7328.2,
"valid_targets_min": 4839
},
{
"epoch": 5.041782729805014,
"grad_norm": 0.42318640045066125,
"learning_rate": 8.814350511511187e-06,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09257575869560242,
"step": 3620,
"valid_targets_mean": 6838.2,
"valid_targets_min": 5034
},
{
"epoch": 5.048746518105849,
"grad_norm": 0.4452897616046545,
"learning_rate": 8.756838853884862e-06,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09431345760822296,
"step": 3625,
"valid_targets_mean": 7248.2,
"valid_targets_min": 5567
},
{
"epoch": 5.055710306406685,
"grad_norm": 0.4113841425843344,
"learning_rate": 8.699462800907063e-06,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07702521979808807,
"step": 3630,
"valid_targets_mean": 6234.0,
"valid_targets_min": 5603
},
{
"epoch": 5.062674094707521,
"grad_norm": 0.6816435531080544,
"learning_rate": 8.642223044594873e-06,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023794259876012802,
"step": 3635,
"valid_targets_mean": 602.0,
"valid_targets_min": 152
},
{
"epoch": 5.069637883008356,
"grad_norm": 0.40935977827091236,
"learning_rate": 8.585120275321493e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08000779151916504,
"step": 3640,
"valid_targets_mean": 7299.9,
"valid_targets_min": 6158
},
{
"epoch": 5.076601671309192,
"grad_norm": 0.41147638157549343,
"learning_rate": 8.528155181807895e-06,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08062512427568436,
"step": 3645,
"valid_targets_mean": 6140.0,
"valid_targets_min": 4648
},
{
"epoch": 5.0835654596100275,
"grad_norm": 0.44547329868476815,
"learning_rate": 8.471328451114545e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08527650684118271,
"step": 3650,
"valid_targets_mean": 6603.0,
"valid_targets_min": 4882
},
{
"epoch": 5.0905292479108635,
"grad_norm": 0.40170578080263875,
"learning_rate": 8.414640768633096e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0836111456155777,
"step": 3655,
"valid_targets_mean": 8015.0,
"valid_targets_min": 6344
},
{
"epoch": 5.0974930362116995,
"grad_norm": 0.41169416175196893,
"learning_rate": 8.358092818078133e-06,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07325682044029236,
"step": 3660,
"valid_targets_mean": 6305.2,
"valid_targets_min": 4622
},
{
"epoch": 5.104456824512535,
"grad_norm": 0.40731776029002104,
"learning_rate": 8.301685281478923e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.089007668197155,
"step": 3665,
"valid_targets_mean": 7890.8,
"valid_targets_min": 5485
},
{
"epoch": 5.111420612813371,
"grad_norm": 0.4776234320230322,
"learning_rate": 8.24541883917119e-06,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07598386704921722,
"step": 3670,
"valid_targets_mean": 7016.6,
"valid_targets_min": 4960
},
{
"epoch": 5.118384401114207,
"grad_norm": 0.41863282757191406,
"learning_rate": 8.189294169788913e-06,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07902969419956207,
"step": 3675,
"valid_targets_mean": 6527.1,
"valid_targets_min": 5399
},
{
"epoch": 5.125348189415042,
"grad_norm": 0.47406483603656724,
"learning_rate": 8.133311950256127e-06,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08029402792453766,
"step": 3680,
"valid_targets_mean": 4995.0,
"valid_targets_min": 618
},
{
"epoch": 5.132311977715878,
"grad_norm": 0.4225431739550544,
"learning_rate": 8.077472855778774e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09067791700363159,
"step": 3685,
"valid_targets_mean": 7219.4,
"valid_targets_min": 5764
},
{
"epoch": 5.139275766016713,
"grad_norm": 0.4015096498481741,
"learning_rate": 8.021777559836554e-06,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08319695293903351,
"step": 3690,
"valid_targets_mean": 7998.5,
"valid_targets_min": 5902
},
{
"epoch": 5.146239554317549,
"grad_norm": 0.38710682418396525,
"learning_rate": 7.966226734174799e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06552509218454361,
"step": 3695,
"valid_targets_mean": 7377.4,
"valid_targets_min": 5015
},
{
"epoch": 5.153203342618385,
"grad_norm": 0.3983605888889487,
"learning_rate": 7.910821048796368e-06,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06865357607603073,
"step": 3700,
"valid_targets_mean": 6794.0,
"valid_targets_min": 5283
},
{
"epoch": 5.16016713091922,
"grad_norm": 0.44045948176479105,
"learning_rate": 7.855561171953594e-06,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09348156303167343,
"step": 3705,
"valid_targets_mean": 6656.4,
"valid_targets_min": 4364
},
{
"epoch": 5.167130919220056,
"grad_norm": 0.43728173137315074,
"learning_rate": 7.800447770140185e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07885047048330307,
"step": 3710,
"valid_targets_mean": 7178.4,
"valid_targets_min": 4448
},
{
"epoch": 5.174094707520891,
"grad_norm": 0.4411940412213923,
"learning_rate": 7.74548150808319e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09826900064945221,
"step": 3715,
"valid_targets_mean": 7619.8,
"valid_targets_min": 5737
},
{
"epoch": 5.181058495821727,
"grad_norm": 0.3963098926707128,
"learning_rate": 7.690663048735009e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06886550784111023,
"step": 3720,
"valid_targets_mean": 8754.4,
"valid_targets_min": 5752
},
{
"epoch": 5.188022284122563,
"grad_norm": 0.4431165807502115,
"learning_rate": 7.635993053265391e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07675637304782867,
"step": 3725,
"valid_targets_mean": 6341.0,
"valid_targets_min": 4543
},
{
"epoch": 5.194986072423398,
"grad_norm": 0.4239858813074235,
"learning_rate": 7.581472181053435e-06,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08128580451011658,
"step": 3730,
"valid_targets_mean": 7181.9,
"valid_targets_min": 4563
},
{
"epoch": 5.201949860724234,
"grad_norm": 0.7649649723811223,
"learning_rate": 7.527101089679658e-06,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051468294113874435,
"step": 3735,
"valid_targets_mean": 1104.4,
"valid_targets_min": 161
},
{
"epoch": 5.20891364902507,
"grad_norm": 0.41405913060333405,
"learning_rate": 7.4728804349180575e-06,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07386703789234161,
"step": 3740,
"valid_targets_mean": 7018.2,
"valid_targets_min": 5424
},
{
"epoch": 5.215877437325905,
"grad_norm": 0.45338644264188654,
"learning_rate": 7.418810870728203e-06,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08742383122444153,
"step": 3745,
"valid_targets_mean": 7738.4,
"valid_targets_min": 5329
},
{
"epoch": 5.222841225626741,
"grad_norm": 0.4466036832294684,
"learning_rate": 7.364893049247351e-06,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0829770565032959,
"step": 3750,
"valid_targets_mean": 6426.6,
"valid_targets_min": 5560
},
{
"epoch": 5.229805013927576,
"grad_norm": 0.48777116575319945,
"learning_rate": 7.311127620782575e-06,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08484528213739395,
"step": 3755,
"valid_targets_mean": 6169.9,
"valid_targets_min": 3446
},
{
"epoch": 5.236768802228412,
"grad_norm": 0.4147145687544805,
"learning_rate": 7.2575152338029255e-06,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08592289686203003,
"step": 3760,
"valid_targets_mean": 7204.6,
"valid_targets_min": 5381
},
{
"epoch": 5.243732590529248,
"grad_norm": 0.4338983913748669,
"learning_rate": 7.204056534931607e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08771762251853943,
"step": 3765,
"valid_targets_mean": 7600.4,
"valid_targets_min": 5241
},
{
"epoch": 5.250696378830083,
"grad_norm": 0.41445196900515596,
"learning_rate": 7.150752168938182e-06,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08908963948488235,
"step": 3770,
"valid_targets_mean": 7098.5,
"valid_targets_min": 5607
},
{
"epoch": 5.257660167130919,
"grad_norm": 0.463052253966403,
"learning_rate": 7.097602778730788e-06,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08907216787338257,
"step": 3775,
"valid_targets_mean": 6955.1,
"valid_targets_min": 5530
},
{
"epoch": 5.264623955431755,
"grad_norm": 0.4364902349015762,
"learning_rate": 7.044609005348389e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08470651507377625,
"step": 3780,
"valid_targets_mean": 6748.1,
"valid_targets_min": 5364
},
{
"epoch": 5.27158774373259,
"grad_norm": 0.4667194728842975,
"learning_rate": 6.991771487953036e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08043470978736877,
"step": 3785,
"valid_targets_mean": 6273.9,
"valid_targets_min": 5438
},
{
"epoch": 5.278551532033426,
"grad_norm": 0.42521567334703014,
"learning_rate": 6.939090863822188e-06,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07761454582214355,
"step": 3790,
"valid_targets_mean": 6419.5,
"valid_targets_min": 4879
},
{
"epoch": 5.2855153203342615,
"grad_norm": 0.43932142773608807,
"learning_rate": 6.8865677683409835e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07779448479413986,
"step": 3795,
"valid_targets_mean": 6483.4,
"valid_targets_min": 4309
},
{
"epoch": 5.2924791086350975,
"grad_norm": 0.47079517415735234,
"learning_rate": 6.834202834994581e-06,
"loss": 0.1334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09646376967430115,
"step": 3800,
"valid_targets_mean": 6825.0,
"valid_targets_min": 5205
},
{
"epoch": 5.2994428969359335,
"grad_norm": 0.46289740146196456,
"learning_rate": 6.781996695360553e-06,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07646790146827698,
"step": 3805,
"valid_targets_mean": 6729.4,
"valid_targets_min": 5200
},
{
"epoch": 5.306406685236769,
"grad_norm": 0.44246422147197345,
"learning_rate": 6.729949979101256e-06,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07880687713623047,
"step": 3810,
"valid_targets_mean": 6094.0,
"valid_targets_min": 5302
},
{
"epoch": 5.313370473537605,
"grad_norm": 0.4386645916488665,
"learning_rate": 6.678063313956211e-06,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0853356197476387,
"step": 3815,
"valid_targets_mean": 7140.0,
"valid_targets_min": 5270
},
{
"epoch": 5.32033426183844,
"grad_norm": 0.3896192941415339,
"learning_rate": 6.626337325734564e-06,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07671719789505005,
"step": 3820,
"valid_targets_mean": 7425.0,
"valid_targets_min": 5281
},
{
"epoch": 5.327298050139276,
"grad_norm": 0.43882210400710403,
"learning_rate": 6.574772638307496e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10439842939376831,
"step": 3825,
"valid_targets_mean": 7063.4,
"valid_targets_min": 5386
},
{
"epoch": 5.334261838440112,
"grad_norm": 0.4328294638391199,
"learning_rate": 6.523369873600767e-06,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08555565774440765,
"step": 3830,
"valid_targets_mean": 6827.0,
"valid_targets_min": 4547
},
{
"epoch": 5.341225626740947,
"grad_norm": 0.5740969553533752,
"learning_rate": 6.472129651587147e-06,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03779056295752525,
"step": 3835,
"valid_targets_mean": 2047.0,
"valid_targets_min": 165
},
{
"epoch": 5.348189415041783,
"grad_norm": 0.4535247047853864,
"learning_rate": 6.421052590278976e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07807661592960358,
"step": 3840,
"valid_targets_mean": 6754.1,
"valid_targets_min": 5196
},
{
"epoch": 5.355153203342619,
"grad_norm": 0.4691124981565333,
"learning_rate": 6.370139305720693e-06,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07937394082546234,
"step": 3845,
"valid_targets_mean": 5985.6,
"valid_targets_min": 5028
},
{
"epoch": 5.362116991643454,
"grad_norm": 0.4621292650890354,
"learning_rate": 6.319390411981421e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07576687633991241,
"step": 3850,
"valid_targets_mean": 5963.9,
"valid_targets_min": 5237
},
{
"epoch": 5.36908077994429,
"grad_norm": 0.47453529144859713,
"learning_rate": 6.268806521147546e-06,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08445766568183899,
"step": 3855,
"valid_targets_mean": 6319.0,
"valid_targets_min": 5412
},
{
"epoch": 5.376044568245125,
"grad_norm": 0.41147646717777764,
"learning_rate": 6.218388243315343e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06716381013393402,
"step": 3860,
"valid_targets_mean": 7125.8,
"valid_targets_min": 5080
},
{
"epoch": 5.383008356545961,
"grad_norm": 0.43779798115412527,
"learning_rate": 6.168136186583615e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07958684861660004,
"step": 3865,
"valid_targets_mean": 6123.5,
"valid_targets_min": 4521
},
{
"epoch": 5.389972144846797,
"grad_norm": 0.966196621555397,
"learning_rate": 6.118050957046358e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09092744439840317,
"step": 3870,
"valid_targets_mean": 1886.0,
"valid_targets_min": 1111
},
{
"epoch": 5.396935933147632,
"grad_norm": 0.8077855185739582,
"learning_rate": 6.068133158785463e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07527165114879608,
"step": 3875,
"valid_targets_mean": 1497.6,
"valid_targets_min": 893
},
{
"epoch": 5.403899721448468,
"grad_norm": 0.7144983965195878,
"learning_rate": 6.018383393863412e-06,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049098506569862366,
"step": 3880,
"valid_targets_mean": 1356.0,
"valid_targets_min": 914
},
{
"epoch": 5.410863509749303,
"grad_norm": 0.8109690813075966,
"learning_rate": 5.968802262316009e-06,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054713502526283264,
"step": 3885,
"valid_targets_mean": 1324.5,
"valid_targets_min": 680
},
{
"epoch": 5.417827298050139,
"grad_norm": 0.8096672959801836,
"learning_rate": 5.919390362145172e-06,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06651387363672256,
"step": 3890,
"valid_targets_mean": 1931.8,
"valid_targets_min": 876
},
{
"epoch": 5.424791086350975,
"grad_norm": 0.9084117209145378,
"learning_rate": 5.870148289311719e-06,
"loss": 0.1281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05635681003332138,
"step": 3895,
"valid_targets_mean": 1292.2,
"valid_targets_min": 734
},
{
"epoch": 5.43175487465181,
"grad_norm": 0.8234461561242756,
"learning_rate": 5.8210766377281425e-06,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05349376052618027,
"step": 3900,
"valid_targets_mean": 1469.6,
"valid_targets_min": 655
},
{
"epoch": 5.438718662952646,
"grad_norm": 0.8349797022317297,
"learning_rate": 5.7721759992514835e-06,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06947162747383118,
"step": 3905,
"valid_targets_mean": 1548.4,
"valid_targets_min": 737
},
{
"epoch": 5.445682451253482,
"grad_norm": 0.8357949779321237,
"learning_rate": 5.7234469636761825e-06,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05619405210018158,
"step": 3910,
"valid_targets_mean": 1316.5,
"valid_targets_min": 759
},
{
"epoch": 5.452646239554317,
"grad_norm": 0.8320721049373022,
"learning_rate": 5.674890118726955e-06,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048418521881103516,
"step": 3915,
"valid_targets_mean": 1249.6,
"valid_targets_min": 753
},
{
"epoch": 5.459610027855153,
"grad_norm": 0.8918073241547342,
"learning_rate": 5.626506050051716e-06,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07567094266414642,
"step": 3920,
"valid_targets_mean": 1833.0,
"valid_targets_min": 927
},
{
"epoch": 5.4665738161559885,
"grad_norm": 0.864812696220783,
"learning_rate": 5.578295341214519e-06,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06043354421854019,
"step": 3925,
"valid_targets_mean": 1338.4,
"valid_targets_min": 679
},
{
"epoch": 5.4735376044568245,
"grad_norm": 0.854189693756131,
"learning_rate": 5.530258573688496e-06,
"loss": 0.124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05904326215386391,
"step": 3930,
"valid_targets_mean": 1244.6,
"valid_targets_min": 771
},
{
"epoch": 5.4805013927576605,
"grad_norm": 0.7843808631480862,
"learning_rate": 5.482396326848884e-06,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058021124452352524,
"step": 3935,
"valid_targets_mean": 1732.5,
"valid_targets_min": 986
},
{
"epoch": 5.487465181058496,
"grad_norm": 0.9558429957238452,
"learning_rate": 5.434709177965982e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05305638536810875,
"step": 3940,
"valid_targets_mean": 1389.9,
"valid_targets_min": 1103
},
{
"epoch": 5.494428969359332,
"grad_norm": 0.8557141687664696,
"learning_rate": 5.387197702198239e-06,
"loss": 0.1195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0624840185046196,
"step": 3945,
"valid_targets_mean": 1593.2,
"valid_targets_min": 675
},
{
"epoch": 5.501392757660167,
"grad_norm": 0.8442709657389822,
"learning_rate": 5.339862472585284e-06,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07162931561470032,
"step": 3950,
"valid_targets_mean": 1926.6,
"valid_targets_min": 974
},
{
"epoch": 5.508356545961003,
"grad_norm": 0.8922738009156526,
"learning_rate": 5.292704060041047e-06,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07262811809778214,
"step": 3955,
"valid_targets_mean": 1953.1,
"valid_targets_min": 869
},
{
"epoch": 5.515320334261839,
"grad_norm": 0.8628907763362105,
"learning_rate": 5.245723033346841e-06,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05248372256755829,
"step": 3960,
"valid_targets_mean": 1327.2,
"valid_targets_min": 1023
},
{
"epoch": 5.522284122562674,
"grad_norm": 1.0689981634779093,
"learning_rate": 5.198919959144504e-06,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06385475397109985,
"step": 3965,
"valid_targets_mean": 1717.9,
"valid_targets_min": 709
},
{
"epoch": 5.52924791086351,
"grad_norm": 0.8507547339269755,
"learning_rate": 5.152295401929581e-06,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04907778650522232,
"step": 3970,
"valid_targets_mean": 1139.9,
"valid_targets_min": 658
},
{
"epoch": 5.536211699164346,
"grad_norm": 0.8352935218223749,
"learning_rate": 5.10584992404453e-06,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05608684569597244,
"step": 3975,
"valid_targets_mean": 1444.8,
"valid_targets_min": 662
},
{
"epoch": 5.543175487465181,
"grad_norm": 0.8360060925828016,
"learning_rate": 5.059584085671896e-06,
"loss": 0.1211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04403482377529144,
"step": 3980,
"valid_targets_mean": 1242.2,
"valid_targets_min": 859
},
{
"epoch": 5.550139275766017,
"grad_norm": 0.8557031879654616,
"learning_rate": 5.0134984448275844e-06,
"loss": 0.11,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06525018811225891,
"step": 3985,
"valid_targets_mean": 1569.2,
"valid_targets_min": 950
},
{
"epoch": 5.557103064066853,
"grad_norm": 0.8940987834631933,
"learning_rate": 4.967593557354125e-06,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057968899607658386,
"step": 3990,
"valid_targets_mean": 1539.8,
"valid_targets_min": 686
},
{
"epoch": 5.564066852367688,
"grad_norm": 0.8803812608953893,
"learning_rate": 4.921869976913964e-06,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06881322711706161,
"step": 3995,
"valid_targets_mean": 1610.6,
"valid_targets_min": 702
},
{
"epoch": 5.571030640668524,
"grad_norm": 0.8857750625346741,
"learning_rate": 4.876328254982796e-06,
"loss": 0.1188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043028295040130615,
"step": 4000,
"valid_targets_mean": 1190.4,
"valid_targets_min": 779
},
{
"epoch": 5.577994428969359,
"grad_norm": 0.8537850227769329,
"learning_rate": 4.8309689408429015e-06,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06296706199645996,
"step": 4005,
"valid_targets_mean": 1467.1,
"valid_targets_min": 822
},
{
"epoch": 5.584958217270195,
"grad_norm": 0.8285166830028964,
"learning_rate": 4.785792581576523e-06,
"loss": 0.1172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05445345491170883,
"step": 4010,
"valid_targets_mean": 1350.5,
"valid_targets_min": 868
},
{
"epoch": 5.591922005571031,
"grad_norm": 0.8667031190956394,
"learning_rate": 4.740799722059269e-06,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04850904271006584,
"step": 4015,
"valid_targets_mean": 1283.5,
"valid_targets_min": 781
},
{
"epoch": 5.598885793871866,
"grad_norm": 0.8366685664142771,
"learning_rate": 4.6959909049535665e-06,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05181458219885826,
"step": 4020,
"valid_targets_mean": 1303.2,
"valid_targets_min": 793
},
{
"epoch": 5.605849582172702,
"grad_norm": 0.7495096178648898,
"learning_rate": 4.651366670702054e-06,
"loss": 0.1211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047033414244651794,
"step": 4025,
"valid_targets_mean": 1309.1,
"valid_targets_min": 806
},
{
"epoch": 5.612813370473537,
"grad_norm": 0.811123052386617,
"learning_rate": 4.606927557521128e-06,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04835967719554901,
"step": 4030,
"valid_targets_mean": 1397.6,
"valid_targets_min": 803
},
{
"epoch": 5.619777158774373,
"grad_norm": 0.851744557513053,
"learning_rate": 4.562674101394413e-06,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04473861679434776,
"step": 4035,
"valid_targets_mean": 1187.8,
"valid_targets_min": 660
},
{
"epoch": 5.626740947075209,
"grad_norm": 0.8083228291949228,
"learning_rate": 4.518606836066328e-06,
"loss": 0.107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05075952038168907,
"step": 4040,
"valid_targets_mean": 1547.0,
"valid_targets_min": 853
},
{
"epoch": 5.633704735376044,
"grad_norm": 0.924317112722506,
"learning_rate": 4.474726293035614e-06,
"loss": 0.1172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0637693852186203,
"step": 4045,
"valid_targets_mean": 1704.2,
"valid_targets_min": 719
},
{
"epoch": 5.64066852367688,
"grad_norm": 0.8765664950505369,
"learning_rate": 4.43103300154893e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044058702886104584,
"step": 4050,
"valid_targets_mean": 1255.0,
"valid_targets_min": 765
},
{
"epoch": 5.647632311977716,
"grad_norm": 0.8847967785711801,
"learning_rate": 4.3875274885944965e-06,
"loss": 0.1184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06218354403972626,
"step": 4055,
"valid_targets_mean": 1550.8,
"valid_targets_min": 875
},
{
"epoch": 5.654596100278551,
"grad_norm": 0.8774671561905153,
"learning_rate": 4.344210278895729e-06,
"loss": 0.1121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0588260255753994,
"step": 4060,
"valid_targets_mean": 1362.0,
"valid_targets_min": 739
},
{
"epoch": 5.661559888579387,
"grad_norm": 0.8793053210734343,
"learning_rate": 4.301081894904882e-06,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06402565538883209,
"step": 4065,
"valid_targets_mean": 1666.8,
"valid_targets_min": 760
},
{
"epoch": 5.6685236768802225,
"grad_norm": 0.8736445128719057,
"learning_rate": 4.258142856796779e-06,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04810625687241554,
"step": 4070,
"valid_targets_mean": 1319.6,
"valid_targets_min": 1046
},
{
"epoch": 5.6754874651810585,
"grad_norm": 0.9146961523812506,
"learning_rate": 4.21539368246253e-06,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06791988015174866,
"step": 4075,
"valid_targets_mean": 1727.9,
"valid_targets_min": 851
},
{
"epoch": 5.6824512534818945,
"grad_norm": 0.8950204260314059,
"learning_rate": 4.172834887503277e-06,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06217281520366669,
"step": 4080,
"valid_targets_mean": 1643.2,
"valid_targets_min": 907
},
{
"epoch": 5.68941504178273,
"grad_norm": 0.8625659343005182,
"learning_rate": 4.1304669852239865e-06,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052721407264471054,
"step": 4085,
"valid_targets_mean": 1478.5,
"valid_targets_min": 764
},
{
"epoch": 5.696378830083566,
"grad_norm": 0.8423037084637137,
"learning_rate": 4.088290486627249e-06,
"loss": 0.1117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051760852336883545,
"step": 4090,
"valid_targets_mean": 1522.6,
"valid_targets_min": 822
},
{
"epoch": 5.703342618384401,
"grad_norm": 0.7986133696863431,
"learning_rate": 4.046305900407123e-06,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05744687840342522,
"step": 4095,
"valid_targets_mean": 1589.0,
"valid_targets_min": 982
},
{
"epoch": 5.710306406685237,
"grad_norm": 0.8247019511544061,
"learning_rate": 4.004513732943001e-06,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05563589930534363,
"step": 4100,
"valid_targets_mean": 1574.8,
"valid_targets_min": 816
},
{
"epoch": 5.717270194986073,
"grad_norm": 0.8220162581325487,
"learning_rate": 3.962914488293487e-06,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05360320955514908,
"step": 4105,
"valid_targets_mean": 1422.0,
"valid_targets_min": 721
},
{
"epoch": 5.724233983286908,
"grad_norm": 0.8640387086170787,
"learning_rate": 3.921508668190337e-06,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04421108961105347,
"step": 4110,
"valid_targets_mean": 1150.6,
"valid_targets_min": 741
},
{
"epoch": 5.731197771587744,
"grad_norm": 0.9963080986309333,
"learning_rate": 3.8802967720323944e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0667385682463646,
"step": 4115,
"valid_targets_mean": 1684.2,
"valid_targets_min": 734
},
{
"epoch": 5.73816155988858,
"grad_norm": 0.9033327920465504,
"learning_rate": 3.839279296879566e-06,
"loss": 0.122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07596944272518158,
"step": 4120,
"valid_targets_mean": 1937.1,
"valid_targets_min": 744
},
{
"epoch": 5.745125348189415,
"grad_norm": 0.9201337682269749,
"learning_rate": 3.7984567374468495e-06,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06649009138345718,
"step": 4125,
"valid_targets_mean": 1842.2,
"valid_targets_min": 620
},
{
"epoch": 5.752089136490251,
"grad_norm": 0.8638321399247245,
"learning_rate": 3.757829586098334e-06,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06432803720235825,
"step": 4130,
"valid_targets_mean": 1637.6,
"valid_targets_min": 785
},
{
"epoch": 5.759052924791086,
"grad_norm": 0.8229387884326227,
"learning_rate": 3.717398332841269e-06,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06425435841083527,
"step": 4135,
"valid_targets_mean": 1969.9,
"valid_targets_min": 740
},
{
"epoch": 5.766016713091922,
"grad_norm": 0.9669615015698776,
"learning_rate": 3.6771634653201726e-06,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054495103657245636,
"step": 4140,
"valid_targets_mean": 1432.1,
"valid_targets_min": 711
},
{
"epoch": 5.772980501392758,
"grad_norm": 0.7975239579352195,
"learning_rate": 3.6371254688109493e-06,
"loss": 0.1163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06108352169394493,
"step": 4145,
"valid_targets_mean": 1695.6,
"valid_targets_min": 1122
},
{
"epoch": 5.779944289693593,
"grad_norm": 0.8324320935247468,
"learning_rate": 3.5972848262150084e-06,
"loss": 0.1145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06076567620038986,
"step": 4150,
"valid_targets_mean": 1524.5,
"valid_targets_min": 722
},
{
"epoch": 5.786908077994429,
"grad_norm": 0.8295223085601157,
"learning_rate": 3.5576420180534666e-06,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052539028227329254,
"step": 4155,
"valid_targets_mean": 1289.2,
"valid_targets_min": 661
},
{
"epoch": 5.793871866295264,
"grad_norm": 0.8688174214233373,
"learning_rate": 3.518197522461344e-06,
"loss": 0.1093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05658646672964096,
"step": 4160,
"valid_targets_mean": 1519.5,
"valid_targets_min": 1011
},
{
"epoch": 5.8008356545961,
"grad_norm": 0.8560277889635767,
"learning_rate": 3.4789518151817926e-06,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0627206489443779,
"step": 4165,
"valid_targets_mean": 1731.4,
"valid_targets_min": 1277
},
{
"epoch": 5.807799442896936,
"grad_norm": 0.8221705464226036,
"learning_rate": 3.43990536956037e-06,
"loss": 0.1132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05920272320508957,
"step": 4170,
"valid_targets_mean": 1486.1,
"valid_targets_min": 807
},
{
"epoch": 5.814763231197771,
"grad_norm": 0.8332753209312879,
"learning_rate": 3.4010586565393176e-06,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057332780212163925,
"step": 4175,
"valid_targets_mean": 1549.9,
"valid_targets_min": 679
},
{
"epoch": 5.821727019498607,
"grad_norm": 0.8619887271447355,
"learning_rate": 3.36241214465189e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05862189084291458,
"step": 4180,
"valid_targets_mean": 1656.0,
"valid_targets_min": 1294
},
{
"epoch": 5.828690807799443,
"grad_norm": 0.8103161574226729,
"learning_rate": 3.323966300016699e-06,
"loss": 0.1199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053418777883052826,
"step": 4185,
"valid_targets_mean": 1368.8,
"valid_targets_min": 790
},
{
"epoch": 5.835654596100278,
"grad_norm": 0.8465138226795567,
"learning_rate": 3.285721586332089e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06450681388378143,
"step": 4190,
"valid_targets_mean": 1765.8,
"valid_targets_min": 592
},
{
"epoch": 5.842618384401114,
"grad_norm": 0.8341389356508091,
"learning_rate": 3.247678464870556e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0624236986041069,
"step": 4195,
"valid_targets_mean": 1586.8,
"valid_targets_min": 662
},
{
"epoch": 5.84958217270195,
"grad_norm": 0.9648828608657739,
"learning_rate": 3.2098373944731696e-06,
"loss": 0.114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05213096737861633,
"step": 4200,
"valid_targets_mean": 1336.9,
"valid_targets_min": 622
},
{
"epoch": 5.8565459610027855,
"grad_norm": 0.8693836846048845,
"learning_rate": 3.1721988315440467e-06,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03882891684770584,
"step": 4205,
"valid_targets_mean": 1097.1,
"valid_targets_min": 625
},
{
"epoch": 5.8635097493036215,
"grad_norm": 0.8889935458275575,
"learning_rate": 3.1347632300448528e-06,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05130942910909653,
"step": 4210,
"valid_targets_mean": 1484.9,
"valid_targets_min": 888
},
{
"epoch": 5.870473537604457,
"grad_norm": 0.8950418860834436,
"learning_rate": 3.0975310414893147e-06,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06308726966381073,
"step": 4215,
"valid_targets_mean": 1757.0,
"valid_targets_min": 635
},
{
"epoch": 5.8774373259052926,
"grad_norm": 0.9448517682773246,
"learning_rate": 3.060502714937772e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06284761428833008,
"step": 4220,
"valid_targets_mean": 1476.1,
"valid_targets_min": 522
},
{
"epoch": 5.884401114206128,
"grad_norm": 0.8513582848638479,
"learning_rate": 3.023678696991774e-06,
"loss": 0.1155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04917547106742859,
"step": 4225,
"valid_targets_mean": 1230.9,
"valid_targets_min": 697
},
{
"epoch": 5.891364902506964,
"grad_norm": 0.8380241944756079,
"learning_rate": 2.9870594317887012e-06,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060824502259492874,
"step": 4230,
"valid_targets_mean": 1671.0,
"valid_targets_min": 1010
},
{
"epoch": 5.8983286908078,
"grad_norm": 0.9611502718725131,
"learning_rate": 2.950645360996378e-06,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05260036140680313,
"step": 4235,
"valid_targets_mean": 1411.0,
"valid_targets_min": 769
},
{
"epoch": 5.905292479108635,
"grad_norm": 0.8900339205155612,
"learning_rate": 2.914436923807773e-06,
"loss": 0.115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04677753150463104,
"step": 4240,
"valid_targets_mean": 1298.6,
"valid_targets_min": 745
},
{
"epoch": 5.912256267409471,
"grad_norm": 0.8870011470624816,
"learning_rate": 2.878434556935672e-06,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042783405631780624,
"step": 4245,
"valid_targets_mean": 1118.9,
"valid_targets_min": 680
},
{
"epoch": 5.919220055710307,
"grad_norm": 0.8118186588287939,
"learning_rate": 2.8426386946074625e-06,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07259643822908401,
"step": 4250,
"valid_targets_mean": 1905.9,
"valid_targets_min": 1347
},
{
"epoch": 5.926183844011142,
"grad_norm": 0.9846435636971836,
"learning_rate": 2.807049768559844e-06,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08297774195671082,
"step": 4255,
"valid_targets_mean": 1636.0,
"valid_targets_min": 851
},
{
"epoch": 5.933147632311978,
"grad_norm": 0.89306065477576,
"learning_rate": 2.771668208033642e-06,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05090225487947464,
"step": 4260,
"valid_targets_mean": 1457.2,
"valid_targets_min": 903
},
{
"epoch": 5.940111420612814,
"grad_norm": 0.8381846762533809,
"learning_rate": 2.7364944397686356e-06,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05966182425618172,
"step": 4265,
"valid_targets_mean": 1674.4,
"valid_targets_min": 1240
},
{
"epoch": 5.947075208913649,
"grad_norm": 0.6975382895103197,
"learning_rate": 2.7015288879984013e-06,
"loss": 0.1174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05049895867705345,
"step": 4270,
"valid_targets_mean": 1697.1,
"valid_targets_min": 917
},
{
"epoch": 5.954038997214485,
"grad_norm": 0.8183978547191294,
"learning_rate": 2.6667719744452037e-06,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05475775897502899,
"step": 4275,
"valid_targets_mean": 1580.9,
"valid_targets_min": 930
},
{
"epoch": 5.96100278551532,
"grad_norm": 0.8177442897301394,
"learning_rate": 2.6322241183149057e-06,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059341538697481155,
"step": 4280,
"valid_targets_mean": 1655.1,
"valid_targets_min": 1227
},
{
"epoch": 5.967966573816156,
"grad_norm": 0.8272238546293612,
"learning_rate": 2.5978857362919054e-06,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05763782560825348,
"step": 4285,
"valid_targets_mean": 1565.8,
"valid_targets_min": 870
},
{
"epoch": 5.974930362116992,
"grad_norm": 0.9573734999330009,
"learning_rate": 2.5637572425341174e-06,
"loss": 0.122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06584827601909637,
"step": 4290,
"valid_targets_mean": 1564.6,
"valid_targets_min": 822
},
{
"epoch": 5.981894150417827,
"grad_norm": 1.1210065324101028,
"learning_rate": 2.529839048667997e-06,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05611727386713028,
"step": 4295,
"valid_targets_mean": 1540.5,
"valid_targets_min": 1214
},
{
"epoch": 5.988857938718663,
"grad_norm": 0.8877917752913989,
"learning_rate": 2.4961315637835346e-06,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05314347892999649,
"step": 4300,
"valid_targets_mean": 1268.6,
"valid_targets_min": 591
},
{
"epoch": 5.995821727019498,
"grad_norm": 0.9062573425634036,
"learning_rate": 2.4626351944293435e-06,
"loss": 0.1205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04725968837738037,
"step": 4305,
"valid_targets_mean": 1232.5,
"valid_targets_min": 646
},
{
"epoch": 6.002785515320334,
"grad_norm": 0.9480677409493633,
"learning_rate": 2.4293503446077638e-06,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08825192600488663,
"step": 4310,
"valid_targets_mean": 8514.0,
"valid_targets_min": 6788
},
{
"epoch": 6.00974930362117,
"grad_norm": 0.8792429695725503,
"learning_rate": 2.3962774157699853e-06,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09347966313362122,
"step": 4315,
"valid_targets_mean": 6668.0,
"valid_targets_min": 5933
},
{
"epoch": 6.016713091922005,
"grad_norm": 0.7256186554172626,
"learning_rate": 2.363416806811196e-06,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07888566702604294,
"step": 4320,
"valid_targets_mean": 4107.0,
"valid_targets_min": 161
},
{
"epoch": 6.023676880222841,
"grad_norm": 0.5337563605817399,
"learning_rate": 2.3307689140657796e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07886291295289993,
"step": 4325,
"valid_targets_mean": 7946.0,
"valid_targets_min": 5596
},
{
"epoch": 6.030640668523677,
"grad_norm": 0.5250064440886613,
"learning_rate": 2.29833413130252e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08924835920333862,
"step": 4330,
"valid_targets_mean": 7392.8,
"valid_targets_min": 5629
},
{
"epoch": 6.037604456824512,
"grad_norm": 1.706269156371303,
"learning_rate": 2.2661128497198905e-06,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08858384191989899,
"step": 4335,
"valid_targets_mean": 6879.6,
"valid_targets_min": 5113
},
{
"epoch": 6.044568245125348,
"grad_norm": 0.4944795196550045,
"learning_rate": 2.234105457941289e-06,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08616100996732712,
"step": 4340,
"valid_targets_mean": 6919.5,
"valid_targets_min": 5080
},
{
"epoch": 6.0515320334261835,
"grad_norm": 0.46269857441542933,
"learning_rate": 2.202312342010382e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0758790597319603,
"step": 4345,
"valid_targets_mean": 6377.0,
"valid_targets_min": 3939
},
{
"epoch": 6.0584958217270195,
"grad_norm": 0.46714693312176175,
"learning_rate": 2.170733885386431e-06,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08216223120689392,
"step": 4350,
"valid_targets_mean": 6392.2,
"valid_targets_min": 4355
},
{
"epoch": 6.0654596100278555,
"grad_norm": 0.6249782828216601,
"learning_rate": 2.1393704689396812e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08479143679141998,
"step": 4355,
"valid_targets_mean": 5196.5,
"valid_targets_min": 137
},
{
"epoch": 6.072423398328691,
"grad_norm": 0.43679042233173293,
"learning_rate": 2.108222470946757e-06,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07390058040618896,
"step": 4360,
"valid_targets_mean": 7344.4,
"valid_targets_min": 5244
},
{
"epoch": 6.079387186629527,
"grad_norm": 0.43303393100622734,
"learning_rate": 2.077290267086105e-06,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06864619255065918,
"step": 4365,
"valid_targets_mean": 7921.0,
"valid_targets_min": 5311
},
{
"epoch": 6.086350974930362,
"grad_norm": 0.4246006529195599,
"learning_rate": 2.04657423043346e-06,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08542105555534363,
"step": 4370,
"valid_targets_mean": 7931.2,
"valid_targets_min": 6015
},
{
"epoch": 6.093314763231198,
"grad_norm": 0.4106570417894629,
"learning_rate": 2.016074731457356e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07517217099666595,
"step": 4375,
"valid_targets_mean": 7640.8,
"valid_targets_min": 5248
},
{
"epoch": 6.100278551532034,
"grad_norm": 0.4148098516880654,
"learning_rate": 1.9857921380146462e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07737202942371368,
"step": 4380,
"valid_targets_mean": 7249.6,
"valid_targets_min": 5217
},
{
"epoch": 6.107242339832869,
"grad_norm": 0.4436920181563948,
"learning_rate": 1.955726815346053e-06,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08977077901363373,
"step": 4385,
"valid_targets_mean": 7619.9,
"valid_targets_min": 5094
},
{
"epoch": 6.114206128133705,
"grad_norm": 0.40942198769595695,
"learning_rate": 1.9258791260717944e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07487683743238449,
"step": 4390,
"valid_targets_mean": 7732.8,
"valid_targets_min": 5842
},
{
"epoch": 6.121169916434541,
"grad_norm": 0.4096948039067667,
"learning_rate": 1.896249430187198e-06,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08216005563735962,
"step": 4395,
"valid_targets_mean": 7952.9,
"valid_targets_min": 5494
},
{
"epoch": 6.128133704735376,
"grad_norm": 0.5382913217347769,
"learning_rate": 1.866838085058349e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08534446358680725,
"step": 4400,
"valid_targets_mean": 8001.0,
"valid_targets_min": 5454
},
{
"epoch": 6.135097493036212,
"grad_norm": 0.4993178623034378,
"learning_rate": 1.837645445417786e-06,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05737616866827011,
"step": 4405,
"valid_targets_mean": 2985.1,
"valid_targets_min": 1896
},
{
"epoch": 6.142061281337047,
"grad_norm": 0.5514824724986366,
"learning_rate": 1.8086718633602252e-06,
"loss": 0.1294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07018405199050903,
"step": 4410,
"valid_targets_mean": 6714.6,
"valid_targets_min": 4917
},
{
"epoch": 6.149025069637883,
"grad_norm": 0.4252531390576798,
"learning_rate": 1.7799176883383152e-06,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08560578525066376,
"step": 4415,
"valid_targets_mean": 7595.2,
"valid_targets_min": 5488
},
{
"epoch": 6.155988857938719,
"grad_norm": 0.5092771217817552,
"learning_rate": 1.751383267158413e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08620335161685944,
"step": 4420,
"valid_targets_mean": 7046.1,
"valid_targets_min": 5579
},
{
"epoch": 6.162952646239554,
"grad_norm": 0.4716862438880787,
"learning_rate": 1.7230689439764136e-06,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07925520837306976,
"step": 4425,
"valid_targets_mean": 7108.0,
"valid_targets_min": 4963
},
{
"epoch": 6.16991643454039,
"grad_norm": 0.45619274881293254,
"learning_rate": 1.694975060293591e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08042465150356293,
"step": 4430,
"valid_targets_mean": 6810.1,
"valid_targets_min": 5666
},
{
"epoch": 6.176880222841225,
"grad_norm": 0.3901334892783887,
"learning_rate": 1.6671019549524724e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07437565922737122,
"step": 4435,
"valid_targets_mean": 8068.5,
"valid_targets_min": 5524
},
{
"epoch": 6.183844011142061,
"grad_norm": 0.40732855082482716,
"learning_rate": 1.63944996413278e-06,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06510244309902191,
"step": 4440,
"valid_targets_mean": 6553.8,
"valid_targets_min": 3621
},
{
"epoch": 6.190807799442897,
"grad_norm": 0.42124118933928567,
"learning_rate": 1.612019421347335e-06,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07448364794254303,
"step": 4445,
"valid_targets_mean": 6762.5,
"valid_targets_min": 4968
},
{
"epoch": 6.197771587743732,
"grad_norm": 0.4383555593223217,
"learning_rate": 1.5848106574380694e-06,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07571583241224289,
"step": 4450,
"valid_targets_mean": 6143.9,
"valid_targets_min": 4917
},
{
"epoch": 6.204735376044568,
"grad_norm": 0.5466494230157721,
"learning_rate": 1.5578240005720147e-06,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10035134851932526,
"step": 4455,
"valid_targets_mean": 4583.8,
"valid_targets_min": 215
},
{
"epoch": 6.211699164345404,
"grad_norm": 0.4040453396697649,
"learning_rate": 1.5310597762373624e-06,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08089716732501984,
"step": 4460,
"valid_targets_mean": 7317.1,
"valid_targets_min": 4948
},
{
"epoch": 6.218662952646239,
"grad_norm": 0.4727586903795262,
"learning_rate": 1.504518307239522e-06,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08399631083011627,
"step": 4465,
"valid_targets_mean": 6437.6,
"valid_targets_min": 4510
},
{
"epoch": 6.225626740947075,
"grad_norm": 0.47933738314929225,
"learning_rate": 1.478199913697227e-06,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09280038625001907,
"step": 4470,
"valid_targets_mean": 7707.9,
"valid_targets_min": 5796
},
{
"epoch": 6.2325905292479105,
"grad_norm": 0.41595542358539167,
"learning_rate": 1.4521049130386854e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07995796948671341,
"step": 4475,
"valid_targets_mean": 7900.9,
"valid_targets_min": 5643
},
{
"epoch": 6.2395543175487465,
"grad_norm": 0.4778381922849063,
"learning_rate": 1.4262336199977545e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08848213404417038,
"step": 4480,
"valid_targets_mean": 7627.2,
"valid_targets_min": 5742
},
{
"epoch": 6.2465181058495824,
"grad_norm": 0.4136225741751865,
"learning_rate": 1.4005863466101265e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09422549605369568,
"step": 4485,
"valid_targets_mean": 8725.6,
"valid_targets_min": 5141
},
{
"epoch": 6.2534818941504176,
"grad_norm": 0.5089693736225027,
"learning_rate": 1.375163402209576e-06,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09053859859704971,
"step": 4490,
"valid_targets_mean": 6967.8,
"valid_targets_min": 6088
},
{
"epoch": 6.2604456824512535,
"grad_norm": 0.4130639739472889,
"learning_rate": 1.3499650934242325e-06,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07545335590839386,
"step": 4495,
"valid_targets_mean": 7140.1,
"valid_targets_min": 4834
},
{
"epoch": 6.2674094707520895,
"grad_norm": 0.43000993148245376,
"learning_rate": 1.3249917241728704e-06,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07579700648784637,
"step": 4500,
"valid_targets_mean": 6706.9,
"valid_targets_min": 5108
},
{
"epoch": 6.274373259052925,
"grad_norm": 0.5160601513181945,
"learning_rate": 1.3002435956612614e-06,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08105462789535522,
"step": 4505,
"valid_targets_mean": 5931.4,
"valid_targets_min": 4708
},
{
"epoch": 6.281337047353761,
"grad_norm": 0.44759379754062206,
"learning_rate": 1.2757210063785186e-06,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07396161556243896,
"step": 4510,
"valid_targets_mean": 7145.6,
"valid_targets_min": 5280
},
{
"epoch": 6.288300835654596,
"grad_norm": 0.7344682406855992,
"learning_rate": 1.2514242520935182e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04381747171282768,
"step": 4515,
"valid_targets_mean": 1554.9,
"valid_targets_min": 592
},
{
"epoch": 6.295264623955432,
"grad_norm": 0.46744454281739256,
"learning_rate": 1.2273536258513174e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09317928552627563,
"step": 4520,
"valid_targets_mean": 7069.5,
"valid_targets_min": 4765
},
{
"epoch": 6.302228412256268,
"grad_norm": 0.44624650053434495,
"learning_rate": 1.2035094179696305e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08074669539928436,
"step": 4525,
"valid_targets_mean": 6193.4,
"valid_targets_min": 5587
},
{
"epoch": 6.309192200557103,
"grad_norm": 0.45433035530886273,
"learning_rate": 1.1798919160353183e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0842660665512085,
"step": 4530,
"valid_targets_mean": 6612.2,
"valid_targets_min": 4894
},
{
"epoch": 6.316155988857939,
"grad_norm": 0.4219263161331273,
"learning_rate": 1.1565014049009227e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07519182562828064,
"step": 4535,
"valid_targets_mean": 6605.9,
"valid_targets_min": 3795
},
{
"epoch": 6.323119777158775,
"grad_norm": 0.428099298209557,
"learning_rate": 1.1333381666812326e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08015845715999603,
"step": 4540,
"valid_targets_mean": 7186.8,
"valid_targets_min": 4890
},
{
"epoch": 6.33008356545961,
"grad_norm": 0.5405733766441226,
"learning_rate": 1.110402480749886e-06,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08327323198318481,
"step": 4545,
"valid_targets_mean": 6544.4,
"valid_targets_min": 4615
},
{
"epoch": 6.337047353760446,
"grad_norm": 0.48862459251110824,
"learning_rate": 1.0876946237359887e-06,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0856969878077507,
"step": 4550,
"valid_targets_mean": 6339.2,
"valid_targets_min": 4798
},
{
"epoch": 6.344011142061281,
"grad_norm": 0.5591305131293233,
"learning_rate": 1.0652148695207809e-06,
"loss": 0.1176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08373311161994934,
"step": 4555,
"valid_targets_mean": 4558.8,
"valid_targets_min": 148
},
{
"epoch": 6.350974930362117,
"grad_norm": 0.4694300456582176,
"learning_rate": 1.042963489234341e-06,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08754730969667435,
"step": 4560,
"valid_targets_mean": 6807.9,
"valid_targets_min": 5164
},
{
"epoch": 6.357938718662953,
"grad_norm": 0.4564231493271595,
"learning_rate": 1.0209407512523194e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07847484946250916,
"step": 4565,
"valid_targets_mean": 7011.8,
"valid_targets_min": 4974
},
{
"epoch": 6.364902506963788,
"grad_norm": 0.44585558276766535,
"learning_rate": 9.99146921192682e-07,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07176651060581207,
"step": 4570,
"valid_targets_mean": 5794.2,
"valid_targets_min": 4809
},
{
"epoch": 6.371866295264624,
"grad_norm": 0.4586375643278151,
"learning_rate": 9.775822619125242e-07,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06948361545801163,
"step": 4575,
"valid_targets_mean": 6401.8,
"valid_targets_min": 4842
},
{
"epoch": 6.378830083565459,
"grad_norm": 0.4501958201734831,
"learning_rate": 9.562470335048912e-07,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07945942133665085,
"step": 4580,
"valid_targets_mean": 6182.1,
"valid_targets_min": 5116
},
{
"epoch": 6.385793871866295,
"grad_norm": 0.4327240600935404,
"learning_rate": 9.351414932956482e-07,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0714079886674881,
"step": 4585,
"valid_targets_mean": 6165.1,
"valid_targets_min": 5764
},
{
"epoch": 6.392757660167131,
"grad_norm": 0.8047252344536302,
"learning_rate": 9.142658958403694e-07,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05607593059539795,
"step": 4590,
"valid_targets_mean": 1428.2,
"valid_targets_min": 1062
},
{
"epoch": 6.399721448467966,
"grad_norm": 0.8195753374003149,
"learning_rate": 8.936204929212766e-07,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06777313351631165,
"step": 4595,
"valid_targets_mean": 1663.0,
"valid_targets_min": 960
},
{
"epoch": 6.406685236768802,
"grad_norm": 0.833685966360577,
"learning_rate": 8.732055335441902e-07,
"loss": 0.1253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06374421715736389,
"step": 4600,
"valid_targets_mean": 1476.5,
"valid_targets_min": 933
},
{
"epoch": 6.413649025069638,
"grad_norm": 0.780358085772891,
"learning_rate": 8.530212639355384e-07,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06148510053753853,
"step": 4605,
"valid_targets_mean": 1478.1,
"valid_targets_min": 881
},
{
"epoch": 6.420612813370473,
"grad_norm": 0.890308955107473,
"learning_rate": 8.330679275393816e-07,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07429173588752747,
"step": 4610,
"valid_targets_mean": 1640.6,
"valid_targets_min": 869
},
{
"epoch": 6.427576601671309,
"grad_norm": 0.9489952322841751,
"learning_rate": 8.133457650144705e-07,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06858045607805252,
"step": 4615,
"valid_targets_mean": 1709.0,
"valid_targets_min": 1090
},
{
"epoch": 6.4345403899721445,
"grad_norm": 0.8409646954850704,
"learning_rate": 7.938550142313594e-07,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046157389879226685,
"step": 4620,
"valid_targets_mean": 1157.9,
"valid_targets_min": 761
},
{
"epoch": 6.4415041782729805,
"grad_norm": 0.7487722194005665,
"learning_rate": 7.7459591026952e-07,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05890098214149475,
"step": 4625,
"valid_targets_mean": 1553.6,
"valid_targets_min": 1241
},
{
"epoch": 6.4484679665738165,
"grad_norm": 0.7904874191930988,
"learning_rate": 7.555686854145184e-07,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05734875053167343,
"step": 4630,
"valid_targets_mean": 1538.1,
"valid_targets_min": 733
},
{
"epoch": 6.455431754874652,
"grad_norm": 0.792386346804611,
"learning_rate": 7.367735691552047e-07,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03880469501018524,
"step": 4635,
"valid_targets_mean": 1250.6,
"valid_targets_min": 835
},
{
"epoch": 6.462395543175488,
"grad_norm": 0.860965341679149,
"learning_rate": 7.182107881809486e-07,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06356509774923325,
"step": 4640,
"valid_targets_mean": 1596.2,
"valid_targets_min": 1046
},
{
"epoch": 6.469359331476323,
"grad_norm": 0.8718675926426537,
"learning_rate": 6.998805663789077e-07,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05807361379265785,
"step": 4645,
"valid_targets_mean": 1646.5,
"valid_targets_min": 797
},
{
"epoch": 6.476323119777159,
"grad_norm": 0.8164546555462905,
"learning_rate": 6.817831248313279e-07,
"loss": 0.1123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05345907807350159,
"step": 4650,
"valid_targets_mean": 1448.9,
"valid_targets_min": 570
},
{
"epoch": 6.483286908077995,
"grad_norm": 0.7688143714918261,
"learning_rate": 6.639186818128696e-07,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04237380996346474,
"step": 4655,
"valid_targets_mean": 1164.1,
"valid_targets_min": 548
},
{
"epoch": 6.49025069637883,
"grad_norm": 0.8494248149460677,
"learning_rate": 6.462874527879859e-07,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05192333832383156,
"step": 4660,
"valid_targets_mean": 1338.0,
"valid_targets_min": 682
},
{
"epoch": 6.497214484679666,
"grad_norm": 0.9725150847641078,
"learning_rate": 6.288896504083019e-07,
"loss": 0.1176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06402169167995453,
"step": 4665,
"valid_targets_mean": 1632.8,
"valid_targets_min": 896
},
{
"epoch": 6.504178272980502,
"grad_norm": 0.8615786174263845,
"learning_rate": 6.117254845100884e-07,
"loss": 0.115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0654836893081665,
"step": 4670,
"valid_targets_mean": 1806.5,
"valid_targets_min": 597
},
{
"epoch": 6.511142061281337,
"grad_norm": 0.8339197139282923,
"learning_rate": 5.947951621116899e-07,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049058057367801666,
"step": 4675,
"valid_targets_mean": 1289.9,
"valid_targets_min": 706
},
{
"epoch": 6.518105849582173,
"grad_norm": 0.7968481465627608,
"learning_rate": 5.78098887411056e-07,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04030627757310867,
"step": 4680,
"valid_targets_mean": 1354.1,
"valid_targets_min": 754
},
{
"epoch": 6.525069637883008,
"grad_norm": 0.7476070454913744,
"learning_rate": 5.616368617832657e-07,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049573637545108795,
"step": 4685,
"valid_targets_mean": 1461.9,
"valid_targets_min": 819
},
{
"epoch": 6.532033426183844,
"grad_norm": 1.0053730974789308,
"learning_rate": 5.454092837781e-07,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041574910283088684,
"step": 4690,
"valid_targets_mean": 1225.5,
"valid_targets_min": 684
},
{
"epoch": 6.53899721448468,
"grad_norm": 0.9520563364369184,
"learning_rate": 5.294163491176507e-07,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05617387592792511,
"step": 4695,
"valid_targets_mean": 1282.2,
"valid_targets_min": 711
},
{
"epoch": 6.545961002785515,
"grad_norm": 1.2484349046028755,
"learning_rate": 5.136582506939558e-07,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06170322746038437,
"step": 4700,
"valid_targets_mean": 1634.8,
"valid_targets_min": 1190
},
{
"epoch": 6.552924791086351,
"grad_norm": 0.8277215108085088,
"learning_rate": 4.981351785666788e-07,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05962364748120308,
"step": 4705,
"valid_targets_mean": 1615.9,
"valid_targets_min": 774
},
{
"epoch": 6.559888579387186,
"grad_norm": 1.256443333024305,
"learning_rate": 4.828473199608086e-07,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062144938856363297,
"step": 4710,
"valid_targets_mean": 1848.4,
"valid_targets_min": 734
},
{
"epoch": 6.566852367688022,
"grad_norm": 0.8519945991274293,
"learning_rate": 4.6779485926440994e-07,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06112103536725044,
"step": 4715,
"valid_targets_mean": 1570.6,
"valid_targets_min": 1011
},
{
"epoch": 6.573816155988858,
"grad_norm": 0.8867015908107557,
"learning_rate": 4.529779780263899e-07,
"loss": 0.1188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06696411967277527,
"step": 4720,
"valid_targets_mean": 1697.0,
"valid_targets_min": 803
},
{
"epoch": 6.580779944289693,
"grad_norm": 0.8971331539026275,
"learning_rate": 4.3839685495431494e-07,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05167017877101898,
"step": 4725,
"valid_targets_mean": 1307.1,
"valid_targets_min": 782
},
{
"epoch": 6.587743732590529,
"grad_norm": 0.8240677573070857,
"learning_rate": 4.240516659122529e-07,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05892687290906906,
"step": 4730,
"valid_targets_mean": 1596.6,
"valid_targets_min": 646
},
{
"epoch": 6.594707520891365,
"grad_norm": 0.8777230504903879,
"learning_rate": 4.099425839186588e-07,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07540211081504822,
"step": 4735,
"valid_targets_mean": 1817.5,
"valid_targets_min": 922
},
{
"epoch": 6.6016713091922,
"grad_norm": 0.9233129928932025,
"learning_rate": 3.960697791442725e-07,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06853315234184265,
"step": 4740,
"valid_targets_mean": 1822.2,
"valid_targets_min": 796
},
{
"epoch": 6.608635097493036,
"grad_norm": 0.8365359905989758,
"learning_rate": 3.824334189100864e-07,
"loss": 0.1067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05597367510199547,
"step": 4745,
"valid_targets_mean": 1542.4,
"valid_targets_min": 903
},
{
"epoch": 6.615598885793872,
"grad_norm": 0.8653881395676635,
"learning_rate": 3.6903366768530347e-07,
"loss": 0.1093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059465356171131134,
"step": 4750,
"valid_targets_mean": 1459.5,
"valid_targets_min": 780
},
{
"epoch": 6.6225626740947074,
"grad_norm": 1.0220209875020088,
"learning_rate": 3.558706870853801e-07,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05482107773423195,
"step": 4755,
"valid_targets_mean": 1581.1,
"valid_targets_min": 783
},
{
"epoch": 6.629526462395543,
"grad_norm": 0.8895541017805985,
"learning_rate": 3.42944635870055e-07,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04831491783261299,
"step": 4760,
"valid_targets_mean": 1342.1,
"valid_targets_min": 662
},
{
"epoch": 6.6364902506963785,
"grad_norm": 0.85022678615267,
"learning_rate": 3.302556699414461e-07,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04755166172981262,
"step": 4765,
"valid_targets_mean": 1269.1,
"valid_targets_min": 724
},
{
"epoch": 6.6434540389972145,
"grad_norm": 0.9159333691892194,
"learning_rate": 3.178039423421675e-07,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05955637991428375,
"step": 4770,
"valid_targets_mean": 1510.1,
"valid_targets_min": 966
},
{
"epoch": 6.65041782729805,
"grad_norm": 0.8794943394432526,
"learning_rate": 3.055896032534844e-07,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04700024425983429,
"step": 4775,
"valid_targets_mean": 1327.8,
"valid_targets_min": 773
},
{
"epoch": 6.657381615598886,
"grad_norm": 1.0648559373125812,
"learning_rate": 2.9361279999349456e-07,
"loss": 0.1072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0473455972969532,
"step": 4780,
"valid_targets_mean": 1353.2,
"valid_targets_min": 807
},
{
"epoch": 6.664345403899722,
"grad_norm": 0.8462867733368669,
"learning_rate": 2.8187367701536514e-07,
"loss": 0.1106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0411439947783947,
"step": 4785,
"valid_targets_mean": 1142.5,
"valid_targets_min": 782
},
{
"epoch": 6.671309192200557,
"grad_norm": 0.8759881208699287,
"learning_rate": 2.7037237590557874e-07,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06818887591362,
"step": 4790,
"valid_targets_mean": 1849.9,
"valid_targets_min": 634
},
{
"epoch": 6.678272980501393,
"grad_norm": 0.8652916414354441,
"learning_rate": 2.591090353822279e-07,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05813930183649063,
"step": 4795,
"valid_targets_mean": 1599.6,
"valid_targets_min": 573
},
{
"epoch": 6.685236768802229,
"grad_norm": 0.8289668185741821,
"learning_rate": 2.480837912933476e-07,
"loss": 0.1141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06298094987869263,
"step": 4800,
"valid_targets_mean": 1994.9,
"valid_targets_min": 1102
},
{
"epoch": 6.692200557103064,
"grad_norm": 0.8437774991054501,
"learning_rate": 2.372967766152745e-07,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04422305151820183,
"step": 4805,
"valid_targets_mean": 1239.2,
"valid_targets_min": 841
},
{
"epoch": 6.6991643454039,
"grad_norm": 0.8335016224230695,
"learning_rate": 2.2674812145103253e-07,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04819972813129425,
"step": 4810,
"valid_targets_mean": 1467.5,
"valid_targets_min": 956
},
{
"epoch": 6.706128133704736,
"grad_norm": 0.9023177270948384,
"learning_rate": 2.16437953028783e-07,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05732536315917969,
"step": 4815,
"valid_targets_mean": 1300.9,
"valid_targets_min": 857
},
{
"epoch": 6.713091922005571,
"grad_norm": 0.8464182537507942,
"learning_rate": 2.0636639570027706e-07,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054763518273830414,
"step": 4820,
"valid_targets_mean": 1389.8,
"valid_targets_min": 808
},
{
"epoch": 6.720055710306407,
"grad_norm": 0.8724602751899221,
"learning_rate": 1.9653357093935677e-07,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05148616060614586,
"step": 4825,
"valid_targets_mean": 1303.8,
"valid_targets_min": 677
},
{
"epoch": 6.727019498607242,
"grad_norm": 0.892862606177971,
"learning_rate": 1.8693959734049194e-07,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04439748823642731,
"step": 4830,
"valid_targets_mean": 1220.1,
"valid_targets_min": 727
},
{
"epoch": 6.733983286908078,
"grad_norm": 0.8006054734140239,
"learning_rate": 1.7758459061735235e-07,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04145853966474533,
"step": 4835,
"valid_targets_mean": 1262.0,
"valid_targets_min": 726
},
{
"epoch": 6.740947075208914,
"grad_norm": 0.9012716233194072,
"learning_rate": 1.6846866360140434e-07,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06492114067077637,
"step": 4840,
"valid_targets_mean": 1615.0,
"valid_targets_min": 669
},
{
"epoch": 6.747910863509749,
"grad_norm": 0.8349181470475844,
"learning_rate": 1.595919262405632e-07,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05895448848605156,
"step": 4845,
"valid_targets_mean": 1806.5,
"valid_targets_min": 792
},
{
"epoch": 6.754874651810585,
"grad_norm": 0.8116954418998069,
"learning_rate": 1.5095448559785176e-07,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05427628010511398,
"step": 4850,
"valid_targets_mean": 1627.6,
"valid_targets_min": 736
},
{
"epoch": 6.76183844011142,
"grad_norm": 0.8820001141515799,
"learning_rate": 1.425564458501194e-07,
"loss": 0.1152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07305572926998138,
"step": 4855,
"valid_targets_mean": 1822.9,
"valid_targets_min": 694
},
{
"epoch": 6.768802228412256,
"grad_norm": 0.8785588698821919,
"learning_rate": 1.3439790828678523e-07,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06912118941545486,
"step": 4860,
"valid_targets_mean": 1848.9,
"valid_targets_min": 1437
},
{
"epoch": 6.775766016713092,
"grad_norm": 0.8363864610673993,
"learning_rate": 1.2647897130860566e-07,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06591206789016724,
"step": 4865,
"valid_targets_mean": 1852.4,
"valid_targets_min": 809
},
{
"epoch": 6.782729805013927,
"grad_norm": 0.8474827648363192,
"learning_rate": 1.187997304265065e-07,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05124801769852638,
"step": 4870,
"valid_targets_mean": 1375.5,
"valid_targets_min": 790
},
{
"epoch": 6.789693593314763,
"grad_norm": 0.8696793467523222,
"learning_rate": 1.1136027826040841e-07,
"loss": 0.102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048445772379636765,
"step": 4875,
"valid_targets_mean": 1338.8,
"valid_targets_min": 750
},
{
"epoch": 6.796657381615599,
"grad_norm": 0.9202757557686742,
"learning_rate": 1.041607045381321e-07,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06679531186819077,
"step": 4880,
"valid_targets_mean": 1778.8,
"valid_targets_min": 826
},
{
"epoch": 6.803621169916434,
"grad_norm": 0.8516595011162112,
"learning_rate": 9.720109609429928e-08,
"loss": 0.1121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05206713080406189,
"step": 4885,
"valid_targets_mean": 1600.8,
"valid_targets_min": 907
},
{
"epoch": 6.81058495821727,
"grad_norm": 0.8400966183501765,
"learning_rate": 9.04815368692935e-08,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05995471403002739,
"step": 4890,
"valid_targets_mean": 1474.5,
"valid_targets_min": 1093
},
{
"epoch": 6.8175487465181055,
"grad_norm": 0.8562520722201993,
"learning_rate": 8.400210790824536e-08,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06154263764619827,
"step": 4895,
"valid_targets_mean": 1577.2,
"valid_targets_min": 1119
},
{
"epoch": 6.8245125348189415,
"grad_norm": 0.8814865307617711,
"learning_rate": 7.776288736005776e-08,
"loss": 0.1132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06116368994116783,
"step": 4900,
"valid_targets_mean": 1512.1,
"valid_targets_min": 700
},
{
"epoch": 6.8314763231197775,
"grad_norm": 0.816015444670367,
"learning_rate": 7.176395047645557e-08,
"loss": 0.11,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0455644354224205,
"step": 4905,
"valid_targets_mean": 1288.2,
"valid_targets_min": 810
},
{
"epoch": 6.838440111420613,
"grad_norm": 0.9432317625659447,
"learning_rate": 6.600536961109072e-08,
"loss": 0.1136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052437908947467804,
"step": 4910,
"valid_targets_mean": 1328.9,
"valid_targets_min": 635
},
{
"epoch": 6.845403899721449,
"grad_norm": 0.8794044449829441,
"learning_rate": 6.048721421865633e-08,
"loss": 0.1057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059289056807756424,
"step": 4915,
"valid_targets_mean": 1542.5,
"valid_targets_min": 673
},
{
"epoch": 6.852367688022284,
"grad_norm": 0.9326004661735458,
"learning_rate": 5.5209550854058435e-08,
"loss": 0.1152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06115001440048218,
"step": 4920,
"valid_targets_mean": 1215.6,
"valid_targets_min": 641
},
{
"epoch": 6.85933147632312,
"grad_norm": 0.8767540104775717,
"learning_rate": 5.017244317160997e-08,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04882102459669113,
"step": 4925,
"valid_targets_mean": 1222.6,
"valid_targets_min": 701
},
{
"epoch": 6.866295264623956,
"grad_norm": 0.8971771361885165,
"learning_rate": 4.537595192425803e-08,
"loss": 0.1211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0595490038394928,
"step": 4930,
"valid_targets_mean": 1850.6,
"valid_targets_min": 1202
},
{
"epoch": 6.873259052924791,
"grad_norm": 0.8299434208974764,
"learning_rate": 4.0820134962864525e-08,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044841837137937546,
"step": 4935,
"valid_targets_mean": 1265.5,
"valid_targets_min": 657
},
{
"epoch": 6.880222841225627,
"grad_norm": 0.901095866607732,
"learning_rate": 3.650504723549109e-08,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05367933213710785,
"step": 4940,
"valid_targets_mean": 1388.0,
"valid_targets_min": 672
},
{
"epoch": 6.887186629526463,
"grad_norm": 0.8315063396628217,
"learning_rate": 3.243074078675301e-08,
"loss": 0.1088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06695376336574554,
"step": 4945,
"valid_targets_mean": 1813.6,
"valid_targets_min": 1019
},
{
"epoch": 6.894150417827298,
"grad_norm": 0.8625526799833706,
"learning_rate": 2.85972647571775e-08,
"loss": 0.1029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044332314282655716,
"step": 4950,
"valid_targets_mean": 1114.6,
"valid_targets_min": 732
},
{
"epoch": 6.901114206128134,
"grad_norm": 1.0040487494315289,
"learning_rate": 2.5004665382619698e-08,
"loss": 0.1126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0398283377289772,
"step": 4955,
"valid_targets_mean": 1194.5,
"valid_targets_min": 634
},
{
"epoch": 6.908077994428969,
"grad_norm": 0.8569836647676721,
"learning_rate": 2.1652985993705355e-08,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0556265227496624,
"step": 4960,
"valid_targets_mean": 1756.5,
"valid_targets_min": 905
},
{
"epoch": 6.915041782729805,
"grad_norm": 0.8794612149843942,
"learning_rate": 1.8542267015297932e-08,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06186116486787796,
"step": 4965,
"valid_targets_mean": 1554.9,
"valid_targets_min": 596
},
{
"epoch": 6.922005571030641,
"grad_norm": 0.8682797357172517,
"learning_rate": 1.5672545966025633e-08,
"loss": 0.105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0438067801296711,
"step": 4970,
"valid_targets_mean": 1214.6,
"valid_targets_min": 687
},
{
"epoch": 6.928969359331476,
"grad_norm": 0.8529938938679981,
"learning_rate": 1.3043857457819553e-08,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06511755287647247,
"step": 4975,
"valid_targets_mean": 1955.1,
"valid_targets_min": 1199
},
{
"epoch": 6.935933147632312,
"grad_norm": 0.8325142431206025,
"learning_rate": 1.0656233195498466e-08,
"loss": 0.1088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059841353446245193,
"step": 4980,
"valid_targets_mean": 1758.6,
"valid_targets_min": 1214
},
{
"epoch": 6.942896935933147,
"grad_norm": 0.8532395148660459,
"learning_rate": 8.509701976382456e-09,
"loss": 0.1079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06080895662307739,
"step": 4985,
"valid_targets_mean": 1711.5,
"valid_targets_min": 1122
},
{
"epoch": 6.949860724233983,
"grad_norm": 0.8576769303500783,
"learning_rate": 6.6042896899576324e-09,
"loss": 0.1106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051803942769765854,
"step": 4990,
"valid_targets_mean": 1489.6,
"valid_targets_min": 850
},
{
"epoch": 6.956824512534819,
"grad_norm": 0.7839478511204715,
"learning_rate": 4.940019317547506e-09,
"loss": 0.0999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049742192029953,
"step": 4995,
"valid_targets_mean": 1572.4,
"valid_targets_min": 1318
},
{
"epoch": 6.963788300835654,
"grad_norm": 0.8785812149835993,
"learning_rate": 3.516910932048756e-09,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060333505272865295,
"step": 5000,
"valid_targets_mean": 1500.0,
"valid_targets_min": 1043
},
{
"epoch": 6.97075208913649,
"grad_norm": 0.8822603333113546,
"learning_rate": 2.3349816976825367e-09,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06858158856630325,
"step": 5005,
"valid_targets_mean": 1774.9,
"valid_targets_min": 920
},
{
"epoch": 6.977715877437326,
"grad_norm": 0.8367535436815119,
"learning_rate": 1.3942458697924211e-09,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05870440602302551,
"step": 5010,
"valid_targets_mean": 1547.1,
"valid_targets_min": 847
},
{
"epoch": 6.984679665738161,
"grad_norm": 0.7917458458759404,
"learning_rate": 6.947147946645416e-10,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05920833349227905,
"step": 5015,
"valid_targets_mean": 1769.4,
"valid_targets_min": 738
},
{
"epoch": 6.991643454038997,
"grad_norm": 0.9106170116332665,
"learning_rate": 2.3639690939880613e-10,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06107974797487259,
"step": 5020,
"valid_targets_mean": 1540.1,
"valid_targets_min": 594
},
{
"epoch": 6.998607242339833,
"grad_norm": 1.1797464944725595,
"learning_rate": 1.929774180231547e-11,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06046333163976669,
"step": 5025,
"valid_targets_mean": 2228.6,
"valid_targets_min": 1393
},
{
"epoch": 7.0,
"step": 5026,
"total_flos": 1.6519984675532308e+18,
"train_loss": 0.0,
"train_runtime": 1.7845,
"train_samples_per_second": 45043.632,
"train_steps_per_second": 2816.453
}
],
"logging_steps": 5,
"max_steps": 5026,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.6519984675532308e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}