swesmith-bugsseq / trainer_state.json
penfever's picture
End of training
7acd8db verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 6187,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.005659309564233163,
"grad_norm": 13.932631974720623,
"learning_rate": 2.584814216478191e-07,
"loss": 0.6701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3416905999183655,
"step": 5,
"valid_targets_mean": 7214.4,
"valid_targets_min": 4847
},
{
"epoch": 0.011318619128466326,
"grad_norm": 13.104201365603958,
"learning_rate": 5.815831987075929e-07,
"loss": 0.6193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30890709161758423,
"step": 10,
"valid_targets_mean": 6417.1,
"valid_targets_min": 4480
},
{
"epoch": 0.01697792869269949,
"grad_norm": 12.986646595432257,
"learning_rate": 9.046849757673668e-07,
"loss": 0.6611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3296949863433838,
"step": 15,
"valid_targets_mean": 7605.4,
"valid_targets_min": 5236
},
{
"epoch": 0.022637238256932653,
"grad_norm": 12.202975712757784,
"learning_rate": 1.2277867528271405e-06,
"loss": 0.6527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29244548082351685,
"step": 20,
"valid_targets_mean": 5827.9,
"valid_targets_min": 4727
},
{
"epoch": 0.028296547821165818,
"grad_norm": 8.284738278527138,
"learning_rate": 1.5508885298869145e-06,
"loss": 0.6323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3284326195716858,
"step": 25,
"valid_targets_mean": 6448.2,
"valid_targets_min": 4211
},
{
"epoch": 0.03395585738539898,
"grad_norm": 6.699927356351593,
"learning_rate": 1.8739903069466882e-06,
"loss": 0.5787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3189699649810791,
"step": 30,
"valid_targets_mean": 6108.1,
"valid_targets_min": 4279
},
{
"epoch": 0.039615166949632144,
"grad_norm": 5.491375033981934,
"learning_rate": 2.197092084006462e-06,
"loss": 0.5324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2483714073896408,
"step": 35,
"valid_targets_mean": 5962.4,
"valid_targets_min": 4589
},
{
"epoch": 0.045274476513865305,
"grad_norm": 5.479122606853314,
"learning_rate": 2.5201938610662364e-06,
"loss": 0.5064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21808978915214539,
"step": 40,
"valid_targets_mean": 3503.2,
"valid_targets_min": 2015
},
{
"epoch": 0.050933786078098474,
"grad_norm": 2.1266074610168677,
"learning_rate": 2.84329563812601e-06,
"loss": 0.4299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1883259415626526,
"step": 45,
"valid_targets_mean": 6102.5,
"valid_targets_min": 4778
},
{
"epoch": 0.056593095642331635,
"grad_norm": 1.5323390515097495,
"learning_rate": 3.166397415185784e-06,
"loss": 0.4095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19586817920207977,
"step": 50,
"valid_targets_mean": 5868.2,
"valid_targets_min": 4612
},
{
"epoch": 0.0622524052065648,
"grad_norm": 1.159860405025848,
"learning_rate": 3.489499192245558e-06,
"loss": 0.4175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21410322189331055,
"step": 55,
"valid_targets_mean": 6105.8,
"valid_targets_min": 4491
},
{
"epoch": 0.06791171477079797,
"grad_norm": 0.894038373410666,
"learning_rate": 3.812600969305332e-06,
"loss": 0.3799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17711375653743744,
"step": 60,
"valid_targets_mean": 6962.0,
"valid_targets_min": 4754
},
{
"epoch": 0.07357102433503113,
"grad_norm": 0.8624955501056109,
"learning_rate": 4.1357027463651056e-06,
"loss": 0.3707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1949971616268158,
"step": 65,
"valid_targets_mean": 6035.1,
"valid_targets_min": 4787
},
{
"epoch": 0.07923033389926429,
"grad_norm": 0.7091607001817442,
"learning_rate": 4.458804523424879e-06,
"loss": 0.361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18302902579307556,
"step": 70,
"valid_targets_mean": 6028.5,
"valid_targets_min": 5213
},
{
"epoch": 0.08488964346349745,
"grad_norm": 0.585307554413562,
"learning_rate": 4.781906300484653e-06,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14917157590389252,
"step": 75,
"valid_targets_mean": 6814.1,
"valid_targets_min": 4664
},
{
"epoch": 0.09054895302773061,
"grad_norm": 0.6376342595638888,
"learning_rate": 5.105008077544427e-06,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16629627346992493,
"step": 80,
"valid_targets_mean": 6281.5,
"valid_targets_min": 4996
},
{
"epoch": 0.09620826259196379,
"grad_norm": 0.5883660151243281,
"learning_rate": 5.4281098546042014e-06,
"loss": 0.3411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16139009594917297,
"step": 85,
"valid_targets_mean": 6628.9,
"valid_targets_min": 4582
},
{
"epoch": 0.10186757215619695,
"grad_norm": 0.5306968778726449,
"learning_rate": 5.751211631663974e-06,
"loss": 0.3247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1460968554019928,
"step": 90,
"valid_targets_mean": 6536.6,
"valid_targets_min": 5205
},
{
"epoch": 0.10752688172043011,
"grad_norm": 0.5036303188428934,
"learning_rate": 6.074313408723749e-06,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15533623099327087,
"step": 95,
"valid_targets_mean": 7031.0,
"valid_targets_min": 5098
},
{
"epoch": 0.11318619128466327,
"grad_norm": 0.516720651939086,
"learning_rate": 6.397415185783522e-06,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1776922047138214,
"step": 100,
"valid_targets_mean": 6514.2,
"valid_targets_min": 5016
},
{
"epoch": 0.11884550084889643,
"grad_norm": 0.538952735082876,
"learning_rate": 6.7205169628432965e-06,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20050251483917236,
"step": 105,
"valid_targets_mean": 6330.0,
"valid_targets_min": 965
},
{
"epoch": 0.1245048104131296,
"grad_norm": 0.5135956002010927,
"learning_rate": 7.043618739903069e-06,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15224193036556244,
"step": 110,
"valid_targets_mean": 6293.1,
"valid_targets_min": 5218
},
{
"epoch": 0.13016411997736277,
"grad_norm": 0.4731793435324797,
"learning_rate": 7.366720516962844e-06,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13703802227973938,
"step": 115,
"valid_targets_mean": 6957.4,
"valid_targets_min": 4213
},
{
"epoch": 0.13582342954159593,
"grad_norm": 0.5989726776221539,
"learning_rate": 7.689822294022618e-06,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16760709881782532,
"step": 120,
"valid_targets_mean": 5888.5,
"valid_targets_min": 4923
},
{
"epoch": 0.1414827391058291,
"grad_norm": 0.4926854131506727,
"learning_rate": 8.012924071082391e-06,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19979137182235718,
"step": 125,
"valid_targets_mean": 7822.9,
"valid_targets_min": 4993
},
{
"epoch": 0.14714204867006225,
"grad_norm": 0.6268142920401387,
"learning_rate": 8.336025848142165e-06,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16050826013088226,
"step": 130,
"valid_targets_mean": 6098.6,
"valid_targets_min": 4872
},
{
"epoch": 0.15280135823429541,
"grad_norm": 0.6293607807525029,
"learning_rate": 8.659127625201939e-06,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15364673733711243,
"step": 135,
"valid_targets_mean": 6892.2,
"valid_targets_min": 4706
},
{
"epoch": 0.15846066779852858,
"grad_norm": 0.6156398588670324,
"learning_rate": 8.982229402261713e-06,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13796129822731018,
"step": 140,
"valid_targets_mean": 6352.0,
"valid_targets_min": 4889
},
{
"epoch": 0.16411997736276174,
"grad_norm": 0.5767454589802685,
"learning_rate": 9.305331179321486e-06,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13889192044734955,
"step": 145,
"valid_targets_mean": 5948.9,
"valid_targets_min": 3888
},
{
"epoch": 0.1697792869269949,
"grad_norm": 0.6287336280725723,
"learning_rate": 9.62843295638126e-06,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13580778241157532,
"step": 150,
"valid_targets_mean": 5846.2,
"valid_targets_min": 4051
},
{
"epoch": 0.17543859649122806,
"grad_norm": 0.4685830287171293,
"learning_rate": 9.951534733441036e-06,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14092932641506195,
"step": 155,
"valid_targets_mean": 7319.2,
"valid_targets_min": 5230
},
{
"epoch": 0.18109790605546122,
"grad_norm": 0.5282874259897358,
"learning_rate": 1.0274636510500808e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14267754554748535,
"step": 160,
"valid_targets_mean": 8235.1,
"valid_targets_min": 4997
},
{
"epoch": 0.1867572156196944,
"grad_norm": 0.5395936939838358,
"learning_rate": 1.0597738287560582e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14883150160312653,
"step": 165,
"valid_targets_mean": 6402.5,
"valid_targets_min": 5364
},
{
"epoch": 0.19241652518392757,
"grad_norm": 0.5333879494600592,
"learning_rate": 1.0920840064620357e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1588222235441208,
"step": 170,
"valid_targets_mean": 7117.4,
"valid_targets_min": 3391
},
{
"epoch": 0.19807583474816073,
"grad_norm": 0.4867516211322162,
"learning_rate": 1.124394184168013e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1317976713180542,
"step": 175,
"valid_targets_mean": 7542.8,
"valid_targets_min": 4829
},
{
"epoch": 0.2037351443123939,
"grad_norm": 0.5420891751146504,
"learning_rate": 1.1567043618739904e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1280643194913864,
"step": 180,
"valid_targets_mean": 6284.4,
"valid_targets_min": 5180
},
{
"epoch": 0.20939445387662706,
"grad_norm": 0.6661403521505342,
"learning_rate": 1.1890145395799677e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14606133103370667,
"step": 185,
"valid_targets_mean": 5806.2,
"valid_targets_min": 5101
},
{
"epoch": 0.21505376344086022,
"grad_norm": 0.5210883149895804,
"learning_rate": 1.2213247172859452e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12868677079677582,
"step": 190,
"valid_targets_mean": 6697.9,
"valid_targets_min": 4527
},
{
"epoch": 0.22071307300509338,
"grad_norm": 0.5097320565529695,
"learning_rate": 1.2536348949919226e-05,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15265926718711853,
"step": 195,
"valid_targets_mean": 6410.4,
"valid_targets_min": 3082
},
{
"epoch": 0.22637238256932654,
"grad_norm": 0.49409646681977326,
"learning_rate": 1.2859450726979e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1307762712240219,
"step": 200,
"valid_targets_mean": 6847.1,
"valid_targets_min": 4685
},
{
"epoch": 0.2320316921335597,
"grad_norm": 0.5881665700498941,
"learning_rate": 1.3182552504038773e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13722704350948334,
"step": 205,
"valid_targets_mean": 6194.0,
"valid_targets_min": 4644
},
{
"epoch": 0.23769100169779286,
"grad_norm": 0.5147963094755471,
"learning_rate": 1.3505654281098549e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12045536190271378,
"step": 210,
"valid_targets_mean": 6283.8,
"valid_targets_min": 4433
},
{
"epoch": 0.24335031126202603,
"grad_norm": 1.0878536917736155,
"learning_rate": 1.382875605815832e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12820014357566833,
"step": 215,
"valid_targets_mean": 5917.2,
"valid_targets_min": 4857
},
{
"epoch": 0.2490096208262592,
"grad_norm": 0.5533070005440421,
"learning_rate": 1.4151857835218094e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599322259426117,
"step": 220,
"valid_targets_mean": 6986.4,
"valid_targets_min": 5101
},
{
"epoch": 0.2546689303904924,
"grad_norm": 0.8360192901625697,
"learning_rate": 1.4474959612277868e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1139596477150917,
"step": 225,
"valid_targets_mean": 5299.5,
"valid_targets_min": 4442
},
{
"epoch": 0.26032823995472554,
"grad_norm": 0.5113052700220211,
"learning_rate": 1.4798061389337644e-05,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10088923573493958,
"step": 230,
"valid_targets_mean": 6133.9,
"valid_targets_min": 5130
},
{
"epoch": 0.2659875495189587,
"grad_norm": 0.556777937085549,
"learning_rate": 1.5121163166397417e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13561654090881348,
"step": 235,
"valid_targets_mean": 6477.4,
"valid_targets_min": 4162
},
{
"epoch": 0.27164685908319186,
"grad_norm": 0.5097652957820101,
"learning_rate": 1.544426494345719e-05,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11574803292751312,
"step": 240,
"valid_targets_mean": 6350.4,
"valid_targets_min": 3940
},
{
"epoch": 0.277306168647425,
"grad_norm": 0.5471177439544483,
"learning_rate": 1.5767366720516963e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14649951457977295,
"step": 245,
"valid_targets_mean": 6625.1,
"valid_targets_min": 4642
},
{
"epoch": 0.2829654782116582,
"grad_norm": 0.6360629397684805,
"learning_rate": 1.609046849757674e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13972824811935425,
"step": 250,
"valid_targets_mean": 4907.0,
"valid_targets_min": 4431
},
{
"epoch": 0.28862478777589134,
"grad_norm": 0.5114528328133985,
"learning_rate": 1.641357027463651e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13421732187271118,
"step": 255,
"valid_targets_mean": 6465.0,
"valid_targets_min": 5333
},
{
"epoch": 0.2942840973401245,
"grad_norm": 0.5662488412896973,
"learning_rate": 1.6736672051696286e-05,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13066646456718445,
"step": 260,
"valid_targets_mean": 5650.5,
"valid_targets_min": 4769
},
{
"epoch": 0.29994340690435767,
"grad_norm": 0.596415912061785,
"learning_rate": 1.7059773828756058e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1249205470085144,
"step": 265,
"valid_targets_mean": 5540.0,
"valid_targets_min": 4281
},
{
"epoch": 0.30560271646859083,
"grad_norm": 0.5414221324867248,
"learning_rate": 1.7382875605815834e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1712135374546051,
"step": 270,
"valid_targets_mean": 6499.0,
"valid_targets_min": 4844
},
{
"epoch": 0.311262026032824,
"grad_norm": 0.4800403021295474,
"learning_rate": 1.770597738287561e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11049605160951614,
"step": 275,
"valid_targets_mean": 5736.5,
"valid_targets_min": 5227
},
{
"epoch": 0.31692133559705715,
"grad_norm": 0.4602797707086169,
"learning_rate": 1.802907915993538e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09841249883174896,
"step": 280,
"valid_targets_mean": 5857.2,
"valid_targets_min": 2461
},
{
"epoch": 0.3225806451612903,
"grad_norm": 0.5144413634754103,
"learning_rate": 1.8352180936995153e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11220520734786987,
"step": 285,
"valid_targets_mean": 5793.4,
"valid_targets_min": 2815
},
{
"epoch": 0.3282399547255235,
"grad_norm": 0.518213039234328,
"learning_rate": 1.867528271405493e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10794945061206818,
"step": 290,
"valid_targets_mean": 6588.8,
"valid_targets_min": 4875
},
{
"epoch": 0.33389926428975664,
"grad_norm": 0.5028338131244561,
"learning_rate": 1.8998384491114704e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11335889995098114,
"step": 295,
"valid_targets_mean": 5984.8,
"valid_targets_min": 4901
},
{
"epoch": 0.3395585738539898,
"grad_norm": 0.5014172240561889,
"learning_rate": 1.9321486268174476e-05,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11073829233646393,
"step": 300,
"valid_targets_mean": 6067.4,
"valid_targets_min": 3786
},
{
"epoch": 0.34521788341822296,
"grad_norm": 0.5159175569899495,
"learning_rate": 1.9644588045234248e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12275815010070801,
"step": 305,
"valid_targets_mean": 5852.5,
"valid_targets_min": 5057
},
{
"epoch": 0.3508771929824561,
"grad_norm": 0.4920285069970866,
"learning_rate": 1.9967689822294024e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13101038336753845,
"step": 310,
"valid_targets_mean": 6362.2,
"valid_targets_min": 3952
},
{
"epoch": 0.3565365025466893,
"grad_norm": 0.5829499325070455,
"learning_rate": 2.0290791599353796e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12691429257392883,
"step": 315,
"valid_targets_mean": 5360.2,
"valid_targets_min": 4267
},
{
"epoch": 0.36219581211092244,
"grad_norm": 0.5106185491779682,
"learning_rate": 2.0613893376413575e-05,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14615000784397125,
"step": 320,
"valid_targets_mean": 6842.1,
"valid_targets_min": 4785
},
{
"epoch": 0.3678551216751556,
"grad_norm": 0.46986873220654096,
"learning_rate": 2.0936995153473347e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11088338494300842,
"step": 325,
"valid_targets_mean": 6188.5,
"valid_targets_min": 5438
},
{
"epoch": 0.3735144312393888,
"grad_norm": 0.5155604844270958,
"learning_rate": 2.1260096930533122e-05,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12904900312423706,
"step": 330,
"valid_targets_mean": 5848.6,
"valid_targets_min": 4734
},
{
"epoch": 0.379173740803622,
"grad_norm": 0.5286196270158149,
"learning_rate": 2.1583198707592894e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10007612407207489,
"step": 335,
"valid_targets_mean": 6278.2,
"valid_targets_min": 5636
},
{
"epoch": 0.38483305036785515,
"grad_norm": 0.6422666761769791,
"learning_rate": 2.1906300484652666e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10531717538833618,
"step": 340,
"valid_targets_mean": 6168.9,
"valid_targets_min": 4206
},
{
"epoch": 0.3904923599320883,
"grad_norm": 0.4809008293583508,
"learning_rate": 2.2229402261712442e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1038937121629715,
"step": 345,
"valid_targets_mean": 6226.5,
"valid_targets_min": 4535
},
{
"epoch": 0.39615166949632147,
"grad_norm": 0.4200796846107823,
"learning_rate": 2.2552504038772214e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11499610543251038,
"step": 350,
"valid_targets_mean": 7821.6,
"valid_targets_min": 5471
},
{
"epoch": 0.40181097906055463,
"grad_norm": 0.46601849681120616,
"learning_rate": 2.2875605815831986e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10218453407287598,
"step": 355,
"valid_targets_mean": 6843.0,
"valid_targets_min": 5243
},
{
"epoch": 0.4074702886247878,
"grad_norm": 0.5592711031433829,
"learning_rate": 2.3198707592891765e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.138760507106781,
"step": 360,
"valid_targets_mean": 6658.6,
"valid_targets_min": 4906
},
{
"epoch": 0.41312959818902095,
"grad_norm": 0.4764946128159071,
"learning_rate": 2.3521809369951537e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1221180111169815,
"step": 365,
"valid_targets_mean": 6799.5,
"valid_targets_min": 5168
},
{
"epoch": 0.4187889077532541,
"grad_norm": 0.5633069925985472,
"learning_rate": 2.3844911147011312e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13051849603652954,
"step": 370,
"valid_targets_mean": 5376.2,
"valid_targets_min": 3130
},
{
"epoch": 0.4244482173174873,
"grad_norm": 0.980342272097954,
"learning_rate": 2.4168012924071084e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11312370002269745,
"step": 375,
"valid_targets_mean": 2843.1,
"valid_targets_min": 1990
},
{
"epoch": 0.43010752688172044,
"grad_norm": 0.822944627042817,
"learning_rate": 2.449111470113086e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1140211820602417,
"step": 380,
"valid_targets_mean": 2532.2,
"valid_targets_min": 324
},
{
"epoch": 0.4357668364459536,
"grad_norm": 0.6701905365467292,
"learning_rate": 2.4814216478190632e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08650068193674088,
"step": 385,
"valid_targets_mean": 2359.2,
"valid_targets_min": 982
},
{
"epoch": 0.44142614601018676,
"grad_norm": 0.5747277053205969,
"learning_rate": 2.5137318255250404e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0882439985871315,
"step": 390,
"valid_targets_mean": 3640.0,
"valid_targets_min": 2479
},
{
"epoch": 0.4470854555744199,
"grad_norm": 0.5225775305209468,
"learning_rate": 2.546042003231018e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057190995663404465,
"step": 395,
"valid_targets_mean": 3079.5,
"valid_targets_min": 811
},
{
"epoch": 0.4527447651386531,
"grad_norm": 0.5826735610560169,
"learning_rate": 2.5783521809369955e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0974460318684578,
"step": 400,
"valid_targets_mean": 3113.4,
"valid_targets_min": 1431
},
{
"epoch": 0.45840407470288624,
"grad_norm": 1.0037976393338115,
"learning_rate": 2.610662358642973e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1623167097568512,
"step": 405,
"valid_targets_mean": 1990.9,
"valid_targets_min": 702
},
{
"epoch": 0.4640633842671194,
"grad_norm": 0.5191241155436422,
"learning_rate": 2.6429725363489502e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08460583537817001,
"step": 410,
"valid_targets_mean": 3221.6,
"valid_targets_min": 621
},
{
"epoch": 0.46972269383135257,
"grad_norm": 0.677644881422118,
"learning_rate": 2.6752827140549274e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0884869396686554,
"step": 415,
"valid_targets_mean": 2591.4,
"valid_targets_min": 846
},
{
"epoch": 0.47538200339558573,
"grad_norm": 0.6341714358056391,
"learning_rate": 2.707592891760905e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10547944158315659,
"step": 420,
"valid_targets_mean": 3738.9,
"valid_targets_min": 1369
},
{
"epoch": 0.4810413129598189,
"grad_norm": 0.5089106640165426,
"learning_rate": 2.7399030694668822e-05,
"loss": 0.1232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07162182033061981,
"step": 425,
"valid_targets_mean": 2715.4,
"valid_targets_min": 754
},
{
"epoch": 0.48670062252405205,
"grad_norm": 0.6511128875447165,
"learning_rate": 2.7722132471728597e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09212324023246765,
"step": 430,
"valid_targets_mean": 2725.9,
"valid_targets_min": 776
},
{
"epoch": 0.4923599320882852,
"grad_norm": 0.468238315396383,
"learning_rate": 2.804523424878837e-05,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09181820601224899,
"step": 435,
"valid_targets_mean": 3194.4,
"valid_targets_min": 754
},
{
"epoch": 0.4980192416525184,
"grad_norm": 0.8727612672516372,
"learning_rate": 2.8368336025848148e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2480352222919464,
"step": 440,
"valid_targets_mean": 2053.8,
"valid_targets_min": 664
},
{
"epoch": 0.5036785512167515,
"grad_norm": 0.5210005323173948,
"learning_rate": 2.869143780290792e-05,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08143844455480576,
"step": 445,
"valid_targets_mean": 3771.4,
"valid_targets_min": 2542
},
{
"epoch": 0.5093378607809848,
"grad_norm": 0.5379047687704024,
"learning_rate": 2.9014539579967692e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09487590193748474,
"step": 450,
"valid_targets_mean": 3486.2,
"valid_targets_min": 2988
},
{
"epoch": 0.5149971703452179,
"grad_norm": 0.5672323966032542,
"learning_rate": 2.9337641357027468e-05,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08703413605690002,
"step": 455,
"valid_targets_mean": 3779.4,
"valid_targets_min": 3281
},
{
"epoch": 0.5206564799094511,
"grad_norm": 0.6137232437450363,
"learning_rate": 2.966074313408724e-05,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07755735516548157,
"step": 460,
"valid_targets_mean": 3471.1,
"valid_targets_min": 2189
},
{
"epoch": 0.5263157894736842,
"grad_norm": 0.5015341485462157,
"learning_rate": 2.9983844911147012e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06586933135986328,
"step": 465,
"valid_targets_mean": 3483.6,
"valid_targets_min": 1788
},
{
"epoch": 0.5319750990379174,
"grad_norm": 0.7406309314592703,
"learning_rate": 3.0306946688206787e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09322462230920792,
"step": 470,
"valid_targets_mean": 2562.1,
"valid_targets_min": 597
},
{
"epoch": 0.5376344086021505,
"grad_norm": 0.7033983658453125,
"learning_rate": 3.063004846526656e-05,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07036390900611877,
"step": 475,
"valid_targets_mean": 2272.8,
"valid_targets_min": 701
},
{
"epoch": 0.5432937181663837,
"grad_norm": 0.6806014114354145,
"learning_rate": 3.095315024232634e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11313560605049133,
"step": 480,
"valid_targets_mean": 2971.0,
"valid_targets_min": 1652
},
{
"epoch": 0.5489530277306168,
"grad_norm": 0.47880028331211966,
"learning_rate": 3.127625201938611e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07742761820554733,
"step": 485,
"valid_targets_mean": 3747.4,
"valid_targets_min": 1908
},
{
"epoch": 0.55461233729485,
"grad_norm": 0.6132600376986139,
"learning_rate": 3.159935379644588e-05,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058801814913749695,
"step": 490,
"valid_targets_mean": 3247.8,
"valid_targets_min": 971
},
{
"epoch": 0.5602716468590832,
"grad_norm": 0.5322542810337509,
"learning_rate": 3.1922455573505654e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0757409855723381,
"step": 495,
"valid_targets_mean": 3422.2,
"valid_targets_min": 2552
},
{
"epoch": 0.5659309564233164,
"grad_norm": 0.555861116706065,
"learning_rate": 3.224555735056543e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061425432562828064,
"step": 500,
"valid_targets_mean": 2948.9,
"valid_targets_min": 753
},
{
"epoch": 0.5715902659875495,
"grad_norm": 0.692458977719794,
"learning_rate": 3.2568659127625205e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06144799664616585,
"step": 505,
"valid_targets_mean": 1090.5,
"valid_targets_min": 568
},
{
"epoch": 0.5772495755517827,
"grad_norm": 0.6074379759592959,
"learning_rate": 3.289176090468498e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16443628072738647,
"step": 510,
"valid_targets_mean": 2921.1,
"valid_targets_min": 1070
},
{
"epoch": 0.5829088851160158,
"grad_norm": 0.7139647841577196,
"learning_rate": 3.321486268174475e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07074105739593506,
"step": 515,
"valid_targets_mean": 2052.1,
"valid_targets_min": 329
},
{
"epoch": 0.588568194680249,
"grad_norm": 0.9997802597595687,
"learning_rate": 3.353796445880453e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08975844085216522,
"step": 520,
"valid_targets_mean": 998.2,
"valid_targets_min": 608
},
{
"epoch": 0.5942275042444821,
"grad_norm": 0.5353719487561314,
"learning_rate": 3.38610662358643e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08616983890533447,
"step": 525,
"valid_targets_mean": 4405.9,
"valid_targets_min": 2772
},
{
"epoch": 0.5998868138087153,
"grad_norm": 0.37012257410615623,
"learning_rate": 3.418416801292407e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03389976918697357,
"step": 530,
"valid_targets_mean": 5138.2,
"valid_targets_min": 3778
},
{
"epoch": 0.6055461233729486,
"grad_norm": 0.42309989480020843,
"learning_rate": 3.450726978998385e-05,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07327836751937866,
"step": 535,
"valid_targets_mean": 4641.0,
"valid_targets_min": 2336
},
{
"epoch": 0.6112054329371817,
"grad_norm": 0.4767188679502289,
"learning_rate": 3.483037156704362e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09635117650032043,
"step": 540,
"valid_targets_mean": 3962.1,
"valid_targets_min": 2161
},
{
"epoch": 0.6168647425014149,
"grad_norm": 0.4625024398234958,
"learning_rate": 3.5153473344103395e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07724954187870026,
"step": 545,
"valid_targets_mean": 3271.8,
"valid_targets_min": 798
},
{
"epoch": 0.622524052065648,
"grad_norm": 0.5338159680740975,
"learning_rate": 3.547657512116317e-05,
"loss": 0.131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05782943218946457,
"step": 550,
"valid_targets_mean": 1915.8,
"valid_targets_min": 533
},
{
"epoch": 0.6281833616298812,
"grad_norm": 0.5326298581049448,
"learning_rate": 3.579967689822294e-05,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06620592623949051,
"step": 555,
"valid_targets_mean": 2589.2,
"valid_targets_min": 833
},
{
"epoch": 0.6338426711941143,
"grad_norm": 0.3929364751105547,
"learning_rate": 3.612277867528272e-05,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06302763521671295,
"step": 560,
"valid_targets_mean": 3888.0,
"valid_targets_min": 3391
},
{
"epoch": 0.6395019807583475,
"grad_norm": 0.6449559476750033,
"learning_rate": 3.644588045234249e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0976746454834938,
"step": 565,
"valid_targets_mean": 1517.1,
"valid_targets_min": 732
},
{
"epoch": 0.6451612903225806,
"grad_norm": 0.7287905778647281,
"learning_rate": 3.676898222940227e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09375546127557755,
"step": 570,
"valid_targets_mean": 1623.9,
"valid_targets_min": 538
},
{
"epoch": 0.6508205998868138,
"grad_norm": 0.9334597399750638,
"learning_rate": 3.709208400646204e-05,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07705486565828323,
"step": 575,
"valid_targets_mean": 1158.1,
"valid_targets_min": 720
},
{
"epoch": 0.656479909451047,
"grad_norm": 0.520582326302511,
"learning_rate": 3.741518578352181e-05,
"loss": 0.1293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0693022832274437,
"step": 580,
"valid_targets_mean": 2982.2,
"valid_targets_min": 2328
},
{
"epoch": 0.6621392190152802,
"grad_norm": 0.5193502586396022,
"learning_rate": 3.7738287560581585e-05,
"loss": 0.1211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05764622613787651,
"step": 585,
"valid_targets_mean": 2637.0,
"valid_targets_min": 684
},
{
"epoch": 0.6677985285795133,
"grad_norm": 0.5086958802467102,
"learning_rate": 3.806138933764136e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0691675916314125,
"step": 590,
"valid_targets_mean": 3441.4,
"valid_targets_min": 2795
},
{
"epoch": 0.6734578381437465,
"grad_norm": 0.4850447820432571,
"learning_rate": 3.838449111470113e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07534271478652954,
"step": 595,
"valid_targets_mean": 3286.4,
"valid_targets_min": 744
},
{
"epoch": 0.6791171477079796,
"grad_norm": 0.48421566338639804,
"learning_rate": 3.870759289176091e-05,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05804857611656189,
"step": 600,
"valid_targets_mean": 3976.5,
"valid_targets_min": 3279
},
{
"epoch": 0.6847764572722128,
"grad_norm": 0.7226548407603152,
"learning_rate": 3.903069466882068e-05,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07041174173355103,
"step": 605,
"valid_targets_mean": 1140.4,
"valid_targets_min": 536
},
{
"epoch": 0.6904357668364459,
"grad_norm": 0.571223926526635,
"learning_rate": 3.935379644588046e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06768079102039337,
"step": 610,
"valid_targets_mean": 2468.8,
"valid_targets_min": 853
},
{
"epoch": 0.6960950764006791,
"grad_norm": 0.5652274695532502,
"learning_rate": 3.967689822294023e-05,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0701763778924942,
"step": 615,
"valid_targets_mean": 3205.8,
"valid_targets_min": 2621
},
{
"epoch": 0.7017543859649122,
"grad_norm": 0.7631423275049859,
"learning_rate": 4e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07661966979503632,
"step": 620,
"valid_targets_mean": 1332.4,
"valid_targets_min": 728
},
{
"epoch": 0.7074136955291455,
"grad_norm": 0.7426645119465096,
"learning_rate": 3.999992044178504e-05,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07438753545284271,
"step": 625,
"valid_targets_mean": 1538.9,
"valid_targets_min": 618
},
{
"epoch": 0.7130730050933786,
"grad_norm": 0.434165182746641,
"learning_rate": 3.9999681767773104e-05,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08520899713039398,
"step": 630,
"valid_targets_mean": 4142.9,
"valid_targets_min": 907
},
{
"epoch": 0.7187323146576118,
"grad_norm": 0.6276743040350341,
"learning_rate": 3.999928397986304e-05,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11276379972696304,
"step": 635,
"valid_targets_mean": 3060.4,
"valid_targets_min": 577
},
{
"epoch": 0.7243916242218449,
"grad_norm": 0.4341449304787945,
"learning_rate": 3.9998727081219585e-05,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056107230484485626,
"step": 640,
"valid_targets_mean": 3732.2,
"valid_targets_min": 726
},
{
"epoch": 0.7300509337860781,
"grad_norm": 0.40263084785984393,
"learning_rate": 3.999801107627332e-05,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0675823912024498,
"step": 645,
"valid_targets_mean": 4288.9,
"valid_targets_min": 2252
},
{
"epoch": 0.7357102433503112,
"grad_norm": 0.5991957808916428,
"learning_rate": 3.9997135970720655e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07685792446136475,
"step": 650,
"valid_targets_mean": 2427.5,
"valid_targets_min": 531
},
{
"epoch": 0.7413695529145444,
"grad_norm": 0.5224063375277248,
"learning_rate": 3.9996101771523766e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061697687953710556,
"step": 655,
"valid_targets_mean": 2126.6,
"valid_targets_min": 744
},
{
"epoch": 0.7470288624787776,
"grad_norm": 0.4345176533930879,
"learning_rate": 3.999490848691057e-05,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06378062069416046,
"step": 660,
"valid_targets_mean": 3755.5,
"valid_targets_min": 3024
},
{
"epoch": 0.7526881720430108,
"grad_norm": 0.4569816247653973,
"learning_rate": 3.999355612637461e-05,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07932804524898529,
"step": 665,
"valid_targets_mean": 3352.0,
"valid_targets_min": 2366
},
{
"epoch": 0.758347481607244,
"grad_norm": 0.5751225435233932,
"learning_rate": 3.999204470067504e-05,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07831130921840668,
"step": 670,
"valid_targets_mean": 956.8,
"valid_targets_min": 509
},
{
"epoch": 0.7640067911714771,
"grad_norm": 0.48072853866166537,
"learning_rate": 3.9990374221836484e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06048751622438431,
"step": 675,
"valid_targets_mean": 3013.6,
"valid_targets_min": 1158
},
{
"epoch": 0.7696661007357103,
"grad_norm": 0.40749695301719024,
"learning_rate": 3.998854470314898e-05,
"loss": 0.1127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05904872715473175,
"step": 680,
"valid_targets_mean": 3860.5,
"valid_targets_min": 3044
},
{
"epoch": 0.7753254102999434,
"grad_norm": 0.4479181701407655,
"learning_rate": 3.9986556159167846e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04606478661298752,
"step": 685,
"valid_targets_mean": 2286.4,
"valid_targets_min": 539
},
{
"epoch": 0.7809847198641766,
"grad_norm": 0.4692149977774639,
"learning_rate": 3.998440860571358e-05,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059417132288217545,
"step": 690,
"valid_targets_mean": 2865.5,
"valid_targets_min": 912
},
{
"epoch": 0.7866440294284097,
"grad_norm": 0.6595632418113099,
"learning_rate": 3.998210205987175e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08933501690626144,
"step": 695,
"valid_targets_mean": 2087.4,
"valid_targets_min": 872
},
{
"epoch": 0.7923033389926429,
"grad_norm": 0.43788134024153513,
"learning_rate": 3.9979636539992805e-05,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05341676250100136,
"step": 700,
"valid_targets_mean": 3380.1,
"valid_targets_min": 2254
},
{
"epoch": 0.797962648556876,
"grad_norm": 0.8001613859076356,
"learning_rate": 3.9977012065692e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09082688391208649,
"step": 705,
"valid_targets_mean": 1274.0,
"valid_targets_min": 605
},
{
"epoch": 0.8036219581211093,
"grad_norm": 0.5094244900852393,
"learning_rate": 3.997422865784916e-05,
"loss": 0.1327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07657082378864288,
"step": 710,
"valid_targets_mean": 2289.0,
"valid_targets_min": 1117
},
{
"epoch": 0.8092812676853424,
"grad_norm": 0.4600031239543275,
"learning_rate": 3.99712863386086e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06370458006858826,
"step": 715,
"valid_targets_mean": 3169.9,
"valid_targets_min": 1132
},
{
"epoch": 0.8149405772495756,
"grad_norm": 0.5229218472624875,
"learning_rate": 3.9968185131378876e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04839629679918289,
"step": 720,
"valid_targets_mean": 2107.4,
"valid_targets_min": 524
},
{
"epoch": 0.8205998868138087,
"grad_norm": 0.5010534381484323,
"learning_rate": 3.996492506083264e-05,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05224666744470596,
"step": 725,
"valid_targets_mean": 1705.8,
"valid_targets_min": 516
},
{
"epoch": 0.8262591963780419,
"grad_norm": 0.5503804393257022,
"learning_rate": 3.9961506152906445e-05,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07331585884094238,
"step": 730,
"valid_targets_mean": 2088.2,
"valid_targets_min": 342
},
{
"epoch": 0.831918505942275,
"grad_norm": 0.35323711189740525,
"learning_rate": 3.995792843480051e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06214073300361633,
"step": 735,
"valid_targets_mean": 3528.1,
"valid_targets_min": 1935
},
{
"epoch": 0.8375778155065082,
"grad_norm": 0.5249098117659579,
"learning_rate": 3.9954191934978494e-05,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043227165937423706,
"step": 740,
"valid_targets_mean": 1818.2,
"valid_targets_min": 564
},
{
"epoch": 0.8432371250707413,
"grad_norm": 0.3299099340846902,
"learning_rate": 3.995029668316735e-05,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06274382770061493,
"step": 745,
"valid_targets_mean": 5238.9,
"valid_targets_min": 3653
},
{
"epoch": 0.8488964346349746,
"grad_norm": 0.36575794432079584,
"learning_rate": 3.9946242710356994e-05,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040668781846761703,
"step": 750,
"valid_targets_mean": 2983.4,
"valid_targets_min": 684
},
{
"epoch": 0.8545557441992077,
"grad_norm": 0.5075588125856926,
"learning_rate": 3.994203004880012e-05,
"loss": 0.1079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06988832354545593,
"step": 755,
"valid_targets_mean": 3324.8,
"valid_targets_min": 726
},
{
"epoch": 0.8602150537634409,
"grad_norm": 0.39852501254916606,
"learning_rate": 3.9937658732011905e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0661604031920433,
"step": 760,
"valid_targets_mean": 4154.5,
"valid_targets_min": 3469
},
{
"epoch": 0.865874363327674,
"grad_norm": 0.686455143981827,
"learning_rate": 3.993312879476976e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19141210615634918,
"step": 765,
"valid_targets_mean": 2561.6,
"valid_targets_min": 1536
},
{
"epoch": 0.8715336728919072,
"grad_norm": 0.43519246110287957,
"learning_rate": 3.992844027311307e-05,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06963059306144714,
"step": 770,
"valid_targets_mean": 2912.4,
"valid_targets_min": 582
},
{
"epoch": 0.8771929824561403,
"grad_norm": 0.3610697013476402,
"learning_rate": 3.992359320434287e-05,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049161579459905624,
"step": 775,
"valid_targets_mean": 3388.5,
"valid_targets_min": 633
},
{
"epoch": 0.8828522920203735,
"grad_norm": 0.4253116172505089,
"learning_rate": 3.9918587627021566e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05305824428796768,
"step": 780,
"valid_targets_mean": 3263.6,
"valid_targets_min": 1130
},
{
"epoch": 0.8885116015846066,
"grad_norm": 0.41320327540238194,
"learning_rate": 3.991342358097265e-05,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0637916624546051,
"step": 785,
"valid_targets_mean": 2866.5,
"valid_targets_min": 492
},
{
"epoch": 0.8941709111488398,
"grad_norm": 0.828001679310075,
"learning_rate": 3.990810110728034e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10161933302879333,
"step": 790,
"valid_targets_mean": 2353.8,
"valid_targets_min": 1045
},
{
"epoch": 0.8998302207130731,
"grad_norm": 0.38967894220881866,
"learning_rate": 3.99026202482893e-05,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04142877459526062,
"step": 795,
"valid_targets_mean": 3043.9,
"valid_targets_min": 647
},
{
"epoch": 0.9054895302773062,
"grad_norm": 0.7579700154789877,
"learning_rate": 3.989698104760425e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11227335035800934,
"step": 800,
"valid_targets_mean": 2093.0,
"valid_targets_min": 806
},
{
"epoch": 0.9111488398415394,
"grad_norm": 0.6550049745460668,
"learning_rate": 3.989118355008968e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06615293025970459,
"step": 805,
"valid_targets_mean": 1208.8,
"valid_targets_min": 575
},
{
"epoch": 0.9168081494057725,
"grad_norm": 0.5313531127641108,
"learning_rate": 3.988522780186943e-05,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058285586535930634,
"step": 810,
"valid_targets_mean": 3447.5,
"valid_targets_min": 2784
},
{
"epoch": 0.9224674589700057,
"grad_norm": 0.42281770147833686,
"learning_rate": 3.987911385032638e-05,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05373559519648552,
"step": 815,
"valid_targets_mean": 3721.6,
"valid_targets_min": 2525
},
{
"epoch": 0.9281267685342388,
"grad_norm": 0.4127768410682695,
"learning_rate": 3.987284174410203e-05,
"loss": 0.1285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05588556081056595,
"step": 820,
"valid_targets_mean": 2665.2,
"valid_targets_min": 767
},
{
"epoch": 0.933786078098472,
"grad_norm": 0.4894787437319876,
"learning_rate": 3.986641153309615e-05,
"loss": 0.1176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052959829568862915,
"step": 825,
"valid_targets_mean": 2277.6,
"valid_targets_min": 870
},
{
"epoch": 0.9394453876627051,
"grad_norm": 0.7402127878724636,
"learning_rate": 3.985982326846634e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09184592217206955,
"step": 830,
"valid_targets_mean": 1535.8,
"valid_targets_min": 758
},
{
"epoch": 0.9451046972269384,
"grad_norm": 0.46799832031998007,
"learning_rate": 3.985307700262765e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059100307524204254,
"step": 835,
"valid_targets_mean": 2024.1,
"valid_targets_min": 797
},
{
"epoch": 0.9507640067911715,
"grad_norm": 0.3657972143765407,
"learning_rate": 3.984617278925218e-05,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05874822288751602,
"step": 840,
"valid_targets_mean": 3299.5,
"valid_targets_min": 1606
},
{
"epoch": 0.9564233163554047,
"grad_norm": 0.433457585178867,
"learning_rate": 3.9839110683268624e-05,
"loss": 0.1294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0675329715013504,
"step": 845,
"valid_targets_mean": 3055.0,
"valid_targets_min": 678
},
{
"epoch": 0.9620826259196378,
"grad_norm": 0.3318398548480011,
"learning_rate": 3.9831890740861826e-05,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06505134701728821,
"step": 850,
"valid_targets_mean": 4980.6,
"valid_targets_min": 1078
},
{
"epoch": 0.967741935483871,
"grad_norm": 0.3441479953856927,
"learning_rate": 3.982451301947236e-05,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04246465489268303,
"step": 855,
"valid_targets_mean": 2680.8,
"valid_targets_min": 706
},
{
"epoch": 0.9734012450481041,
"grad_norm": 0.6698327188776084,
"learning_rate": 3.981697757779606e-05,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08046382665634155,
"step": 860,
"valid_targets_mean": 1580.4,
"valid_targets_min": 580
},
{
"epoch": 0.9790605546123373,
"grad_norm": 0.6426747257677874,
"learning_rate": 3.980928447578356e-05,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10326772928237915,
"step": 865,
"valid_targets_mean": 2592.1,
"valid_targets_min": 780
},
{
"epoch": 0.9847198641765704,
"grad_norm": 0.4076799742075529,
"learning_rate": 3.98014337746398e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04925592988729477,
"step": 870,
"valid_targets_mean": 3478.2,
"valid_targets_min": 2861
},
{
"epoch": 0.9903791737408036,
"grad_norm": 0.40044366441837925,
"learning_rate": 3.9793425536823555e-05,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06652865558862686,
"step": 875,
"valid_targets_mean": 3846.5,
"valid_targets_min": 2453
},
{
"epoch": 0.9960384833050367,
"grad_norm": 0.43952559861608015,
"learning_rate": 3.978525982604695e-05,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07187198102474213,
"step": 880,
"valid_targets_mean": 3881.8,
"valid_targets_min": 3389
},
{
"epoch": 1.0011318619128466,
"grad_norm": 0.6856007855669121,
"learning_rate": 3.977693670727491e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13266420364379883,
"step": 885,
"valid_targets_mean": 6935.0,
"valid_targets_min": 5295
},
{
"epoch": 1.0067911714770799,
"grad_norm": 0.43379131857748404,
"learning_rate": 3.9768456246724675e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1459798812866211,
"step": 890,
"valid_targets_mean": 7672.9,
"valid_targets_min": 5066
},
{
"epoch": 1.0124504810413129,
"grad_norm": 0.4683116079781387,
"learning_rate": 3.97598185118653e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12084569036960602,
"step": 895,
"valid_targets_mean": 7347.6,
"valid_targets_min": 4923
},
{
"epoch": 1.018109790605546,
"grad_norm": 0.48855719634434,
"learning_rate": 3.975102357141704e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11077947914600372,
"step": 900,
"valid_targets_mean": 5446.8,
"valid_targets_min": 3922
},
{
"epoch": 1.0237691001697793,
"grad_norm": 0.42798402935325797,
"learning_rate": 3.974207149535088e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1109333485364914,
"step": 905,
"valid_targets_mean": 6924.9,
"valid_targets_min": 4797
},
{
"epoch": 1.0294284097340125,
"grad_norm": 0.4351702732960488,
"learning_rate": 3.9732962354887936e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12490881234407425,
"step": 910,
"valid_targets_mean": 6443.5,
"valid_targets_min": 3853
},
{
"epoch": 1.0350877192982457,
"grad_norm": 0.47752325780331667,
"learning_rate": 3.972369622249891e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1165180504322052,
"step": 915,
"valid_targets_mean": 5446.5,
"valid_targets_min": 4487
},
{
"epoch": 1.0407470288624787,
"grad_norm": 0.55468198932523,
"learning_rate": 3.9714273171903486e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11226481199264526,
"step": 920,
"valid_targets_mean": 6210.2,
"valid_targets_min": 4137
},
{
"epoch": 1.046406338426712,
"grad_norm": 0.5656955802461123,
"learning_rate": 3.970469327806978e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20384201407432556,
"step": 925,
"valid_targets_mean": 5404.4,
"valid_targets_min": 698
},
{
"epoch": 1.0520656479909452,
"grad_norm": 0.42478256890845617,
"learning_rate": 3.969495661721372e-05,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13021141290664673,
"step": 930,
"valid_targets_mean": 7197.6,
"valid_targets_min": 4499
},
{
"epoch": 1.0577249575551784,
"grad_norm": 0.47440889374120215,
"learning_rate": 3.9685063266798434e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15133237838745117,
"step": 935,
"valid_targets_mean": 5538.4,
"valid_targets_min": 4291
},
{
"epoch": 1.0633842671194114,
"grad_norm": 0.45853285772484853,
"learning_rate": 3.967501330553366e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09450241178274155,
"step": 940,
"valid_targets_mean": 5531.4,
"valid_targets_min": 4050
},
{
"epoch": 1.0690435766836446,
"grad_norm": 0.4165165821206238,
"learning_rate": 3.966480681337508e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12836091220378876,
"step": 945,
"valid_targets_mean": 7526.6,
"valid_targets_min": 5196
},
{
"epoch": 1.0747028862478778,
"grad_norm": 0.4439127191876095,
"learning_rate": 3.965444387152375e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.103563092648983,
"step": 950,
"valid_targets_mean": 6248.9,
"valid_targets_min": 4749
},
{
"epoch": 1.080362195812111,
"grad_norm": 0.5042962353960474,
"learning_rate": 3.9643924562425365e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05952709913253784,
"step": 955,
"valid_targets_mean": 3248.5,
"valid_targets_min": 1908
},
{
"epoch": 1.086021505376344,
"grad_norm": 0.4245617765773125,
"learning_rate": 3.963324896976968e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10588788986206055,
"step": 960,
"valid_targets_mean": 6225.6,
"valid_targets_min": 4808
},
{
"epoch": 1.0916808149405772,
"grad_norm": 0.44302682414413963,
"learning_rate": 3.962241717848979e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10773646831512451,
"step": 965,
"valid_targets_mean": 5383.0,
"valid_targets_min": 3774
},
{
"epoch": 1.0973401245048104,
"grad_norm": 0.4090806507981392,
"learning_rate": 3.961142927476151e-05,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11196926236152649,
"step": 970,
"valid_targets_mean": 6291.4,
"valid_targets_min": 5335
},
{
"epoch": 1.1029994340690437,
"grad_norm": 0.3734040338697041,
"learning_rate": 3.960028534600264e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11295393109321594,
"step": 975,
"valid_targets_mean": 7749.1,
"valid_targets_min": 6205
},
{
"epoch": 1.1086587436332767,
"grad_norm": 0.3906381278203426,
"learning_rate": 3.9588985480872275e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10481761395931244,
"step": 980,
"valid_targets_mean": 6882.1,
"valid_targets_min": 4428
},
{
"epoch": 1.1143180531975099,
"grad_norm": 0.4456420223942386,
"learning_rate": 3.9577529769270137e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11185906827449799,
"step": 985,
"valid_targets_mean": 5751.8,
"valid_targets_min": 4458
},
{
"epoch": 1.119977362761743,
"grad_norm": 0.4397561377985395,
"learning_rate": 3.9565918302335816e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09672285616397858,
"step": 990,
"valid_targets_mean": 6003.9,
"valid_targets_min": 4458
},
{
"epoch": 1.1256366723259763,
"grad_norm": 0.4329998383462111,
"learning_rate": 3.955415117244807e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09833373129367828,
"step": 995,
"valid_targets_mean": 6033.8,
"valid_targets_min": 4066
},
{
"epoch": 1.1312959818902093,
"grad_norm": 0.41841572645344943,
"learning_rate": 3.9542228473224086e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11922608315944672,
"step": 1000,
"valid_targets_mean": 6601.0,
"valid_targets_min": 4708
},
{
"epoch": 1.1369552914544425,
"grad_norm": 0.4315438341662908,
"learning_rate": 3.953015029951874e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12108911573886871,
"step": 1005,
"valid_targets_mean": 6092.1,
"valid_targets_min": 4789
},
{
"epoch": 1.1426146010186757,
"grad_norm": 0.40535781524675796,
"learning_rate": 3.9517916747423804e-05,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12264654040336609,
"step": 1010,
"valid_targets_mean": 6474.6,
"valid_targets_min": 4224
},
{
"epoch": 1.148273910582909,
"grad_norm": 0.41571559354767595,
"learning_rate": 3.9505527914267255e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11821147054433823,
"step": 1015,
"valid_targets_mean": 6312.4,
"valid_targets_min": 4617
},
{
"epoch": 1.1539332201471422,
"grad_norm": 0.40714327444148485,
"learning_rate": 3.949298389861243e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11297283321619034,
"step": 1020,
"valid_targets_mean": 6333.8,
"valid_targets_min": 4783
},
{
"epoch": 1.1595925297113752,
"grad_norm": 0.45247118108391804,
"learning_rate": 3.948028480025728e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11267365515232086,
"step": 1025,
"valid_targets_mean": 7380.1,
"valid_targets_min": 6020
},
{
"epoch": 1.1652518392756084,
"grad_norm": 0.4357879080967964,
"learning_rate": 3.9467430720233555e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11564698815345764,
"step": 1030,
"valid_targets_mean": 6009.0,
"valid_targets_min": 3049
},
{
"epoch": 1.1709111488398416,
"grad_norm": 0.4468978613451375,
"learning_rate": 3.945442176080604e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10168086737394333,
"step": 1035,
"valid_targets_mean": 5973.1,
"valid_targets_min": 4822
},
{
"epoch": 1.1765704584040746,
"grad_norm": 0.4644751057173812,
"learning_rate": 3.944125802547168e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.104912169277668,
"step": 1040,
"valid_targets_mean": 5754.9,
"valid_targets_min": 2910
},
{
"epoch": 1.1822297679683078,
"grad_norm": 0.4750656628065809,
"learning_rate": 3.942793961895881e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12494048476219177,
"step": 1045,
"valid_targets_mean": 6414.6,
"valid_targets_min": 4791
},
{
"epoch": 1.187889077532541,
"grad_norm": 0.46661891824647705,
"learning_rate": 3.941446664722629e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11205330491065979,
"step": 1050,
"valid_targets_mean": 5675.9,
"valid_targets_min": 3983
},
{
"epoch": 1.1935483870967742,
"grad_norm": 0.3693476342351284,
"learning_rate": 3.940083921746268e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08969860523939133,
"step": 1055,
"valid_targets_mean": 6975.5,
"valid_targets_min": 4383
},
{
"epoch": 1.1992076966610075,
"grad_norm": 0.3893171784380533,
"learning_rate": 3.938705743808538e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1054840236902237,
"step": 1060,
"valid_targets_mean": 6417.1,
"valid_targets_min": 3182
},
{
"epoch": 1.2048670062252405,
"grad_norm": 0.4534363275965842,
"learning_rate": 3.9373121418739765e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11998751014471054,
"step": 1065,
"valid_targets_mean": 6218.6,
"valid_targets_min": 5077
},
{
"epoch": 1.2105263157894737,
"grad_norm": 0.49747070693615936,
"learning_rate": 3.935903127029832e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11035722494125366,
"step": 1070,
"valid_targets_mean": 4774.9,
"valid_targets_min": 3663
},
{
"epoch": 1.216185625353707,
"grad_norm": 0.4539470299738808,
"learning_rate": 3.934478710485975e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11278726160526276,
"step": 1075,
"valid_targets_mean": 6316.8,
"valid_targets_min": 4105
},
{
"epoch": 1.22184493491794,
"grad_norm": 0.4150450186888815,
"learning_rate": 3.9330389035748086e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09741287678480148,
"step": 1080,
"valid_targets_mean": 6528.9,
"valid_targets_min": 4537
},
{
"epoch": 1.227504244482173,
"grad_norm": 0.4102218195249173,
"learning_rate": 3.9315837177511816e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09937061369419098,
"step": 1085,
"valid_targets_mean": 6416.8,
"valid_targets_min": 2494
},
{
"epoch": 1.2331635540464063,
"grad_norm": 0.4554765624706927,
"learning_rate": 3.93011316459229e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1132006049156189,
"step": 1090,
"valid_targets_mean": 6070.9,
"valid_targets_min": 4921
},
{
"epoch": 1.2388228636106395,
"grad_norm": 0.46305531026666913,
"learning_rate": 3.928627255797593e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11665916442871094,
"step": 1095,
"valid_targets_mean": 6701.4,
"valid_targets_min": 5285
},
{
"epoch": 1.2444821731748728,
"grad_norm": 0.4177211742532018,
"learning_rate": 3.927126003188717e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10000447928905487,
"step": 1100,
"valid_targets_mean": 6273.9,
"valid_targets_min": 4464
},
{
"epoch": 1.2501414827391057,
"grad_norm": 0.4227921157715367,
"learning_rate": 3.925609418709358e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09662619233131409,
"step": 1105,
"valid_targets_mean": 5554.8,
"valid_targets_min": 4439
},
{
"epoch": 1.255800792303339,
"grad_norm": 0.39346061104081265,
"learning_rate": 3.924077514425193e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09001141786575317,
"step": 1110,
"valid_targets_mean": 6043.0,
"valid_targets_min": 4686
},
{
"epoch": 1.2614601018675722,
"grad_norm": 0.4138966359666768,
"learning_rate": 3.922530302523779e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09198030829429626,
"step": 1115,
"valid_targets_mean": 5912.5,
"valid_targets_min": 3381
},
{
"epoch": 1.2671194114318054,
"grad_norm": 0.379265006887859,
"learning_rate": 3.920967795314456e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09785998612642288,
"step": 1120,
"valid_targets_mean": 6495.5,
"valid_targets_min": 5309
},
{
"epoch": 1.2727787209960386,
"grad_norm": 0.41391321836622774,
"learning_rate": 3.919390005228254e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10846744477748871,
"step": 1125,
"valid_targets_mean": 6483.9,
"valid_targets_min": 5161
},
{
"epoch": 1.2784380305602716,
"grad_norm": 0.49875136898167355,
"learning_rate": 3.9177969448177884e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10463844239711761,
"step": 1130,
"valid_targets_mean": 5958.9,
"valid_targets_min": 4666
},
{
"epoch": 1.2840973401245048,
"grad_norm": 0.6505825282340078,
"learning_rate": 3.916188626757164e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125363290309906,
"step": 1135,
"valid_targets_mean": 1691.5,
"valid_targets_min": 1440
},
{
"epoch": 1.289756649688738,
"grad_norm": 0.4550942995720742,
"learning_rate": 3.9145650638418724e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09323972463607788,
"step": 1140,
"valid_targets_mean": 5299.1,
"valid_targets_min": 4547
},
{
"epoch": 1.295415959252971,
"grad_norm": 0.48730645845105025,
"learning_rate": 3.91292626898869e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10699446499347687,
"step": 1145,
"valid_targets_mean": 6003.5,
"valid_targets_min": 5031
},
{
"epoch": 1.3010752688172043,
"grad_norm": 0.36627880501682747,
"learning_rate": 3.911272255235576e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09872409701347351,
"step": 1150,
"valid_targets_mean": 8169.6,
"valid_targets_min": 5487
},
{
"epoch": 1.3067345783814375,
"grad_norm": 0.39046063875124754,
"learning_rate": 3.909603035741568e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10074116289615631,
"step": 1155,
"valid_targets_mean": 6474.9,
"valid_targets_min": 4253
},
{
"epoch": 1.3123938879456707,
"grad_norm": 0.4056457954329597,
"learning_rate": 3.90791862378668e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1214001476764679,
"step": 1160,
"valid_targets_mean": 7021.0,
"valid_targets_min": 4990
},
{
"epoch": 1.318053197509904,
"grad_norm": 0.4295987244796204,
"learning_rate": 3.906219032771791e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1252824068069458,
"step": 1165,
"valid_targets_mean": 6356.0,
"valid_targets_min": 4385
},
{
"epoch": 1.323712507074137,
"grad_norm": 0.38071643326705473,
"learning_rate": 3.904504276218545e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11139969527721405,
"step": 1170,
"valid_targets_mean": 6815.1,
"valid_targets_min": 5164
},
{
"epoch": 1.3293718166383701,
"grad_norm": 0.4511869701543047,
"learning_rate": 3.902774367769238e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07966958731412888,
"step": 1175,
"valid_targets_mean": 5588.5,
"valid_targets_min": 4098
},
{
"epoch": 1.3350311262026033,
"grad_norm": 0.40443974143086536,
"learning_rate": 3.901029321186715e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10711172968149185,
"step": 1180,
"valid_targets_mean": 6167.6,
"valid_targets_min": 4801
},
{
"epoch": 1.3406904357668363,
"grad_norm": 0.5025063120071397,
"learning_rate": 3.8992691503542526e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22311510145664215,
"step": 1185,
"valid_targets_mean": 6224.9,
"valid_targets_min": 4772
},
{
"epoch": 1.3463497453310695,
"grad_norm": 0.43096078673252874,
"learning_rate": 3.8974938692754565e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11844121664762497,
"step": 1190,
"valid_targets_mean": 6549.2,
"valid_targets_min": 5025
},
{
"epoch": 1.3520090548953028,
"grad_norm": 0.4411764049541238,
"learning_rate": 3.895703492074147e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1157045066356659,
"step": 1195,
"valid_targets_mean": 6680.8,
"valid_targets_min": 4818
},
{
"epoch": 1.357668364459536,
"grad_norm": 0.4327381745312927,
"learning_rate": 3.893898032994244e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10466340184211731,
"step": 1200,
"valid_targets_mean": 5835.1,
"valid_targets_min": 4111
},
{
"epoch": 1.3633276740237692,
"grad_norm": 0.41626129249832783,
"learning_rate": 3.892077506399659e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10042882710695267,
"step": 1205,
"valid_targets_mean": 7029.9,
"valid_targets_min": 2275
},
{
"epoch": 1.3689869835880022,
"grad_norm": 0.3941078540715684,
"learning_rate": 3.890241926774176e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08970265835523605,
"step": 1210,
"valid_targets_mean": 5621.2,
"valid_targets_min": 4826
},
{
"epoch": 1.3746462931522354,
"grad_norm": 0.4328651679860648,
"learning_rate": 3.888391308721339e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09326186776161194,
"step": 1215,
"valid_targets_mean": 6858.8,
"valid_targets_min": 4710
},
{
"epoch": 1.3803056027164686,
"grad_norm": 0.3858063007563162,
"learning_rate": 3.8865256669643345e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13152405619621277,
"step": 1220,
"valid_targets_mean": 7012.5,
"valid_targets_min": 5421
},
{
"epoch": 1.3859649122807016,
"grad_norm": 0.3744177832844025,
"learning_rate": 3.884645016345876e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09377632290124893,
"step": 1225,
"valid_targets_mean": 6967.6,
"valid_targets_min": 4949
},
{
"epoch": 1.3916242218449348,
"grad_norm": 0.3859158266030199,
"learning_rate": 3.882749371828084e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10139726847410202,
"step": 1230,
"valid_targets_mean": 6348.5,
"valid_targets_min": 4831
},
{
"epoch": 1.397283531409168,
"grad_norm": 0.40628323849120285,
"learning_rate": 3.880838748492367e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12447110563516617,
"step": 1235,
"valid_targets_mean": 6597.2,
"valid_targets_min": 4018
},
{
"epoch": 1.4029428409734013,
"grad_norm": 0.3728400695414987,
"learning_rate": 3.878913161539304e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07373258471488953,
"step": 1240,
"valid_targets_mean": 6420.9,
"valid_targets_min": 5034
},
{
"epoch": 1.4086021505376345,
"grad_norm": 0.41679011568104735,
"learning_rate": 3.876972626288521e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11582024395465851,
"step": 1245,
"valid_targets_mean": 6962.4,
"valid_targets_min": 5442
},
{
"epoch": 1.4142614601018675,
"grad_norm": 0.44005462344702845,
"learning_rate": 3.87501715817857e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077890619635582,
"step": 1250,
"valid_targets_mean": 5610.9,
"valid_targets_min": 4609
},
{
"epoch": 1.4199207696661007,
"grad_norm": 0.46782563125127635,
"learning_rate": 3.873046772766806e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10515996068716049,
"step": 1255,
"valid_targets_mean": 5038.4,
"valid_targets_min": 2301
},
{
"epoch": 1.425580079230334,
"grad_norm": 0.6393525154542397,
"learning_rate": 3.871061485729264e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11196956783533096,
"step": 1260,
"valid_targets_mean": 1449.8,
"valid_targets_min": 363
},
{
"epoch": 1.4312393887945671,
"grad_norm": 0.3961715756785153,
"learning_rate": 3.8690613128605325e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07758249342441559,
"step": 1265,
"valid_targets_mean": 3729.8,
"valid_targets_min": 3074
},
{
"epoch": 1.4368986983588004,
"grad_norm": 0.514411411172113,
"learning_rate": 3.867046270073631e-05,
"loss": 0.1211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06430846452713013,
"step": 1270,
"valid_targets_mean": 2272.8,
"valid_targets_min": 700
},
{
"epoch": 1.4425580079230333,
"grad_norm": 0.4844248582697401,
"learning_rate": 3.8650163733998796e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057508524507284164,
"step": 1275,
"valid_targets_mean": 2997.5,
"valid_targets_min": 803
},
{
"epoch": 1.4482173174872666,
"grad_norm": 0.4495056164678961,
"learning_rate": 3.862971638988774e-05,
"loss": 0.1155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06564734131097794,
"step": 1280,
"valid_targets_mean": 2655.5,
"valid_targets_min": 920
},
{
"epoch": 1.4538766270514998,
"grad_norm": 0.4256726932838878,
"learning_rate": 3.860912083107856e-05,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06890624016523361,
"step": 1285,
"valid_targets_mean": 3263.8,
"valid_targets_min": 806
},
{
"epoch": 1.4595359366157328,
"grad_norm": 0.7987833397224602,
"learning_rate": 3.8588377221425846e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10396931320428848,
"step": 1290,
"valid_targets_mean": 1644.4,
"valid_targets_min": 718
},
{
"epoch": 1.465195246179966,
"grad_norm": 0.41071930776105053,
"learning_rate": 3.8567485725962054e-05,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0699780210852623,
"step": 1295,
"valid_targets_mean": 3399.4,
"valid_targets_min": 1133
},
{
"epoch": 1.4708545557441992,
"grad_norm": 0.4669417191292071,
"learning_rate": 3.8546446510896196e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052286192774772644,
"step": 1300,
"valid_targets_mean": 1808.9,
"valid_targets_min": 859
},
{
"epoch": 1.4765138653084324,
"grad_norm": 0.279190024858727,
"learning_rate": 3.8525259743612504e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04190339148044586,
"step": 1305,
"valid_targets_mean": 5541.4,
"valid_targets_min": 5150
},
{
"epoch": 1.4821731748726656,
"grad_norm": 0.3783760567491969,
"learning_rate": 3.850392559266912e-05,
"loss": 0.1072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07370060682296753,
"step": 1310,
"valid_targets_mean": 4000.1,
"valid_targets_min": 502
},
{
"epoch": 1.4878324844368986,
"grad_norm": 0.37009657456448125,
"learning_rate": 3.848244422779675e-05,
"loss": 0.114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06480339169502258,
"step": 1315,
"valid_targets_mean": 3906.9,
"valid_targets_min": 600
},
{
"epoch": 1.4934917940011319,
"grad_norm": 0.4432314283510275,
"learning_rate": 3.8460815819897275e-05,
"loss": 0.1126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05141071975231171,
"step": 1320,
"valid_targets_mean": 2979.5,
"valid_targets_min": 518
},
{
"epoch": 1.499151103565365,
"grad_norm": 0.4118835024522952,
"learning_rate": 3.8439040541042477e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06730692833662033,
"step": 1325,
"valid_targets_mean": 3522.5,
"valid_targets_min": 549
},
{
"epoch": 1.504810413129598,
"grad_norm": 0.3453526365894916,
"learning_rate": 3.8417118564472566e-05,
"loss": 0.1057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04490172117948532,
"step": 1330,
"valid_targets_mean": 3878.5,
"valid_targets_min": 3170
},
{
"epoch": 1.5104697226938315,
"grad_norm": 0.5973143983949719,
"learning_rate": 3.8395050064594886e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07379209250211716,
"step": 1335,
"valid_targets_mean": 1656.0,
"valid_targets_min": 644
},
{
"epoch": 1.5161290322580645,
"grad_norm": 0.3322282229333689,
"learning_rate": 3.8372835216982474e-05,
"loss": 0.0988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030613193288445473,
"step": 1340,
"valid_targets_mean": 2891.8,
"valid_targets_min": 720
},
{
"epoch": 1.5217883418222977,
"grad_norm": 0.4763357740709184,
"learning_rate": 3.83504741983727e-05,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05212488770484924,
"step": 1345,
"valid_targets_mean": 1775.6,
"valid_targets_min": 516
},
{
"epoch": 1.527447651386531,
"grad_norm": 0.5616103799879494,
"learning_rate": 3.832796718666583e-05,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0769435241818428,
"step": 1350,
"valid_targets_mean": 2018.6,
"valid_targets_min": 557
},
{
"epoch": 1.533106960950764,
"grad_norm": 0.43822923169816463,
"learning_rate": 3.830531436092363e-05,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07701824605464935,
"step": 1355,
"valid_targets_mean": 3398.1,
"valid_targets_min": 1086
},
{
"epoch": 1.5387662705149971,
"grad_norm": 0.4317930795508292,
"learning_rate": 3.828251590136795e-05,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07521131634712219,
"step": 1360,
"valid_targets_mean": 2532.9,
"valid_targets_min": 1008
},
{
"epoch": 1.5444255800792304,
"grad_norm": 0.5245145698637755,
"learning_rate": 3.8259571989379256e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046158429235219955,
"step": 1365,
"valid_targets_mean": 3481.1,
"valid_targets_min": 2756
},
{
"epoch": 1.5500848896434634,
"grad_norm": 0.3296178101522478,
"learning_rate": 3.8236482807495214e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04727683216333389,
"step": 1370,
"valid_targets_mean": 4113.5,
"valid_targets_min": 3798
},
{
"epoch": 1.5557441992076968,
"grad_norm": 0.8548617148468368,
"learning_rate": 3.8213248539409236e-05,
"loss": 0.1335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11022968590259552,
"step": 1375,
"valid_targets_mean": 1058.6,
"valid_targets_min": 598
},
{
"epoch": 1.5614035087719298,
"grad_norm": 0.41271716216436005,
"learning_rate": 3.8189869369969016e-05,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04818184673786163,
"step": 1380,
"valid_targets_mean": 2403.5,
"valid_targets_min": 754
},
{
"epoch": 1.567062818336163,
"grad_norm": 0.34511489195605416,
"learning_rate": 3.816634548517505e-05,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06006976217031479,
"step": 1385,
"valid_targets_mean": 4045.8,
"valid_targets_min": 3390
},
{
"epoch": 1.5727221279003962,
"grad_norm": 0.6490300241903905,
"learning_rate": 3.814267707217917e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16865617036819458,
"step": 1390,
"valid_targets_mean": 2255.9,
"valid_targets_min": 1052
},
{
"epoch": 1.5783814374646292,
"grad_norm": 0.4099557009711887,
"learning_rate": 3.8118864319283025e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07171247899532318,
"step": 1395,
"valid_targets_mean": 3214.0,
"valid_targets_min": 2176
},
{
"epoch": 1.5840407470288624,
"grad_norm": 0.48507846475715394,
"learning_rate": 3.809490741593665e-05,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057411808520555496,
"step": 1400,
"valid_targets_mean": 2396.0,
"valid_targets_min": 1074
},
{
"epoch": 1.5897000565930957,
"grad_norm": 0.46213090035219073,
"learning_rate": 3.807080655273689e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06575348228216171,
"step": 1405,
"valid_targets_mean": 3271.8,
"valid_targets_min": 1212
},
{
"epoch": 1.5953593661573287,
"grad_norm": 0.4504573910708974,
"learning_rate": 3.8046561921425895e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07250872254371643,
"step": 1410,
"valid_targets_mean": 3990.8,
"valid_targets_min": 2258
},
{
"epoch": 1.601018675721562,
"grad_norm": 0.31830121418698293,
"learning_rate": 3.802217371488964e-05,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06969204545021057,
"step": 1415,
"valid_targets_mean": 3730.2,
"valid_targets_min": 1466
},
{
"epoch": 1.606677985285795,
"grad_norm": 0.38404044511110647,
"learning_rate": 3.799764212715633e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06129370257258415,
"step": 1420,
"valid_targets_mean": 3557.1,
"valid_targets_min": 560
},
{
"epoch": 1.6123372948500283,
"grad_norm": 0.3782342128182197,
"learning_rate": 3.7972967353394906e-05,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06335802376270294,
"step": 1425,
"valid_targets_mean": 3222.9,
"valid_targets_min": 1189
},
{
"epoch": 1.6179966044142615,
"grad_norm": 0.3631388391112149,
"learning_rate": 3.794814958991346e-05,
"loss": 0.1072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048005443066358566,
"step": 1430,
"valid_targets_mean": 3665.2,
"valid_targets_min": 2257
},
{
"epoch": 1.6236559139784945,
"grad_norm": 0.36678907072924855,
"learning_rate": 3.792318903415769e-05,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04388028010725975,
"step": 1435,
"valid_targets_mean": 3314.4,
"valid_targets_min": 886
},
{
"epoch": 1.629315223542728,
"grad_norm": 0.3876337194785037,
"learning_rate": 3.789808588470932e-05,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05543633550405502,
"step": 1440,
"valid_targets_mean": 3377.5,
"valid_targets_min": 2409
},
{
"epoch": 1.634974533106961,
"grad_norm": 0.37020115100592305,
"learning_rate": 3.787284034128453e-05,
"loss": 0.1046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04897238314151764,
"step": 1445,
"valid_targets_mean": 3241.8,
"valid_targets_min": 820
},
{
"epoch": 1.6406338426711942,
"grad_norm": 0.9398974150849458,
"learning_rate": 3.784745260473235e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13083994388580322,
"step": 1450,
"valid_targets_mean": 2264.2,
"valid_targets_min": 813
},
{
"epoch": 1.6462931522354274,
"grad_norm": 0.3455411095404806,
"learning_rate": 3.782192287703309e-05,
"loss": 0.1016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0457475408911705,
"step": 1455,
"valid_targets_mean": 3651.9,
"valid_targets_min": 2877
},
{
"epoch": 1.6519524617996604,
"grad_norm": 0.5320280185554186,
"learning_rate": 3.7796251361296695e-05,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06856375932693481,
"step": 1460,
"valid_targets_mean": 2384.0,
"valid_targets_min": 667
},
{
"epoch": 1.6576117713638936,
"grad_norm": 0.33107100848601195,
"learning_rate": 3.777043826176117e-05,
"loss": 0.0984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046754010021686554,
"step": 1465,
"valid_targets_mean": 3488.6,
"valid_targets_min": 2353
},
{
"epoch": 1.6632710809281268,
"grad_norm": 0.3889838725270318,
"learning_rate": 3.7744483783790924e-05,
"loss": 0.1037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0684385597705841,
"step": 1470,
"valid_targets_mean": 3189.9,
"valid_targets_min": 549
},
{
"epoch": 1.6689303904923598,
"grad_norm": 0.3441656776900516,
"learning_rate": 3.771838813387516e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048582062125205994,
"step": 1475,
"valid_targets_mean": 3826.5,
"valid_targets_min": 3340
},
{
"epoch": 1.6745897000565932,
"grad_norm": 0.4277143254856908,
"learning_rate": 3.7692151519626196e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0704786479473114,
"step": 1480,
"valid_targets_mean": 2178.2,
"valid_targets_min": 647
},
{
"epoch": 1.6802490096208262,
"grad_norm": 0.47124270373672383,
"learning_rate": 3.766577414977786e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06369224935770035,
"step": 1485,
"valid_targets_mean": 1558.9,
"valid_targets_min": 804
},
{
"epoch": 1.6859083191850595,
"grad_norm": 0.753103958134033,
"learning_rate": 3.763925623418379e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12379364669322968,
"step": 1490,
"valid_targets_mean": 1855.1,
"valid_targets_min": 702
},
{
"epoch": 1.6915676287492927,
"grad_norm": 0.48046832764275127,
"learning_rate": 3.7612597983815797e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08387649059295654,
"step": 1495,
"valid_targets_mean": 2858.1,
"valid_targets_min": 945
},
{
"epoch": 1.6972269383135257,
"grad_norm": 0.49583149151554834,
"learning_rate": 3.7585799610762166e-05,
"loss": 0.1184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07928980141878128,
"step": 1500,
"valid_targets_mean": 2879.5,
"valid_targets_min": 703
},
{
"epoch": 1.7028862478777589,
"grad_norm": 0.42423476563437235,
"learning_rate": 3.755886132822596e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06221155822277069,
"step": 1505,
"valid_targets_mean": 3950.5,
"valid_targets_min": 3051
},
{
"epoch": 1.708545557441992,
"grad_norm": 0.5882449890510761,
"learning_rate": 3.753178335052335e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08767211437225342,
"step": 1510,
"valid_targets_mean": 1759.8,
"valid_targets_min": 523
},
{
"epoch": 1.714204867006225,
"grad_norm": 0.3446555532092815,
"learning_rate": 3.750456589308189e-05,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05195833742618561,
"step": 1515,
"valid_targets_mean": 2138.2,
"valid_targets_min": 468
},
{
"epoch": 1.7198641765704585,
"grad_norm": 0.25061409519259453,
"learning_rate": 3.7477209172438824e-05,
"loss": 0.1152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03194167837500572,
"step": 1520,
"valid_targets_mean": 4428.1,
"valid_targets_min": 885
},
{
"epoch": 1.7255234861346915,
"grad_norm": 0.369656846375251,
"learning_rate": 3.744971340623932e-05,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04173450544476509,
"step": 1525,
"valid_targets_mean": 2478.5,
"valid_targets_min": 546
},
{
"epoch": 1.7311827956989247,
"grad_norm": 0.33231186695325116,
"learning_rate": 3.74220788132348e-05,
"loss": 0.1024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05705367028713226,
"step": 1530,
"valid_targets_mean": 3910.5,
"valid_targets_min": 981
},
{
"epoch": 1.736842105263158,
"grad_norm": 0.48276957868170417,
"learning_rate": 3.739430561328116e-05,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06112513691186905,
"step": 1535,
"valid_targets_mean": 1519.9,
"valid_targets_min": 697
},
{
"epoch": 1.742501414827391,
"grad_norm": 0.41746150621793054,
"learning_rate": 3.736639402733699e-05,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05486248433589935,
"step": 1540,
"valid_targets_mean": 3473.4,
"valid_targets_min": 2777
},
{
"epoch": 1.7481607243916242,
"grad_norm": 0.42139772843391654,
"learning_rate": 3.733834427746192e-05,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061300329864025116,
"step": 1545,
"valid_targets_mean": 3932.4,
"valid_targets_min": 3061
},
{
"epoch": 1.7538200339558574,
"grad_norm": 0.340496756363664,
"learning_rate": 3.7310156586814736e-05,
"loss": 0.1077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054317034780979156,
"step": 1550,
"valid_targets_mean": 2882.2,
"valid_targets_min": 868
},
{
"epoch": 1.7594793435200904,
"grad_norm": 0.437913008532826,
"learning_rate": 3.7281831179651674e-05,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04469527676701546,
"step": 1555,
"valid_targets_mean": 2506.6,
"valid_targets_min": 752
},
{
"epoch": 1.7651386530843238,
"grad_norm": 0.4597022925107832,
"learning_rate": 3.725336828132462e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055792104452848434,
"step": 1560,
"valid_targets_mean": 3418.9,
"valid_targets_min": 1141
},
{
"epoch": 1.7707979626485568,
"grad_norm": 0.3140091225890798,
"learning_rate": 3.722476811827931e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052371345460414886,
"step": 1565,
"valid_targets_mean": 3901.2,
"valid_targets_min": 3540
},
{
"epoch": 1.77645727221279,
"grad_norm": 0.3873586711176246,
"learning_rate": 3.719603091805354e-05,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048507675528526306,
"step": 1570,
"valid_targets_mean": 2808.2,
"valid_targets_min": 773
},
{
"epoch": 1.7821165817770233,
"grad_norm": 0.4072289949420176,
"learning_rate": 3.716715690927534e-05,
"loss": 0.1174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03962133452296257,
"step": 1575,
"valid_targets_mean": 3550.5,
"valid_targets_min": 2587
},
{
"epoch": 1.7877758913412563,
"grad_norm": 0.423490356907719,
"learning_rate": 3.713814632166117e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05531451851129532,
"step": 1580,
"valid_targets_mean": 2700.6,
"valid_targets_min": 773
},
{
"epoch": 1.7934352009054897,
"grad_norm": 0.4459507286833836,
"learning_rate": 3.7108999386014094e-05,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06484959274530411,
"step": 1585,
"valid_targets_mean": 3615.9,
"valid_targets_min": 2962
},
{
"epoch": 1.7990945104697227,
"grad_norm": 0.5974029415055255,
"learning_rate": 3.707971633422192e-05,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06666037440299988,
"step": 1590,
"valid_targets_mean": 1766.6,
"valid_targets_min": 649
},
{
"epoch": 1.804753820033956,
"grad_norm": 0.5371457964206325,
"learning_rate": 3.705029739925539e-05,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06027115881443024,
"step": 1595,
"valid_targets_mean": 1668.4,
"valid_targets_min": 708
},
{
"epoch": 1.8104131295981891,
"grad_norm": 0.4105963034912273,
"learning_rate": 3.702074281516629e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051896438002586365,
"step": 1600,
"valid_targets_mean": 2129.5,
"valid_targets_min": 617
},
{
"epoch": 1.8160724391624221,
"grad_norm": 0.4304740098082602,
"learning_rate": 3.699105281708562e-05,
"loss": 0.1141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05431009829044342,
"step": 1605,
"valid_targets_mean": 2495.0,
"valid_targets_min": 720
},
{
"epoch": 1.8217317487266553,
"grad_norm": 0.5735926965861751,
"learning_rate": 3.69612276412217e-05,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06785906851291656,
"step": 1610,
"valid_targets_mean": 1537.8,
"valid_targets_min": 628
},
{
"epoch": 1.8273910582908885,
"grad_norm": 0.5898530064935896,
"learning_rate": 3.693126752485833e-05,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10182633996009827,
"step": 1615,
"valid_targets_mean": 2155.2,
"valid_targets_min": 821
},
{
"epoch": 1.8330503678551215,
"grad_norm": 0.30947250284869365,
"learning_rate": 3.6901172706352804e-05,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03451775759458542,
"step": 1620,
"valid_targets_mean": 3628.1,
"valid_targets_min": 2863
},
{
"epoch": 1.838709677419355,
"grad_norm": 0.3690235938558517,
"learning_rate": 3.687094342513416e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03967660665512085,
"step": 1625,
"valid_targets_mean": 3585.2,
"valid_targets_min": 1773
},
{
"epoch": 1.844368986983588,
"grad_norm": 0.4516985285671224,
"learning_rate": 3.6840579921701155e-05,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06410881876945496,
"step": 1630,
"valid_targets_mean": 2356.6,
"valid_targets_min": 721
},
{
"epoch": 1.8500282965478212,
"grad_norm": 0.359767615703714,
"learning_rate": 3.68100824376204e-05,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06105772778391838,
"step": 1635,
"valid_targets_mean": 5092.5,
"valid_targets_min": 4222
},
{
"epoch": 1.8556876061120544,
"grad_norm": 0.34713169199052546,
"learning_rate": 3.6779451215524425e-05,
"loss": 0.0952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05121070519089699,
"step": 1640,
"valid_targets_mean": 4604.0,
"valid_targets_min": 2020
},
{
"epoch": 1.8613469156762874,
"grad_norm": 0.3719471726084662,
"learning_rate": 3.6748686499109784e-05,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04059560224413872,
"step": 1645,
"valid_targets_mean": 3097.9,
"valid_targets_min": 739
},
{
"epoch": 1.8670062252405206,
"grad_norm": 0.4061457385537339,
"learning_rate": 3.6717788533135056e-05,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058897800743579865,
"step": 1650,
"valid_targets_mean": 3696.1,
"valid_targets_min": 2945
},
{
"epoch": 1.8726655348047538,
"grad_norm": 0.3617521099651027,
"learning_rate": 3.6686757563418945e-05,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061327625066041946,
"step": 1655,
"valid_targets_mean": 3112.8,
"valid_targets_min": 704
},
{
"epoch": 1.8783248443689868,
"grad_norm": 0.3604517782802872,
"learning_rate": 3.665559383683832e-05,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05376065522432327,
"step": 1660,
"valid_targets_mean": 2490.9,
"valid_targets_min": 774
},
{
"epoch": 1.8839841539332203,
"grad_norm": 0.33553954553952914,
"learning_rate": 3.6624297601326205e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043106965720653534,
"step": 1665,
"valid_targets_mean": 2570.2,
"valid_targets_min": 485
},
{
"epoch": 1.8896434634974533,
"grad_norm": 0.3897113819731708,
"learning_rate": 3.659286910586988e-05,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04850570484995842,
"step": 1670,
"valid_targets_mean": 3087.4,
"valid_targets_min": 1048
},
{
"epoch": 1.8953027730616865,
"grad_norm": 0.37895239456846863,
"learning_rate": 3.656130860050883e-05,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052234359085559845,
"step": 1675,
"valid_targets_mean": 2753.6,
"valid_targets_min": 722
},
{
"epoch": 1.9009620826259197,
"grad_norm": 0.5106105258979503,
"learning_rate": 3.652961633633282e-05,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06938277184963226,
"step": 1680,
"valid_targets_mean": 1836.2,
"valid_targets_min": 865
},
{
"epoch": 1.9066213921901527,
"grad_norm": 0.521228149558116,
"learning_rate": 3.649779256547984e-05,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060481246560811996,
"step": 1685,
"valid_targets_mean": 2377.5,
"valid_targets_min": 675
},
{
"epoch": 1.912280701754386,
"grad_norm": 0.39880685753741063,
"learning_rate": 3.6465837541134114e-05,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0540006123483181,
"step": 1690,
"valid_targets_mean": 3323.0,
"valid_targets_min": 782
},
{
"epoch": 1.9179400113186191,
"grad_norm": 0.42108885956864084,
"learning_rate": 3.643375151752414e-05,
"loss": 0.1091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05214047059416771,
"step": 1695,
"valid_targets_mean": 2581.8,
"valid_targets_min": 795
},
{
"epoch": 1.9235993208828521,
"grad_norm": 0.4156569687453574,
"learning_rate": 3.6401534749920566e-05,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0582006499171257,
"step": 1700,
"valid_targets_mean": 3264.6,
"valid_targets_min": 2017
},
{
"epoch": 1.9292586304470856,
"grad_norm": 0.3723182247552374,
"learning_rate": 3.636918749463426e-05,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04763641208410263,
"step": 1705,
"valid_targets_mean": 2319.6,
"valid_targets_min": 798
},
{
"epoch": 1.9349179400113186,
"grad_norm": 0.3569396345560108,
"learning_rate": 3.633671000901422e-05,
"loss": 0.0985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05561841279268265,
"step": 1710,
"valid_targets_mean": 3299.6,
"valid_targets_min": 860
},
{
"epoch": 1.9405772495755518,
"grad_norm": 0.4168083888615434,
"learning_rate": 3.63041025514455e-05,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0583263598382473,
"step": 1715,
"valid_targets_mean": 3302.4,
"valid_targets_min": 878
},
{
"epoch": 1.946236559139785,
"grad_norm": 0.3357389283054348,
"learning_rate": 3.627136538134723e-05,
"loss": 0.0957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039092086255550385,
"step": 1720,
"valid_targets_mean": 3832.2,
"valid_targets_min": 2602
},
{
"epoch": 1.951895868704018,
"grad_norm": 0.4848350300498934,
"learning_rate": 3.623849875917049e-05,
"loss": 0.1133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06840664148330688,
"step": 1725,
"valid_targets_mean": 2736.5,
"valid_targets_min": 945
},
{
"epoch": 1.9575551782682514,
"grad_norm": 0.4192988003009786,
"learning_rate": 3.620550294639625e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06918597221374512,
"step": 1730,
"valid_targets_mean": 3831.1,
"valid_targets_min": 3128
},
{
"epoch": 1.9632144878324844,
"grad_norm": 0.346024934816044,
"learning_rate": 3.6172378205533316e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05582546442747116,
"step": 1735,
"valid_targets_mean": 3966.2,
"valid_targets_min": 2529
},
{
"epoch": 1.9688737973967176,
"grad_norm": 0.3488468452500612,
"learning_rate": 3.613912480011621e-05,
"loss": 0.0953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06639085710048676,
"step": 1740,
"valid_targets_mean": 4704.8,
"valid_targets_min": 892
},
{
"epoch": 1.9745331069609509,
"grad_norm": 0.27640089567785464,
"learning_rate": 3.610574299470308e-05,
"loss": 0.1067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03565194457769394,
"step": 1745,
"valid_targets_mean": 4471.1,
"valid_targets_min": 1657
},
{
"epoch": 1.9801924165251839,
"grad_norm": 0.557304325917542,
"learning_rate": 3.6072233054873634e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14241379499435425,
"step": 1750,
"valid_targets_mean": 1989.8,
"valid_targets_min": 709
},
{
"epoch": 1.985851726089417,
"grad_norm": 0.3099094861639918,
"learning_rate": 3.6038595247226946e-05,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04021911323070526,
"step": 1755,
"valid_targets_mean": 3226.5,
"valid_targets_min": 527
},
{
"epoch": 1.9915110356536503,
"grad_norm": 0.3484031043449807,
"learning_rate": 3.600482983937943e-05,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06430061161518097,
"step": 1760,
"valid_targets_mean": 3531.0,
"valid_targets_min": 2318
},
{
"epoch": 1.9971703452178833,
"grad_norm": 0.3315201233960109,
"learning_rate": 3.597093709996263e-05,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05331774055957794,
"step": 1765,
"valid_targets_mean": 3520.9,
"valid_targets_min": 2883
},
{
"epoch": 2.0022637238256933,
"grad_norm": 0.4650942658007115,
"learning_rate": 3.593691729862114e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10227910429239273,
"step": 1770,
"valid_targets_mean": 5904.0,
"valid_targets_min": 4967
},
{
"epoch": 2.0079230333899263,
"grad_norm": 0.3688430969903834,
"learning_rate": 3.5902770706010414e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11695493757724762,
"step": 1775,
"valid_targets_mean": 8641.4,
"valid_targets_min": 5164
},
{
"epoch": 2.0135823429541597,
"grad_norm": 0.36292308857695155,
"learning_rate": 3.586849759379466e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09385283291339874,
"step": 1780,
"valid_targets_mean": 6838.2,
"valid_targets_min": 5200
},
{
"epoch": 2.0192416525183927,
"grad_norm": 0.3826950676721889,
"learning_rate": 3.583409823464464e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07843857258558273,
"step": 1785,
"valid_targets_mean": 5411.6,
"valid_targets_min": 3853
},
{
"epoch": 2.0249009620826257,
"grad_norm": 0.39590639769636465,
"learning_rate": 3.5799572902235506e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10466514527797699,
"step": 1790,
"valid_targets_mean": 5598.0,
"valid_targets_min": 4669
},
{
"epoch": 2.030560271646859,
"grad_norm": 0.42021932727305517,
"learning_rate": 3.576492187124465e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10257241129875183,
"step": 1795,
"valid_targets_mean": 5953.0,
"valid_targets_min": 4216
},
{
"epoch": 2.036219581211092,
"grad_norm": 0.3824309948575738,
"learning_rate": 3.5730145417349486e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10280093550682068,
"step": 1800,
"valid_targets_mean": 5914.0,
"valid_targets_min": 4589
},
{
"epoch": 2.0418788907753256,
"grad_norm": 0.3774424672724206,
"learning_rate": 3.569524381722527e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09702812880277634,
"step": 1805,
"valid_targets_mean": 6515.4,
"valid_targets_min": 4588
},
{
"epoch": 2.0475382003395586,
"grad_norm": 0.3463163873793305,
"learning_rate": 3.5660217348542905e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09045751392841339,
"step": 1810,
"valid_targets_mean": 7015.2,
"valid_targets_min": 4530
},
{
"epoch": 2.0531975099037916,
"grad_norm": 0.38005898031225666,
"learning_rate": 3.562506628996672e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10554981231689453,
"step": 1815,
"valid_targets_mean": 6202.6,
"valid_targets_min": 4837
},
{
"epoch": 2.058856819468025,
"grad_norm": 0.49281621300824496,
"learning_rate": 3.558979092115227e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062259264290332794,
"step": 1820,
"valid_targets_mean": 1720.9,
"valid_targets_min": 229
},
{
"epoch": 2.064516129032258,
"grad_norm": 0.38979368137302145,
"learning_rate": 3.555439152274408e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09573017060756683,
"step": 1825,
"valid_targets_mean": 5963.8,
"valid_targets_min": 4216
},
{
"epoch": 2.0701754385964914,
"grad_norm": 0.37983119309515756,
"learning_rate": 3.551886837637346e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09074237197637558,
"step": 1830,
"valid_targets_mean": 5973.9,
"valid_targets_min": 4835
},
{
"epoch": 2.0758347481607244,
"grad_norm": 0.3558752312487743,
"learning_rate": 3.548322176465622e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0832388773560524,
"step": 1835,
"valid_targets_mean": 6669.8,
"valid_targets_min": 4995
},
{
"epoch": 2.0814940577249574,
"grad_norm": 0.44946142448140997,
"learning_rate": 3.544745197119042e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12601280212402344,
"step": 1840,
"valid_targets_mean": 5705.5,
"valid_targets_min": 4108
},
{
"epoch": 2.087153367289191,
"grad_norm": 0.4096707797369472,
"learning_rate": 3.541155928055418e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1199854165315628,
"step": 1845,
"valid_targets_mean": 6594.0,
"valid_targets_min": 4527
},
{
"epoch": 2.092812676853424,
"grad_norm": 0.4480155154525078,
"learning_rate": 3.537554397830331e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10273626446723938,
"step": 1850,
"valid_targets_mean": 3100.9,
"valid_targets_min": 2104
},
{
"epoch": 2.098471986417657,
"grad_norm": 0.376634058661012,
"learning_rate": 3.533940635096915e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08255627006292343,
"step": 1855,
"valid_targets_mean": 5817.8,
"valid_targets_min": 4757
},
{
"epoch": 2.1041312959818903,
"grad_norm": 0.40073821404298404,
"learning_rate": 3.530314668605621e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11327770352363586,
"step": 1860,
"valid_targets_mean": 6333.0,
"valid_targets_min": 5056
},
{
"epoch": 2.1097906055461233,
"grad_norm": 0.3734001545981099,
"learning_rate": 3.5266765272039895e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08531501889228821,
"step": 1865,
"valid_targets_mean": 5956.0,
"valid_targets_min": 2834
},
{
"epoch": 2.1154499151103567,
"grad_norm": 0.3967893930386219,
"learning_rate": 3.523026239836426e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12767675518989563,
"step": 1870,
"valid_targets_mean": 6984.6,
"valid_targets_min": 5744
},
{
"epoch": 2.1211092246745897,
"grad_norm": 0.4034811625677781,
"learning_rate": 3.5193638355439635e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08648249506950378,
"step": 1875,
"valid_targets_mean": 7290.2,
"valid_targets_min": 5640
},
{
"epoch": 2.1267685342388227,
"grad_norm": 0.4225969920586299,
"learning_rate": 3.515689343464038e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09000758826732635,
"step": 1880,
"valid_targets_mean": 7036.0,
"valid_targets_min": 5210
},
{
"epoch": 2.132427843803056,
"grad_norm": 0.4180663507921894,
"learning_rate": 3.512002792830252e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1279435157775879,
"step": 1885,
"valid_targets_mean": 7138.5,
"valid_targets_min": 5292
},
{
"epoch": 2.138087153367289,
"grad_norm": 0.4082154228625417,
"learning_rate": 3.508304212972145e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10258790850639343,
"step": 1890,
"valid_targets_mean": 6134.2,
"valid_targets_min": 3531
},
{
"epoch": 2.143746462931522,
"grad_norm": 0.4001627333855726,
"learning_rate": 3.504593633314957e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1019192785024643,
"step": 1895,
"valid_targets_mean": 5968.2,
"valid_targets_min": 4640
},
{
"epoch": 2.1494057724957556,
"grad_norm": 0.3939812237785384,
"learning_rate": 3.500871083379398e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0974932610988617,
"step": 1900,
"valid_targets_mean": 6249.6,
"valid_targets_min": 4328
},
{
"epoch": 2.1550650820599886,
"grad_norm": 0.425061630606132,
"learning_rate": 3.497136592781411e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10714038461446762,
"step": 1905,
"valid_targets_mean": 6002.4,
"valid_targets_min": 3123
},
{
"epoch": 2.160724391624222,
"grad_norm": 0.3909594756495503,
"learning_rate": 3.493390191231937e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09464001655578613,
"step": 1910,
"valid_targets_mean": 6372.2,
"valid_targets_min": 4256
},
{
"epoch": 2.166383701188455,
"grad_norm": 0.4753346300038162,
"learning_rate": 3.4896319085366764e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10602079331874847,
"step": 1915,
"valid_targets_mean": 5927.8,
"valid_targets_min": 4753
},
{
"epoch": 2.172043010752688,
"grad_norm": 0.40365757025068216,
"learning_rate": 3.485861774595857e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09577983617782593,
"step": 1920,
"valid_targets_mean": 6106.1,
"valid_targets_min": 5370
},
{
"epoch": 2.1777023203169215,
"grad_norm": 0.4429082540303591,
"learning_rate": 3.482079819403991e-05,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10737248510122299,
"step": 1925,
"valid_targets_mean": 6240.6,
"valid_targets_min": 4608
},
{
"epoch": 2.1833616298811545,
"grad_norm": 0.4604460702396511,
"learning_rate": 3.4782860730496385e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09162674099206924,
"step": 1930,
"valid_targets_mean": 5733.2,
"valid_targets_min": 3801
},
{
"epoch": 2.1890209394453874,
"grad_norm": 0.38939580594223905,
"learning_rate": 3.474480565715168e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10398145765066147,
"step": 1935,
"valid_targets_mean": 6430.1,
"valid_targets_min": 4754
},
{
"epoch": 2.194680249009621,
"grad_norm": 0.33698859572698064,
"learning_rate": 3.470663327676517e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0752083882689476,
"step": 1940,
"valid_targets_mean": 7375.2,
"valid_targets_min": 6417
},
{
"epoch": 2.200339558573854,
"grad_norm": 0.4562817386757838,
"learning_rate": 3.466834389302951e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1071748435497284,
"step": 1945,
"valid_targets_mean": 6281.0,
"valid_targets_min": 3468
},
{
"epoch": 2.2059988681380873,
"grad_norm": 0.4019776315767542,
"learning_rate": 3.4629937810568185e-05,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09497380256652832,
"step": 1950,
"valid_targets_mean": 6532.4,
"valid_targets_min": 5221
},
{
"epoch": 2.2116581777023203,
"grad_norm": 0.49926857648549444,
"learning_rate": 3.459141533493315e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08050023019313812,
"step": 1955,
"valid_targets_mean": 5552.6,
"valid_targets_min": 4438
},
{
"epoch": 2.2173174872665533,
"grad_norm": 0.4249799624141297,
"learning_rate": 3.455277677260231e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10170389711856842,
"step": 1960,
"valid_targets_mean": 5878.1,
"valid_targets_min": 3915
},
{
"epoch": 2.2229767968307867,
"grad_norm": 0.3284937764800396,
"learning_rate": 3.451402243097721e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07613489031791687,
"step": 1965,
"valid_targets_mean": 7082.6,
"valid_targets_min": 4135
},
{
"epoch": 2.2286361063950197,
"grad_norm": 0.4244872944881361,
"learning_rate": 3.4475152618380456e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0987371951341629,
"step": 1970,
"valid_targets_mean": 5936.4,
"valid_targets_min": 3947
},
{
"epoch": 2.234295415959253,
"grad_norm": 0.40889945828872726,
"learning_rate": 3.443616764405334e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12065830081701279,
"step": 1975,
"valid_targets_mean": 6836.2,
"valid_targets_min": 4865
},
{
"epoch": 2.239954725523486,
"grad_norm": 0.5840265740345978,
"learning_rate": 3.4397067818153345e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09379205107688904,
"step": 1980,
"valid_targets_mean": 6539.4,
"valid_targets_min": 4643
},
{
"epoch": 2.245614035087719,
"grad_norm": 0.37861827661541286,
"learning_rate": 3.435785345175173e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09451638907194138,
"step": 1985,
"valid_targets_mean": 6613.6,
"valid_targets_min": 4959
},
{
"epoch": 2.2512733446519526,
"grad_norm": 0.39489041786405854,
"learning_rate": 3.431852485683098e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10732698440551758,
"step": 1990,
"valid_targets_mean": 6044.1,
"valid_targets_min": 4652
},
{
"epoch": 2.2569326542161856,
"grad_norm": 0.38898383798039116,
"learning_rate": 3.4279082346282396e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0827295109629631,
"step": 1995,
"valid_targets_mean": 5893.9,
"valid_targets_min": 4938
},
{
"epoch": 2.2625919637804186,
"grad_norm": 0.376704751319281,
"learning_rate": 3.423952623390352e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07669830322265625,
"step": 2000,
"valid_targets_mean": 5849.6,
"valid_targets_min": 4546
},
{
"epoch": 2.268251273344652,
"grad_norm": 0.3910964440500796,
"learning_rate": 3.419985683439574e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08727534115314484,
"step": 2005,
"valid_targets_mean": 5751.5,
"valid_targets_min": 3200
},
{
"epoch": 2.273910582908885,
"grad_norm": 0.37774305187779456,
"learning_rate": 3.416007446336172e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09513689577579498,
"step": 2010,
"valid_targets_mean": 6149.6,
"valid_targets_min": 5010
},
{
"epoch": 2.279569892473118,
"grad_norm": 0.7245046622730861,
"learning_rate": 3.4120179437302885e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10477955639362335,
"step": 2015,
"valid_targets_mean": 6551.2,
"valid_targets_min": 4904
},
{
"epoch": 2.2852292020373515,
"grad_norm": 0.43974321457580223,
"learning_rate": 3.408017207361696e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13391438126564026,
"step": 2020,
"valid_targets_mean": 5728.9,
"valid_targets_min": 4812
},
{
"epoch": 2.2908885116015845,
"grad_norm": 0.4190046872972955,
"learning_rate": 3.4040052690595376e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07912546396255493,
"step": 2025,
"valid_targets_mean": 5047.9,
"valid_targets_min": 3629
},
{
"epoch": 2.296547821165818,
"grad_norm": 0.4117794454695208,
"learning_rate": 3.399982160742079e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09514860808849335,
"step": 2030,
"valid_targets_mean": 6260.0,
"valid_targets_min": 4324
},
{
"epoch": 2.302207130730051,
"grad_norm": 0.3485537640844097,
"learning_rate": 3.3959479144164515e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08208595216274261,
"step": 2035,
"valid_targets_mean": 7853.1,
"valid_targets_min": 4920
},
{
"epoch": 2.3078664402942843,
"grad_norm": 0.40215304288985815,
"learning_rate": 3.3919025621783996e-05,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08957590162754059,
"step": 2040,
"valid_targets_mean": 6231.0,
"valid_targets_min": 4882
},
{
"epoch": 2.3135257498585173,
"grad_norm": 0.3994007707086233,
"learning_rate": 3.387846136212022e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08934713900089264,
"step": 2045,
"valid_targets_mean": 7472.9,
"valid_targets_min": 3943
},
{
"epoch": 2.3191850594227503,
"grad_norm": 0.39411875696086646,
"learning_rate": 3.3837786687895214e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09899666160345078,
"step": 2050,
"valid_targets_mean": 6840.2,
"valid_targets_min": 5034
},
{
"epoch": 2.3248443689869838,
"grad_norm": 0.41432286699353016,
"learning_rate": 3.3797001922709416e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09966832399368286,
"step": 2055,
"valid_targets_mean": 6458.5,
"valid_targets_min": 4461
},
{
"epoch": 2.3305036785512168,
"grad_norm": 0.3696592168950713,
"learning_rate": 3.375610739103913e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0865120217204094,
"step": 2060,
"valid_targets_mean": 6645.4,
"valid_targets_min": 5188
},
{
"epoch": 2.3361629881154498,
"grad_norm": 0.38218748203757885,
"learning_rate": 3.371510341823396e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09908951073884964,
"step": 2065,
"valid_targets_mean": 6002.9,
"valid_targets_min": 5009
},
{
"epoch": 2.341822297679683,
"grad_norm": 0.4216291403746872,
"learning_rate": 3.3673990330514197e-05,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10168929398059845,
"step": 2070,
"valid_targets_mean": 6025.9,
"valid_targets_min": 4551
},
{
"epoch": 2.347481607243916,
"grad_norm": 0.38801428996393683,
"learning_rate": 3.363276845496822e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09701313078403473,
"step": 2075,
"valid_targets_mean": 7210.0,
"valid_targets_min": 4492
},
{
"epoch": 2.353140916808149,
"grad_norm": 0.38850555570599626,
"learning_rate": 3.359143811954992e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09031613916158676,
"step": 2080,
"valid_targets_mean": 7051.4,
"valid_targets_min": 4718
},
{
"epoch": 2.3588002263723826,
"grad_norm": 0.38719154647188286,
"learning_rate": 3.354999965307606e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09918487071990967,
"step": 2085,
"valid_targets_mean": 6686.0,
"valid_targets_min": 4827
},
{
"epoch": 2.3644595359366156,
"grad_norm": 0.36238981373390344,
"learning_rate": 3.3508453385223684e-05,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0751459077000618,
"step": 2090,
"valid_targets_mean": 5311.9,
"valid_targets_min": 3828
},
{
"epoch": 2.370118845500849,
"grad_norm": 0.39766759905835697,
"learning_rate": 3.346679964652749e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07942270487546921,
"step": 2095,
"valid_targets_mean": 7078.9,
"valid_targets_min": 4594
},
{
"epoch": 2.375778155065082,
"grad_norm": 0.39459968327080425,
"learning_rate": 3.342503876837718e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07656831294298172,
"step": 2100,
"valid_targets_mean": 6393.8,
"valid_targets_min": 4509
},
{
"epoch": 2.381437464629315,
"grad_norm": 0.3758001299296689,
"learning_rate": 3.3383171083014856e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10427580773830414,
"step": 2105,
"valid_targets_mean": 7848.9,
"valid_targets_min": 5649
},
{
"epoch": 2.3870967741935485,
"grad_norm": 0.3903744879220785,
"learning_rate": 3.3341196923532336e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07996858656406403,
"step": 2110,
"valid_targets_mean": 6623.4,
"valid_targets_min": 4343
},
{
"epoch": 2.3927560837577815,
"grad_norm": 0.3953141794689289,
"learning_rate": 3.329911662386855e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08288268744945526,
"step": 2115,
"valid_targets_mean": 6255.9,
"valid_targets_min": 4660
},
{
"epoch": 2.398415393322015,
"grad_norm": 0.34363852176252085,
"learning_rate": 3.3256930518806845e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09071113914251328,
"step": 2120,
"valid_targets_mean": 8243.0,
"valid_targets_min": 6281
},
{
"epoch": 2.404074702886248,
"grad_norm": 0.360214785751071,
"learning_rate": 3.321463894397235e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08923101425170898,
"step": 2125,
"valid_targets_mean": 7083.5,
"valid_targets_min": 4657
},
{
"epoch": 2.409734012450481,
"grad_norm": 0.4200445006113312,
"learning_rate": 3.317224223582927e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10604465007781982,
"step": 2130,
"valid_targets_mean": 6399.8,
"valid_targets_min": 5098
},
{
"epoch": 2.4153933220147144,
"grad_norm": 0.46264235033494944,
"learning_rate": 3.312974073167825e-05,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10362359136343002,
"step": 2135,
"valid_targets_mean": 5257.4,
"valid_targets_min": 1879
},
{
"epoch": 2.4210526315789473,
"grad_norm": 0.43111753430771954,
"learning_rate": 3.30871347696537e-05,
"loss": 0.192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10390962660312653,
"step": 2140,
"valid_targets_mean": 5260.5,
"valid_targets_min": 3619
},
{
"epoch": 2.4267119411431803,
"grad_norm": 0.41865096806641583,
"learning_rate": 3.3044424688721016e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06864843517541885,
"step": 2145,
"valid_targets_mean": 3976.1,
"valid_targets_min": 3545
},
{
"epoch": 2.432371250707414,
"grad_norm": 0.3573869762021644,
"learning_rate": 3.300161082867398e-05,
"loss": 0.1091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04815223067998886,
"step": 2150,
"valid_targets_mean": 3099.4,
"valid_targets_min": 1024
},
{
"epoch": 2.4380305602716468,
"grad_norm": 0.34190173531670653,
"learning_rate": 3.295869353013204e-05,
"loss": 0.0982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02967439591884613,
"step": 2155,
"valid_targets_mean": 3441.1,
"valid_targets_min": 2927
},
{
"epoch": 2.44368986983588,
"grad_norm": 0.43983243600032806,
"learning_rate": 3.291567313453754e-05,
"loss": 0.1198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07892259210348129,
"step": 2160,
"valid_targets_mean": 3442.0,
"valid_targets_min": 2213
},
{
"epoch": 2.449349179400113,
"grad_norm": 0.46751571452574264,
"learning_rate": 3.287254998415308e-05,
"loss": 0.0987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060992803424596786,
"step": 2165,
"valid_targets_mean": 2907.4,
"valid_targets_min": 1134
},
{
"epoch": 2.455008488964346,
"grad_norm": 0.4395489284393833,
"learning_rate": 3.282932442205875e-05,
"loss": 0.1062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06305012106895447,
"step": 2170,
"valid_targets_mean": 2523.4,
"valid_targets_min": 663
},
{
"epoch": 2.4606677985285796,
"grad_norm": 0.6628613828680201,
"learning_rate": 3.2785996792149397e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07510661333799362,
"step": 2175,
"valid_targets_mean": 1893.8,
"valid_targets_min": 535
},
{
"epoch": 2.4663271080928126,
"grad_norm": 0.4089669303969591,
"learning_rate": 3.274256743913192e-05,
"loss": 0.1036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04284790903329849,
"step": 2180,
"valid_targets_mean": 1971.8,
"valid_targets_min": 811
},
{
"epoch": 2.471986417657046,
"grad_norm": 0.4732750376584821,
"learning_rate": 3.2699036708522486e-05,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07278202474117279,
"step": 2185,
"valid_targets_mean": 2785.5,
"valid_targets_min": 2392
},
{
"epoch": 2.477645727221279,
"grad_norm": 0.2586276180787425,
"learning_rate": 3.265540494664383e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032237522304058075,
"step": 2190,
"valid_targets_mean": 4540.6,
"valid_targets_min": 3285
},
{
"epoch": 2.483305036785512,
"grad_norm": 0.373237775006757,
"learning_rate": 3.261167250062246e-05,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0476677343249321,
"step": 2195,
"valid_targets_mean": 2926.8,
"valid_targets_min": 764
},
{
"epoch": 2.4889643463497455,
"grad_norm": 0.3674744465113664,
"learning_rate": 3.25678397183859e-05,
"loss": 0.1021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056619517505168915,
"step": 2200,
"valid_targets_mean": 3378.6,
"valid_targets_min": 1290
},
{
"epoch": 2.4946236559139785,
"grad_norm": 0.4594754544351409,
"learning_rate": 3.252390694865995e-05,
"loss": 0.0997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057963818311691284,
"step": 2205,
"valid_targets_mean": 2432.4,
"valid_targets_min": 720
},
{
"epoch": 2.5002829654782115,
"grad_norm": 0.3192949581204995,
"learning_rate": 3.247987454096588e-05,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04614349454641342,
"step": 2210,
"valid_targets_mean": 3896.0,
"valid_targets_min": 2336
},
{
"epoch": 2.505942275042445,
"grad_norm": 0.33644471032634066,
"learning_rate": 3.2435742845617664e-05,
"loss": 0.0947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04669766128063202,
"step": 2215,
"valid_targets_mean": 2912.5,
"valid_targets_min": 1049
},
{
"epoch": 2.511601584606678,
"grad_norm": 0.34479623408810645,
"learning_rate": 3.2391512213719195e-05,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0345931239426136,
"step": 2220,
"valid_targets_mean": 3087.8,
"valid_targets_min": 1086
},
{
"epoch": 2.517260894170911,
"grad_norm": 0.36688535674523926,
"learning_rate": 3.23471829971615e-05,
"loss": 0.0884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04897375777363777,
"step": 2225,
"valid_targets_mean": 3296.5,
"valid_targets_min": 732
},
{
"epoch": 2.5229202037351444,
"grad_norm": 0.5957001879370355,
"learning_rate": 3.230275554861988e-05,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07079662382602692,
"step": 2230,
"valid_targets_mean": 1688.5,
"valid_targets_min": 770
},
{
"epoch": 2.5285795132993774,
"grad_norm": 0.43461041178958076,
"learning_rate": 3.2258230221551216e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04917736351490021,
"step": 2235,
"valid_targets_mean": 2574.8,
"valid_targets_min": 592
},
{
"epoch": 2.534238822863611,
"grad_norm": 0.42565232202035636,
"learning_rate": 3.221360737019105e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055679723620414734,
"step": 2240,
"valid_targets_mean": 3089.1,
"valid_targets_min": 2224
},
{
"epoch": 2.539898132427844,
"grad_norm": 0.4171403916689987,
"learning_rate": 3.216888734955082e-05,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042909517884254456,
"step": 2245,
"valid_targets_mean": 2364.5,
"valid_targets_min": 511
},
{
"epoch": 2.5455574419920772,
"grad_norm": 0.4453123084365863,
"learning_rate": 3.2124070515415026e-05,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06102481111884117,
"step": 2250,
"valid_targets_mean": 3775.5,
"valid_targets_min": 2328
},
{
"epoch": 2.5512167515563102,
"grad_norm": 0.3935444374091009,
"learning_rate": 3.20791572243384e-05,
"loss": 0.0943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043448153883218765,
"step": 2255,
"valid_targets_mean": 2867.1,
"valid_targets_min": 669
},
{
"epoch": 2.556876061120543,
"grad_norm": 0.6248731534527211,
"learning_rate": 3.2034147833643085e-05,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07770198583602905,
"step": 2260,
"valid_targets_mean": 1722.5,
"valid_targets_min": 802
},
{
"epoch": 2.5625353706847767,
"grad_norm": 0.6695756417777585,
"learning_rate": 3.1989042701415735e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07981681078672409,
"step": 2265,
"valid_targets_mean": 1527.9,
"valid_targets_min": 357
},
{
"epoch": 2.5681946802490097,
"grad_norm": 0.37224281178132096,
"learning_rate": 3.194384218650475e-05,
"loss": 0.112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05012982338666916,
"step": 2270,
"valid_targets_mean": 3831.6,
"valid_targets_min": 2808
},
{
"epoch": 2.5738539898132426,
"grad_norm": 0.500568844305321,
"learning_rate": 3.1898546648517344e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13740640878677368,
"step": 2275,
"valid_targets_mean": 2953.2,
"valid_targets_min": 652
},
{
"epoch": 2.579513299377476,
"grad_norm": 0.3736709958108341,
"learning_rate": 3.185315644781674e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05496054142713547,
"step": 2280,
"valid_targets_mean": 3963.6,
"valid_targets_min": 3573
},
{
"epoch": 2.585172608941709,
"grad_norm": 0.5090649187854307,
"learning_rate": 3.1807671945519275e-05,
"loss": 0.1208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06333998590707779,
"step": 2285,
"valid_targets_mean": 2137.1,
"valid_targets_min": 822
},
{
"epoch": 2.590831918505942,
"grad_norm": 0.5165232888652537,
"learning_rate": 3.1762093503491515e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16781306266784668,
"step": 2290,
"valid_targets_mean": 2582.1,
"valid_targets_min": 965
},
{
"epoch": 2.5964912280701755,
"grad_norm": 0.3296689482507935,
"learning_rate": 3.171642148434743e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043995440006256104,
"step": 2295,
"valid_targets_mean": 4182.0,
"valid_targets_min": 636
},
{
"epoch": 2.6021505376344085,
"grad_norm": 0.399676787291068,
"learning_rate": 3.167065625144544e-05,
"loss": 0.0972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07242860645055771,
"step": 2300,
"valid_targets_mean": 4735.0,
"valid_targets_min": 2733
},
{
"epoch": 2.6078098471986415,
"grad_norm": 0.3909386303098651,
"learning_rate": 3.1624798168885566e-05,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0652426928281784,
"step": 2305,
"valid_targets_mean": 4307.1,
"valid_targets_min": 2571
},
{
"epoch": 2.613469156762875,
"grad_norm": 0.30890902026855777,
"learning_rate": 3.157884760150653e-05,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03641439974308014,
"step": 2310,
"valid_targets_mean": 3207.2,
"valid_targets_min": 970
},
{
"epoch": 2.619128466327108,
"grad_norm": 0.41688683844062174,
"learning_rate": 3.153280491488285e-05,
"loss": 0.0973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038325291126966476,
"step": 2315,
"valid_targets_mean": 2923.8,
"valid_targets_min": 748
},
{
"epoch": 2.6247877758913414,
"grad_norm": 0.4141664805039355,
"learning_rate": 3.148667047532191e-05,
"loss": 0.099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06093056499958038,
"step": 2320,
"valid_targets_mean": 3834.1,
"valid_targets_min": 3568
},
{
"epoch": 2.6304470854555744,
"grad_norm": 0.5296100301519969,
"learning_rate": 3.1440444649861084e-05,
"loss": 0.1014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05555908381938934,
"step": 2325,
"valid_targets_mean": 2406.8,
"valid_targets_min": 1820
},
{
"epoch": 2.636106395019808,
"grad_norm": 0.4344050252582694,
"learning_rate": 3.139412780626478e-05,
"loss": 0.0865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0589946024119854,
"step": 2330,
"valid_targets_mean": 2587.6,
"valid_targets_min": 772
},
{
"epoch": 2.641765704584041,
"grad_norm": 0.4764837983611368,
"learning_rate": 3.134772031302156e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07396160066127777,
"step": 2335,
"valid_targets_mean": 3260.0,
"valid_targets_min": 1289
},
{
"epoch": 2.647425014148274,
"grad_norm": 0.37816499084386906,
"learning_rate": 3.130122253934113e-05,
"loss": 0.08,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045197054743766785,
"step": 2340,
"valid_targets_mean": 3723.0,
"valid_targets_min": 3122
},
{
"epoch": 2.6530843237125072,
"grad_norm": 0.3706727023566082,
"learning_rate": 3.125463485515149e-05,
"loss": 0.0921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049566566944122314,
"step": 2345,
"valid_targets_mean": 3712.5,
"valid_targets_min": 1451
},
{
"epoch": 2.6587436332767402,
"grad_norm": 0.3661474166395112,
"learning_rate": 3.1207957631095944e-05,
"loss": 0.0876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04905054345726967,
"step": 2350,
"valid_targets_mean": 3632.8,
"valid_targets_min": 792
},
{
"epoch": 2.6644029428409732,
"grad_norm": 0.47433911573934034,
"learning_rate": 3.116119123853014e-05,
"loss": 0.1083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044324200600385666,
"step": 2355,
"valid_targets_mean": 1992.4,
"valid_targets_min": 795
},
{
"epoch": 2.6700622524052067,
"grad_norm": 0.3405483587292372,
"learning_rate": 3.1114336049519165e-05,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048648297786712646,
"step": 2360,
"valid_targets_mean": 3431.4,
"valid_targets_min": 1196
},
{
"epoch": 2.6757215619694397,
"grad_norm": 0.528089751667171,
"learning_rate": 3.106739243683453e-05,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05340038612484932,
"step": 2365,
"valid_targets_mean": 1836.1,
"valid_targets_min": 575
},
{
"epoch": 2.6813808715336727,
"grad_norm": 0.655807946929079,
"learning_rate": 3.1020360773951225e-05,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08533156663179398,
"step": 2370,
"valid_targets_mean": 1908.8,
"valid_targets_min": 609
},
{
"epoch": 2.687040181097906,
"grad_norm": 0.479137600509888,
"learning_rate": 3.097324143504479e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0396895632147789,
"step": 2375,
"valid_targets_mean": 1497.2,
"valid_targets_min": 542
},
{
"epoch": 2.692699490662139,
"grad_norm": 0.35572554367136605,
"learning_rate": 3.092603479498826e-05,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046362824738025665,
"step": 2380,
"valid_targets_mean": 3701.8,
"valid_targets_min": 2440
},
{
"epoch": 2.6983588002263725,
"grad_norm": 0.4294308993861767,
"learning_rate": 3.087874122934924e-05,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03990578651428223,
"step": 2385,
"valid_targets_mean": 1648.2,
"valid_targets_min": 629
},
{
"epoch": 2.7040181097906055,
"grad_norm": 0.5487991767733832,
"learning_rate": 3.0831361114386905e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05739689990878105,
"step": 2390,
"valid_targets_mean": 3953.0,
"valid_targets_min": 3701
},
{
"epoch": 2.709677419354839,
"grad_norm": 0.42836710916085596,
"learning_rate": 3.078389482704897e-05,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05183224380016327,
"step": 2395,
"valid_targets_mean": 1700.9,
"valid_targets_min": 485
},
{
"epoch": 2.715336728919072,
"grad_norm": 0.47163155795442635,
"learning_rate": 3.0736342744968764e-05,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0850541889667511,
"step": 2400,
"valid_targets_mean": 2381.9,
"valid_targets_min": 605
},
{
"epoch": 2.720996038483305,
"grad_norm": 0.3348814947703484,
"learning_rate": 3.068870524646215e-05,
"loss": 0.0907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03373149782419205,
"step": 2405,
"valid_targets_mean": 2713.5,
"valid_targets_min": 848
},
{
"epoch": 2.7266553480475384,
"grad_norm": 0.31717139487830104,
"learning_rate": 3.064098271052457e-05,
"loss": 0.0912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04711340367794037,
"step": 2410,
"valid_targets_mean": 5106.4,
"valid_targets_min": 4456
},
{
"epoch": 2.7323146576117714,
"grad_norm": 0.37159333535295175,
"learning_rate": 3.059317551682801e-05,
"loss": 0.0948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05447401478886604,
"step": 2415,
"valid_targets_mean": 3905.5,
"valid_targets_min": 1864
},
{
"epoch": 2.7379739671760044,
"grad_norm": 0.36008589768281596,
"learning_rate": 3.0545284045717956e-05,
"loss": 0.1091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04373928904533386,
"step": 2420,
"valid_targets_mean": 3313.8,
"valid_targets_min": 1361
},
{
"epoch": 2.743633276740238,
"grad_norm": 0.41946488267172877,
"learning_rate": 3.0497308678210413e-05,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05137067288160324,
"step": 2425,
"valid_targets_mean": 3500.1,
"valid_targets_min": 1814
},
{
"epoch": 2.749292586304471,
"grad_norm": 0.4741519627348511,
"learning_rate": 3.044924979598882e-05,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049934521317481995,
"step": 2430,
"valid_targets_mean": 1559.0,
"valid_targets_min": 759
},
{
"epoch": 2.754951895868704,
"grad_norm": 0.3075634231736509,
"learning_rate": 3.0401107781401092e-05,
"loss": 0.0835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039611075073480606,
"step": 2435,
"valid_targets_mean": 3942.6,
"valid_targets_min": 2719
},
{
"epoch": 2.7606112054329373,
"grad_norm": 0.5009109914391133,
"learning_rate": 3.0352883017456497e-05,
"loss": 0.1061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040671542286872864,
"step": 2440,
"valid_targets_mean": 1133.4,
"valid_targets_min": 664
},
{
"epoch": 2.7662705149971702,
"grad_norm": 0.35783834790167424,
"learning_rate": 3.0304575887822635e-05,
"loss": 0.1039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03562743961811066,
"step": 2445,
"valid_targets_mean": 2489.8,
"valid_targets_min": 1584
},
{
"epoch": 2.7719298245614032,
"grad_norm": 0.36757407384846696,
"learning_rate": 3.0256186776822415e-05,
"loss": 0.0836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0379403755068779,
"step": 2450,
"valid_targets_mean": 2685.4,
"valid_targets_min": 1003
},
{
"epoch": 2.7775891341256367,
"grad_norm": 0.3558843724226644,
"learning_rate": 3.0207716069430968e-05,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04235576093196869,
"step": 2455,
"valid_targets_mean": 3180.8,
"valid_targets_min": 560
},
{
"epoch": 2.7832484436898697,
"grad_norm": 0.36637576971355346,
"learning_rate": 3.015916415127259e-05,
"loss": 0.1036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05197940021753311,
"step": 2460,
"valid_targets_mean": 3285.9,
"valid_targets_min": 1049
},
{
"epoch": 2.788907753254103,
"grad_norm": 0.48073478238853684,
"learning_rate": 3.011053140861768e-05,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06219557300209999,
"step": 2465,
"valid_targets_mean": 2464.9,
"valid_targets_min": 771
},
{
"epoch": 2.794567062818336,
"grad_norm": 0.4222816152964138,
"learning_rate": 3.006181822837964e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0535898320376873,
"step": 2470,
"valid_targets_mean": 2959.5,
"valid_targets_min": 825
},
{
"epoch": 2.8002263723825696,
"grad_norm": 0.5137217888589967,
"learning_rate": 3.0013024998111856e-05,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06423379480838776,
"step": 2475,
"valid_targets_mean": 2602.1,
"valid_targets_min": 829
},
{
"epoch": 2.8058856819468025,
"grad_norm": 0.6608430897923827,
"learning_rate": 2.9964152106004546e-05,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062066759914159775,
"step": 2480,
"valid_targets_mean": 2106.1,
"valid_targets_min": 650
},
{
"epoch": 2.8115449915110355,
"grad_norm": 0.4491563125079627,
"learning_rate": 2.9915199940881723e-05,
"loss": 0.1081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060543835163116455,
"step": 2485,
"valid_targets_mean": 2946.0,
"valid_targets_min": 729
},
{
"epoch": 2.817204301075269,
"grad_norm": 0.2901989643151657,
"learning_rate": 2.9866168892198067e-05,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03691372275352478,
"step": 2490,
"valid_targets_mean": 3853.5,
"valid_targets_min": 3152
},
{
"epoch": 2.822863610639502,
"grad_norm": 0.31715286077111987,
"learning_rate": 2.9817059350035858e-05,
"loss": 0.0958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03336600959300995,
"step": 2495,
"valid_targets_mean": 3448.2,
"valid_targets_min": 2543
},
{
"epoch": 2.828522920203735,
"grad_norm": 0.44423757895685106,
"learning_rate": 2.9767871705101834e-05,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05750303715467453,
"step": 2500,
"valid_targets_mean": 2674.9,
"valid_targets_min": 446
},
{
"epoch": 2.8341822297679684,
"grad_norm": 0.3714047560342441,
"learning_rate": 2.9718606348724135e-05,
"loss": 0.0877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042779020965099335,
"step": 2505,
"valid_targets_mean": 2807.6,
"valid_targets_min": 681
},
{
"epoch": 2.8398415393322014,
"grad_norm": 0.45565095764546504,
"learning_rate": 2.966926367284913e-05,
"loss": 0.0975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06783543527126312,
"step": 2510,
"valid_targets_mean": 5567.5,
"valid_targets_min": 3772
},
{
"epoch": 2.8455008488964344,
"grad_norm": 0.31870357464902527,
"learning_rate": 2.9619844070038336e-05,
"loss": 0.0965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04572061821818352,
"step": 2515,
"valid_targets_mean": 3662.4,
"valid_targets_min": 484
},
{
"epoch": 2.851160158460668,
"grad_norm": 0.28353049541003644,
"learning_rate": 2.957034793346531e-05,
"loss": 0.0819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035324037075042725,
"step": 2520,
"valid_targets_mean": 3900.0,
"valid_targets_min": 861
},
{
"epoch": 2.856819468024901,
"grad_norm": 0.41454732495960667,
"learning_rate": 2.9520775656912467e-05,
"loss": 0.0969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07399703562259674,
"step": 2525,
"valid_targets_mean": 4100.8,
"valid_targets_min": 3268
},
{
"epoch": 2.8624787775891343,
"grad_norm": 0.3594007437946367,
"learning_rate": 2.9471127634767992e-05,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04679866135120392,
"step": 2530,
"valid_targets_mean": 3277.8,
"valid_targets_min": 559
},
{
"epoch": 2.8681380871533673,
"grad_norm": 0.38766671277978854,
"learning_rate": 2.9421404262022687e-05,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044593460857868195,
"step": 2535,
"valid_targets_mean": 2986.2,
"valid_targets_min": 689
},
{
"epoch": 2.8737973967176007,
"grad_norm": 0.5541215791435989,
"learning_rate": 2.9371605934266826e-05,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06732194870710373,
"step": 2540,
"valid_targets_mean": 1831.6,
"valid_targets_min": 616
},
{
"epoch": 2.8794567062818337,
"grad_norm": 0.4653944890140849,
"learning_rate": 2.9321733047687028e-05,
"loss": 0.0785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052152834832668304,
"step": 2545,
"valid_targets_mean": 2087.0,
"valid_targets_min": 602
},
{
"epoch": 2.8851160158460667,
"grad_norm": 0.3697902152532082,
"learning_rate": 2.9271785999063058e-05,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05232277512550354,
"step": 2550,
"valid_targets_mean": 3992.1,
"valid_targets_min": 3551
},
{
"epoch": 2.8907753254103,
"grad_norm": 0.4102298567601552,
"learning_rate": 2.922176518576473e-05,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03710225224494934,
"step": 2555,
"valid_targets_mean": 2115.1,
"valid_targets_min": 596
},
{
"epoch": 2.896434634974533,
"grad_norm": 0.3506315433787024,
"learning_rate": 2.9171671005748705e-05,
"loss": 0.1021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04065260291099548,
"step": 2560,
"valid_targets_mean": 3488.0,
"valid_targets_min": 799
},
{
"epoch": 2.902093944538766,
"grad_norm": 0.43876156646589926,
"learning_rate": 2.9121503857555337e-05,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0732661634683609,
"step": 2565,
"valid_targets_mean": 3078.9,
"valid_targets_min": 706
},
{
"epoch": 2.9077532541029996,
"grad_norm": 0.4989205776297815,
"learning_rate": 2.9071264140305504e-05,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05086730048060417,
"step": 2570,
"valid_targets_mean": 1957.6,
"valid_targets_min": 710
},
{
"epoch": 2.9134125636672326,
"grad_norm": 0.411276296598042,
"learning_rate": 2.9020952253697417e-05,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045306913554668427,
"step": 2575,
"valid_targets_mean": 3112.4,
"valid_targets_min": 647
},
{
"epoch": 2.9190718732314656,
"grad_norm": 0.5328660391020346,
"learning_rate": 2.8970568598003485e-05,
"loss": 0.1019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047358643263578415,
"step": 2580,
"valid_targets_mean": 1494.9,
"valid_targets_min": 716
},
{
"epoch": 2.924731182795699,
"grad_norm": 0.3852799501619404,
"learning_rate": 2.8920113574067063e-05,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05453154444694519,
"step": 2585,
"valid_targets_mean": 3669.5,
"valid_targets_min": 3122
},
{
"epoch": 2.930390492359932,
"grad_norm": 0.4503646099363286,
"learning_rate": 2.8869587583299315e-05,
"loss": 0.0979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051441676914691925,
"step": 2590,
"valid_targets_mean": 2399.1,
"valid_targets_min": 832
},
{
"epoch": 2.936049801924165,
"grad_norm": 0.5372867608649338,
"learning_rate": 2.8818991027676014e-05,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04305317997932434,
"step": 2595,
"valid_targets_mean": 1216.9,
"valid_targets_min": 635
},
{
"epoch": 2.9417091114883984,
"grad_norm": 0.40304566483129606,
"learning_rate": 2.876832430973432e-05,
"loss": 0.1187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048321161419153214,
"step": 2600,
"valid_targets_mean": 3078.1,
"valid_targets_min": 756
},
{
"epoch": 2.9473684210526314,
"grad_norm": 0.4502755032894269,
"learning_rate": 2.8717587832569598e-05,
"loss": 0.0881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059124238789081573,
"step": 2605,
"valid_targets_mean": 2387.1,
"valid_targets_min": 744
},
{
"epoch": 2.953027730616865,
"grad_norm": 0.3427640277748679,
"learning_rate": 2.8666781999832198e-05,
"loss": 0.0946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03376740589737892,
"step": 2610,
"valid_targets_mean": 2088.4,
"valid_targets_min": 529
},
{
"epoch": 2.958687040181098,
"grad_norm": 0.44946510033221493,
"learning_rate": 2.8615907215724266e-05,
"loss": 0.1061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06872159242630005,
"step": 2615,
"valid_targets_mean": 3932.1,
"valid_targets_min": 2017
},
{
"epoch": 2.9643463497453313,
"grad_norm": 0.2666267217286435,
"learning_rate": 2.8564963884996494e-05,
"loss": 0.0894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03546273708343506,
"step": 2620,
"valid_targets_mean": 4790.0,
"valid_targets_min": 516
},
{
"epoch": 2.9700056593095643,
"grad_norm": 0.364616438660843,
"learning_rate": 2.851395241294493e-05,
"loss": 0.088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041498977690935135,
"step": 2625,
"valid_targets_mean": 2245.1,
"valid_targets_min": 772
},
{
"epoch": 2.9756649688737973,
"grad_norm": 0.348973673917049,
"learning_rate": 2.8462873205407747e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046205684542655945,
"step": 2630,
"valid_targets_mean": 3851.0,
"valid_targets_min": 2196
},
{
"epoch": 2.9813242784380307,
"grad_norm": 0.46190471072869965,
"learning_rate": 2.8411726668761998e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13584215939044952,
"step": 2635,
"valid_targets_mean": 3094.1,
"valid_targets_min": 2759
},
{
"epoch": 2.9869835880022637,
"grad_norm": 0.3227746990944905,
"learning_rate": 2.8360513209920388e-05,
"loss": 0.1048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03658788651227951,
"step": 2640,
"valid_targets_mean": 3760.2,
"valid_targets_min": 3175
},
{
"epoch": 2.9926428975664967,
"grad_norm": 0.3837603633008106,
"learning_rate": 2.8309233236328074e-05,
"loss": 0.1043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03533530980348587,
"step": 2645,
"valid_targets_mean": 2446.5,
"valid_targets_min": 759
},
{
"epoch": 2.99830220713073,
"grad_norm": 0.4993258903053454,
"learning_rate": 2.8257887155959352e-05,
"loss": 0.1022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10851038992404938,
"step": 2650,
"valid_targets_mean": 2332.5,
"valid_targets_min": 927
},
{
"epoch": 3.0033955857385397,
"grad_norm": 0.4474466581519664,
"learning_rate": 2.8206475377314486e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08224907517433167,
"step": 2655,
"valid_targets_mean": 6116.6,
"valid_targets_min": 4858
},
{
"epoch": 3.009054895302773,
"grad_norm": 0.3834057659347809,
"learning_rate": 2.8154998309416404e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08942107111215591,
"step": 2660,
"valid_targets_mean": 6616.0,
"valid_targets_min": 4759
},
{
"epoch": 3.014714204867006,
"grad_norm": 0.38251126769579447,
"learning_rate": 2.8103456361807473e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08066676557064056,
"step": 2665,
"valid_targets_mean": 5258.1,
"valid_targets_min": 4373
},
{
"epoch": 3.0203735144312396,
"grad_norm": 0.400000478072429,
"learning_rate": 2.8051849944546225e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09580092132091522,
"step": 2670,
"valid_targets_mean": 5849.6,
"valid_targets_min": 4813
},
{
"epoch": 3.0260328239954726,
"grad_norm": 0.43763746681992655,
"learning_rate": 2.80001794682041e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09335286170244217,
"step": 2675,
"valid_targets_mean": 5604.5,
"valid_targets_min": 3983
},
{
"epoch": 3.0316921335597056,
"grad_norm": 0.48759592075455604,
"learning_rate": 2.7948445343862188e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08601689338684082,
"step": 2680,
"valid_targets_mean": 6438.2,
"valid_targets_min": 5154
},
{
"epoch": 3.037351443123939,
"grad_norm": 0.4005248763640473,
"learning_rate": 2.7896647983107952e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07797376066446304,
"step": 2685,
"valid_targets_mean": 5509.6,
"valid_targets_min": 5040
},
{
"epoch": 3.043010752688172,
"grad_norm": 0.4567820303407952,
"learning_rate": 2.784478779803194e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11923784762620926,
"step": 2690,
"valid_targets_mean": 6410.5,
"valid_targets_min": 5066
},
{
"epoch": 3.048670062252405,
"grad_norm": 0.4018410434737254,
"learning_rate": 2.7792865201224536e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07983622699975967,
"step": 2695,
"valid_targets_mean": 6616.2,
"valid_targets_min": 4500
},
{
"epoch": 3.0543293718166384,
"grad_norm": 0.42280164910105855,
"learning_rate": 2.7740880605772644e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10148809850215912,
"step": 2700,
"valid_targets_mean": 7507.6,
"valid_targets_min": 5455
},
{
"epoch": 3.0599886813808714,
"grad_norm": 0.40674098351312155,
"learning_rate": 2.7688834425256426e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09895728528499603,
"step": 2705,
"valid_targets_mean": 7383.8,
"valid_targets_min": 4715
},
{
"epoch": 3.065647990945105,
"grad_norm": 0.36990046485579053,
"learning_rate": 2.7636727073746015e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0861731767654419,
"step": 2710,
"valid_targets_mean": 6624.9,
"valid_targets_min": 5315
},
{
"epoch": 3.071307300509338,
"grad_norm": 0.3662529670090019,
"learning_rate": 2.7584558965798183e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09385193884372711,
"step": 2715,
"valid_targets_mean": 7394.5,
"valid_targets_min": 4353
},
{
"epoch": 3.076966610073571,
"grad_norm": 0.476285721677575,
"learning_rate": 2.7532330516453094e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08194148540496826,
"step": 2720,
"valid_targets_mean": 6296.0,
"valid_targets_min": 4890
},
{
"epoch": 3.0826259196378043,
"grad_norm": 0.4001613005928641,
"learning_rate": 2.7480042141230963e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0721985325217247,
"step": 2725,
"valid_targets_mean": 5848.5,
"valid_targets_min": 4560
},
{
"epoch": 3.0882852292020373,
"grad_norm": 0.4520142971167075,
"learning_rate": 2.7427694256128776e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09193578362464905,
"step": 2730,
"valid_targets_mean": 5550.9,
"valid_targets_min": 3640
},
{
"epoch": 3.0939445387662703,
"grad_norm": 0.5140528274529098,
"learning_rate": 2.737528727761696e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09765416383743286,
"step": 2735,
"valid_targets_mean": 5894.4,
"valid_targets_min": 3967
},
{
"epoch": 3.0996038483305037,
"grad_norm": 0.3994772187194201,
"learning_rate": 2.7322821622636077e-05,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08106030523777008,
"step": 2740,
"valid_targets_mean": 6153.9,
"valid_targets_min": 4521
},
{
"epoch": 3.1052631578947367,
"grad_norm": 0.4273215647315338,
"learning_rate": 2.7270297708593517e-05,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08103308826684952,
"step": 2745,
"valid_targets_mean": 6440.5,
"valid_targets_min": 5067
},
{
"epoch": 3.11092246745897,
"grad_norm": 0.4133850486345733,
"learning_rate": 2.7217715953360166e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07770150154829025,
"step": 2750,
"valid_targets_mean": 6049.2,
"valid_targets_min": 4385
},
{
"epoch": 3.116581777023203,
"grad_norm": 0.34763851050877514,
"learning_rate": 2.716507677526707e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07968132197856903,
"step": 2755,
"valid_targets_mean": 7771.6,
"valid_targets_min": 4566
},
{
"epoch": 3.122241086587436,
"grad_norm": 0.3658412345569811,
"learning_rate": 2.711238059310215e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08296516537666321,
"step": 2760,
"valid_targets_mean": 6633.6,
"valid_targets_min": 5067
},
{
"epoch": 3.1279003961516696,
"grad_norm": 0.4022203908775496,
"learning_rate": 2.7059627826106817e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08426246792078018,
"step": 2765,
"valid_targets_mean": 6862.6,
"valid_targets_min": 5178
},
{
"epoch": 3.1335597057159026,
"grad_norm": 0.36101301045305095,
"learning_rate": 2.700681889397267e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08576173335313797,
"step": 2770,
"valid_targets_mean": 6075.1,
"valid_targets_min": 3854
},
{
"epoch": 3.139219015280136,
"grad_norm": 0.38940482167263113,
"learning_rate": 2.6953954216838148e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.103759765625,
"step": 2775,
"valid_targets_mean": 6840.1,
"valid_targets_min": 4743
},
{
"epoch": 3.144878324844369,
"grad_norm": 0.42119432839413173,
"learning_rate": 2.6901034215285182e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11053457856178284,
"step": 2780,
"valid_targets_mean": 6480.9,
"valid_targets_min": 4761
},
{
"epoch": 3.150537634408602,
"grad_norm": 0.38769543749848867,
"learning_rate": 2.684805931033586e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08253707736730576,
"step": 2785,
"valid_targets_mean": 6224.5,
"valid_targets_min": 4789
},
{
"epoch": 3.1561969439728355,
"grad_norm": 0.4282214287537209,
"learning_rate": 2.679502992344907e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08985629677772522,
"step": 2790,
"valid_targets_mean": 6686.4,
"valid_targets_min": 5403
},
{
"epoch": 3.1618562535370685,
"grad_norm": 0.41290216643054406,
"learning_rate": 2.6741946476517146e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08517882227897644,
"step": 2795,
"valid_targets_mean": 6285.0,
"valid_targets_min": 4970
},
{
"epoch": 3.1675155631013014,
"grad_norm": 0.3814241100551298,
"learning_rate": 2.6688809391862523e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09944672882556915,
"step": 2800,
"valid_targets_mean": 6926.9,
"valid_targets_min": 5299
},
{
"epoch": 3.173174872665535,
"grad_norm": 0.3698913524612867,
"learning_rate": 2.663561909223435e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08579894155263901,
"step": 2805,
"valid_targets_mean": 6121.8,
"valid_targets_min": 4951
},
{
"epoch": 3.178834182229768,
"grad_norm": 0.37507158309419764,
"learning_rate": 2.6582376000805165e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08966280519962311,
"step": 2810,
"valid_targets_mean": 8113.1,
"valid_targets_min": 4794
},
{
"epoch": 3.1844934917940013,
"grad_norm": 0.41938823779454215,
"learning_rate": 2.6529080541167495e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09570719301700592,
"step": 2815,
"valid_targets_mean": 5281.6,
"valid_targets_min": 593
},
{
"epoch": 3.1901528013582343,
"grad_norm": 0.3576745054687525,
"learning_rate": 2.6475733137330507e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07610517740249634,
"step": 2820,
"valid_targets_mean": 7339.1,
"valid_targets_min": 4595
},
{
"epoch": 3.1958121109224673,
"grad_norm": 0.37485748388357865,
"learning_rate": 2.6422334213716624e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07846750319004059,
"step": 2825,
"valid_targets_mean": 6674.0,
"valid_targets_min": 5411
},
{
"epoch": 3.2014714204867007,
"grad_norm": 0.39479740390012996,
"learning_rate": 2.6368884195158143e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0896659716963768,
"step": 2830,
"valid_targets_mean": 6596.2,
"valid_targets_min": 4451
},
{
"epoch": 3.2071307300509337,
"grad_norm": 0.40341629615302077,
"learning_rate": 2.6315383506893876e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09459621459245682,
"step": 2835,
"valid_targets_mean": 7159.2,
"valid_targets_min": 5568
},
{
"epoch": 3.212790039615167,
"grad_norm": 0.3918402890328763,
"learning_rate": 2.6261832574565752e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10028786957263947,
"step": 2840,
"valid_targets_mean": 6923.1,
"valid_targets_min": 4839
},
{
"epoch": 3.2184493491794,
"grad_norm": 0.44570531285265286,
"learning_rate": 2.6208231824215417e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07951401174068451,
"step": 2845,
"valid_targets_mean": 4921.4,
"valid_targets_min": 3517
},
{
"epoch": 3.224108658743633,
"grad_norm": 0.39736569597017907,
"learning_rate": 2.6154581682280892e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07940314710140228,
"step": 2850,
"valid_targets_mean": 5929.9,
"valid_targets_min": 3551
},
{
"epoch": 3.2297679683078666,
"grad_norm": 0.43576786309433435,
"learning_rate": 2.610088257559311e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07687495648860931,
"step": 2855,
"valid_targets_mean": 5854.9,
"valid_targets_min": 4614
},
{
"epoch": 3.2354272778720996,
"grad_norm": 0.39667426144543194,
"learning_rate": 2.604713493137259e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0954388827085495,
"step": 2860,
"valid_targets_mean": 6779.1,
"valid_targets_min": 5050
},
{
"epoch": 3.2410865874363326,
"grad_norm": 0.39211282940314196,
"learning_rate": 2.5993339177226002e-05,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08446860313415527,
"step": 2865,
"valid_targets_mean": 5993.4,
"valid_targets_min": 4734
},
{
"epoch": 3.246745897000566,
"grad_norm": 0.37180973272400625,
"learning_rate": 2.593949574114274e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08481285721063614,
"step": 2870,
"valid_targets_mean": 6826.9,
"valid_targets_min": 4966
},
{
"epoch": 3.252405206564799,
"grad_norm": 0.38890138005202446,
"learning_rate": 2.5885605051491592e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.076046884059906,
"step": 2875,
"valid_targets_mean": 6366.5,
"valid_targets_min": 4510
},
{
"epoch": 3.258064516129032,
"grad_norm": 0.3764722912174805,
"learning_rate": 2.583166753701725e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06771224737167358,
"step": 2880,
"valid_targets_mean": 5248.9,
"valid_targets_min": 4430
},
{
"epoch": 3.2637238256932655,
"grad_norm": 0.3707213763979597,
"learning_rate": 2.5777683626836964e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07067465782165527,
"step": 2885,
"valid_targets_mean": 5854.6,
"valid_targets_min": 4701
},
{
"epoch": 3.2693831352574985,
"grad_norm": 0.38176253383761427,
"learning_rate": 2.5723653750437083e-05,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08251985907554626,
"step": 2890,
"valid_targets_mean": 6520.2,
"valid_targets_min": 4501
},
{
"epoch": 3.275042444821732,
"grad_norm": 0.3696783228124919,
"learning_rate": 2.5669578337669653e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08970288187265396,
"step": 2895,
"valid_targets_mean": 6796.4,
"valid_targets_min": 3640
},
{
"epoch": 3.280701754385965,
"grad_norm": 0.5997009652550589,
"learning_rate": 2.5615457818749007e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08683329820632935,
"step": 2900,
"valid_targets_mean": 6024.8,
"valid_targets_min": 5024
},
{
"epoch": 3.286361063950198,
"grad_norm": 0.3970354064915422,
"learning_rate": 2.5561292624248344e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09823933243751526,
"step": 2905,
"valid_targets_mean": 6549.4,
"valid_targets_min": 4715
},
{
"epoch": 3.2920203735144313,
"grad_norm": 0.4040600633209962,
"learning_rate": 2.5507083185096267e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0729404091835022,
"step": 2910,
"valid_targets_mean": 5681.1,
"valid_targets_min": 4730
},
{
"epoch": 3.2976796830786643,
"grad_norm": 0.40529122982296795,
"learning_rate": 2.545282993257341e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08735214918851852,
"step": 2915,
"valid_targets_mean": 5787.6,
"valid_targets_min": 4657
},
{
"epoch": 3.3033389926428978,
"grad_norm": 0.38732883346244273,
"learning_rate": 2.5398533298308956e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08877654373645782,
"step": 2920,
"valid_targets_mean": 6862.9,
"valid_targets_min": 5599
},
{
"epoch": 3.3089983022071308,
"grad_norm": 0.5611570775932486,
"learning_rate": 2.534419371427724e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11140226572751999,
"step": 2925,
"valid_targets_mean": 6471.2,
"valid_targets_min": 4948
},
{
"epoch": 3.3146576117713638,
"grad_norm": 0.43561660126955126,
"learning_rate": 2.5289811612794297e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09498600661754608,
"step": 2930,
"valid_targets_mean": 7644.9,
"valid_targets_min": 4876
},
{
"epoch": 3.320316921335597,
"grad_norm": 0.39243379533926886,
"learning_rate": 2.5235387426514405e-05,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07330992817878723,
"step": 2935,
"valid_targets_mean": 5750.1,
"valid_targets_min": 3599
},
{
"epoch": 3.32597623089983,
"grad_norm": 0.3950361179379625,
"learning_rate": 2.5180921588426693e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10302229225635529,
"step": 2940,
"valid_targets_mean": 7335.2,
"valid_targets_min": 4800
},
{
"epoch": 3.331635540464063,
"grad_norm": 0.34118533977997895,
"learning_rate": 2.5126414531851634e-05,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06809462606906891,
"step": 2945,
"valid_targets_mean": 7088.9,
"valid_targets_min": 4228
},
{
"epoch": 3.3372948500282966,
"grad_norm": 0.40089882561464724,
"learning_rate": 2.507186669043764e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08894894272089005,
"step": 2950,
"valid_targets_mean": 6421.2,
"valid_targets_min": 5314
},
{
"epoch": 3.3429541595925296,
"grad_norm": 0.3809360499548981,
"learning_rate": 2.5017278498157608e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08135772496461868,
"step": 2955,
"valid_targets_mean": 6345.4,
"valid_targets_min": 4634
},
{
"epoch": 3.348613469156763,
"grad_norm": 0.401319262721283,
"learning_rate": 2.496265038930545e-05,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07413016259670258,
"step": 2960,
"valid_targets_mean": 5758.2,
"valid_targets_min": 4521
},
{
"epoch": 3.354272778720996,
"grad_norm": 0.4181749873395065,
"learning_rate": 2.4907982798492647e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07992276549339294,
"step": 2965,
"valid_targets_mean": 5346.1,
"valid_targets_min": 4180
},
{
"epoch": 3.359932088285229,
"grad_norm": 0.37821898461591213,
"learning_rate": 2.485327616064479e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09109698235988617,
"step": 2970,
"valid_targets_mean": 7561.1,
"valid_targets_min": 4791
},
{
"epoch": 3.3655913978494625,
"grad_norm": 0.42463483961812915,
"learning_rate": 2.4798530910998126e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07687358558177948,
"step": 2975,
"valid_targets_mean": 6135.1,
"valid_targets_min": 4670
},
{
"epoch": 3.3712507074136955,
"grad_norm": 0.4168973212704639,
"learning_rate": 2.474374748509609e-05,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08751700818538666,
"step": 2980,
"valid_targets_mean": 6526.8,
"valid_targets_min": 4806
},
{
"epoch": 3.376910016977929,
"grad_norm": 0.4377975902513151,
"learning_rate": 2.4688926318785845e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07013484835624695,
"step": 2985,
"valid_targets_mean": 5486.9,
"valid_targets_min": 4453
},
{
"epoch": 3.382569326542162,
"grad_norm": 0.37451008367015687,
"learning_rate": 2.4634067848214797e-05,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09076303988695145,
"step": 2990,
"valid_targets_mean": 7182.4,
"valid_targets_min": 5687
},
{
"epoch": 3.388228636106395,
"grad_norm": 0.39214339758244726,
"learning_rate": 2.4579172509827146e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07283439487218857,
"step": 2995,
"valid_targets_mean": 6945.2,
"valid_targets_min": 4964
},
{
"epoch": 3.3938879456706283,
"grad_norm": 0.34687787029362777,
"learning_rate": 2.4524240740360404e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08273832499980927,
"step": 3000,
"valid_targets_mean": 7281.2,
"valid_targets_min": 5625
},
{
"epoch": 3.3995472552348613,
"grad_norm": 0.39512915127755643,
"learning_rate": 2.4469272976841925e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07421189546585083,
"step": 3005,
"valid_targets_mean": 6706.9,
"valid_targets_min": 5006
},
{
"epoch": 3.4052065647990943,
"grad_norm": 0.3837267214169814,
"learning_rate": 2.441426965658543e-05,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08413764834403992,
"step": 3010,
"valid_targets_mean": 6947.8,
"valid_targets_min": 5252
},
{
"epoch": 3.4108658743633278,
"grad_norm": 0.3987996482159172,
"learning_rate": 2.4359231217187508e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08512748777866364,
"step": 3015,
"valid_targets_mean": 6373.1,
"valid_targets_min": 5071
},
{
"epoch": 3.4165251839275608,
"grad_norm": 0.42740405345315763,
"learning_rate": 2.430415809652416e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09217800945043564,
"step": 3020,
"valid_targets_mean": 6664.0,
"valid_targets_min": 3440
},
{
"epoch": 3.4221844934917938,
"grad_norm": 0.4565520082770164,
"learning_rate": 2.4249050732747302e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05961686745285988,
"step": 3025,
"valid_targets_mean": 3621.8,
"valid_targets_min": 393
},
{
"epoch": 3.427843803056027,
"grad_norm": 0.46328547075081156,
"learning_rate": 2.4193909564281288e-05,
"loss": 0.1266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04435160011053085,
"step": 3030,
"valid_targets_mean": 2602.0,
"valid_targets_min": 816
},
{
"epoch": 3.43350311262026,
"grad_norm": 0.37137173861478123,
"learning_rate": 2.4138735029819418e-05,
"loss": 0.0901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04348450154066086,
"step": 3035,
"valid_targets_mean": 3217.9,
"valid_targets_min": 2461
},
{
"epoch": 3.4391624221844936,
"grad_norm": 0.39992157414840956,
"learning_rate": 2.408352756832042e-05,
"loss": 0.0875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04790376126766205,
"step": 3040,
"valid_targets_mean": 3767.2,
"valid_targets_min": 2571
},
{
"epoch": 3.4448217317487266,
"grad_norm": 0.35293050494196204,
"learning_rate": 2.402828761900502e-05,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042876340448856354,
"step": 3045,
"valid_targets_mean": 3830.4,
"valid_targets_min": 2582
},
{
"epoch": 3.4504810413129596,
"grad_norm": 0.5742800954287768,
"learning_rate": 2.3973015621352382e-05,
"loss": 0.0869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036809295415878296,
"step": 3050,
"valid_targets_mean": 3032.0,
"valid_targets_min": 1198
},
{
"epoch": 3.456140350877193,
"grad_norm": 0.7703852038293989,
"learning_rate": 2.3917712015096664e-05,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06168600916862488,
"step": 3055,
"valid_targets_mean": 974.9,
"valid_targets_min": 525
},
{
"epoch": 3.461799660441426,
"grad_norm": 0.4488567722071903,
"learning_rate": 2.386237724022348e-05,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052345506846904755,
"step": 3060,
"valid_targets_mean": 3010.8,
"valid_targets_min": 954
},
{
"epoch": 3.4674589700056595,
"grad_norm": 0.4394392338230334,
"learning_rate": 2.3807011736966414e-05,
"loss": 0.095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0646510049700737,
"step": 3065,
"valid_targets_mean": 3078.4,
"valid_targets_min": 863
},
{
"epoch": 3.4731182795698925,
"grad_norm": 0.33509251616177965,
"learning_rate": 2.3751615945803547e-05,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04230031371116638,
"step": 3070,
"valid_targets_mean": 2921.1,
"valid_targets_min": 540
},
{
"epoch": 3.4787775891341255,
"grad_norm": 0.2933598862510744,
"learning_rate": 2.3696190307453883e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03300682455301285,
"step": 3075,
"valid_targets_mean": 4658.5,
"valid_targets_min": 1008
},
{
"epoch": 3.484436898698359,
"grad_norm": 0.3443708556168441,
"learning_rate": 2.364073526287392e-05,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042443834245204926,
"step": 3080,
"valid_targets_mean": 3757.0,
"valid_targets_min": 818
},
{
"epoch": 3.490096208262592,
"grad_norm": 0.32342934598558776,
"learning_rate": 2.358525125325409e-05,
"loss": 0.0911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03649405390024185,
"step": 3085,
"valid_targets_mean": 4063.0,
"valid_targets_min": 2642
},
{
"epoch": 3.495755517826825,
"grad_norm": 0.5233099293331086,
"learning_rate": 2.352973872001527e-05,
"loss": 0.1005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09330583363771439,
"step": 3090,
"valid_targets_mean": 2844.0,
"valid_targets_min": 614
},
{
"epoch": 3.5014148273910584,
"grad_norm": 0.3713693899571308,
"learning_rate": 2.347419810480527e-05,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03937401995062828,
"step": 3095,
"valid_targets_mean": 3617.4,
"valid_targets_min": 2537
},
{
"epoch": 3.5070741369552914,
"grad_norm": 0.5342177275371015,
"learning_rate": 2.34186298494953e-05,
"loss": 0.0902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05524876341223717,
"step": 3100,
"valid_targets_mean": 1941.8,
"valid_targets_min": 674
},
{
"epoch": 3.5127334465195243,
"grad_norm": 0.32478754183719977,
"learning_rate": 2.3363034396176486e-05,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03607283532619476,
"step": 3105,
"valid_targets_mean": 3252.2,
"valid_targets_min": 987
},
{
"epoch": 3.518392756083758,
"grad_norm": 0.34568450638192383,
"learning_rate": 2.3307412187156334e-05,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036379989236593246,
"step": 3110,
"valid_targets_mean": 3654.8,
"valid_targets_min": 2616
},
{
"epoch": 3.524052065647991,
"grad_norm": 0.446074380238172,
"learning_rate": 2.3251763664955208e-05,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040246620774269104,
"step": 3115,
"valid_targets_mean": 2054.1,
"valid_targets_min": 714
},
{
"epoch": 3.5297113752122242,
"grad_norm": 0.46251594514856853,
"learning_rate": 2.3196089272302813e-05,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047611210495233536,
"step": 3120,
"valid_targets_mean": 2018.1,
"valid_targets_min": 893
},
{
"epoch": 3.535370684776457,
"grad_norm": 0.43018554505934625,
"learning_rate": 2.3140389452134677e-05,
"loss": 0.1043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053366247564554214,
"step": 3125,
"valid_targets_mean": 3815.4,
"valid_targets_min": 3061
},
{
"epoch": 3.5410299943406907,
"grad_norm": 0.38989614452081606,
"learning_rate": 2.3084664647588636e-05,
"loss": 0.1001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05068257078528404,
"step": 3130,
"valid_targets_mean": 3584.0,
"valid_targets_min": 1810
},
{
"epoch": 3.5466893039049237,
"grad_norm": 0.33899258716770153,
"learning_rate": 2.3028915302001286e-05,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03708091750741005,
"step": 3135,
"valid_targets_mean": 3354.2,
"valid_targets_min": 902
},
{
"epoch": 3.5523486134691566,
"grad_norm": 0.479265531070496,
"learning_rate": 2.297314185890446e-05,
"loss": 0.0872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04440346360206604,
"step": 3140,
"valid_targets_mean": 2775.8,
"valid_targets_min": 711
},
{
"epoch": 3.55800792303339,
"grad_norm": 0.670543564360072,
"learning_rate": 2.291734476202173e-05,
"loss": 0.1195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05753045901656151,
"step": 3145,
"valid_targets_mean": 1493.0,
"valid_targets_min": 643
},
{
"epoch": 3.563667232597623,
"grad_norm": 0.5391448054021986,
"learning_rate": 2.286152445526482e-05,
"loss": 0.1134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04792678728699684,
"step": 3150,
"valid_targets_mean": 2481.8,
"valid_targets_min": 538
},
{
"epoch": 3.569326542161856,
"grad_norm": 0.4195015177774701,
"learning_rate": 2.2805681382730142e-05,
"loss": 0.0912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028936494141817093,
"step": 3155,
"valid_targets_mean": 2257.2,
"valid_targets_min": 664
},
{
"epoch": 3.5749858517260895,
"grad_norm": 0.5865427341283793,
"learning_rate": 2.2749815988695208e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09612908959388733,
"step": 3160,
"valid_targets_mean": 2451.9,
"valid_targets_min": 1180
},
{
"epoch": 3.5806451612903225,
"grad_norm": 0.4682729700077621,
"learning_rate": 2.2693928717615118e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03941601514816284,
"step": 3165,
"valid_targets_mean": 1885.5,
"valid_targets_min": 756
},
{
"epoch": 3.5863044708545555,
"grad_norm": 0.342242583693858,
"learning_rate": 2.2638020014119033e-05,
"loss": 0.1034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03896958753466606,
"step": 3170,
"valid_targets_mean": 3355.1,
"valid_targets_min": 2963
},
{
"epoch": 3.591963780418789,
"grad_norm": 0.6921453617996776,
"learning_rate": 2.2582090323006603e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1678619682788849,
"step": 3175,
"valid_targets_mean": 2357.1,
"valid_targets_min": 1153
},
{
"epoch": 3.597623089983022,
"grad_norm": 0.31611802316350174,
"learning_rate": 2.2526140089244483e-05,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04150187224149704,
"step": 3180,
"valid_targets_mean": 4602.2,
"valid_targets_min": 3507
},
{
"epoch": 3.6032823995472554,
"grad_norm": 0.3350914314311627,
"learning_rate": 2.247016975796274e-05,
"loss": 0.0901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04903364181518555,
"step": 3185,
"valid_targets_mean": 4597.1,
"valid_targets_min": 3835
},
{
"epoch": 3.6089417091114884,
"grad_norm": 0.40270627304143364,
"learning_rate": 2.2414179774451333e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04972846806049347,
"step": 3190,
"valid_targets_mean": 3571.6,
"valid_targets_min": 784
},
{
"epoch": 3.614601018675722,
"grad_norm": 0.415917999569666,
"learning_rate": 2.2358170584156577e-05,
"loss": 0.0865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034407228231430054,
"step": 3195,
"valid_targets_mean": 1951.9,
"valid_targets_min": 779
},
{
"epoch": 3.620260328239955,
"grad_norm": 0.5217860854709225,
"learning_rate": 2.2302142632677605e-05,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042375870048999786,
"step": 3200,
"valid_targets_mean": 2124.8,
"valid_targets_min": 674
},
{
"epoch": 3.625919637804188,
"grad_norm": 0.44254199276435036,
"learning_rate": 2.2246096365762782e-05,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04500596970319748,
"step": 3205,
"valid_targets_mean": 2388.5,
"valid_targets_min": 712
},
{
"epoch": 3.6315789473684212,
"grad_norm": 0.3665353563421478,
"learning_rate": 2.2190032229306215e-05,
"loss": 0.0894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04064202308654785,
"step": 3210,
"valid_targets_mean": 3521.6,
"valid_targets_min": 2422
},
{
"epoch": 3.6372382569326542,
"grad_norm": 0.34605379460700103,
"learning_rate": 2.2133950669344156e-05,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02806910313665867,
"step": 3215,
"valid_targets_mean": 3248.5,
"valid_targets_min": 576
},
{
"epoch": 3.6428975664968872,
"grad_norm": 0.30931044690920806,
"learning_rate": 2.207785213205149e-05,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023745758458971977,
"step": 3220,
"valid_targets_mean": 3581.9,
"valid_targets_min": 772
},
{
"epoch": 3.6485568760611207,
"grad_norm": 0.43922432142537926,
"learning_rate": 2.202173706373817e-05,
"loss": 0.0751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03783226013183594,
"step": 3225,
"valid_targets_mean": 2654.1,
"valid_targets_min": 722
},
{
"epoch": 3.6542161856253537,
"grad_norm": 0.3477209012773255,
"learning_rate": 2.1965605910845654e-05,
"loss": 0.0779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04104755073785782,
"step": 3230,
"valid_targets_mean": 3685.9,
"valid_targets_min": 2788
},
{
"epoch": 3.6598754951895867,
"grad_norm": 0.3768374199903355,
"learning_rate": 2.1909459119943384e-05,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0392816886305809,
"step": 3235,
"valid_targets_mean": 2503.4,
"valid_targets_min": 614
},
{
"epoch": 3.66553480475382,
"grad_norm": 0.6007344213267962,
"learning_rate": 2.1853297137725204e-05,
"loss": 0.1136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11411529779434204,
"step": 3240,
"valid_targets_mean": 1719.4,
"valid_targets_min": 608
},
{
"epoch": 3.671194114318053,
"grad_norm": 0.3754157879242706,
"learning_rate": 2.1797120411005807e-05,
"loss": 0.0982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042109765112400055,
"step": 3245,
"valid_targets_mean": 3966.6,
"valid_targets_min": 3150
},
{
"epoch": 3.676853423882286,
"grad_norm": 0.5445762559868512,
"learning_rate": 2.1740929386717222e-05,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05597252771258354,
"step": 3250,
"valid_targets_mean": 2366.1,
"valid_targets_min": 718
},
{
"epoch": 3.6825127334465195,
"grad_norm": 0.42769001995635586,
"learning_rate": 2.1684724511905193e-05,
"loss": 0.0934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04565860331058502,
"step": 3255,
"valid_targets_mean": 3555.2,
"valid_targets_min": 1333
},
{
"epoch": 3.688172043010753,
"grad_norm": 0.44318255157550557,
"learning_rate": 2.1628506233725678e-05,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041587576270103455,
"step": 3260,
"valid_targets_mean": 2041.2,
"valid_targets_min": 693
},
{
"epoch": 3.693831352574986,
"grad_norm": 0.4537669446711333,
"learning_rate": 2.1572274999441265e-05,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036606110632419586,
"step": 3265,
"valid_targets_mean": 1494.2,
"valid_targets_min": 803
},
{
"epoch": 3.699490662139219,
"grad_norm": 0.38686037920354616,
"learning_rate": 2.151603125641761e-05,
"loss": 0.0984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07212714850902557,
"step": 3270,
"valid_targets_mean": 2762.1,
"valid_targets_min": 902
},
{
"epoch": 3.7051499717034524,
"grad_norm": 0.47568407094967713,
"learning_rate": 2.1459775452119898e-05,
"loss": 0.1123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04315885156393051,
"step": 3275,
"valid_targets_mean": 3572.5,
"valid_targets_min": 2393
},
{
"epoch": 3.7108092812676854,
"grad_norm": 0.35866653739893223,
"learning_rate": 2.1403508034109262e-05,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030487315729260445,
"step": 3280,
"valid_targets_mean": 3086.6,
"valid_targets_min": 804
},
{
"epoch": 3.7164685908319184,
"grad_norm": 0.344859782354928,
"learning_rate": 2.1347229450039237e-05,
"loss": 0.0932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0409947969019413,
"step": 3285,
"valid_targets_mean": 5223.5,
"valid_targets_min": 4147
},
{
"epoch": 3.722127900396152,
"grad_norm": 0.39780389555566287,
"learning_rate": 2.12909401476522e-05,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052354902029037476,
"step": 3290,
"valid_targets_mean": 4369.2,
"valid_targets_min": 871
},
{
"epoch": 3.727787209960385,
"grad_norm": 0.28502767625047915,
"learning_rate": 2.1234640574775783e-05,
"loss": 0.0771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02787552773952484,
"step": 3295,
"valid_targets_mean": 4207.1,
"valid_targets_min": 896
},
{
"epoch": 3.733446519524618,
"grad_norm": 0.35279233295246115,
"learning_rate": 2.1178331179319336e-05,
"loss": 0.088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043562762439250946,
"step": 3300,
"valid_targets_mean": 3603.9,
"valid_targets_min": 2862
},
{
"epoch": 3.7391058290888513,
"grad_norm": 0.6045679331388665,
"learning_rate": 2.112201240927037e-05,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06445741653442383,
"step": 3305,
"valid_targets_mean": 1776.4,
"valid_targets_min": 497
},
{
"epoch": 3.7447651386530842,
"grad_norm": 0.41700082787673637,
"learning_rate": 2.1065684712690954e-05,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05462094396352768,
"step": 3310,
"valid_targets_mean": 4063.8,
"valid_targets_min": 3217
},
{
"epoch": 3.7504244482173172,
"grad_norm": 0.47105077925347255,
"learning_rate": 2.1009348537714194e-05,
"loss": 0.1009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04253324121236801,
"step": 3315,
"valid_targets_mean": 2245.1,
"valid_targets_min": 901
},
{
"epoch": 3.7560837577815507,
"grad_norm": 0.3781290654660693,
"learning_rate": 2.0953004332540644e-05,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03992723301053047,
"step": 3320,
"valid_targets_mean": 3350.9,
"valid_targets_min": 905
},
{
"epoch": 3.7617430673457837,
"grad_norm": 0.4585858979255781,
"learning_rate": 2.089665254543473e-05,
"loss": 0.0975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06727780401706696,
"step": 3325,
"valid_targets_mean": 3223.2,
"valid_targets_min": 1181
},
{
"epoch": 3.767402376910017,
"grad_norm": 0.42217539231813284,
"learning_rate": 2.0840293624721234e-05,
"loss": 0.0882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03888125717639923,
"step": 3330,
"valid_targets_mean": 3718.1,
"valid_targets_min": 3184
},
{
"epoch": 3.77306168647425,
"grad_norm": 0.579536581426898,
"learning_rate": 2.0783928018781644e-05,
"loss": 0.0833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07282514870166779,
"step": 3335,
"valid_targets_mean": 2082.6,
"valid_targets_min": 650
},
{
"epoch": 3.7787209960384835,
"grad_norm": 0.517663613067983,
"learning_rate": 2.0727556176050676e-05,
"loss": 0.0882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046402908861637115,
"step": 3340,
"valid_targets_mean": 1639.8,
"valid_targets_min": 827
},
{
"epoch": 3.7843803056027165,
"grad_norm": 0.534794827416597,
"learning_rate": 2.0671178545012643e-05,
"loss": 0.0945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05245472490787506,
"step": 3345,
"valid_targets_mean": 1642.2,
"valid_targets_min": 940
},
{
"epoch": 3.7900396151669495,
"grad_norm": 0.37804680274866975,
"learning_rate": 2.0614795574197907e-05,
"loss": 0.101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03373146057128906,
"step": 3350,
"valid_targets_mean": 2931.0,
"valid_targets_min": 958
},
{
"epoch": 3.795698924731183,
"grad_norm": 0.5595591873372421,
"learning_rate": 2.0558407712179334e-05,
"loss": 0.0925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03488003835082054,
"step": 3355,
"valid_targets_mean": 1184.4,
"valid_targets_min": 495
},
{
"epoch": 3.801358234295416,
"grad_norm": 0.5049597929263119,
"learning_rate": 2.050201540756868e-05,
"loss": 0.1026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031919289380311966,
"step": 3360,
"valid_targets_mean": 1703.6,
"valid_targets_min": 655
},
{
"epoch": 3.807017543859649,
"grad_norm": 0.6514065995671096,
"learning_rate": 2.0445619109013054e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1003175750374794,
"step": 3365,
"valid_targets_mean": 2292.5,
"valid_targets_min": 521
},
{
"epoch": 3.8126768534238824,
"grad_norm": 0.43132665183117197,
"learning_rate": 2.038921926519134e-05,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052312783896923065,
"step": 3370,
"valid_targets_mean": 3474.4,
"valid_targets_min": 1909
},
{
"epoch": 3.8183361629881154,
"grad_norm": 0.31564328422784954,
"learning_rate": 2.033281632481063e-05,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03723391890525818,
"step": 3375,
"valid_targets_mean": 3427.6,
"valid_targets_min": 841
},
{
"epoch": 3.8239954725523484,
"grad_norm": 0.39519327642614127,
"learning_rate": 2.027641073660265e-05,
"loss": 0.0889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04752538353204727,
"step": 3380,
"valid_targets_mean": 3007.1,
"valid_targets_min": 2144
},
{
"epoch": 3.829654782116582,
"grad_norm": 0.456054856186123,
"learning_rate": 2.0220002949320187e-05,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05250108242034912,
"step": 3385,
"valid_targets_mean": 3419.9,
"valid_targets_min": 2215
},
{
"epoch": 3.835314091680815,
"grad_norm": 0.33797200336103456,
"learning_rate": 2.0163593411733533e-05,
"loss": 0.0715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04054778814315796,
"step": 3390,
"valid_targets_mean": 3754.9,
"valid_targets_min": 723
},
{
"epoch": 3.8409734012450483,
"grad_norm": 0.3296089900649167,
"learning_rate": 2.0107182572626897e-05,
"loss": 0.0893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04143691062927246,
"step": 3395,
"valid_targets_mean": 4612.4,
"valid_targets_min": 1253
},
{
"epoch": 3.8466327108092813,
"grad_norm": 0.315842382743557,
"learning_rate": 2.0050770880794843e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04056167230010033,
"step": 3400,
"valid_targets_mean": 3894.0,
"valid_targets_min": 995
},
{
"epoch": 3.8522920203735147,
"grad_norm": 0.29138446818333136,
"learning_rate": 1.9994358785038736e-05,
"loss": 0.0707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04306381940841675,
"step": 3405,
"valid_targets_mean": 4775.1,
"valid_targets_min": 3539
},
{
"epoch": 3.8579513299377477,
"grad_norm": 0.4118629229039932,
"learning_rate": 1.9937946734163117e-05,
"loss": 0.0945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05121958628296852,
"step": 3410,
"valid_targets_mean": 4235.9,
"valid_targets_min": 2839
},
{
"epoch": 3.8636106395019807,
"grad_norm": 0.32989201224002446,
"learning_rate": 1.98815351769722e-05,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02642885595560074,
"step": 3415,
"valid_targets_mean": 2090.6,
"valid_targets_min": 424
},
{
"epoch": 3.869269949066214,
"grad_norm": 0.4092120038133833,
"learning_rate": 1.982512456226628e-05,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05555412918329239,
"step": 3420,
"valid_targets_mean": 2603.4,
"valid_targets_min": 541
},
{
"epoch": 3.874929258630447,
"grad_norm": 0.38568525926824204,
"learning_rate": 1.976871533883812e-05,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03278844431042671,
"step": 3425,
"valid_targets_mean": 3360.5,
"valid_targets_min": 1938
},
{
"epoch": 3.88058856819468,
"grad_norm": 0.44242322902590053,
"learning_rate": 1.971230795546944e-05,
"loss": 0.0865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11511512100696564,
"step": 3430,
"valid_targets_mean": 2122.4,
"valid_targets_min": 722
},
{
"epoch": 3.8862478777589136,
"grad_norm": 0.38417822688245,
"learning_rate": 1.965590286092731e-05,
"loss": 0.0925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045143697410821915,
"step": 3435,
"valid_targets_mean": 3572.6,
"valid_targets_min": 2919
},
{
"epoch": 3.8919071873231466,
"grad_norm": 0.42311205060593304,
"learning_rate": 1.9599500503960596e-05,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03667496144771576,
"step": 3440,
"valid_targets_mean": 1793.4,
"valid_targets_min": 559
},
{
"epoch": 3.8975664968873796,
"grad_norm": 0.49304330387414225,
"learning_rate": 1.954310133329639e-05,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06212100386619568,
"step": 3445,
"valid_targets_mean": 2699.0,
"valid_targets_min": 811
},
{
"epoch": 3.903225806451613,
"grad_norm": 0.6981683111926872,
"learning_rate": 1.948670579763641e-05,
"loss": 0.1126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07180996239185333,
"step": 3450,
"valid_targets_mean": 1462.5,
"valid_targets_min": 685
},
{
"epoch": 3.908885116015846,
"grad_norm": 0.3665019195997859,
"learning_rate": 1.9430314345653486e-05,
"loss": 0.1174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028401896357536316,
"step": 3455,
"valid_targets_mean": 2990.6,
"valid_targets_min": 593
},
{
"epoch": 3.914544425580079,
"grad_norm": 0.36683102464115874,
"learning_rate": 1.9373927425987928e-05,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041700564324855804,
"step": 3460,
"valid_targets_mean": 3558.8,
"valid_targets_min": 1041
},
{
"epoch": 3.9202037351443124,
"grad_norm": 0.4262467475407333,
"learning_rate": 1.9317545487244016e-05,
"loss": 0.0949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05397236347198486,
"step": 3465,
"valid_targets_mean": 3713.2,
"valid_targets_min": 2556
},
{
"epoch": 3.9258630447085454,
"grad_norm": 0.45865992664307026,
"learning_rate": 1.926116897798639e-05,
"loss": 0.0838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05742509290575981,
"step": 3470,
"valid_targets_mean": 3734.9,
"valid_targets_min": 3385
},
{
"epoch": 3.931522354272779,
"grad_norm": 0.3807270985107737,
"learning_rate": 1.9204798346736485e-05,
"loss": 0.083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0385202094912529,
"step": 3475,
"valid_targets_mean": 3136.2,
"valid_targets_min": 541
},
{
"epoch": 3.937181663837012,
"grad_norm": 0.697305609254891,
"learning_rate": 1.914843404196899e-05,
"loss": 0.083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056570932269096375,
"step": 3480,
"valid_targets_mean": 1219.4,
"valid_targets_min": 598
},
{
"epoch": 3.9428409734012453,
"grad_norm": 0.4381515795574387,
"learning_rate": 1.9092076512108253e-05,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04982505738735199,
"step": 3485,
"valid_targets_mean": 3262.6,
"valid_targets_min": 1069
},
{
"epoch": 3.9485002829654783,
"grad_norm": 0.5458296366412162,
"learning_rate": 1.903572620552471e-05,
"loss": 0.0802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0361316055059433,
"step": 3490,
"valid_targets_mean": 1540.1,
"valid_targets_min": 680
},
{
"epoch": 3.9541595925297113,
"grad_norm": 0.40347912681769865,
"learning_rate": 1.8979383570531358e-05,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04016882926225662,
"step": 3495,
"valid_targets_mean": 2487.0,
"valid_targets_min": 774
},
{
"epoch": 3.9598189020939447,
"grad_norm": 0.3597195559569826,
"learning_rate": 1.8923049055380128e-05,
"loss": 0.0945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043545953929424286,
"step": 3500,
"valid_targets_mean": 4372.6,
"valid_targets_min": 1474
},
{
"epoch": 3.9654782116581777,
"grad_norm": 0.25634379370918176,
"learning_rate": 1.8866723108258376e-05,
"loss": 0.0747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03357706218957901,
"step": 3505,
"valid_targets_mean": 5496.2,
"valid_targets_min": 4657
},
{
"epoch": 3.9711375212224107,
"grad_norm": 0.3334762985004109,
"learning_rate": 1.8810406177285282e-05,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042172081768512726,
"step": 3510,
"valid_targets_mean": 3943.8,
"valid_targets_min": 675
},
{
"epoch": 3.976796830786644,
"grad_norm": 0.35172500208172275,
"learning_rate": 1.8754098710508294e-05,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046609655022621155,
"step": 3515,
"valid_targets_mean": 3760.4,
"valid_targets_min": 2463
},
{
"epoch": 3.982456140350877,
"grad_norm": 0.8796896661404067,
"learning_rate": 1.869780115589957e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03977133333683014,
"step": 3520,
"valid_targets_mean": 2844.4,
"valid_targets_min": 605
},
{
"epoch": 3.98811544991511,
"grad_norm": 0.35543893040609253,
"learning_rate": 1.8641513961352396e-05,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037588320672512054,
"step": 3525,
"valid_targets_mean": 3247.4,
"valid_targets_min": 1014
},
{
"epoch": 3.9937747594793436,
"grad_norm": 0.3704753246940243,
"learning_rate": 1.858523757467765e-05,
"loss": 0.0912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042072445154190063,
"step": 3530,
"valid_targets_mean": 3545.2,
"valid_targets_min": 2807
},
{
"epoch": 3.9994340690435766,
"grad_norm": 0.5344737197927087,
"learning_rate": 1.8528972443600226e-05,
"loss": 0.1144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11486827582120895,
"step": 3535,
"valid_targets_mean": 2912.9,
"valid_targets_min": 1214
},
{
"epoch": 4.005659309564233,
"grad_norm": 0.5008124596440419,
"learning_rate": 1.8472719015755452e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09267597645521164,
"step": 3540,
"valid_targets_mean": 7214.4,
"valid_targets_min": 4847
},
{
"epoch": 4.011318619128466,
"grad_norm": 0.3939702908833795,
"learning_rate": 1.8416477738685567e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0846470445394516,
"step": 3545,
"valid_targets_mean": 6417.1,
"valid_targets_min": 4480
},
{
"epoch": 4.016977928692699,
"grad_norm": 0.3835188973433748,
"learning_rate": 1.8360249059836123e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08836297690868378,
"step": 3550,
"valid_targets_mean": 7605.4,
"valid_targets_min": 5236
},
{
"epoch": 4.022637238256933,
"grad_norm": 0.40270414663569104,
"learning_rate": 1.830403342655246e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07130195200443268,
"step": 3555,
"valid_targets_mean": 5827.9,
"valid_targets_min": 4727
},
{
"epoch": 4.028296547821165,
"grad_norm": 0.4331187042742476,
"learning_rate": 1.824783128607612e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0947471559047699,
"step": 3560,
"valid_targets_mean": 6448.2,
"valid_targets_min": 4211
},
{
"epoch": 4.033955857385399,
"grad_norm": 0.4728306033797111,
"learning_rate": 1.8191643085541296e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09749437868595123,
"step": 3565,
"valid_targets_mean": 6108.1,
"valid_targets_min": 4279
},
{
"epoch": 4.039615166949632,
"grad_norm": 0.3742686771616783,
"learning_rate": 1.813546927197129e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07242477685213089,
"step": 3570,
"valid_targets_mean": 5962.4,
"valid_targets_min": 4589
},
{
"epoch": 4.045274476513866,
"grad_norm": 0.47923860816844743,
"learning_rate": 1.8079310292274928e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08282826095819473,
"step": 3575,
"valid_targets_mean": 3503.2,
"valid_targets_min": 2015
},
{
"epoch": 4.050933786078098,
"grad_norm": 0.35980349731828126,
"learning_rate": 1.8023166593243026e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06773898005485535,
"step": 3580,
"valid_targets_mean": 6102.5,
"valid_targets_min": 4778
},
{
"epoch": 4.056593095642332,
"grad_norm": 0.3825978995401686,
"learning_rate": 1.7967038621544845e-05,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07666116952896118,
"step": 3585,
"valid_targets_mean": 5868.2,
"valid_targets_min": 4612
},
{
"epoch": 4.062252405206565,
"grad_norm": 0.40696919494833955,
"learning_rate": 1.791092682372449e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08827384561300278,
"step": 3590,
"valid_targets_mean": 6105.8,
"valid_targets_min": 4491
},
{
"epoch": 4.067911714770798,
"grad_norm": 0.39421380445121584,
"learning_rate": 1.7854831646197426e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08447161316871643,
"step": 3595,
"valid_targets_mean": 6962.0,
"valid_targets_min": 4754
},
{
"epoch": 4.073571024335031,
"grad_norm": 0.37473359119575794,
"learning_rate": 1.7798753535246856e-05,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07447396218776703,
"step": 3600,
"valid_targets_mean": 6035.1,
"valid_targets_min": 4787
},
{
"epoch": 4.079230333899265,
"grad_norm": 0.4227213769477523,
"learning_rate": 1.7742692937020234e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07278391718864441,
"step": 3605,
"valid_targets_mean": 6028.5,
"valid_targets_min": 5213
},
{
"epoch": 4.084889643463497,
"grad_norm": 0.38524214879156815,
"learning_rate": 1.768665029752567e-05,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06999488174915314,
"step": 3610,
"valid_targets_mean": 6814.1,
"valid_targets_min": 4664
},
{
"epoch": 4.090548953027731,
"grad_norm": 0.3972869029235263,
"learning_rate": 1.763062606262839e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07294754683971405,
"step": 3615,
"valid_targets_mean": 6281.5,
"valid_targets_min": 4996
},
{
"epoch": 4.096208262591964,
"grad_norm": 0.3931822579344668,
"learning_rate": 1.7574620678047215e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07363331317901611,
"step": 3620,
"valid_targets_mean": 6628.9,
"valid_targets_min": 4582
},
{
"epoch": 4.101867572156197,
"grad_norm": 0.3601228835997598,
"learning_rate": 1.751863458935099e-05,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06443273276090622,
"step": 3625,
"valid_targets_mean": 6536.6,
"valid_targets_min": 5205
},
{
"epoch": 4.10752688172043,
"grad_norm": 0.37681366926978777,
"learning_rate": 1.746266824195504e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07399990409612656,
"step": 3630,
"valid_targets_mean": 7031.0,
"valid_targets_min": 5098
},
{
"epoch": 4.1131861912846635,
"grad_norm": 0.4129281253908889,
"learning_rate": 1.7406722081117632e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09378090500831604,
"step": 3635,
"valid_targets_mean": 6514.2,
"valid_targets_min": 5016
},
{
"epoch": 4.118845500848896,
"grad_norm": 0.40046677747273324,
"learning_rate": 1.7350796551936432e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11042913794517517,
"step": 3640,
"valid_targets_mean": 6330.0,
"valid_targets_min": 965
},
{
"epoch": 4.124504810413129,
"grad_norm": 0.38272577252010453,
"learning_rate": 1.7294892099344975e-05,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07567565888166428,
"step": 3645,
"valid_targets_mean": 6293.1,
"valid_targets_min": 5218
},
{
"epoch": 4.130164119977363,
"grad_norm": 0.4075941121248639,
"learning_rate": 1.7239009168109108e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07180091738700867,
"step": 3650,
"valid_targets_mean": 6957.4,
"valid_targets_min": 4213
},
{
"epoch": 4.135823429541596,
"grad_norm": 0.4459180719896231,
"learning_rate": 1.7183148202823445e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09024065732955933,
"step": 3655,
"valid_targets_mean": 5888.5,
"valid_targets_min": 4923
},
{
"epoch": 4.141482739105829,
"grad_norm": 0.417345833444335,
"learning_rate": 1.7127309647907867e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11535342037677765,
"step": 3660,
"valid_targets_mean": 7822.9,
"valid_targets_min": 4993
},
{
"epoch": 4.147142048670062,
"grad_norm": 0.4092836996069491,
"learning_rate": 1.7071493947603942e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08515796065330505,
"step": 3665,
"valid_targets_mean": 6098.6,
"valid_targets_min": 4872
},
{
"epoch": 4.152801358234296,
"grad_norm": 0.3829832784465982,
"learning_rate": 1.7015701545971417e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08360423147678375,
"step": 3670,
"valid_targets_mean": 6892.2,
"valid_targets_min": 4706
},
{
"epoch": 4.158460667798528,
"grad_norm": 0.45523292925046316,
"learning_rate": 1.695993288688469e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07692007720470428,
"step": 3675,
"valid_targets_mean": 6352.0,
"valid_targets_min": 4889
},
{
"epoch": 4.164119977362762,
"grad_norm": 0.4255022530499619,
"learning_rate": 1.6904188414029248e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07571934908628464,
"step": 3680,
"valid_targets_mean": 5948.9,
"valid_targets_min": 3888
},
{
"epoch": 4.169779286926995,
"grad_norm": 0.4095787920769221,
"learning_rate": 1.6848468570898172e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07443135976791382,
"step": 3685,
"valid_targets_mean": 5846.2,
"valid_targets_min": 4051
},
{
"epoch": 4.175438596491228,
"grad_norm": 0.3788095484158347,
"learning_rate": 1.6792773800788583e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08252878487110138,
"step": 3690,
"valid_targets_mean": 7319.2,
"valid_targets_min": 5230
},
{
"epoch": 4.181097906055461,
"grad_norm": 0.38497942903312243,
"learning_rate": 1.673710454679813e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08583734184503555,
"step": 3695,
"valid_targets_mean": 8235.1,
"valid_targets_min": 4997
},
{
"epoch": 4.186757215619695,
"grad_norm": 0.4446341909959979,
"learning_rate": 1.668146125182147e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08628219366073608,
"step": 3700,
"valid_targets_mean": 6402.5,
"valid_targets_min": 5364
},
{
"epoch": 4.192416525183927,
"grad_norm": 0.40330962971590845,
"learning_rate": 1.6625844358546715e-05,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09064686298370361,
"step": 3705,
"valid_targets_mean": 7117.4,
"valid_targets_min": 3391
},
{
"epoch": 4.198075834748161,
"grad_norm": 0.36576009736166315,
"learning_rate": 1.657025430945195e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07560627907514572,
"step": 3710,
"valid_targets_mean": 7542.8,
"valid_targets_min": 4829
},
{
"epoch": 4.203735144312394,
"grad_norm": 0.5393492990188449,
"learning_rate": 1.651469154680167e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0772615298628807,
"step": 3715,
"valid_targets_mean": 6284.4,
"valid_targets_min": 5180
},
{
"epoch": 4.2093944538766275,
"grad_norm": 0.4471781144605719,
"learning_rate": 1.6459156512643303e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08217886090278625,
"step": 3720,
"valid_targets_mean": 5806.2,
"valid_targets_min": 5101
},
{
"epoch": 4.21505376344086,
"grad_norm": 0.4336240077848953,
"learning_rate": 1.640364964880367e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07309036701917648,
"step": 3725,
"valid_targets_mean": 6697.9,
"valid_targets_min": 4527
},
{
"epoch": 4.2207130730050935,
"grad_norm": 0.40323628644582493,
"learning_rate": 1.6348171396885468e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08748327940702438,
"step": 3730,
"valid_targets_mean": 6410.4,
"valid_targets_min": 3082
},
{
"epoch": 4.226372382569327,
"grad_norm": 0.4095929036243839,
"learning_rate": 1.6292722198263766e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07573725283145905,
"step": 3735,
"valid_targets_mean": 6847.1,
"valid_targets_min": 4685
},
{
"epoch": 4.2320316921335595,
"grad_norm": 0.43963984326487965,
"learning_rate": 1.623730249408249e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08435098826885223,
"step": 3740,
"valid_targets_mean": 6194.0,
"valid_targets_min": 4644
},
{
"epoch": 4.237691001697793,
"grad_norm": 0.3929935896020955,
"learning_rate": 1.618191272525092e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06960330903530121,
"step": 3745,
"valid_targets_mean": 6283.8,
"valid_targets_min": 4433
},
{
"epoch": 4.243350311262026,
"grad_norm": 0.5154631432189906,
"learning_rate": 1.612655333244016e-05,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07508840411901474,
"step": 3750,
"valid_targets_mean": 5917.2,
"valid_targets_min": 4857
},
{
"epoch": 4.249009620826259,
"grad_norm": 0.4376479061623972,
"learning_rate": 1.6071224756079666e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0977800190448761,
"step": 3755,
"valid_targets_mean": 6986.4,
"valid_targets_min": 5101
},
{
"epoch": 4.254668930390492,
"grad_norm": 0.445663905724086,
"learning_rate": 1.6015927436353713e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06677838414907455,
"step": 3760,
"valid_targets_mean": 5299.5,
"valid_targets_min": 4442
},
{
"epoch": 4.260328239954726,
"grad_norm": 0.37709369412424565,
"learning_rate": 1.59606618131979e-05,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05814947187900543,
"step": 3765,
"valid_targets_mean": 6133.9,
"valid_targets_min": 5130
},
{
"epoch": 4.265987549518958,
"grad_norm": 0.42340455157424106,
"learning_rate": 1.5905428326295663e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08240945637226105,
"step": 3770,
"valid_targets_mean": 6477.4,
"valid_targets_min": 4162
},
{
"epoch": 4.271646859083192,
"grad_norm": 0.3764871118641996,
"learning_rate": 1.585022741507477e-05,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06925308704376221,
"step": 3775,
"valid_targets_mean": 6350.4,
"valid_targets_min": 3940
},
{
"epoch": 4.277306168647425,
"grad_norm": 0.4362310563771639,
"learning_rate": 1.579505951870381e-05,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08733298629522324,
"step": 3780,
"valid_targets_mean": 6625.1,
"valid_targets_min": 4642
},
{
"epoch": 4.282965478211658,
"grad_norm": 0.4268228683981418,
"learning_rate": 1.573992507608872e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08933217823505402,
"step": 3785,
"valid_targets_mean": 4907.0,
"valid_targets_min": 4431
},
{
"epoch": 4.288624787775891,
"grad_norm": 0.42302991710871685,
"learning_rate": 1.568482452586929e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08254139870405197,
"step": 3790,
"valid_targets_mean": 6465.0,
"valid_targets_min": 5333
},
{
"epoch": 4.294284097340125,
"grad_norm": 0.4151763737853865,
"learning_rate": 1.5629758306415652e-05,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0802953690290451,
"step": 3795,
"valid_targets_mean": 5650.5,
"valid_targets_min": 4769
},
{
"epoch": 4.299943406904358,
"grad_norm": 0.4311186422126902,
"learning_rate": 1.5574726855824827e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07794877886772156,
"step": 3800,
"valid_targets_mean": 5540.0,
"valid_targets_min": 4281
},
{
"epoch": 4.305602716468591,
"grad_norm": 0.4543300622427506,
"learning_rate": 1.5519730611917206e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11111429333686829,
"step": 3805,
"valid_targets_mean": 6499.0,
"valid_targets_min": 4844
},
{
"epoch": 4.311262026032824,
"grad_norm": 0.39997302398510315,
"learning_rate": 1.546477001223309e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07029193639755249,
"step": 3810,
"valid_targets_mean": 5736.5,
"valid_targets_min": 5227
},
{
"epoch": 4.3169213355970575,
"grad_norm": 0.3686385730004549,
"learning_rate": 1.5409845494029208e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06129857152700424,
"step": 3815,
"valid_targets_mean": 5857.2,
"valid_targets_min": 2461
},
{
"epoch": 4.32258064516129,
"grad_norm": 0.4060862356848946,
"learning_rate": 1.5354957494275207e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07067536562681198,
"step": 3820,
"valid_targets_mean": 5793.4,
"valid_targets_min": 2815
},
{
"epoch": 4.3282399547255235,
"grad_norm": 0.4038576482109372,
"learning_rate": 1.5300106449650234e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06821887195110321,
"step": 3825,
"valid_targets_mean": 6588.8,
"valid_targets_min": 4875
},
{
"epoch": 4.333899264289757,
"grad_norm": 0.41338552584688865,
"learning_rate": 1.524529279653939e-05,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07139618694782257,
"step": 3830,
"valid_targets_mean": 5984.8,
"valid_targets_min": 4901
},
{
"epoch": 4.3395585738539895,
"grad_norm": 0.3626865453067956,
"learning_rate": 1.5190516971030324e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06856446713209152,
"step": 3835,
"valid_targets_mean": 6067.4,
"valid_targets_min": 3786
},
{
"epoch": 4.345217883418223,
"grad_norm": 0.40474411941293037,
"learning_rate": 1.5135779408909732e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07661972939968109,
"step": 3840,
"valid_targets_mean": 5852.5,
"valid_targets_min": 5057
},
{
"epoch": 4.350877192982456,
"grad_norm": 0.4529750374758651,
"learning_rate": 1.5081080545659874e-05,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0812104269862175,
"step": 3845,
"valid_targets_mean": 6362.2,
"valid_targets_min": 3952
},
{
"epoch": 4.356536502546689,
"grad_norm": 0.47063382640866086,
"learning_rate": 1.5026420816455156e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07746419310569763,
"step": 3850,
"valid_targets_mean": 5360.2,
"valid_targets_min": 4267
},
{
"epoch": 4.362195812110922,
"grad_norm": 0.42248565285269357,
"learning_rate": 1.4971800656158624e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09461343288421631,
"step": 3855,
"valid_targets_mean": 6842.1,
"valid_targets_min": 4785
},
{
"epoch": 4.367855121675156,
"grad_norm": 0.38764246155158855,
"learning_rate": 1.4917220499318506e-05,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06870239973068237,
"step": 3860,
"valid_targets_mean": 6188.5,
"valid_targets_min": 5438
},
{
"epoch": 4.373514431239389,
"grad_norm": 0.43502410000194525,
"learning_rate": 1.4862680780164805e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08560039103031158,
"step": 3865,
"valid_targets_mean": 5848.6,
"valid_targets_min": 4734
},
{
"epoch": 4.379173740803622,
"grad_norm": 0.35644987083560775,
"learning_rate": 1.4808181932605787e-05,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06139899417757988,
"step": 3870,
"valid_targets_mean": 6278.2,
"valid_targets_min": 5636
},
{
"epoch": 4.384833050367855,
"grad_norm": 0.3918664932129097,
"learning_rate": 1.4753724390224551e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0662948489189148,
"step": 3875,
"valid_targets_mean": 6168.9,
"valid_targets_min": 4206
},
{
"epoch": 4.390492359932089,
"grad_norm": 0.40240258367128745,
"learning_rate": 1.4699308586275591e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06691467016935349,
"step": 3880,
"valid_targets_mean": 6226.5,
"valid_targets_min": 4535
},
{
"epoch": 4.396151669496321,
"grad_norm": 0.35360407851709585,
"learning_rate": 1.464493495368132e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07321492582559586,
"step": 3885,
"valid_targets_mean": 7821.6,
"valid_targets_min": 5471
},
{
"epoch": 4.401810979060555,
"grad_norm": 0.4168799254478002,
"learning_rate": 1.459060392502866e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06479287147521973,
"step": 3890,
"valid_targets_mean": 6843.0,
"valid_targets_min": 5243
},
{
"epoch": 4.407470288624788,
"grad_norm": 0.45280990702426094,
"learning_rate": 1.4536315932565575e-05,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08667883276939392,
"step": 3895,
"valid_targets_mean": 6658.6,
"valid_targets_min": 4906
},
{
"epoch": 4.413129598189021,
"grad_norm": 0.5170654478744513,
"learning_rate": 1.448207140819764e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07833343744277954,
"step": 3900,
"valid_targets_mean": 6799.5,
"valid_targets_min": 5168
},
{
"epoch": 4.418788907753254,
"grad_norm": 0.4585375937990011,
"learning_rate": 1.4427870783484613e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08121506869792938,
"step": 3905,
"valid_targets_mean": 5376.2,
"valid_targets_min": 3130
},
{
"epoch": 4.4244482173174875,
"grad_norm": 0.443331932431525,
"learning_rate": 1.4373714489636985e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04741574078798294,
"step": 3910,
"valid_targets_mean": 2843.1,
"valid_targets_min": 1990
},
{
"epoch": 4.43010752688172,
"grad_norm": 0.48401226868031233,
"learning_rate": 1.4319602957512564e-05,
"loss": 0.106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04668089747428894,
"step": 3915,
"valid_targets_mean": 2532.2,
"valid_targets_min": 324
},
{
"epoch": 4.4357668364459535,
"grad_norm": 0.3954237444400868,
"learning_rate": 1.4265536617613043e-05,
"loss": 0.0807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04219325631856918,
"step": 3920,
"valid_targets_mean": 2359.2,
"valid_targets_min": 982
},
{
"epoch": 4.441426146010187,
"grad_norm": 0.5155838952571494,
"learning_rate": 1.4211515900080568e-05,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04493227228522301,
"step": 3925,
"valid_targets_mean": 3640.0,
"valid_targets_min": 2479
},
{
"epoch": 4.44708545557442,
"grad_norm": 0.3246724348372543,
"learning_rate": 1.4157541234694324e-05,
"loss": 0.0906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028960149735212326,
"step": 3930,
"valid_targets_mean": 3079.5,
"valid_targets_min": 811
},
{
"epoch": 4.452744765138653,
"grad_norm": 0.4095150256981928,
"learning_rate": 1.4103613050867117e-05,
"loss": 0.0837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047411803156137466,
"step": 3935,
"valid_targets_mean": 3113.4,
"valid_targets_min": 1431
},
{
"epoch": 4.458404074702886,
"grad_norm": 0.6391321063571365,
"learning_rate": 1.4049731777641948e-05,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.086330845952034,
"step": 3940,
"valid_targets_mean": 1990.9,
"valid_targets_min": 702
},
{
"epoch": 4.46406338426712,
"grad_norm": 0.38922644742240664,
"learning_rate": 1.3995897843688615e-05,
"loss": 0.1011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047160811722278595,
"step": 3945,
"valid_targets_mean": 3221.6,
"valid_targets_min": 621
},
{
"epoch": 4.469722693831352,
"grad_norm": 0.6462094372397308,
"learning_rate": 1.3942111677300276e-05,
"loss": 0.0907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05346031114459038,
"step": 3950,
"valid_targets_mean": 2591.4,
"valid_targets_min": 846
},
{
"epoch": 4.475382003395586,
"grad_norm": 0.4061055434466861,
"learning_rate": 1.388837370639008e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06589578837156296,
"step": 3955,
"valid_targets_mean": 3738.9,
"valid_targets_min": 1369
},
{
"epoch": 4.481041312959819,
"grad_norm": 0.3849733546616827,
"learning_rate": 1.3834684358487731e-05,
"loss": 0.0646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039215341210365295,
"step": 3960,
"valid_targets_mean": 2715.4,
"valid_targets_min": 754
},
{
"epoch": 4.486700622524052,
"grad_norm": 0.4253804496012952,
"learning_rate": 1.3781044060736089e-05,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04853950813412666,
"step": 3965,
"valid_targets_mean": 2725.9,
"valid_targets_min": 776
},
{
"epoch": 4.492359932088285,
"grad_norm": 0.3578152154235922,
"learning_rate": 1.3727453239887796e-05,
"loss": 0.0802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052317701280117035,
"step": 3970,
"valid_targets_mean": 3194.4,
"valid_targets_min": 754
},
{
"epoch": 4.498019241652519,
"grad_norm": 0.6391115960853455,
"learning_rate": 1.367391232230185e-05,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17157770693302155,
"step": 3975,
"valid_targets_mean": 2053.8,
"valid_targets_min": 664
},
{
"epoch": 4.503678551216751,
"grad_norm": 0.40231212097613134,
"learning_rate": 1.3620421733940234e-05,
"loss": 0.0756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04370037838816643,
"step": 3980,
"valid_targets_mean": 3771.4,
"valid_targets_min": 2542
},
{
"epoch": 4.509337860780985,
"grad_norm": 0.4723821784200535,
"learning_rate": 1.356698190036453e-05,
"loss": 0.0813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051801249384880066,
"step": 3985,
"valid_targets_mean": 3486.2,
"valid_targets_min": 2988
},
{
"epoch": 4.514997170345218,
"grad_norm": 0.4080233853264302,
"learning_rate": 1.3513593246732506e-05,
"loss": 0.0751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046337466686964035,
"step": 3990,
"valid_targets_mean": 3779.4,
"valid_targets_min": 3281
},
{
"epoch": 4.5206564799094515,
"grad_norm": 0.44644169226312036,
"learning_rate": 1.3460256197794768e-05,
"loss": 0.0822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04264343902468681,
"step": 3995,
"valid_targets_mean": 3471.1,
"valid_targets_min": 2189
},
{
"epoch": 4.526315789473684,
"grad_norm": 0.4063499834323027,
"learning_rate": 1.3406971177891343e-05,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03730551153421402,
"step": 4000,
"valid_targets_mean": 3483.6,
"valid_targets_min": 1788
},
{
"epoch": 4.5319750990379175,
"grad_norm": 0.5680761401310686,
"learning_rate": 1.3353738610948347e-05,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05603942275047302,
"step": 4005,
"valid_targets_mean": 2562.1,
"valid_targets_min": 597
},
{
"epoch": 4.53763440860215,
"grad_norm": 0.4615652741114608,
"learning_rate": 1.3300558920474586e-05,
"loss": 0.0904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04337063431739807,
"step": 4010,
"valid_targets_mean": 2272.8,
"valid_targets_min": 701
},
{
"epoch": 4.5432937181663835,
"grad_norm": 0.475199804932793,
"learning_rate": 1.3247432529558175e-05,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07559002190828323,
"step": 4015,
"valid_targets_mean": 2971.0,
"valid_targets_min": 1652
},
{
"epoch": 4.548953027730617,
"grad_norm": 0.3985376653121622,
"learning_rate": 1.3194359860863201e-05,
"loss": 0.0938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03962837532162666,
"step": 4020,
"valid_targets_mean": 3747.4,
"valid_targets_min": 1908
},
{
"epoch": 4.55461233729485,
"grad_norm": 0.4095101597017151,
"learning_rate": 1.3141341336626336e-05,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03326389938592911,
"step": 4025,
"valid_targets_mean": 3247.8,
"valid_targets_min": 971
},
{
"epoch": 4.560271646859083,
"grad_norm": 0.44270290029488385,
"learning_rate": 1.3088377378653503e-05,
"loss": 0.1158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04294685274362564,
"step": 4030,
"valid_targets_mean": 3422.2,
"valid_targets_min": 2552
},
{
"epoch": 4.565930956423316,
"grad_norm": 0.39806191121450035,
"learning_rate": 1.3035468408316501e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03280611336231232,
"step": 4035,
"valid_targets_mean": 2948.9,
"valid_targets_min": 753
},
{
"epoch": 4.57159026598755,
"grad_norm": 0.5454580231471242,
"learning_rate": 1.2982614846549639e-05,
"loss": 0.0899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036681562662124634,
"step": 4040,
"valid_targets_mean": 1090.5,
"valid_targets_min": 568
},
{
"epoch": 4.577249575551782,
"grad_norm": 0.5272571498175689,
"learning_rate": 1.2929817113846428e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11161740869283676,
"step": 4045,
"valid_targets_mean": 2921.1,
"valid_targets_min": 1070
},
{
"epoch": 4.582908885116016,
"grad_norm": 0.5114999200280982,
"learning_rate": 1.287707563025621e-05,
"loss": 0.0928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04125947877764702,
"step": 4050,
"valid_targets_mean": 2052.1,
"valid_targets_min": 329
},
{
"epoch": 4.588568194680249,
"grad_norm": 0.6794177641022152,
"learning_rate": 1.2824390815380805e-05,
"loss": 0.0947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05280480161309242,
"step": 4055,
"valid_targets_mean": 998.2,
"valid_targets_min": 608
},
{
"epoch": 4.594227504244482,
"grad_norm": 0.43483819154934944,
"learning_rate": 1.2771763088371202e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050098396837711334,
"step": 4060,
"valid_targets_mean": 4405.9,
"valid_targets_min": 2772
},
{
"epoch": 4.599886813808715,
"grad_norm": 0.3413473904426111,
"learning_rate": 1.2719192867924197e-05,
"loss": 0.077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021962987259030342,
"step": 4065,
"valid_targets_mean": 5138.2,
"valid_targets_min": 3778
},
{
"epoch": 4.605546123372949,
"grad_norm": 0.37623027963803085,
"learning_rate": 1.2666680572279083e-05,
"loss": 0.0903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04053713008761406,
"step": 4070,
"valid_targets_mean": 4641.0,
"valid_targets_min": 2336
},
{
"epoch": 4.611205432937181,
"grad_norm": 0.4165917942784783,
"learning_rate": 1.2614226619214317e-05,
"loss": 0.0874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05364896357059479,
"step": 4075,
"valid_targets_mean": 3962.1,
"valid_targets_min": 2161
},
{
"epoch": 4.616864742501415,
"grad_norm": 0.4068046168922619,
"learning_rate": 1.2561831426044173e-05,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04479540139436722,
"step": 4080,
"valid_targets_mean": 3271.8,
"valid_targets_min": 798
},
{
"epoch": 4.622524052065648,
"grad_norm": 0.48384948537626565,
"learning_rate": 1.250949540961547e-05,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03350779414176941,
"step": 4085,
"valid_targets_mean": 1915.8,
"valid_targets_min": 533
},
{
"epoch": 4.6281833616298815,
"grad_norm": 0.46288391779242044,
"learning_rate": 1.2457218986304196e-05,
"loss": 0.077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038839347660541534,
"step": 4090,
"valid_targets_mean": 2589.2,
"valid_targets_min": 833
},
{
"epoch": 4.633842671194114,
"grad_norm": 0.35155068112360527,
"learning_rate": 1.2405002572012252e-05,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036818526685237885,
"step": 4095,
"valid_targets_mean": 3888.0,
"valid_targets_min": 3391
},
{
"epoch": 4.6395019807583475,
"grad_norm": 0.5592411123462357,
"learning_rate": 1.2352846582164117e-05,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06276963651180267,
"step": 4100,
"valid_targets_mean": 1517.1,
"valid_targets_min": 732
},
{
"epoch": 4.645161290322581,
"grad_norm": 0.6587717790794467,
"learning_rate": 1.2300751431703523e-05,
"loss": 0.1068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05123891681432724,
"step": 4105,
"valid_targets_mean": 1623.9,
"valid_targets_min": 538
},
{
"epoch": 4.6508205998868135,
"grad_norm": 0.5410366205486246,
"learning_rate": 1.2248717535090196e-05,
"loss": 0.065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04050035774707794,
"step": 4110,
"valid_targets_mean": 1158.1,
"valid_targets_min": 720
},
{
"epoch": 4.656479909451047,
"grad_norm": 0.46500986147482537,
"learning_rate": 1.2196745306296522e-05,
"loss": 0.0731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0410282164812088,
"step": 4115,
"valid_targets_mean": 2982.2,
"valid_targets_min": 2328
},
{
"epoch": 4.66213921901528,
"grad_norm": 0.46392092870275686,
"learning_rate": 1.2144835158804282e-05,
"loss": 0.0685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03278231620788574,
"step": 4120,
"valid_targets_mean": 2637.0,
"valid_targets_min": 684
},
{
"epoch": 4.667798528579513,
"grad_norm": 0.41902047710660106,
"learning_rate": 1.2092987505601346e-05,
"loss": 0.1186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043621864169836044,
"step": 4125,
"valid_targets_mean": 3441.4,
"valid_targets_min": 2795
},
{
"epoch": 4.673457838143746,
"grad_norm": 0.4456436609381996,
"learning_rate": 1.2041202759178381e-05,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0421648807823658,
"step": 4130,
"valid_targets_mean": 3286.4,
"valid_targets_min": 744
},
{
"epoch": 4.67911714770798,
"grad_norm": 0.3824039606101949,
"learning_rate": 1.198948133152559e-05,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03015786036849022,
"step": 4135,
"valid_targets_mean": 3976.5,
"valid_targets_min": 3279
},
{
"epoch": 4.684776457272212,
"grad_norm": 0.6000628647624624,
"learning_rate": 1.1937823634129416e-05,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0420723631978035,
"step": 4140,
"valid_targets_mean": 1140.4,
"valid_targets_min": 536
},
{
"epoch": 4.690435766836446,
"grad_norm": 0.5812001606124553,
"learning_rate": 1.1886230077969278e-05,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04249496012926102,
"step": 4145,
"valid_targets_mean": 2468.8,
"valid_targets_min": 853
},
{
"epoch": 4.696095076400679,
"grad_norm": 0.46335769498418267,
"learning_rate": 1.1834701073514306e-05,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0430687814950943,
"step": 4150,
"valid_targets_mean": 3205.8,
"valid_targets_min": 2621
},
{
"epoch": 4.701754385964913,
"grad_norm": 0.6333180992883152,
"learning_rate": 1.1783237030720049e-05,
"loss": 0.1106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04079118371009827,
"step": 4155,
"valid_targets_mean": 1332.4,
"valid_targets_min": 728
},
{
"epoch": 4.707413695529145,
"grad_norm": 0.5690407519442315,
"learning_rate": 1.1731838359025261e-05,
"loss": 0.0772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04055098071694374,
"step": 4160,
"valid_targets_mean": 1538.9,
"valid_targets_min": 618
},
{
"epoch": 4.713073005093379,
"grad_norm": 0.35164824124775307,
"learning_rate": 1.1680505467348584e-05,
"loss": 0.0827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045088913291692734,
"step": 4165,
"valid_targets_mean": 4142.9,
"valid_targets_min": 907
},
{
"epoch": 4.718732314657612,
"grad_norm": 0.6006000307194947,
"learning_rate": 1.162923876408535e-05,
"loss": 0.0884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059268467128276825,
"step": 4170,
"valid_targets_mean": 3060.4,
"valid_targets_min": 577
},
{
"epoch": 4.724391624221845,
"grad_norm": 0.3963810037110701,
"learning_rate": 1.1578038657104295e-05,
"loss": 0.0701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032515622675418854,
"step": 4175,
"valid_targets_mean": 3732.2,
"valid_targets_min": 726
},
{
"epoch": 4.730050933786078,
"grad_norm": 0.4059488375077736,
"learning_rate": 1.1526905553744337e-05,
"loss": 0.0672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03996988385915756,
"step": 4180,
"valid_targets_mean": 4288.9,
"valid_targets_min": 2252
},
{
"epoch": 4.7357102433503115,
"grad_norm": 0.4600670199394049,
"learning_rate": 1.1475839860811301e-05,
"loss": 0.0777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04087667912244797,
"step": 4185,
"valid_targets_mean": 2427.5,
"valid_targets_min": 531
},
{
"epoch": 4.741369552914544,
"grad_norm": 0.46001203112270483,
"learning_rate": 1.142484198457475e-05,
"loss": 0.0955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03880181163549423,
"step": 4190,
"valid_targets_mean": 2126.6,
"valid_targets_min": 744
},
{
"epoch": 4.7470288624787775,
"grad_norm": 0.4411981906244772,
"learning_rate": 1.1373912330764671e-05,
"loss": 0.0894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03835024684667587,
"step": 4195,
"valid_targets_mean": 3755.5,
"valid_targets_min": 3024
},
{
"epoch": 4.752688172043011,
"grad_norm": 0.3773991905548678,
"learning_rate": 1.1323051304568292e-05,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04429854452610016,
"step": 4200,
"valid_targets_mean": 3352.0,
"valid_targets_min": 2366
},
{
"epoch": 4.7583474816072435,
"grad_norm": 0.5035610691167854,
"learning_rate": 1.1272259310626872e-05,
"loss": 0.0782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04907100647687912,
"step": 4205,
"valid_targets_mean": 956.8,
"valid_targets_min": 509
},
{
"epoch": 4.764006791171477,
"grad_norm": 0.45983183893965734,
"learning_rate": 1.122153675303244e-05,
"loss": 0.0881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03519134968519211,
"step": 4210,
"valid_targets_mean": 3013.6,
"valid_targets_min": 1158
},
{
"epoch": 4.76966610073571,
"grad_norm": 0.33209367748663793,
"learning_rate": 1.1170884035324607e-05,
"loss": 0.0661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034753963351249695,
"step": 4215,
"valid_targets_mean": 3860.5,
"valid_targets_min": 3044
},
{
"epoch": 4.775325410299944,
"grad_norm": 0.3847170268802759,
"learning_rate": 1.1120301560487365e-05,
"loss": 0.0819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02686852589249611,
"step": 4220,
"valid_targets_mean": 2286.4,
"valid_targets_min": 539
},
{
"epoch": 4.780984719864176,
"grad_norm": 0.6034937690417163,
"learning_rate": 1.1069789730945849e-05,
"loss": 0.083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03560284525156021,
"step": 4225,
"valid_targets_mean": 2865.5,
"valid_targets_min": 912
},
{
"epoch": 4.78664402942841,
"grad_norm": 0.6053259730967792,
"learning_rate": 1.1019348948563154e-05,
"loss": 0.0882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04834606498479843,
"step": 4230,
"valid_targets_mean": 2087.4,
"valid_targets_min": 872
},
{
"epoch": 4.792303338992643,
"grad_norm": 0.40623321419478176,
"learning_rate": 1.096897961463714e-05,
"loss": 0.0838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026839591562747955,
"step": 4235,
"valid_targets_mean": 3380.1,
"valid_targets_min": 2254
},
{
"epoch": 4.797962648556876,
"grad_norm": 0.7531250762705376,
"learning_rate": 1.0918682129897244e-05,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05346660315990448,
"step": 4240,
"valid_targets_mean": 1274.0,
"valid_targets_min": 605
},
{
"epoch": 4.803621958121109,
"grad_norm": 0.4541710056333317,
"learning_rate": 1.0868456894501276e-05,
"loss": 0.0772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044228989630937576,
"step": 4245,
"valid_targets_mean": 2289.0,
"valid_targets_min": 1117
},
{
"epoch": 4.809281267685343,
"grad_norm": 0.48951262028685094,
"learning_rate": 1.0818304308032232e-05,
"loss": 0.1018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03746718168258667,
"step": 4250,
"valid_targets_mean": 3169.9,
"valid_targets_min": 1132
},
{
"epoch": 4.814940577249575,
"grad_norm": 0.4192328688567942,
"learning_rate": 1.0768224769495155e-05,
"loss": 0.0783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028717348352074623,
"step": 4255,
"valid_targets_mean": 2107.4,
"valid_targets_min": 524
},
{
"epoch": 4.820599886813809,
"grad_norm": 0.4462875440845788,
"learning_rate": 1.0718218677313904e-05,
"loss": 0.0726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032722052186727524,
"step": 4260,
"valid_targets_mean": 1705.8,
"valid_targets_min": 516
},
{
"epoch": 4.826259196378042,
"grad_norm": 0.5227401635445773,
"learning_rate": 1.0668286429328015e-05,
"loss": 0.0913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04021327197551727,
"step": 4265,
"valid_targets_mean": 2088.2,
"valid_targets_min": 342
},
{
"epoch": 4.831918505942275,
"grad_norm": 0.37467202581633297,
"learning_rate": 1.0618428422789555e-05,
"loss": 0.0858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035980671644210815,
"step": 4270,
"valid_targets_mean": 3528.1,
"valid_targets_min": 1935
},
{
"epoch": 4.837577815506508,
"grad_norm": 0.5620575705357205,
"learning_rate": 1.0568645054359919e-05,
"loss": 0.0677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029610414057970047,
"step": 4275,
"valid_targets_mean": 1818.2,
"valid_targets_min": 564
},
{
"epoch": 4.8432371250707416,
"grad_norm": 0.35221795133693484,
"learning_rate": 1.051893672010669e-05,
"loss": 0.0779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036343298852443695,
"step": 4280,
"valid_targets_mean": 5238.9,
"valid_targets_min": 3653
},
{
"epoch": 4.848896434634975,
"grad_norm": 0.34385645132118725,
"learning_rate": 1.0469303815500518e-05,
"loss": 0.073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0252225324511528,
"step": 4285,
"valid_targets_mean": 2983.4,
"valid_targets_min": 684
},
{
"epoch": 4.8545557441992075,
"grad_norm": 0.4035843769574735,
"learning_rate": 1.0419746735411922e-05,
"loss": 0.0633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03745335340499878,
"step": 4290,
"valid_targets_mean": 3324.8,
"valid_targets_min": 726
},
{
"epoch": 4.860215053763441,
"grad_norm": 0.3379316891220196,
"learning_rate": 1.037026587410819e-05,
"loss": 0.0873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04062708839774132,
"step": 4295,
"valid_targets_mean": 4154.5,
"valid_targets_min": 3469
},
{
"epoch": 4.8658743633276735,
"grad_norm": 0.5869714625833198,
"learning_rate": 1.032086162525021e-05,
"loss": 0.0974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1502927839756012,
"step": 4300,
"valid_targets_mean": 2561.6,
"valid_targets_min": 1536
},
{
"epoch": 4.871533672891907,
"grad_norm": 0.3806887067815329,
"learning_rate": 1.0271534381889385e-05,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041151951998472214,
"step": 4305,
"valid_targets_mean": 2912.4,
"valid_targets_min": 582
},
{
"epoch": 4.87719298245614,
"grad_norm": 0.3310535788490826,
"learning_rate": 1.0222284536464451e-05,
"loss": 0.0892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026854077354073524,
"step": 4310,
"valid_targets_mean": 3388.5,
"valid_targets_min": 633
},
{
"epoch": 4.882852292020374,
"grad_norm": 0.40632377202265596,
"learning_rate": 1.0173112480798376e-05,
"loss": 0.0988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03150768578052521,
"step": 4315,
"valid_targets_mean": 3263.6,
"valid_targets_min": 1130
},
{
"epoch": 4.888511601584606,
"grad_norm": 0.42612380843339315,
"learning_rate": 1.0124018606095278e-05,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03779520094394684,
"step": 4320,
"valid_targets_mean": 2866.5,
"valid_targets_min": 492
},
{
"epoch": 4.89417091114884,
"grad_norm": 0.6847680115960296,
"learning_rate": 1.0075003302937247e-05,
"loss": 0.0841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05836600810289383,
"step": 4325,
"valid_targets_mean": 2353.8,
"valid_targets_min": 1045
},
{
"epoch": 4.899830220713073,
"grad_norm": 0.3809740597349084,
"learning_rate": 1.0026066961281282e-05,
"loss": 0.0712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025576546788215637,
"step": 4330,
"valid_targets_mean": 3043.9,
"valid_targets_min": 647
},
{
"epoch": 4.905489530277306,
"grad_norm": 0.625831634310936,
"learning_rate": 9.977209970456194e-06,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0737590566277504,
"step": 4335,
"valid_targets_mean": 2093.0,
"valid_targets_min": 806
},
{
"epoch": 4.911148839841539,
"grad_norm": 0.6263000587819555,
"learning_rate": 9.928432719159475e-06,
"loss": 0.107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041312504559755325,
"step": 4340,
"valid_targets_mean": 1208.8,
"valid_targets_min": 575
},
{
"epoch": 4.916808149405773,
"grad_norm": 0.44496719578733984,
"learning_rate": 9.879735595454232e-06,
"loss": 0.077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03539961576461792,
"step": 4345,
"valid_targets_mean": 3447.5,
"valid_targets_min": 2784
},
{
"epoch": 4.922467458970006,
"grad_norm": 0.37638760798797666,
"learning_rate": 9.831118986766084e-06,
"loss": 0.0768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030857397243380547,
"step": 4350,
"valid_targets_mean": 3721.6,
"valid_targets_min": 2525
},
{
"epoch": 4.928126768534239,
"grad_norm": 0.4266897421917311,
"learning_rate": 9.782583279880096e-06,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030803639441728592,
"step": 4355,
"valid_targets_mean": 2665.2,
"valid_targets_min": 767
},
{
"epoch": 4.933786078098472,
"grad_norm": 0.46673207366963637,
"learning_rate": 9.734128860937675e-06,
"loss": 0.0688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031016550958156586,
"step": 4360,
"valid_targets_mean": 2277.6,
"valid_targets_min": 870
},
{
"epoch": 4.939445387662705,
"grad_norm": 0.7649765411181526,
"learning_rate": 9.68575611543355e-06,
"loss": 0.0954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05628187209367752,
"step": 4365,
"valid_targets_mean": 1535.8,
"valid_targets_min": 758
},
{
"epoch": 4.945104697226938,
"grad_norm": 0.452703192648749,
"learning_rate": 9.637465428212636e-06,
"loss": 0.068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037448108196258545,
"step": 4370,
"valid_targets_mean": 2024.1,
"valid_targets_min": 797
},
{
"epoch": 4.950764006791172,
"grad_norm": 0.4250155772613219,
"learning_rate": 9.589257183467025e-06,
"loss": 0.0724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034758277237415314,
"step": 4375,
"valid_targets_mean": 3299.5,
"valid_targets_min": 1606
},
{
"epoch": 4.956423316355405,
"grad_norm": 0.5030761530701435,
"learning_rate": 9.541131764732896e-06,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04057200998067856,
"step": 4380,
"valid_targets_mean": 3055.0,
"valid_targets_min": 678
},
{
"epoch": 4.962082625919638,
"grad_norm": 0.3454890398598417,
"learning_rate": 9.493089554887508e-06,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037702687084674835,
"step": 4385,
"valid_targets_mean": 4980.6,
"valid_targets_min": 1078
},
{
"epoch": 4.967741935483871,
"grad_norm": 0.3417198049280031,
"learning_rate": 9.445130936146098e-06,
"loss": 0.0696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02648003399372101,
"step": 4390,
"valid_targets_mean": 2680.8,
"valid_targets_min": 706
},
{
"epoch": 4.973401245048104,
"grad_norm": 0.5884179767956441,
"learning_rate": 9.397256290058869e-06,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048919759690761566,
"step": 4395,
"valid_targets_mean": 1580.4,
"valid_targets_min": 580
},
{
"epoch": 4.979060554612337,
"grad_norm": 0.5496614675946481,
"learning_rate": 9.349465997507974e-06,
"loss": 0.0971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07147332280874252,
"step": 4400,
"valid_targets_mean": 2592.1,
"valid_targets_min": 780
},
{
"epoch": 4.98471986417657,
"grad_norm": 0.3756997485189556,
"learning_rate": 9.301760438704442e-06,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03079824708402157,
"step": 4405,
"valid_targets_mean": 3478.2,
"valid_targets_min": 2861
},
{
"epoch": 4.990379173740804,
"grad_norm": 0.4112393944489124,
"learning_rate": 9.254139993185176e-06,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0403585322201252,
"step": 4410,
"valid_targets_mean": 3846.5,
"valid_targets_min": 2453
},
{
"epoch": 4.996038483305036,
"grad_norm": 0.42208698207818324,
"learning_rate": 9.206605039809955e-06,
"loss": 0.073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04255661368370056,
"step": 4415,
"valid_targets_mean": 3881.8,
"valid_targets_min": 3389
},
{
"epoch": 5.001131861912847,
"grad_norm": 0.7669520907027851,
"learning_rate": 9.159155956758375e-06,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09069793671369553,
"step": 4420,
"valid_targets_mean": 6935.0,
"valid_targets_min": 5295
},
{
"epoch": 5.006791171477079,
"grad_norm": 0.558900053602927,
"learning_rate": 9.111793121526862e-06,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0958920270204544,
"step": 4425,
"valid_targets_mean": 7672.9,
"valid_targets_min": 5066
},
{
"epoch": 5.012450481041313,
"grad_norm": 0.42971110414210983,
"learning_rate": 9.064516910925698e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0791202113032341,
"step": 4430,
"valid_targets_mean": 7347.6,
"valid_targets_min": 4923
},
{
"epoch": 5.018109790605546,
"grad_norm": 0.424026939483264,
"learning_rate": 9.017327701075965e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07265719771385193,
"step": 4435,
"valid_targets_mean": 5446.8,
"valid_targets_min": 3922
},
{
"epoch": 5.023769100169779,
"grad_norm": 0.3966328657232047,
"learning_rate": 8.970225867406593e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0743541494011879,
"step": 4440,
"valid_targets_mean": 6924.9,
"valid_targets_min": 4797
},
{
"epoch": 5.029428409734012,
"grad_norm": 0.40249258933443416,
"learning_rate": 8.923211784651356e-06,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08096291124820709,
"step": 4445,
"valid_targets_mean": 6443.5,
"valid_targets_min": 3853
},
{
"epoch": 5.035087719298246,
"grad_norm": 0.5019839927447249,
"learning_rate": 8.876285826845918e-06,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0774025097489357,
"step": 4450,
"valid_targets_mean": 5446.5,
"valid_targets_min": 4487
},
{
"epoch": 5.040747028862479,
"grad_norm": 0.41328338470674536,
"learning_rate": 8.82944836732482e-06,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07444000989198685,
"step": 4455,
"valid_targets_mean": 6210.2,
"valid_targets_min": 4137
},
{
"epoch": 5.046406338426712,
"grad_norm": 0.5368670084410287,
"learning_rate": 8.782699778718516e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1226726844906807,
"step": 4460,
"valid_targets_mean": 5404.4,
"valid_targets_min": 698
},
{
"epoch": 5.052065647990945,
"grad_norm": 0.4194795096973056,
"learning_rate": 8.736040432950447e-06,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08990229666233063,
"step": 4465,
"valid_targets_mean": 7197.6,
"valid_targets_min": 4499
},
{
"epoch": 5.057724957555179,
"grad_norm": 0.45155172518626197,
"learning_rate": 8.689470701234037e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10899793356657028,
"step": 4470,
"valid_targets_mean": 5538.4,
"valid_targets_min": 4291
},
{
"epoch": 5.063384267119411,
"grad_norm": 0.3856721196725891,
"learning_rate": 8.642990954069747e-06,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06013498827815056,
"step": 4475,
"valid_targets_mean": 5531.4,
"valid_targets_min": 4050
},
{
"epoch": 5.069043576683645,
"grad_norm": 0.43003600987131757,
"learning_rate": 8.596601561242167e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08636723458766937,
"step": 4480,
"valid_targets_mean": 7526.6,
"valid_targets_min": 5196
},
{
"epoch": 5.074702886247878,
"grad_norm": 0.37505619278492647,
"learning_rate": 8.550302891817015e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0698092132806778,
"step": 4485,
"valid_targets_mean": 6248.9,
"valid_targets_min": 4749
},
{
"epoch": 5.080362195812111,
"grad_norm": 0.4318746906316014,
"learning_rate": 8.50409531413824e-06,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039330024272203445,
"step": 4490,
"valid_targets_mean": 3248.5,
"valid_targets_min": 1908
},
{
"epoch": 5.086021505376344,
"grad_norm": 0.41762584637699307,
"learning_rate": 8.457979195825076e-06,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.070592001080513,
"step": 4495,
"valid_targets_mean": 6225.6,
"valid_targets_min": 4808
},
{
"epoch": 5.0916808149405774,
"grad_norm": 0.4025616969393729,
"learning_rate": 8.411954903769145e-06,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0751720666885376,
"step": 4500,
"valid_targets_mean": 5383.0,
"valid_targets_min": 3774
},
{
"epoch": 5.09734012450481,
"grad_norm": 0.4221341874106493,
"learning_rate": 8.366022804131487e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07378105074167252,
"step": 4505,
"valid_targets_mean": 6291.4,
"valid_targets_min": 5335
},
{
"epoch": 5.102999434069043,
"grad_norm": 0.3829917137612727,
"learning_rate": 8.320183262339686e-06,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07340899109840393,
"step": 4510,
"valid_targets_mean": 7749.1,
"valid_targets_min": 6205
},
{
"epoch": 5.108658743633277,
"grad_norm": 0.3805013608286788,
"learning_rate": 8.274436643084962e-06,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0707998052239418,
"step": 4515,
"valid_targets_mean": 6882.1,
"valid_targets_min": 4428
},
{
"epoch": 5.11431805319751,
"grad_norm": 0.48028126526368026,
"learning_rate": 8.228783310319248e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07884474098682404,
"step": 4520,
"valid_targets_mean": 5751.8,
"valid_targets_min": 4458
},
{
"epoch": 5.119977362761743,
"grad_norm": 0.3926095512807884,
"learning_rate": 8.183223627252305e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06521456688642502,
"step": 4525,
"valid_targets_mean": 6003.9,
"valid_targets_min": 4458
},
{
"epoch": 5.125636672325976,
"grad_norm": 0.4181977204631873,
"learning_rate": 8.137757956348854e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06609899550676346,
"step": 4530,
"valid_targets_mean": 6033.8,
"valid_targets_min": 4066
},
{
"epoch": 5.13129598189021,
"grad_norm": 0.46323510844564697,
"learning_rate": 8.092386659325644e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08222903311252594,
"step": 4535,
"valid_targets_mean": 6601.0,
"valid_targets_min": 4708
},
{
"epoch": 5.136955291454442,
"grad_norm": 0.4315489667874819,
"learning_rate": 8.047110097148618e-06,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08429074287414551,
"step": 4540,
"valid_targets_mean": 6092.1,
"valid_targets_min": 4789
},
{
"epoch": 5.142614601018676,
"grad_norm": 0.42567220761721475,
"learning_rate": 8.001928630030017e-06,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08571913838386536,
"step": 4545,
"valid_targets_mean": 6474.6,
"valid_targets_min": 4224
},
{
"epoch": 5.148273910582909,
"grad_norm": 0.41413321611049403,
"learning_rate": 7.95684261742554e-06,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08004915714263916,
"step": 4550,
"valid_targets_mean": 6312.4,
"valid_targets_min": 4617
},
{
"epoch": 5.153933220147142,
"grad_norm": 0.4071549037169186,
"learning_rate": 7.911852418031449e-06,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0771443247795105,
"step": 4555,
"valid_targets_mean": 6333.8,
"valid_targets_min": 4783
},
{
"epoch": 5.159592529711375,
"grad_norm": 0.40644763519175936,
"learning_rate": 7.866958389781736e-06,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07742355763912201,
"step": 4560,
"valid_targets_mean": 7380.1,
"valid_targets_min": 6020
},
{
"epoch": 5.165251839275609,
"grad_norm": 0.4306799765061804,
"learning_rate": 7.822160889845286e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08144442737102509,
"step": 4565,
"valid_targets_mean": 6009.0,
"valid_targets_min": 3049
},
{
"epoch": 5.170911148839841,
"grad_norm": 0.41741532189159075,
"learning_rate": 7.777460274623005e-06,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07007598876953125,
"step": 4570,
"valid_targets_mean": 5973.1,
"valid_targets_min": 4822
},
{
"epoch": 5.176570458404075,
"grad_norm": 0.4294904406202204,
"learning_rate": 7.732856899745003e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07263119518756866,
"step": 4575,
"valid_targets_mean": 5754.9,
"valid_targets_min": 2910
},
{
"epoch": 5.182229767968308,
"grad_norm": 0.44380956966564805,
"learning_rate": 7.688351120067781e-06,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08814549446105957,
"step": 4580,
"valid_targets_mean": 6414.6,
"valid_targets_min": 4791
},
{
"epoch": 5.187889077532541,
"grad_norm": 0.4526826853647187,
"learning_rate": 7.643943289671374e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07937498390674591,
"step": 4585,
"valid_targets_mean": 5675.9,
"valid_targets_min": 3983
},
{
"epoch": 5.193548387096774,
"grad_norm": 0.3578771225498125,
"learning_rate": 7.599633761856542e-06,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06336264312267303,
"step": 4590,
"valid_targets_mean": 6975.5,
"valid_targets_min": 4383
},
{
"epoch": 5.1992076966610075,
"grad_norm": 0.3907734003361043,
"learning_rate": 7.555422889141997e-06,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.073424331843853,
"step": 4595,
"valid_targets_mean": 6417.1,
"valid_targets_min": 3182
},
{
"epoch": 5.204867006225241,
"grad_norm": 0.4311567298480243,
"learning_rate": 7.51131102326154e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0849514901638031,
"step": 4600,
"valid_targets_mean": 6218.6,
"valid_targets_min": 5077
},
{
"epoch": 5.2105263157894735,
"grad_norm": 0.4696685522510483,
"learning_rate": 7.467298515161305e-06,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0753907635807991,
"step": 4605,
"valid_targets_mean": 4774.9,
"valid_targets_min": 3663
},
{
"epoch": 5.216185625353707,
"grad_norm": 0.41679582330020365,
"learning_rate": 7.423385714996942e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07688593864440918,
"step": 4610,
"valid_targets_mean": 6316.8,
"valid_targets_min": 4105
},
{
"epoch": 5.22184493491794,
"grad_norm": 0.4005301809886344,
"learning_rate": 7.379572972130864e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06853274255990982,
"step": 4615,
"valid_targets_mean": 6528.9,
"valid_targets_min": 4537
},
{
"epoch": 5.227504244482173,
"grad_norm": 0.4028892173858166,
"learning_rate": 7.335860635129426e-06,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06940186023712158,
"step": 4620,
"valid_targets_mean": 6416.8,
"valid_targets_min": 2494
},
{
"epoch": 5.233163554046406,
"grad_norm": 0.40156406656775434,
"learning_rate": 7.292249051760169e-06,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0779690071940422,
"step": 4625,
"valid_targets_mean": 6070.9,
"valid_targets_min": 4921
},
{
"epoch": 5.23882286361064,
"grad_norm": 0.4027854588002,
"learning_rate": 7.2487385689890845e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0822412520647049,
"step": 4630,
"valid_targets_mean": 6701.4,
"valid_targets_min": 5285
},
{
"epoch": 5.244482173174872,
"grad_norm": 0.42468145589722883,
"learning_rate": 7.205329532977794e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0705537348985672,
"step": 4635,
"valid_targets_mean": 6273.9,
"valid_targets_min": 4464
},
{
"epoch": 5.250141482739106,
"grad_norm": 0.45132048278659165,
"learning_rate": 7.162022289080837e-06,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06876321882009506,
"step": 4640,
"valid_targets_mean": 5554.8,
"valid_targets_min": 4439
},
{
"epoch": 5.255800792303339,
"grad_norm": 0.41803966931151526,
"learning_rate": 7.1188171818429256e-06,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06165836751461029,
"step": 4645,
"valid_targets_mean": 6043.0,
"valid_targets_min": 4686
},
{
"epoch": 5.261460101867572,
"grad_norm": 0.440878055574104,
"learning_rate": 7.075714554996176e-06,
"loss": 0.129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06370429694652557,
"step": 4650,
"valid_targets_mean": 5912.5,
"valid_targets_min": 3381
},
{
"epoch": 5.267119411431805,
"grad_norm": 0.612073574059755,
"learning_rate": 7.032714751457395e-06,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06927108019590378,
"step": 4655,
"valid_targets_mean": 6495.5,
"valid_targets_min": 5309
},
{
"epoch": 5.272778720996039,
"grad_norm": 0.4251949566082133,
"learning_rate": 6.989818113325333e-06,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07870665192604065,
"step": 4660,
"valid_targets_mean": 6483.9,
"valid_targets_min": 5161
},
{
"epoch": 5.278438030560272,
"grad_norm": 0.4438435905888869,
"learning_rate": 6.947024981878001e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07518930733203888,
"step": 4665,
"valid_targets_mean": 5958.9,
"valid_targets_min": 4666
},
{
"epoch": 5.284097340124505,
"grad_norm": 0.5827403553757994,
"learning_rate": 6.904335697569909e-06,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09826524555683136,
"step": 4670,
"valid_targets_mean": 1691.5,
"valid_targets_min": 1440
},
{
"epoch": 5.289756649688738,
"grad_norm": 0.4333512080117021,
"learning_rate": 6.861750600029373e-06,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06576051563024521,
"step": 4675,
"valid_targets_mean": 5299.1,
"valid_targets_min": 4547
},
{
"epoch": 5.2954159592529715,
"grad_norm": 0.4298304067134876,
"learning_rate": 6.819270028055844e-06,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07609501481056213,
"step": 4680,
"valid_targets_mean": 6003.5,
"valid_targets_min": 5031
},
{
"epoch": 5.301075268817204,
"grad_norm": 0.434080083592628,
"learning_rate": 6.776894319617162e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06977563351392746,
"step": 4685,
"valid_targets_mean": 8169.6,
"valid_targets_min": 5487
},
{
"epoch": 5.3067345783814375,
"grad_norm": 0.4234596055091472,
"learning_rate": 6.73462381184689e-06,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0698070153594017,
"step": 4690,
"valid_targets_mean": 6474.9,
"valid_targets_min": 4253
},
{
"epoch": 5.312393887945671,
"grad_norm": 0.4227309069414161,
"learning_rate": 6.6924588410416604e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08599575608968735,
"step": 4695,
"valid_targets_mean": 7021.0,
"valid_targets_min": 4990
},
{
"epoch": 5.3180531975099035,
"grad_norm": 0.4433300308692838,
"learning_rate": 6.650399742658442e-06,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08826185762882233,
"step": 4700,
"valid_targets_mean": 6356.0,
"valid_targets_min": 4385
},
{
"epoch": 5.323712507074137,
"grad_norm": 0.38772347681595304,
"learning_rate": 6.608446851311918e-06,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08048726618289948,
"step": 4705,
"valid_targets_mean": 6815.1,
"valid_targets_min": 5164
},
{
"epoch": 5.32937181663837,
"grad_norm": 0.40251172074444747,
"learning_rate": 6.566600500771796e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05604606121778488,
"step": 4710,
"valid_targets_mean": 5588.5,
"valid_targets_min": 4098
},
{
"epoch": 5.335031126202603,
"grad_norm": 0.41678126626964224,
"learning_rate": 6.524861023960185e-06,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07454540580511093,
"step": 4715,
"valid_targets_mean": 6167.6,
"valid_targets_min": 4801
},
{
"epoch": 5.340690435766836,
"grad_norm": 0.45099069972017347,
"learning_rate": 6.483228752948902e-06,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18380106985569,
"step": 4720,
"valid_targets_mean": 6224.9,
"valid_targets_min": 4772
},
{
"epoch": 5.34634974533107,
"grad_norm": 0.44008724009186123,
"learning_rate": 6.441704018956858e-06,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08497292548418045,
"step": 4725,
"valid_targets_mean": 6549.2,
"valid_targets_min": 5025
},
{
"epoch": 5.352009054895303,
"grad_norm": 0.5276958180485326,
"learning_rate": 6.400287152347442e-06,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0843924731016159,
"step": 4730,
"valid_targets_mean": 6680.8,
"valid_targets_min": 4818
},
{
"epoch": 5.357668364459536,
"grad_norm": 0.46757375166774123,
"learning_rate": 6.35897848262584e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0748303085565567,
"step": 4735,
"valid_targets_mean": 5835.1,
"valid_targets_min": 4111
},
{
"epoch": 5.363327674023769,
"grad_norm": 0.42048683370736745,
"learning_rate": 6.317778338436449e-06,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07209735363721848,
"step": 4740,
"valid_targets_mean": 7029.9,
"valid_targets_min": 2275
},
{
"epoch": 5.368986983588003,
"grad_norm": 0.41548903650378316,
"learning_rate": 6.276687047560275e-06,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06418467313051224,
"step": 4745,
"valid_targets_mean": 5621.2,
"valid_targets_min": 4826
},
{
"epoch": 5.374646293152235,
"grad_norm": 0.4009641412548776,
"learning_rate": 6.235704936912288e-06,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06733281910419464,
"step": 4750,
"valid_targets_mean": 6858.8,
"valid_targets_min": 4710
},
{
"epoch": 5.380305602716469,
"grad_norm": 0.4058686462438823,
"learning_rate": 6.194832332538838e-06,
"loss": 0.1362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10353972017765045,
"step": 4755,
"valid_targets_mean": 7012.5,
"valid_targets_min": 5421
},
{
"epoch": 5.385964912280702,
"grad_norm": 0.4080275617258039,
"learning_rate": 6.154069559615081e-06,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06577767431735992,
"step": 4760,
"valid_targets_mean": 6967.6,
"valid_targets_min": 4949
},
{
"epoch": 5.391624221844935,
"grad_norm": 0.38798007962489367,
"learning_rate": 6.113416942442358e-06,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07223743200302124,
"step": 4765,
"valid_targets_mean": 6348.5,
"valid_targets_min": 4831
},
{
"epoch": 5.397283531409168,
"grad_norm": 0.4311691528295395,
"learning_rate": 6.072874804445632e-06,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09179031848907471,
"step": 4770,
"valid_targets_mean": 6597.2,
"valid_targets_min": 4018
},
{
"epoch": 5.4029428409734015,
"grad_norm": 0.3467602354311775,
"learning_rate": 6.032443468170912e-06,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051479682326316833,
"step": 4775,
"valid_targets_mean": 6420.9,
"valid_targets_min": 5034
},
{
"epoch": 5.408602150537634,
"grad_norm": 0.41667026215499137,
"learning_rate": 5.992123255282702e-06,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08383023738861084,
"step": 4780,
"valid_targets_mean": 6962.4,
"valid_targets_min": 5442
},
{
"epoch": 5.4142614601018675,
"grad_norm": 0.4802376377588568,
"learning_rate": 5.951914486561417e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07770697772502899,
"step": 4785,
"valid_targets_mean": 5610.9,
"valid_targets_min": 4609
},
{
"epoch": 5.419920769666101,
"grad_norm": 0.4589664164147789,
"learning_rate": 5.911817481900832e-06,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07419160008430481,
"step": 4790,
"valid_targets_mean": 5038.4,
"valid_targets_min": 2301
},
{
"epoch": 5.425580079230334,
"grad_norm": 0.5730477242441706,
"learning_rate": 5.871832560305573e-06,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0763842836022377,
"step": 4795,
"valid_targets_mean": 1449.8,
"valid_targets_min": 363
},
{
"epoch": 5.431239388794567,
"grad_norm": 0.38431554670090246,
"learning_rate": 5.831960039888533e-06,
"loss": 0.0822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04814344644546509,
"step": 4800,
"valid_targets_mean": 3729.8,
"valid_targets_min": 3074
},
{
"epoch": 5.4368986983588,
"grad_norm": 0.42804624601009617,
"learning_rate": 5.792200237868361e-06,
"loss": 0.0748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04012545943260193,
"step": 4805,
"valid_targets_mean": 2272.8,
"valid_targets_min": 700
},
{
"epoch": 5.442558007923034,
"grad_norm": 0.47429604453716917,
"learning_rate": 5.752553470566957e-06,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03822815418243408,
"step": 4810,
"valid_targets_mean": 2997.5,
"valid_targets_min": 803
},
{
"epoch": 5.448217317487266,
"grad_norm": 0.47494590604900366,
"learning_rate": 5.713020053406917e-06,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04123368859291077,
"step": 4815,
"valid_targets_mean": 2655.5,
"valid_targets_min": 920
},
{
"epoch": 5.4538766270515,
"grad_norm": 0.432653492711929,
"learning_rate": 5.673600300909053e-06,
"loss": 0.0787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04253911226987839,
"step": 4820,
"valid_targets_mean": 3263.8,
"valid_targets_min": 806
},
{
"epoch": 5.459535936615733,
"grad_norm": 0.7187022007851978,
"learning_rate": 5.634294526689872e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06496002525091171,
"step": 4825,
"valid_targets_mean": 1644.4,
"valid_targets_min": 718
},
{
"epoch": 5.465195246179966,
"grad_norm": 0.4211215979416941,
"learning_rate": 5.595103043459109e-06,
"loss": 0.0868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043419234454631805,
"step": 4830,
"valid_targets_mean": 3399.4,
"valid_targets_min": 1133
},
{
"epoch": 5.470854555744199,
"grad_norm": 0.4693753835767023,
"learning_rate": 5.556026163017205e-06,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035194315016269684,
"step": 4835,
"valid_targets_mean": 1808.9,
"valid_targets_min": 859
},
{
"epoch": 5.476513865308433,
"grad_norm": 0.27086846723671243,
"learning_rate": 5.517064196252837e-06,
"loss": 0.1077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023684551939368248,
"step": 4840,
"valid_targets_mean": 5541.4,
"valid_targets_min": 5150
},
{
"epoch": 5.482173174872665,
"grad_norm": 0.48126645790976275,
"learning_rate": 5.478217453140471e-06,
"loss": 0.0683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04665878415107727,
"step": 4845,
"valid_targets_mean": 4000.1,
"valid_targets_min": 502
},
{
"epoch": 5.487832484436899,
"grad_norm": 0.3917605803512901,
"learning_rate": 5.439486242737855e-06,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043694302439689636,
"step": 4850,
"valid_targets_mean": 3906.9,
"valid_targets_min": 600
},
{
"epoch": 5.493491794001132,
"grad_norm": 0.39241086936632663,
"learning_rate": 5.400870873183583e-06,
"loss": 0.071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03243585675954819,
"step": 4855,
"valid_targets_mean": 2979.5,
"valid_targets_min": 518
},
{
"epoch": 5.499151103565365,
"grad_norm": 0.43406960946047696,
"learning_rate": 5.362371651694647e-06,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04233259707689285,
"step": 4860,
"valid_targets_mean": 3522.5,
"valid_targets_min": 549
},
{
"epoch": 5.504810413129598,
"grad_norm": 0.3572759598808805,
"learning_rate": 5.323988884563975e-06,
"loss": 0.0659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02906729094684124,
"step": 4865,
"valid_targets_mean": 3878.5,
"valid_targets_min": 3170
},
{
"epoch": 5.5104697226938315,
"grad_norm": 0.5208358787040975,
"learning_rate": 5.2857228771580105e-06,
"loss": 0.0794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04582788050174713,
"step": 4870,
"valid_targets_mean": 1656.0,
"valid_targets_min": 644
},
{
"epoch": 5.516129032258064,
"grad_norm": 0.3326607206725967,
"learning_rate": 5.247573933914285e-06,
"loss": 0.0604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020800217986106873,
"step": 4875,
"valid_targets_mean": 2891.8,
"valid_targets_min": 720
},
{
"epoch": 5.5217883418222975,
"grad_norm": 0.4923417370395899,
"learning_rate": 5.20954235833898e-06,
"loss": 0.08,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030622247606515884,
"step": 4880,
"valid_targets_mean": 1775.6,
"valid_targets_min": 516
},
{
"epoch": 5.527447651386531,
"grad_norm": 0.5285695399568121,
"learning_rate": 5.171628453004512e-06,
"loss": 0.0823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05061523616313934,
"step": 4885,
"valid_targets_mean": 2018.6,
"valid_targets_min": 557
},
{
"epoch": 5.533106960950764,
"grad_norm": 0.5460414179629879,
"learning_rate": 5.133832519547155e-06,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04757304489612579,
"step": 4890,
"valid_targets_mean": 3398.1,
"valid_targets_min": 1086
},
{
"epoch": 5.538766270514997,
"grad_norm": 0.4886522424962672,
"learning_rate": 5.096154858664608e-06,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04523239657282829,
"step": 4895,
"valid_targets_mean": 2532.9,
"valid_targets_min": 1008
},
{
"epoch": 5.54442558007923,
"grad_norm": 0.498231032412165,
"learning_rate": 5.058595770113606e-06,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03225970268249512,
"step": 4900,
"valid_targets_mean": 3481.1,
"valid_targets_min": 2756
},
{
"epoch": 5.550084889643464,
"grad_norm": 0.34825050975154626,
"learning_rate": 5.0211555527075664e-06,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03134623169898987,
"step": 4905,
"valid_targets_mean": 4113.5,
"valid_targets_min": 3798
},
{
"epoch": 5.555744199207696,
"grad_norm": 0.8345018317724164,
"learning_rate": 4.9838345043141665e-06,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07340296357870102,
"step": 4910,
"valid_targets_mean": 1058.6,
"valid_targets_min": 598
},
{
"epoch": 5.56140350877193,
"grad_norm": 0.4594410538877418,
"learning_rate": 4.946632921853009e-06,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030109558254480362,
"step": 4915,
"valid_targets_mean": 2403.5,
"valid_targets_min": 754
},
{
"epoch": 5.567062818336163,
"grad_norm": 0.4270637822659359,
"learning_rate": 4.909551101293238e-06,
"loss": 0.0862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03934195637702942,
"step": 4920,
"valid_targets_mean": 4045.8,
"valid_targets_min": 3390
},
{
"epoch": 5.572722127900396,
"grad_norm": 0.6800143738685122,
"learning_rate": 4.872589337651208e-06,
"loss": 0.1131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13332173228263855,
"step": 4925,
"valid_targets_mean": 2255.9,
"valid_targets_min": 1052
},
{
"epoch": 5.578381437464629,
"grad_norm": 0.5031406060454691,
"learning_rate": 4.835747924988105e-06,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0451483353972435,
"step": 4930,
"valid_targets_mean": 3214.0,
"valid_targets_min": 2176
},
{
"epoch": 5.584040747028863,
"grad_norm": 0.4795250100183131,
"learning_rate": 4.799027156407632e-06,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038113273680210114,
"step": 4935,
"valid_targets_mean": 2396.0,
"valid_targets_min": 1074
},
{
"epoch": 5.589700056593095,
"grad_norm": 0.4549673328264594,
"learning_rate": 4.7624273240536756e-06,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04130017012357712,
"step": 4940,
"valid_targets_mean": 3271.8,
"valid_targets_min": 1212
},
{
"epoch": 5.595359366157329,
"grad_norm": 0.48797530904109687,
"learning_rate": 4.725948719107965e-06,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049380846321582794,
"step": 4945,
"valid_targets_mean": 3990.8,
"valid_targets_min": 2258
},
{
"epoch": 5.601018675721562,
"grad_norm": 0.34295461979365804,
"learning_rate": 4.6895916317877624e-06,
"loss": 0.0666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047332584857940674,
"step": 4950,
"valid_targets_mean": 3730.2,
"valid_targets_min": 1466
},
{
"epoch": 5.6066779852857955,
"grad_norm": 0.3693165572830921,
"learning_rate": 4.653356351343577e-06,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03545898199081421,
"step": 4955,
"valid_targets_mean": 3557.1,
"valid_targets_min": 560
},
{
"epoch": 5.612337294850028,
"grad_norm": 0.45760123311509754,
"learning_rate": 4.617243166056826e-06,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04132983461022377,
"step": 4960,
"valid_targets_mean": 3222.9,
"valid_targets_min": 1189
},
{
"epoch": 5.6179966044142615,
"grad_norm": 0.38183081000487035,
"learning_rate": 4.581252363237567e-06,
"loss": 0.069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03381497412919998,
"step": 4965,
"valid_targets_mean": 3665.2,
"valid_targets_min": 2257
},
{
"epoch": 5.623655913978495,
"grad_norm": 0.385036821503619,
"learning_rate": 4.545384229222196e-06,
"loss": 0.0679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028356987982988358,
"step": 4970,
"valid_targets_mean": 3314.4,
"valid_targets_min": 886
},
{
"epoch": 5.6293152235427275,
"grad_norm": 0.4014468518014719,
"learning_rate": 4.509639049371193e-06,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03628263995051384,
"step": 4975,
"valid_targets_mean": 3377.5,
"valid_targets_min": 2409
},
{
"epoch": 5.634974533106961,
"grad_norm": 0.401897256250637,
"learning_rate": 4.474017108066828e-06,
"loss": 0.0668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03104272112250328,
"step": 4980,
"valid_targets_mean": 3241.8,
"valid_targets_min": 820
},
{
"epoch": 5.640633842671194,
"grad_norm": 0.6805433850912309,
"learning_rate": 4.438518688710898e-06,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08667178452014923,
"step": 4985,
"valid_targets_mean": 2264.2,
"valid_targets_min": 813
},
{
"epoch": 5.646293152235427,
"grad_norm": 0.366707828447475,
"learning_rate": 4.403144073722501e-06,
"loss": 0.0626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02789473347365856,
"step": 4990,
"valid_targets_mean": 3651.9,
"valid_targets_min": 2877
},
{
"epoch": 5.65195246179966,
"grad_norm": 0.5065193268802206,
"learning_rate": 4.367893544535757e-06,
"loss": 0.0625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039443302899599075,
"step": 4995,
"valid_targets_mean": 2384.0,
"valid_targets_min": 667
},
{
"epoch": 5.657611771363894,
"grad_norm": 0.38590017909105073,
"learning_rate": 4.332767381597575e-06,
"loss": 0.0615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029201095923781395,
"step": 5000,
"valid_targets_mean": 3488.6,
"valid_targets_min": 2353
},
{
"epoch": 5.663271080928126,
"grad_norm": 0.40972454629192384,
"learning_rate": 4.297765864365453e-06,
"loss": 0.0647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039309754967689514,
"step": 5005,
"valid_targets_mean": 3189.9,
"valid_targets_min": 549
},
{
"epoch": 5.66893039049236,
"grad_norm": 0.42666806283297,
"learning_rate": 4.262889271305204e-06,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0314299650490284,
"step": 5010,
"valid_targets_mean": 3826.5,
"valid_targets_min": 3340
},
{
"epoch": 5.674589700056593,
"grad_norm": 0.5179962988049834,
"learning_rate": 4.228137879888774e-06,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05188950523734093,
"step": 5015,
"valid_targets_mean": 2178.2,
"valid_targets_min": 647
},
{
"epoch": 5.680249009620827,
"grad_norm": 0.4970353043681172,
"learning_rate": 4.193511966592041e-06,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04057688266038895,
"step": 5020,
"valid_targets_mean": 1558.9,
"valid_targets_min": 804
},
{
"epoch": 5.685908319185059,
"grad_norm": 0.7646762922675957,
"learning_rate": 4.1590118068925815e-06,
"loss": 0.0911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08557213842868805,
"step": 5025,
"valid_targets_mean": 1855.1,
"valid_targets_min": 702
},
{
"epoch": 5.691567628749293,
"grad_norm": 0.5384667166461213,
"learning_rate": 4.124637675267511e-06,
"loss": 0.1086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05332893133163452,
"step": 5030,
"valid_targets_mean": 2858.1,
"valid_targets_min": 945
},
{
"epoch": 5.697226938313526,
"grad_norm": 0.5288805198191306,
"learning_rate": 4.090389845191278e-06,
"loss": 0.0774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049206458032131195,
"step": 5035,
"valid_targets_mean": 2879.5,
"valid_targets_min": 703
},
{
"epoch": 5.702886247877759,
"grad_norm": 0.5414207861579454,
"learning_rate": 4.056268589133516e-06,
"loss": 0.095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038104280829429626,
"step": 5040,
"valid_targets_mean": 3950.5,
"valid_targets_min": 3051
},
{
"epoch": 5.708545557441992,
"grad_norm": 0.5739872667001847,
"learning_rate": 4.022274178556844e-06,
"loss": 0.0772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05831873416900635,
"step": 5045,
"valid_targets_mean": 1759.8,
"valid_targets_min": 523
},
{
"epoch": 5.7142048670062255,
"grad_norm": 0.3871279428177479,
"learning_rate": 3.988406883914717e-06,
"loss": 0.0696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03543112799525261,
"step": 5050,
"valid_targets_mean": 2138.2,
"valid_targets_min": 468
},
{
"epoch": 5.719864176570458,
"grad_norm": 0.29274510999762493,
"learning_rate": 3.954666974649295e-06,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021055569872260094,
"step": 5055,
"valid_targets_mean": 4428.1,
"valid_targets_min": 885
},
{
"epoch": 5.7255234861346915,
"grad_norm": 0.3924485471902587,
"learning_rate": 3.921054719189272e-06,
"loss": 0.0679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025709647685289383,
"step": 5060,
"valid_targets_mean": 2478.5,
"valid_targets_min": 546
},
{
"epoch": 5.731182795698925,
"grad_norm": 0.3937628507775362,
"learning_rate": 3.887570384947745e-06,
"loss": 0.0657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03667730838060379,
"step": 5065,
"valid_targets_mean": 3910.5,
"valid_targets_min": 981
},
{
"epoch": 5.7368421052631575,
"grad_norm": 0.5433030872476484,
"learning_rate": 3.854214238320109e-06,
"loss": 0.0783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04392950236797333,
"step": 5070,
"valid_targets_mean": 1519.9,
"valid_targets_min": 697
},
{
"epoch": 5.742501414827391,
"grad_norm": 0.43220977807356675,
"learning_rate": 3.8209865446819105e-06,
"loss": 0.0818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03852108120918274,
"step": 5075,
"valid_targets_mean": 3473.4,
"valid_targets_min": 2777
},
{
"epoch": 5.748160724391624,
"grad_norm": 0.44530962837687676,
"learning_rate": 3.7878875683867476e-06,
"loss": 0.0845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042130667716264725,
"step": 5080,
"valid_targets_mean": 3932.4,
"valid_targets_min": 3061
},
{
"epoch": 5.753820033955858,
"grad_norm": 0.3694916026913543,
"learning_rate": 3.7549175727641606e-06,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03624318540096283,
"step": 5085,
"valid_targets_mean": 2882.2,
"valid_targets_min": 868
},
{
"epoch": 5.75947934352009,
"grad_norm": 0.4227025192070278,
"learning_rate": 3.7220768201175615e-06,
"loss": 0.0718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03077586367726326,
"step": 5090,
"valid_targets_mean": 2506.6,
"valid_targets_min": 752
},
{
"epoch": 5.765138653084324,
"grad_norm": 0.41725972794779176,
"learning_rate": 3.689365571722112e-06,
"loss": 0.0798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03431401774287224,
"step": 5095,
"valid_targets_mean": 3418.9,
"valid_targets_min": 1141
},
{
"epoch": 5.770797962648556,
"grad_norm": 0.3500677147973765,
"learning_rate": 3.6567840878226577e-06,
"loss": 0.0592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03257271274924278,
"step": 5100,
"valid_targets_mean": 3901.2,
"valid_targets_min": 3540
},
{
"epoch": 5.77645727221279,
"grad_norm": 0.43941140678159996,
"learning_rate": 3.624332627631679e-06,
"loss": 0.0763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030285216867923737,
"step": 5105,
"valid_targets_mean": 2808.2,
"valid_targets_min": 773
},
{
"epoch": 5.782116581777023,
"grad_norm": 0.42014420275176356,
"learning_rate": 3.5920114493271974e-06,
"loss": 0.0745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025668412446975708,
"step": 5110,
"valid_targets_mean": 3550.5,
"valid_targets_min": 2587
},
{
"epoch": 5.787775891341257,
"grad_norm": 0.4385807667884832,
"learning_rate": 3.5598208100507314e-06,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034961722791194916,
"step": 5115,
"valid_targets_mean": 2700.6,
"valid_targets_min": 773
},
{
"epoch": 5.793435200905489,
"grad_norm": 0.5285363614611225,
"learning_rate": 3.5277609659052712e-06,
"loss": 0.0754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037699900567531586,
"step": 5120,
"valid_targets_mean": 3615.9,
"valid_targets_min": 2962
},
{
"epoch": 5.799094510469723,
"grad_norm": 0.6519064391093398,
"learning_rate": 3.4958321719532106e-06,
"loss": 0.0807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04379285126924515,
"step": 5125,
"valid_targets_mean": 1766.6,
"valid_targets_min": 649
},
{
"epoch": 5.804753820033956,
"grad_norm": 0.6115661117657148,
"learning_rate": 3.4640346822143324e-06,
"loss": 0.0763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0414419025182724,
"step": 5130,
"valid_targets_mean": 1668.4,
"valid_targets_min": 708
},
{
"epoch": 5.810413129598189,
"grad_norm": 0.4643873227865667,
"learning_rate": 3.4323687496637837e-06,
"loss": 0.0834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032500360161066055,
"step": 5135,
"valid_targets_mean": 2129.5,
"valid_targets_min": 617
},
{
"epoch": 5.816072439162422,
"grad_norm": 0.518654839110181,
"learning_rate": 3.4008346262300852e-06,
"loss": 0.0748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03613649681210518,
"step": 5140,
"valid_targets_mean": 2495.0,
"valid_targets_min": 720
},
{
"epoch": 5.8217317487266556,
"grad_norm": 0.6468513014194476,
"learning_rate": 3.3694325627930846e-06,
"loss": 0.0674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04318820685148239,
"step": 5145,
"valid_targets_mean": 1537.8,
"valid_targets_min": 628
},
{
"epoch": 5.827391058290889,
"grad_norm": 0.6398866548133438,
"learning_rate": 3.3381628091819907e-06,
"loss": 0.0877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06686189025640488,
"step": 5150,
"valid_targets_mean": 2155.2,
"valid_targets_min": 821
},
{
"epoch": 5.8330503678551215,
"grad_norm": 0.36439329813722365,
"learning_rate": 3.3070256141733913e-06,
"loss": 0.0668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020443886518478394,
"step": 5155,
"valid_targets_mean": 3628.1,
"valid_targets_min": 2863
},
{
"epoch": 5.838709677419355,
"grad_norm": 0.39380579851082065,
"learning_rate": 3.2760212254892453e-06,
"loss": 0.0663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027335772290825844,
"step": 5160,
"valid_targets_mean": 3585.2,
"valid_targets_min": 1773
},
{
"epoch": 5.8443689869835875,
"grad_norm": 0.514279348342231,
"learning_rate": 3.245149889794932e-06,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04034529626369476,
"step": 5165,
"valid_targets_mean": 2356.6,
"valid_targets_min": 721
},
{
"epoch": 5.850028296547821,
"grad_norm": 0.39588532237902196,
"learning_rate": 3.2144118526972943e-06,
"loss": 0.0609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03888987377285957,
"step": 5170,
"valid_targets_mean": 5092.5,
"valid_targets_min": 4222
},
{
"epoch": 5.855687606112054,
"grad_norm": 0.465672567676084,
"learning_rate": 3.1838073587426676e-06,
"loss": 0.0612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03602100908756256,
"step": 5175,
"valid_targets_mean": 4604.0,
"valid_targets_min": 2020
},
{
"epoch": 5.861346915676288,
"grad_norm": 0.3756373975254779,
"learning_rate": 3.153336651414933e-06,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027616024017333984,
"step": 5180,
"valid_targets_mean": 3097.9,
"valid_targets_min": 739
},
{
"epoch": 5.86700622524052,
"grad_norm": 0.4149497449655576,
"learning_rate": 3.1229999731336137e-06,
"loss": 0.0941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03883051872253418,
"step": 5185,
"valid_targets_mean": 3696.1,
"valid_targets_min": 2945
},
{
"epoch": 5.872665534804754,
"grad_norm": 0.3979753959226805,
"learning_rate": 3.0927975652518994e-06,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04112917184829712,
"step": 5190,
"valid_targets_mean": 3112.8,
"valid_targets_min": 704
},
{
"epoch": 5.878324844368987,
"grad_norm": 0.4099255400951427,
"learning_rate": 3.062729668054756e-06,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032986707985401154,
"step": 5195,
"valid_targets_mean": 2490.9,
"valid_targets_min": 774
},
{
"epoch": 5.88398415393322,
"grad_norm": 0.3941404199714783,
"learning_rate": 3.032796520757002e-06,
"loss": 0.0904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026263339444994926,
"step": 5200,
"valid_targets_mean": 2570.2,
"valid_targets_min": 485
},
{
"epoch": 5.889643463497453,
"grad_norm": 0.4427560923548638,
"learning_rate": 3.0029983615014234e-06,
"loss": 0.0683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03036249428987503,
"step": 5205,
"valid_targets_mean": 3087.4,
"valid_targets_min": 1048
},
{
"epoch": 5.895302773061687,
"grad_norm": 0.4229599842758237,
"learning_rate": 2.9733354273568514e-06,
"loss": 0.0739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032209280878305435,
"step": 5210,
"valid_targets_mean": 2753.6,
"valid_targets_min": 722
},
{
"epoch": 5.900962082625919,
"grad_norm": 0.6532864072235072,
"learning_rate": 2.9438079543162914e-06,
"loss": 0.0768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050366684794425964,
"step": 5215,
"valid_targets_mean": 1836.2,
"valid_targets_min": 865
},
{
"epoch": 5.906621392190153,
"grad_norm": 0.5332867595834957,
"learning_rate": 2.9144161772950564e-06,
"loss": 0.104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03690391033887863,
"step": 5220,
"valid_targets_mean": 2377.5,
"valid_targets_min": 675
},
{
"epoch": 5.912280701754386,
"grad_norm": 0.4605237897191458,
"learning_rate": 2.885160330128871e-06,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03459594398736954,
"step": 5225,
"valid_targets_mean": 3323.0,
"valid_targets_min": 782
},
{
"epoch": 5.917940011318619,
"grad_norm": 0.4701984376959242,
"learning_rate": 2.8560406455720333e-06,
"loss": 0.0698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03195595368742943,
"step": 5230,
"valid_targets_mean": 2581.8,
"valid_targets_min": 795
},
{
"epoch": 5.923599320882852,
"grad_norm": 0.4627978786039704,
"learning_rate": 2.8270573552955616e-06,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03759005665779114,
"step": 5235,
"valid_targets_mean": 3264.6,
"valid_targets_min": 2017
},
{
"epoch": 5.929258630447086,
"grad_norm": 0.430552103519957,
"learning_rate": 2.798210689885337e-06,
"loss": 0.0684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029955577105283737,
"step": 5240,
"valid_targets_mean": 2319.6,
"valid_targets_min": 798
},
{
"epoch": 5.934917940011319,
"grad_norm": 0.40555015629365276,
"learning_rate": 2.7695008788402765e-06,
"loss": 0.0606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03208666294813156,
"step": 5245,
"valid_targets_mean": 3299.6,
"valid_targets_min": 860
},
{
"epoch": 5.9405772495755516,
"grad_norm": 0.45207921980647,
"learning_rate": 2.740928150570512e-06,
"loss": 0.0882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03434694558382034,
"step": 5250,
"valid_targets_mean": 3302.4,
"valid_targets_min": 878
},
{
"epoch": 5.946236559139785,
"grad_norm": 0.36093174555240776,
"learning_rate": 2.712492732395575e-06,
"loss": 0.062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026369066908955574,
"step": 5255,
"valid_targets_mean": 3832.2,
"valid_targets_min": 2602
},
{
"epoch": 5.951895868704018,
"grad_norm": 0.526083349405698,
"learning_rate": 2.6841948505425765e-06,
"loss": 0.0701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04250894486904144,
"step": 5260,
"valid_targets_mean": 2736.5,
"valid_targets_min": 945
},
{
"epoch": 5.957555178268251,
"grad_norm": 0.5557462391969753,
"learning_rate": 2.6560347301444035e-06,
"loss": 0.0692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04651749134063721,
"step": 5265,
"valid_targets_mean": 3831.1,
"valid_targets_min": 3128
},
{
"epoch": 5.963214487832484,
"grad_norm": 0.49222443878858035,
"learning_rate": 2.6280125952379567e-06,
"loss": 0.0727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038196124136447906,
"step": 5270,
"valid_targets_mean": 3966.2,
"valid_targets_min": 2529
},
{
"epoch": 5.968873797396718,
"grad_norm": 0.4384145557882011,
"learning_rate": 2.6001286687623382e-06,
"loss": 0.0623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042362622916698456,
"step": 5275,
"valid_targets_mean": 4704.8,
"valid_targets_min": 892
},
{
"epoch": 5.97453310696095,
"grad_norm": 0.33561436487922225,
"learning_rate": 2.5723831725570848e-06,
"loss": 0.068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024302612990140915,
"step": 5280,
"valid_targets_mean": 4471.1,
"valid_targets_min": 1657
},
{
"epoch": 5.980192416525184,
"grad_norm": 0.6312166327590963,
"learning_rate": 2.544776327360419e-06,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10875210165977478,
"step": 5285,
"valid_targets_mean": 1989.8,
"valid_targets_min": 709
},
{
"epoch": 5.985851726089417,
"grad_norm": 0.45996404344118175,
"learning_rate": 2.5173083528074683e-06,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024792591109871864,
"step": 5290,
"valid_targets_mean": 3226.5,
"valid_targets_min": 527
},
{
"epoch": 5.99151103565365,
"grad_norm": 0.4127218758642255,
"learning_rate": 2.489979467428532e-06,
"loss": 0.0742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03901390731334686,
"step": 5295,
"valid_targets_mean": 3531.0,
"valid_targets_min": 2318
},
{
"epoch": 5.997170345217883,
"grad_norm": 0.3788285488600974,
"learning_rate": 2.4627898886473522e-06,
"loss": 0.0656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03326011449098587,
"step": 5300,
"valid_targets_mean": 3520.9,
"valid_targets_min": 2883
},
{
"epoch": 6.002263723825693,
"grad_norm": 0.8276101671544355,
"learning_rate": 2.435739832779358e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07999004423618317,
"step": 5305,
"valid_targets_mean": 5904.0,
"valid_targets_min": 4967
},
{
"epoch": 6.007923033389926,
"grad_norm": 0.7277283379257201,
"learning_rate": 2.408829515029969e-06,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09332052618265152,
"step": 5310,
"valid_targets_mean": 8641.4,
"valid_targets_min": 5164
},
{
"epoch": 6.01358234295416,
"grad_norm": 0.5823805300569702,
"learning_rate": 2.3820591494928635e-06,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07082702219486237,
"step": 5315,
"valid_targets_mean": 6838.2,
"valid_targets_min": 5200
},
{
"epoch": 6.019241652518393,
"grad_norm": 0.5016261384059876,
"learning_rate": 2.3554289491482996e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060256391763687134,
"step": 5320,
"valid_targets_mean": 5411.6,
"valid_targets_min": 3853
},
{
"epoch": 6.024900962082626,
"grad_norm": 0.49029420602885754,
"learning_rate": 2.3289391258613938e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08309821784496307,
"step": 5325,
"valid_targets_mean": 5598.0,
"valid_targets_min": 4669
},
{
"epoch": 6.030560271646859,
"grad_norm": 0.4696599875799638,
"learning_rate": 2.3025898903804467e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07830261439085007,
"step": 5330,
"valid_targets_mean": 5953.0,
"valid_targets_min": 4216
},
{
"epoch": 6.036219581211093,
"grad_norm": 0.4406152488917964,
"learning_rate": 2.276381452335281e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07636751979589462,
"step": 5335,
"valid_targets_mean": 5914.0,
"valid_targets_min": 4589
},
{
"epoch": 6.041878890775325,
"grad_norm": 0.43789300649461604,
"learning_rate": 2.2503140202355488e-06,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07406055927276611,
"step": 5340,
"valid_targets_mean": 6515.4,
"valid_targets_min": 4588
},
{
"epoch": 6.047538200339559,
"grad_norm": 0.39488092916617257,
"learning_rate": 2.2243878014690834e-06,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06888176500797272,
"step": 5345,
"valid_targets_mean": 7015.2,
"valid_targets_min": 4530
},
{
"epoch": 6.053197509903792,
"grad_norm": 0.4131437929720812,
"learning_rate": 2.1986030023002568e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08051659166812897,
"step": 5350,
"valid_targets_mean": 6202.6,
"valid_targets_min": 4837
},
{
"epoch": 6.058856819468025,
"grad_norm": 0.5157470699606653,
"learning_rate": 2.1729598278683264e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04698694124817848,
"step": 5355,
"valid_targets_mean": 1720.9,
"valid_targets_min": 229
},
{
"epoch": 6.064516129032258,
"grad_norm": 0.41192059594925284,
"learning_rate": 2.147458482185807e-06,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07047378271818161,
"step": 5360,
"valid_targets_mean": 5963.8,
"valid_targets_min": 4216
},
{
"epoch": 6.0701754385964914,
"grad_norm": 0.4097676600547405,
"learning_rate": 2.122099168136862e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06870923936367035,
"step": 5365,
"valid_targets_mean": 5973.9,
"valid_targets_min": 4835
},
{
"epoch": 6.075834748160724,
"grad_norm": 0.4826017757756714,
"learning_rate": 2.0968820874756625e-06,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06461106240749359,
"step": 5370,
"valid_targets_mean": 6669.8,
"valid_targets_min": 4995
},
{
"epoch": 6.081494057724957,
"grad_norm": 0.4783505134049246,
"learning_rate": 2.0718074408247955e-06,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08431711792945862,
"step": 5375,
"valid_targets_mean": 5705.5,
"valid_targets_min": 4108
},
{
"epoch": 6.087153367289191,
"grad_norm": 0.4603266617125913,
"learning_rate": 2.0468754276736823e-06,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09027671068906784,
"step": 5380,
"valid_targets_mean": 6594.0,
"valid_targets_min": 4527
},
{
"epoch": 6.092812676853424,
"grad_norm": 0.4668190929700467,
"learning_rate": 2.0220862463769665e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08130667358636856,
"step": 5385,
"valid_targets_mean": 3100.9,
"valid_targets_min": 2104
},
{
"epoch": 6.098471986417657,
"grad_norm": 0.4161670035323307,
"learning_rate": 1.9974400941529493e-06,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06128064543008804,
"step": 5390,
"valid_targets_mean": 5817.8,
"valid_targets_min": 4757
},
{
"epoch": 6.10413129598189,
"grad_norm": 0.49506290970705313,
"learning_rate": 1.972937167082014e-06,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08566483855247498,
"step": 5395,
"valid_targets_mean": 6333.0,
"valid_targets_min": 5056
},
{
"epoch": 6.109790605546124,
"grad_norm": 0.40345628118169874,
"learning_rate": 1.948577660105082e-06,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06584078073501587,
"step": 5400,
"valid_targets_mean": 5956.0,
"valid_targets_min": 2834
},
{
"epoch": 6.115449915110356,
"grad_norm": 0.42809149020646353,
"learning_rate": 1.924361767022038e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10012775659561157,
"step": 5405,
"valid_targets_mean": 6984.6,
"valid_targets_min": 5744
},
{
"epoch": 6.12110922467459,
"grad_norm": 0.3948106402931891,
"learning_rate": 1.9002896804902039e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0651889443397522,
"step": 5410,
"valid_targets_mean": 7290.2,
"valid_targets_min": 5640
},
{
"epoch": 6.126768534238823,
"grad_norm": 0.423531309091551,
"learning_rate": 1.8763615920228084e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0684753954410553,
"step": 5415,
"valid_targets_mean": 7036.0,
"valid_targets_min": 5210
},
{
"epoch": 6.132427843803056,
"grad_norm": 0.4567806851439878,
"learning_rate": 1.8525776919874472e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09491011500358582,
"step": 5420,
"valid_targets_mean": 7138.5,
"valid_targets_min": 5292
},
{
"epoch": 6.138087153367289,
"grad_norm": 0.46052185078926156,
"learning_rate": 1.8289381696045817e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0801386907696724,
"step": 5425,
"valid_targets_mean": 6134.2,
"valid_targets_min": 3531
},
{
"epoch": 6.143746462931523,
"grad_norm": 0.4369176855135763,
"learning_rate": 1.8054432129460386e-06,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08043287694454193,
"step": 5430,
"valid_targets_mean": 5968.2,
"valid_targets_min": 4640
},
{
"epoch": 6.149405772495755,
"grad_norm": 0.41376792180743177,
"learning_rate": 1.7820930089334965e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07278323173522949,
"step": 5435,
"valid_targets_mean": 6249.6,
"valid_targets_min": 4328
},
{
"epoch": 6.155065082059989,
"grad_norm": 0.45569587335080425,
"learning_rate": 1.7588877433370076e-06,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08063621819019318,
"step": 5440,
"valid_targets_mean": 6002.4,
"valid_targets_min": 3123
},
{
"epoch": 6.160724391624222,
"grad_norm": 0.4192478296963226,
"learning_rate": 1.7358276007735276e-06,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07261161506175995,
"step": 5445,
"valid_targets_mean": 6372.2,
"valid_targets_min": 4256
},
{
"epoch": 6.166383701188455,
"grad_norm": 0.44113680036675645,
"learning_rate": 1.71291276470543e-06,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08018209040164948,
"step": 5450,
"valid_targets_mean": 5927.8,
"valid_targets_min": 4753
},
{
"epoch": 6.172043010752688,
"grad_norm": 0.42289106743705024,
"learning_rate": 1.6901434174390652e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07243598997592926,
"step": 5455,
"valid_targets_mean": 6106.1,
"valid_targets_min": 5370
},
{
"epoch": 6.1777023203169215,
"grad_norm": 0.46180892618572433,
"learning_rate": 1.6675197401232869e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08281978964805603,
"step": 5460,
"valid_targets_mean": 6240.6,
"valid_targets_min": 4608
},
{
"epoch": 6.183361629881155,
"grad_norm": 0.44905545436226685,
"learning_rate": 1.6450419127480422e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06940460205078125,
"step": 5465,
"valid_targets_mean": 5733.2,
"valid_targets_min": 3801
},
{
"epoch": 6.1890209394453874,
"grad_norm": 0.42405331723647666,
"learning_rate": 1.6227101141429114e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07862474769353867,
"step": 5470,
"valid_targets_mean": 6430.1,
"valid_targets_min": 4754
},
{
"epoch": 6.194680249009621,
"grad_norm": 0.3636777740153316,
"learning_rate": 1.6005245219756927e-06,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05749621242284775,
"step": 5475,
"valid_targets_mean": 7375.2,
"valid_targets_min": 6417
},
{
"epoch": 6.200339558573854,
"grad_norm": 0.5059615557907053,
"learning_rate": 1.5784853127510058e-06,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08089186251163483,
"step": 5480,
"valid_targets_mean": 6281.0,
"valid_targets_min": 3468
},
{
"epoch": 6.205998868138087,
"grad_norm": 0.41804768443087675,
"learning_rate": 1.5565926618088578e-06,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07407131791114807,
"step": 5485,
"valid_targets_mean": 6532.4,
"valid_targets_min": 5221
},
{
"epoch": 6.21165817770232,
"grad_norm": 0.4444679373526541,
"learning_rate": 1.5348467433232728e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06167688965797424,
"step": 5490,
"valid_targets_mean": 5552.6,
"valid_targets_min": 4438
},
{
"epoch": 6.217317487266554,
"grad_norm": 0.4344700346800421,
"learning_rate": 1.5132477303009018e-06,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07731674611568451,
"step": 5495,
"valid_targets_mean": 5878.1,
"valid_targets_min": 3915
},
{
"epoch": 6.222976796830786,
"grad_norm": 0.37175162900794195,
"learning_rate": 1.4917957945796313e-06,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056854572147130966,
"step": 5500,
"valid_targets_mean": 7082.6,
"valid_targets_min": 4135
},
{
"epoch": 6.22863610639502,
"grad_norm": 0.4519834892138903,
"learning_rate": 1.4704911068272366e-06,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07420016825199127,
"step": 5505,
"valid_targets_mean": 5936.4,
"valid_targets_min": 3947
},
{
"epoch": 6.234295415959253,
"grad_norm": 0.42474375595243313,
"learning_rate": 1.4493338365400034e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0952538400888443,
"step": 5510,
"valid_targets_mean": 6836.2,
"valid_targets_min": 4865
},
{
"epoch": 6.239954725523486,
"grad_norm": 0.4019485048337539,
"learning_rate": 1.428324152041407e-06,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07246479392051697,
"step": 5515,
"valid_targets_mean": 6539.4,
"valid_targets_min": 4643
},
{
"epoch": 6.245614035087719,
"grad_norm": 0.3932962802175302,
"learning_rate": 1.407462220480742e-06,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07242302596569061,
"step": 5520,
"valid_targets_mean": 6613.6,
"valid_targets_min": 4959
},
{
"epoch": 6.251273344651953,
"grad_norm": 0.6506279406434788,
"learning_rate": 1.3867482078318095e-06,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07954353094100952,
"step": 5525,
"valid_targets_mean": 6044.1,
"valid_targets_min": 4652
},
{
"epoch": 6.256932654216186,
"grad_norm": 0.40380824614409955,
"learning_rate": 1.3661822788916013e-06,
"loss": 0.1293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06269079446792603,
"step": 5530,
"valid_targets_mean": 5893.9,
"valid_targets_min": 4938
},
{
"epoch": 6.262591963780419,
"grad_norm": 0.39519519121780683,
"learning_rate": 1.3457645972789778e-06,
"loss": 0.1245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05853109061717987,
"step": 5535,
"valid_targets_mean": 5849.6,
"valid_targets_min": 4546
},
{
"epoch": 6.268251273344652,
"grad_norm": 0.39750633755202286,
"learning_rate": 1.3254953254333613e-06,
"loss": 0.1285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06598692387342453,
"step": 5540,
"valid_targets_mean": 5751.5,
"valid_targets_min": 3200
},
{
"epoch": 6.2739105829088855,
"grad_norm": 0.44355431281874347,
"learning_rate": 1.305374624613469e-06,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07301096618175507,
"step": 5545,
"valid_targets_mean": 6149.6,
"valid_targets_min": 5010
},
{
"epoch": 6.279569892473118,
"grad_norm": 0.44465882297781856,
"learning_rate": 1.285402654896004e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08430242538452148,
"step": 5550,
"valid_targets_mean": 6551.2,
"valid_targets_min": 4904
},
{
"epoch": 6.2852292020373515,
"grad_norm": 0.5270225139071596,
"learning_rate": 1.265579575174387e-06,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10046619921922684,
"step": 5555,
"valid_targets_mean": 5728.9,
"valid_targets_min": 4812
},
{
"epoch": 6.290888511601585,
"grad_norm": 0.4452621705044153,
"learning_rate": 1.245905543157504e-06,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059191398322582245,
"step": 5560,
"valid_targets_mean": 5047.9,
"valid_targets_min": 3629
},
{
"epoch": 6.2965478211658175,
"grad_norm": 0.429665256933034,
"learning_rate": 1.2263807153684448e-06,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07235387712717056,
"step": 5565,
"valid_targets_mean": 6260.0,
"valid_targets_min": 4324
},
{
"epoch": 6.302207130730051,
"grad_norm": 0.3831745381517681,
"learning_rate": 1.2070052471432535e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0637582391500473,
"step": 5570,
"valid_targets_mean": 7853.1,
"valid_targets_min": 4920
},
{
"epoch": 6.307866440294284,
"grad_norm": 0.4395856940321014,
"learning_rate": 1.1877792926296893e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07045142352581024,
"step": 5575,
"valid_targets_mean": 6231.0,
"valid_targets_min": 4882
},
{
"epoch": 6.313525749858517,
"grad_norm": 0.4357912902955703,
"learning_rate": 1.1687030047860248e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06981360912322998,
"step": 5580,
"valid_targets_mean": 7472.9,
"valid_targets_min": 3943
},
{
"epoch": 6.31918505942275,
"grad_norm": 0.447350489255607,
"learning_rate": 1.1497765353797963e-06,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07825092226266861,
"step": 5585,
"valid_targets_mean": 6840.2,
"valid_targets_min": 5034
},
{
"epoch": 6.324844368986984,
"grad_norm": 0.42778721008696324,
"learning_rate": 1.1310000349866136e-06,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07604715973138809,
"step": 5590,
"valid_targets_mean": 6458.5,
"valid_targets_min": 4461
},
{
"epoch": 6.330503678551217,
"grad_norm": 0.3928420540685352,
"learning_rate": 1.1123736529889674e-06,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06796157360076904,
"step": 5595,
"valid_targets_mean": 6645.4,
"valid_targets_min": 5188
},
{
"epoch": 6.33616298811545,
"grad_norm": 0.40726225641199704,
"learning_rate": 1.093897537575026e-06,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07839426398277283,
"step": 5600,
"valid_targets_mean": 6002.9,
"valid_targets_min": 5009
},
{
"epoch": 6.341822297679683,
"grad_norm": 0.5197824268371312,
"learning_rate": 1.075571835737459e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08284924924373627,
"step": 5605,
"valid_targets_mean": 6025.9,
"valid_targets_min": 4551
},
{
"epoch": 6.347481607243917,
"grad_norm": 0.37406341479037775,
"learning_rate": 1.0573966932722902e-06,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07350446283817291,
"step": 5610,
"valid_targets_mean": 7210.0,
"valid_targets_min": 4492
},
{
"epoch": 6.353140916808149,
"grad_norm": 0.41816122930943833,
"learning_rate": 1.039372254777702e-06,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07028060406446457,
"step": 5615,
"valid_targets_mean": 7051.4,
"valid_targets_min": 4718
},
{
"epoch": 6.358800226372383,
"grad_norm": 0.4298009833839158,
"learning_rate": 1.0214986636529112e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0760362297296524,
"step": 5620,
"valid_targets_mean": 6686.0,
"valid_targets_min": 4827
},
{
"epoch": 6.364459535936616,
"grad_norm": 0.406689242569645,
"learning_rate": 1.003776062097015e-06,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05693672597408295,
"step": 5625,
"valid_targets_mean": 5311.9,
"valid_targets_min": 3828
},
{
"epoch": 6.370118845500849,
"grad_norm": 0.38227984996431297,
"learning_rate": 9.862045911078733e-07,
"loss": 0.1262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061227746307849884,
"step": 5630,
"valid_targets_mean": 7078.9,
"valid_targets_min": 4594
},
{
"epoch": 6.375778155065082,
"grad_norm": 0.44431979959785317,
"learning_rate": 9.687843904809725e-07,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061648838222026825,
"step": 5635,
"valid_targets_mean": 6393.8,
"valid_targets_min": 4509
},
{
"epoch": 6.3814374646293155,
"grad_norm": 0.43153627059991495,
"learning_rate": 9.515155988083125e-07,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08048129826784134,
"step": 5640,
"valid_targets_mean": 7848.9,
"valid_targets_min": 5649
},
{
"epoch": 6.387096774193548,
"grad_norm": 0.4032728817369529,
"learning_rate": 9.343983534773238e-07,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061408888548612595,
"step": 5645,
"valid_targets_mean": 6623.4,
"valid_targets_min": 4343
},
{
"epoch": 6.3927560837577815,
"grad_norm": 0.42777057592335804,
"learning_rate": 9.174327906697522e-07,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06570357084274292,
"step": 5650,
"valid_targets_mean": 6255.9,
"valid_targets_min": 4660
},
{
"epoch": 6.398415393322015,
"grad_norm": 0.413587497444861,
"learning_rate": 9.006190453605867e-07,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06969091296195984,
"step": 5655,
"valid_targets_mean": 8243.0,
"valid_targets_min": 6281
},
{
"epoch": 6.4040747028862475,
"grad_norm": 0.3967725258563214,
"learning_rate": 8.839572513169869e-07,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06824289262294769,
"step": 5660,
"valid_targets_mean": 7083.5,
"valid_targets_min": 4657
},
{
"epoch": 6.409734012450481,
"grad_norm": 0.45270305332037425,
"learning_rate": 8.674475410972083e-07,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08294831961393356,
"step": 5665,
"valid_targets_mean": 6399.8,
"valid_targets_min": 5098
},
{
"epoch": 6.415393322014714,
"grad_norm": 0.48113155918133693,
"learning_rate": 8.510900460495608e-07,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08184739202260971,
"step": 5670,
"valid_targets_mean": 5257.4,
"valid_targets_min": 1879
},
{
"epoch": 6.421052631578947,
"grad_norm": 0.462237732588396,
"learning_rate": 8.348848963113498e-07,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07992422580718994,
"step": 5675,
"valid_targets_mean": 5260.5,
"valid_targets_min": 3619
},
{
"epoch": 6.42671194114318,
"grad_norm": 0.4376210559352717,
"learning_rate": 8.188322208078614e-07,
"loss": 0.1087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049073681235313416,
"step": 5680,
"valid_targets_mean": 3976.1,
"valid_targets_min": 3545
},
{
"epoch": 6.432371250707414,
"grad_norm": 0.4443761443952523,
"learning_rate": 8.02932147251314e-07,
"loss": 0.0764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03434424102306366,
"step": 5685,
"valid_targets_mean": 3099.4,
"valid_targets_min": 1024
},
{
"epoch": 6.438030560271647,
"grad_norm": 0.3292086681702203,
"learning_rate": 7.87184802139851e-07,
"loss": 0.0687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021340861916542053,
"step": 5690,
"valid_targets_mean": 3441.1,
"valid_targets_min": 2927
},
{
"epoch": 6.44368986983588,
"grad_norm": 0.495630018274138,
"learning_rate": 7.715903107565426e-07,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05481220781803131,
"step": 5695,
"valid_targets_mean": 3442.0,
"valid_targets_min": 2213
},
{
"epoch": 6.449349179400113,
"grad_norm": 0.4498586504819099,
"learning_rate": 7.56148797168379e-07,
"loss": 0.0712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04381895810365677,
"step": 5700,
"valid_targets_mean": 2907.4,
"valid_targets_min": 1134
},
{
"epoch": 6.455008488964347,
"grad_norm": 0.47457148843186153,
"learning_rate": 7.408603842252837e-07,
"loss": 0.0749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045509450137615204,
"step": 5705,
"valid_targets_mean": 2523.4,
"valid_targets_min": 663
},
{
"epoch": 6.460667798528579,
"grad_norm": 0.6923423608886543,
"learning_rate": 7.257251935591436e-07,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055727388709783554,
"step": 5710,
"valid_targets_mean": 1893.8,
"valid_targets_min": 535
},
{
"epoch": 6.466327108092813,
"grad_norm": 0.4086302890491953,
"learning_rate": 7.107433455828317e-07,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030361641198396683,
"step": 5715,
"valid_targets_mean": 1971.8,
"valid_targets_min": 811
},
{
"epoch": 6.471986417657046,
"grad_norm": 0.490315949097002,
"learning_rate": 6.959149594892567e-07,
"loss": 0.0882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0521058514714241,
"step": 5720,
"valid_targets_mean": 2785.5,
"valid_targets_min": 2392
},
{
"epoch": 6.477645727221279,
"grad_norm": 0.28307075878357413,
"learning_rate": 6.812401532504109e-07,
"loss": 0.0933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022131290286779404,
"step": 5725,
"valid_targets_mean": 4540.6,
"valid_targets_min": 3285
},
{
"epoch": 6.483305036785512,
"grad_norm": 0.36605418977499043,
"learning_rate": 6.667190436164351e-07,
"loss": 0.0688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03333090618252754,
"step": 5730,
"valid_targets_mean": 2926.8,
"valid_targets_min": 764
},
{
"epoch": 6.4889643463497455,
"grad_norm": 0.3792739889735828,
"learning_rate": 6.523517461146856e-07,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03842036426067352,
"step": 5735,
"valid_targets_mean": 3378.6,
"valid_targets_min": 1290
},
{
"epoch": 6.494623655913978,
"grad_norm": 0.5005953776912583,
"learning_rate": 6.381383750488113e-07,
"loss": 0.0693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03875945508480072,
"step": 5740,
"valid_targets_mean": 2432.4,
"valid_targets_min": 720
},
{
"epoch": 6.5002829654782115,
"grad_norm": 0.3298347107591839,
"learning_rate": 6.240790434978628e-07,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031254325062036514,
"step": 5745,
"valid_targets_mean": 3896.0,
"valid_targets_min": 2336
},
{
"epoch": 6.505942275042445,
"grad_norm": 0.363089484382129,
"learning_rate": 6.101738633153686e-07,
"loss": 0.0653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03155246376991272,
"step": 5750,
"valid_targets_mean": 2912.5,
"valid_targets_min": 1049
},
{
"epoch": 6.511601584606678,
"grad_norm": 0.3590771499282617,
"learning_rate": 5.964229451284586e-07,
"loss": 0.073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02306312322616577,
"step": 5755,
"valid_targets_mean": 3087.8,
"valid_targets_min": 1086
},
{
"epoch": 6.517260894170911,
"grad_norm": 0.3892052060779421,
"learning_rate": 5.828263983369864e-07,
"loss": 0.0605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03467557579278946,
"step": 5760,
"valid_targets_mean": 3296.5,
"valid_targets_min": 732
},
{
"epoch": 6.522920203735144,
"grad_norm": 0.6316138887211705,
"learning_rate": 5.693843311126523e-07,
"loss": 0.0811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04579807072877884,
"step": 5765,
"valid_targets_mean": 1688.5,
"valid_targets_min": 770
},
{
"epoch": 6.528579513299378,
"grad_norm": 0.42657241895095116,
"learning_rate": 5.560968503981378e-07,
"loss": 0.0757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03341136872768402,
"step": 5770,
"valid_targets_mean": 2574.8,
"valid_targets_min": 592
},
{
"epoch": 6.53423882286361,
"grad_norm": 0.46142186165107835,
"learning_rate": 5.429640619062726e-07,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04054953530430794,
"step": 5775,
"valid_targets_mean": 3089.1,
"valid_targets_min": 2224
},
{
"epoch": 6.539898132427844,
"grad_norm": 0.4493689812933997,
"learning_rate": 5.299860701191772e-07,
"loss": 0.0827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029141142964363098,
"step": 5780,
"valid_targets_mean": 2364.5,
"valid_targets_min": 511
},
{
"epoch": 6.545557441992077,
"grad_norm": 0.43790299984161335,
"learning_rate": 5.171629782874354e-07,
"loss": 0.1145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04518071562051773,
"step": 5785,
"valid_targets_mean": 3775.5,
"valid_targets_min": 2328
},
{
"epoch": 6.55121675155631,
"grad_norm": 0.42124865037915415,
"learning_rate": 5.044948884292766e-07,
"loss": 0.0643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02882300317287445,
"step": 5790,
"valid_targets_mean": 2867.1,
"valid_targets_min": 669
},
{
"epoch": 6.556876061120543,
"grad_norm": 0.6751482529617706,
"learning_rate": 4.919819013297677e-07,
"loss": 0.0882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0536501370370388,
"step": 5795,
"valid_targets_mean": 1722.5,
"valid_targets_min": 802
},
{
"epoch": 6.562535370684777,
"grad_norm": 0.6476380988588636,
"learning_rate": 4.796241165399939e-07,
"loss": 0.0904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051889095455408096,
"step": 5800,
"valid_targets_mean": 1527.9,
"valid_targets_min": 357
},
{
"epoch": 6.568194680249009,
"grad_norm": 0.442176682737924,
"learning_rate": 4.674216323762881e-07,
"loss": 0.0801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035727713257074356,
"step": 5805,
"valid_targets_mean": 3831.6,
"valid_targets_min": 2808
},
{
"epoch": 6.573853989813243,
"grad_norm": 0.5479385584946559,
"learning_rate": 4.5537454591943584e-07,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11486173421144485,
"step": 5810,
"valid_targets_mean": 2953.2,
"valid_targets_min": 652
},
{
"epoch": 6.579513299377476,
"grad_norm": 0.41350133265317146,
"learning_rate": 4.434829530139095e-07,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04003699868917465,
"step": 5815,
"valid_targets_mean": 3963.6,
"valid_targets_min": 3573
},
{
"epoch": 6.5851726089417095,
"grad_norm": 0.5482015029259201,
"learning_rate": 4.3174694826709107e-07,
"loss": 0.0839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045565806329250336,
"step": 5820,
"valid_targets_mean": 2137.1,
"valid_targets_min": 822
},
{
"epoch": 6.590831918505942,
"grad_norm": 0.6080484811075969,
"learning_rate": 4.201666250485503e-07,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14063608646392822,
"step": 5825,
"valid_targets_mean": 2582.1,
"valid_targets_min": 965
},
{
"epoch": 6.5964912280701755,
"grad_norm": 0.4073205411029621,
"learning_rate": 4.087420754892635e-07,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03254256024956703,
"step": 5830,
"valid_targets_mean": 4182.0,
"valid_targets_min": 636
},
{
"epoch": 6.602150537634409,
"grad_norm": 0.4394219118655527,
"learning_rate": 3.9747339048091136e-07,
"loss": 0.0726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05536698177456856,
"step": 5835,
"valid_targets_mean": 4735.0,
"valid_targets_min": 2733
},
{
"epoch": 6.6078098471986415,
"grad_norm": 0.43545501648190743,
"learning_rate": 3.863606596751379e-07,
"loss": 0.0746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046722978353500366,
"step": 5840,
"valid_targets_mean": 4307.1,
"valid_targets_min": 2571
},
{
"epoch": 6.613469156762875,
"grad_norm": 0.32601803243775,
"learning_rate": 3.7540397148284837e-07,
"loss": 0.0732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025708980858325958,
"step": 5845,
"valid_targets_mean": 3207.2,
"valid_targets_min": 970
},
{
"epoch": 6.619128466327108,
"grad_norm": 0.3599900965727607,
"learning_rate": 3.6460341307349653e-07,
"loss": 0.0688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027514172717928886,
"step": 5850,
"valid_targets_mean": 2923.8,
"valid_targets_min": 748
},
{
"epoch": 6.624787775891341,
"grad_norm": 0.44324928927827856,
"learning_rate": 3.539590703743967e-07,
"loss": 0.0679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041861265897750854,
"step": 5855,
"valid_targets_mean": 3834.1,
"valid_targets_min": 3568
},
{
"epoch": 6.630447085455574,
"grad_norm": 0.5158990365964071,
"learning_rate": 3.434710280700415e-07,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039465367794036865,
"step": 5860,
"valid_targets_mean": 2406.8,
"valid_targets_min": 1820
},
{
"epoch": 6.636106395019808,
"grad_norm": 0.4050936034477056,
"learning_rate": 3.331393696014207e-07,
"loss": 0.0597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03890451416373253,
"step": 5865,
"valid_targets_mean": 2587.6,
"valid_targets_min": 772
},
{
"epoch": 6.64176570458404,
"grad_norm": 0.5110258826615129,
"learning_rate": 3.22964177165368e-07,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05033072829246521,
"step": 5870,
"valid_targets_mean": 3260.0,
"valid_targets_min": 1289
},
{
"epoch": 6.647425014148274,
"grad_norm": 0.40885125808704265,
"learning_rate": 3.129455317138952e-07,
"loss": 0.0538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02987043187022209,
"step": 5875,
"valid_targets_mean": 3723.0,
"valid_targets_min": 3122
},
{
"epoch": 6.653084323712507,
"grad_norm": 0.38109335536839384,
"learning_rate": 3.030835129535592e-07,
"loss": 0.0619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03285347670316696,
"step": 5880,
"valid_targets_mean": 3712.5,
"valid_targets_min": 1451
},
{
"epoch": 6.658743633276741,
"grad_norm": 0.420283639227681,
"learning_rate": 2.9337819934481814e-07,
"loss": 0.0609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03552892059087753,
"step": 5885,
"valid_targets_mean": 3632.8,
"valid_targets_min": 792
},
{
"epoch": 6.664402942840973,
"grad_norm": 0.5249883860736148,
"learning_rate": 2.838296681014185e-07,
"loss": 0.077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03367924317717552,
"step": 5890,
"valid_targets_mean": 1992.4,
"valid_targets_min": 795
},
{
"epoch": 6.670062252405207,
"grad_norm": 0.39437654832589936,
"learning_rate": 2.744379951897691e-07,
"loss": 0.0921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034002915024757385,
"step": 5895,
"valid_targets_mean": 3431.4,
"valid_targets_min": 1196
},
{
"epoch": 6.67572156196944,
"grad_norm": 0.5991953850107175,
"learning_rate": 2.65203255328339e-07,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03567385673522949,
"step": 5900,
"valid_targets_mean": 1836.1,
"valid_targets_min": 575
},
{
"epoch": 6.681380871533673,
"grad_norm": 0.7020941398300836,
"learning_rate": 2.561255219870762e-07,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05443864315748215,
"step": 5905,
"valid_targets_mean": 1908.8,
"valid_targets_min": 609
},
{
"epoch": 6.687040181097906,
"grad_norm": 0.5464404537690308,
"learning_rate": 2.472048673868033e-07,
"loss": 0.0861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02943640947341919,
"step": 5910,
"valid_targets_mean": 1497.2,
"valid_targets_min": 542
},
{
"epoch": 6.6926994906621395,
"grad_norm": 0.3661819024596803,
"learning_rate": 2.3844136249865367e-07,
"loss": 0.1018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03263043984770775,
"step": 5915,
"valid_targets_mean": 3701.8,
"valid_targets_min": 2440
},
{
"epoch": 6.698358800226372,
"grad_norm": 0.4550654896101805,
"learning_rate": 2.2983507704351426e-07,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02765018306672573,
"step": 5920,
"valid_targets_mean": 1648.2,
"valid_targets_min": 629
},
{
"epoch": 6.7040181097906055,
"grad_norm": 0.4137364782748426,
"learning_rate": 2.213860794914524e-07,
"loss": 0.093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038274720311164856,
"step": 5925,
"valid_targets_mean": 3953.0,
"valid_targets_min": 3701
},
{
"epoch": 6.709677419354839,
"grad_norm": 0.5146684136695984,
"learning_rate": 2.1309443706118538e-07,
"loss": 0.0749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03469971567392349,
"step": 5930,
"valid_targets_mean": 1700.9,
"valid_targets_min": 485
},
{
"epoch": 6.7153367289190715,
"grad_norm": 0.49679016274514903,
"learning_rate": 2.049602157195363e-07,
"loss": 0.0752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0654388889670372,
"step": 5935,
"valid_targets_mean": 2381.9,
"valid_targets_min": 605
},
{
"epoch": 6.720996038483305,
"grad_norm": 0.351424709328263,
"learning_rate": 1.9698348018092338e-07,
"loss": 0.0648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025245461612939835,
"step": 5940,
"valid_targets_mean": 2713.5,
"valid_targets_min": 848
},
{
"epoch": 6.726655348047538,
"grad_norm": 0.35432740168743526,
"learning_rate": 1.8916429390682944e-07,
"loss": 0.0647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031980741769075394,
"step": 5945,
"valid_targets_mean": 5106.4,
"valid_targets_min": 4456
},
{
"epoch": 6.732314657611772,
"grad_norm": 0.40381665509366593,
"learning_rate": 1.8150271910530204e-07,
"loss": 0.068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040590934455394745,
"step": 5950,
"valid_targets_mean": 3905.5,
"valid_targets_min": 1864
},
{
"epoch": 6.737973967176004,
"grad_norm": 0.5014073985393658,
"learning_rate": 1.7399881673046736e-07,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03374318778514862,
"step": 5955,
"valid_targets_mean": 3313.8,
"valid_targets_min": 1361
},
{
"epoch": 6.743633276740238,
"grad_norm": 0.4408577069276251,
"learning_rate": 1.666526464820284e-07,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040150947868824005,
"step": 5960,
"valid_targets_mean": 3500.1,
"valid_targets_min": 1814
},
{
"epoch": 6.74929258630447,
"grad_norm": 0.5379572135308958,
"learning_rate": 1.594642668048052e-07,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03901442512869835,
"step": 5965,
"valid_targets_mean": 1559.0,
"valid_targets_min": 759
},
{
"epoch": 6.754951895868704,
"grad_norm": 0.3506083866275488,
"learning_rate": 1.5243373488826653e-07,
"loss": 0.0593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029368489980697632,
"step": 5970,
"valid_targets_mean": 3942.6,
"valid_targets_min": 2719
},
{
"epoch": 6.760611205432937,
"grad_norm": 0.5454659716357816,
"learning_rate": 1.4556110666606783e-07,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028036806732416153,
"step": 5975,
"valid_targets_mean": 1133.4,
"valid_targets_min": 664
},
{
"epoch": 6.766270514997171,
"grad_norm": 0.3915993911091825,
"learning_rate": 1.388464368156095e-07,
"loss": 0.0725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023933472111821175,
"step": 5980,
"valid_targets_mean": 2489.8,
"valid_targets_min": 1584
},
{
"epoch": 6.771929824561403,
"grad_norm": 0.38581046462288265,
"learning_rate": 1.322897787576105e-07,
"loss": 0.0589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028114689514040947,
"step": 5985,
"valid_targets_mean": 2685.4,
"valid_targets_min": 1003
},
{
"epoch": 6.777589134125637,
"grad_norm": 0.38659993644399676,
"learning_rate": 1.2589118465566875e-07,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029353385791182518,
"step": 5990,
"valid_targets_mean": 3180.8,
"valid_targets_min": 560
},
{
"epoch": 6.78324844368987,
"grad_norm": 0.39635633472198784,
"learning_rate": 1.1965070541585912e-07,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0360221303999424,
"step": 5995,
"valid_targets_mean": 3285.9,
"valid_targets_min": 1049
},
{
"epoch": 6.788907753254103,
"grad_norm": 0.4768199556298617,
"learning_rate": 1.1356839068632053e-07,
"loss": 0.0845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041404206305742264,
"step": 6000,
"valid_targets_mean": 2464.9,
"valid_targets_min": 771
},
{
"epoch": 6.794567062818336,
"grad_norm": 0.4759804528663009,
"learning_rate": 1.0764428885686073e-07,
"loss": 0.0719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03653126209974289,
"step": 6005,
"valid_targets_mean": 2959.5,
"valid_targets_min": 825
},
{
"epoch": 6.8002263723825696,
"grad_norm": 0.5508016189657499,
"learning_rate": 1.0187844705857875e-07,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04060523957014084,
"step": 6010,
"valid_targets_mean": 2602.1,
"valid_targets_min": 829
},
{
"epoch": 6.805885681946802,
"grad_norm": 0.47780734613760967,
"learning_rate": 9.627091116348076e-08,
"loss": 0.0777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04422842338681221,
"step": 6015,
"valid_targets_mean": 2106.1,
"valid_targets_min": 650
},
{
"epoch": 6.8115449915110355,
"grad_norm": 0.47337810865412044,
"learning_rate": 9.082172578412263e-08,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04251515865325928,
"step": 6020,
"valid_targets_mean": 2946.0,
"valid_targets_min": 729
},
{
"epoch": 6.817204301075269,
"grad_norm": 0.31759103202396305,
"learning_rate": 8.553093427325243e-08,
"loss": 0.0665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023808494210243225,
"step": 6025,
"valid_targets_mean": 3853.5,
"valid_targets_min": 3152
},
{
"epoch": 6.8228636106395015,
"grad_norm": 0.3290538179958601,
"learning_rate": 8.039857872345736e-08,
"loss": 0.066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0240267775952816,
"step": 6030,
"valid_targets_mean": 3448.2,
"valid_targets_min": 2543
},
{
"epoch": 6.828522920203735,
"grad_norm": 0.48063721542746124,
"learning_rate": 7.542469996684843e-08,
"loss": 0.0915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03989311307668686,
"step": 6035,
"valid_targets_mean": 2674.9,
"valid_targets_min": 446
},
{
"epoch": 6.834182229767968,
"grad_norm": 0.4058482123607516,
"learning_rate": 7.06093375747141e-08,
"loss": 0.0608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02851252630352974,
"step": 6040,
"valid_targets_mean": 2807.6,
"valid_targets_min": 681
},
{
"epoch": 6.839841539332202,
"grad_norm": 0.5135647892958799,
"learning_rate": 6.595252985721834e-08,
"loss": 0.0706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049752771854400635,
"step": 6045,
"valid_targets_mean": 5567.5,
"valid_targets_min": 3772
},
{
"epoch": 6.845500848896434,
"grad_norm": 0.36184997124585655,
"learning_rate": 6.145431386309186e-08,
"loss": 0.0685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032238394021987915,
"step": 6050,
"valid_targets_mean": 3662.4,
"valid_targets_min": 484
},
{
"epoch": 6.851160158460668,
"grad_norm": 0.32341004212385127,
"learning_rate": 5.711472537933693e-08,
"loss": 0.0574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02496453747153282,
"step": 6055,
"valid_targets_mean": 3900.0,
"valid_targets_min": 861
},
{
"epoch": 6.856819468024901,
"grad_norm": 0.523808243909321,
"learning_rate": 5.293379893094752e-08,
"loss": 0.0704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05595286563038826,
"step": 6060,
"valid_targets_mean": 4100.8,
"valid_targets_min": 3268
},
{
"epoch": 6.862478777589134,
"grad_norm": 0.42563665626143066,
"learning_rate": 4.891156778062734e-08,
"loss": 0.071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033235713839530945,
"step": 6065,
"valid_targets_mean": 3277.8,
"valid_targets_min": 559
},
{
"epoch": 6.868138087153367,
"grad_norm": 0.4513013591790561,
"learning_rate": 4.5048063928527785e-08,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030779201537370682,
"step": 6070,
"valid_targets_mean": 2986.2,
"valid_targets_min": 689
},
{
"epoch": 6.873797396717601,
"grad_norm": 0.5888522930807201,
"learning_rate": 4.134331811199932e-08,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05735611915588379,
"step": 6075,
"valid_targets_mean": 1831.6,
"valid_targets_min": 616
},
{
"epoch": 6.879456706281833,
"grad_norm": 0.5316339779537674,
"learning_rate": 3.7797359805333836e-08,
"loss": 0.0535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03486653417348862,
"step": 6080,
"valid_targets_mean": 2087.0,
"valid_targets_min": 602
},
{
"epoch": 6.885116015846067,
"grad_norm": 0.39760459368891415,
"learning_rate": 3.441021721954485e-08,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03535497188568115,
"step": 6085,
"valid_targets_mean": 3992.1,
"valid_targets_min": 3551
},
{
"epoch": 6.8907753254103,
"grad_norm": 0.43388913745160906,
"learning_rate": 3.11819173021366e-08,
"loss": 0.0674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02623586170375347,
"step": 6090,
"valid_targets_mean": 2115.1,
"valid_targets_min": 596
},
{
"epoch": 6.896434634974533,
"grad_norm": 0.38243226683777753,
"learning_rate": 2.8112485736881967e-08,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027614392340183258,
"step": 6095,
"valid_targets_mean": 3488.0,
"valid_targets_min": 799
},
{
"epoch": 6.902093944538766,
"grad_norm": 0.4848799581538806,
"learning_rate": 2.520194694363376e-08,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05016375333070755,
"step": 6100,
"valid_targets_mean": 3078.9,
"valid_targets_min": 706
},
{
"epoch": 6.907753254103,
"grad_norm": 0.5335054810278811,
"learning_rate": 2.2450324078120423e-08,
"loss": 0.1072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03868968039751053,
"step": 6105,
"valid_targets_mean": 1957.6,
"valid_targets_min": 710
},
{
"epoch": 6.913412563667233,
"grad_norm": 0.42779014879456234,
"learning_rate": 1.9857639031759522e-08,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030187007039785385,
"step": 6110,
"valid_targets_mean": 3112.4,
"valid_targets_min": 647
},
{
"epoch": 6.9190718732314656,
"grad_norm": 0.5708406365969891,
"learning_rate": 1.7423912431489e-08,
"loss": 0.0716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03383772075176239,
"step": 6115,
"valid_targets_mean": 1494.9,
"valid_targets_min": 716
},
{
"epoch": 6.924731182795699,
"grad_norm": 0.4164948214390167,
"learning_rate": 1.51491636396095e-08,
"loss": 0.0675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038247913122177124,
"step": 6120,
"valid_targets_mean": 3669.5,
"valid_targets_min": 3122
},
{
"epoch": 6.930390492359932,
"grad_norm": 0.4980278280391314,
"learning_rate": 1.3033410753608977e-08,
"loss": 0.0678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03384961932897568,
"step": 6125,
"valid_targets_mean": 2399.1,
"valid_targets_min": 832
},
{
"epoch": 6.936049801924165,
"grad_norm": 0.5624363897364986,
"learning_rate": 1.1076670606045004e-08,
"loss": 0.0582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0311758890748024,
"step": 6130,
"valid_targets_mean": 1216.9,
"valid_targets_min": 635
},
{
"epoch": 6.941709111488398,
"grad_norm": 0.40337485535884043,
"learning_rate": 9.278958764391554e-09,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03224567323923111,
"step": 6135,
"valid_targets_mean": 3078.1,
"valid_targets_min": 756
},
{
"epoch": 6.947368421052632,
"grad_norm": 0.6199863900014508,
"learning_rate": 7.64028953092133e-09,
"loss": 0.0622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03886682540178299,
"step": 6140,
"valid_targets_mean": 2387.1,
"valid_targets_min": 744
},
{
"epoch": 6.953027730616864,
"grad_norm": 0.36540416345205473,
"learning_rate": 6.16067594259695e-09,
"loss": 0.0647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023269277065992355,
"step": 6145,
"valid_targets_mean": 2088.4,
"valid_targets_min": 529
},
{
"epoch": 6.958687040181098,
"grad_norm": 0.5059157441516826,
"learning_rate": 4.840129770957713e-09,
"loss": 0.0742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04765991121530533,
"step": 6150,
"valid_targets_mean": 3932.1,
"valid_targets_min": 2017
},
{
"epoch": 6.964346349745331,
"grad_norm": 0.32224893355652934,
"learning_rate": 3.6786615220352208e-09,
"loss": 0.0639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02520209550857544,
"step": 6155,
"valid_targets_mean": 4790.0,
"valid_targets_min": 516
},
{
"epoch": 6.970005659309564,
"grad_norm": 0.4023448099684757,
"learning_rate": 2.6762804362623353e-09,
"loss": 0.0625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02867652103304863,
"step": 6160,
"valid_targets_mean": 2245.1,
"valid_targets_min": 772
},
{
"epoch": 6.975664968873797,
"grad_norm": 0.470060085059617,
"learning_rate": 1.8329944884021288e-09,
"loss": 0.0663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03312272951006889,
"step": 6165,
"valid_targets_mean": 3851.0,
"valid_targets_min": 2196
},
{
"epoch": 6.981324278438031,
"grad_norm": 0.5501571965826606,
"learning_rate": 1.1488103874923717e-09,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11629301309585571,
"step": 6170,
"valid_targets_mean": 3094.1,
"valid_targets_min": 2759
},
{
"epoch": 6.986983588002264,
"grad_norm": 0.3747210819200156,
"learning_rate": 6.237335767744767e-10,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026630330830812454,
"step": 6175,
"valid_targets_mean": 3760.2,
"valid_targets_min": 3175
},
{
"epoch": 6.992642897566497,
"grad_norm": 0.4336427114618938,
"learning_rate": 2.577682336690757e-10,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025160185992717743,
"step": 6180,
"valid_targets_mean": 2446.5,
"valid_targets_min": 759
},
{
"epoch": 6.99830220713073,
"grad_norm": 0.5105245398393162,
"learning_rate": 5.091726972938915e-11,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08412353694438934,
"step": 6185,
"valid_targets_mean": 2332.5,
"valid_targets_min": 927
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03830413520336151,
"step": 6187,
"total_flos": 3.038645528557519e+18,
"train_loss": 0.05716925004446894,
"train_runtime": 84196.6554,
"train_samples_per_second": 1.175,
"train_steps_per_second": 0.073,
"valid_targets_mean": 3729.2,
"valid_targets_min": 1273
}
],
"logging_steps": 5,
"max_steps": 6188,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 3.038645528557519e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}