swesmith-stack-reason / trainer_state.json
penfever's picture
End of training
30d98b5 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 6712,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.005216484089723527,
"grad_norm": 11.24254837639787,
"learning_rate": 2.3809523809523811e-07,
"loss": 0.6831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.352985143661499,
"step": 5,
"valid_targets_mean": 5016.1,
"valid_targets_min": 3449
},
{
"epoch": 0.010432968179447054,
"grad_norm": 11.232055207273655,
"learning_rate": 5.357142857142857e-07,
"loss": 0.7003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3600406050682068,
"step": 10,
"valid_targets_mean": 4135.8,
"valid_targets_min": 2157
},
{
"epoch": 0.01564945226917058,
"grad_norm": 11.366410871408558,
"learning_rate": 8.333333333333333e-07,
"loss": 0.6785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33216580748558044,
"step": 15,
"valid_targets_mean": 4791.5,
"valid_targets_min": 1156
},
{
"epoch": 0.020865936358894107,
"grad_norm": 10.34808092771311,
"learning_rate": 1.130952380952381e-06,
"loss": 0.6848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3293125033378601,
"step": 20,
"valid_targets_mean": 5037.9,
"valid_targets_min": 2294
},
{
"epoch": 0.02608242044861763,
"grad_norm": 7.6077329183534355,
"learning_rate": 1.4285714285714286e-06,
"loss": 0.6608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203168511390686,
"step": 25,
"valid_targets_mean": 4165.8,
"valid_targets_min": 1328
},
{
"epoch": 0.03129890453834116,
"grad_norm": 5.405083399889847,
"learning_rate": 1.7261904761904764e-06,
"loss": 0.6115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2907986044883728,
"step": 30,
"valid_targets_mean": 5063.2,
"valid_targets_min": 2066
},
{
"epoch": 0.036515388628064686,
"grad_norm": 3.9727593664560845,
"learning_rate": 2.023809523809524e-06,
"loss": 0.5967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2616725265979767,
"step": 35,
"valid_targets_mean": 5020.9,
"valid_targets_min": 1501
},
{
"epoch": 0.041731872717788214,
"grad_norm": 4.2532153338984795,
"learning_rate": 2.321428571428572e-06,
"loss": 0.5382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24420849978923798,
"step": 40,
"valid_targets_mean": 3708.5,
"valid_targets_min": 1205
},
{
"epoch": 0.046948356807511735,
"grad_norm": 2.934457351095903,
"learning_rate": 2.6190476190476192e-06,
"loss": 0.5187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24222546815872192,
"step": 45,
"valid_targets_mean": 5127.6,
"valid_targets_min": 2067
},
{
"epoch": 0.05216484089723526,
"grad_norm": 1.8853061847111383,
"learning_rate": 2.916666666666667e-06,
"loss": 0.5205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252302885055542,
"step": 50,
"valid_targets_mean": 4483.6,
"valid_targets_min": 2124
},
{
"epoch": 0.05738132498695879,
"grad_norm": 1.4677384311186294,
"learning_rate": 3.2142857142857147e-06,
"loss": 0.4809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18407613039016724,
"step": 55,
"valid_targets_mean": 3567.4,
"valid_targets_min": 1209
},
{
"epoch": 0.06259780907668232,
"grad_norm": 1.120364963485017,
"learning_rate": 3.511904761904762e-06,
"loss": 0.4447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22264821827411652,
"step": 60,
"valid_targets_mean": 3878.1,
"valid_targets_min": 1741
},
{
"epoch": 0.06781429316640585,
"grad_norm": 0.840971856813474,
"learning_rate": 3.80952380952381e-06,
"loss": 0.4575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23368576169013977,
"step": 65,
"valid_targets_mean": 5164.6,
"valid_targets_min": 2130
},
{
"epoch": 0.07303077725612937,
"grad_norm": 0.8384789308765538,
"learning_rate": 4.107142857142857e-06,
"loss": 0.4306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20054024457931519,
"step": 70,
"valid_targets_mean": 5614.9,
"valid_targets_min": 2491
},
{
"epoch": 0.0782472613458529,
"grad_norm": 0.6385587472558049,
"learning_rate": 4.404761904761905e-06,
"loss": 0.4176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22027632594108582,
"step": 75,
"valid_targets_mean": 6077.4,
"valid_targets_min": 2913
},
{
"epoch": 0.08346374543557643,
"grad_norm": 0.6630664582444133,
"learning_rate": 4.702380952380953e-06,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19254867732524872,
"step": 80,
"valid_targets_mean": 3906.9,
"valid_targets_min": 2090
},
{
"epoch": 0.08868022952529994,
"grad_norm": 0.6786403833983912,
"learning_rate": 5e-06,
"loss": 0.4207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23695020377635956,
"step": 85,
"valid_targets_mean": 5569.6,
"valid_targets_min": 3740
},
{
"epoch": 0.09389671361502347,
"grad_norm": 0.6184877623015653,
"learning_rate": 5.297619047619048e-06,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19551850855350494,
"step": 90,
"valid_targets_mean": 4397.8,
"valid_targets_min": 2423
},
{
"epoch": 0.099113197704747,
"grad_norm": 0.7103317313757143,
"learning_rate": 5.595238095238096e-06,
"loss": 0.4175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23150977492332458,
"step": 95,
"valid_targets_mean": 4499.1,
"valid_targets_min": 2100
},
{
"epoch": 0.10432968179447052,
"grad_norm": 0.6478165702052965,
"learning_rate": 5.892857142857144e-06,
"loss": 0.3957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18475624918937683,
"step": 100,
"valid_targets_mean": 3931.0,
"valid_targets_min": 1857
},
{
"epoch": 0.10954616588419405,
"grad_norm": 1.592022317536399,
"learning_rate": 6.1904761904761914e-06,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21138747036457062,
"step": 105,
"valid_targets_mean": 4803.2,
"valid_targets_min": 3210
},
{
"epoch": 0.11476264997391758,
"grad_norm": 0.5508085022135111,
"learning_rate": 6.488095238095239e-06,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21324364840984344,
"step": 110,
"valid_targets_mean": 5535.6,
"valid_targets_min": 2106
},
{
"epoch": 0.11997913406364111,
"grad_norm": 0.6710255867894759,
"learning_rate": 6.785714285714287e-06,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21487626433372498,
"step": 115,
"valid_targets_mean": 5593.4,
"valid_targets_min": 3020
},
{
"epoch": 0.12519561815336464,
"grad_norm": 0.6555896961622583,
"learning_rate": 7.083333333333335e-06,
"loss": 0.3719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.200883150100708,
"step": 120,
"valid_targets_mean": 4099.2,
"valid_targets_min": 1168
},
{
"epoch": 0.13041210224308816,
"grad_norm": 0.6368436071225058,
"learning_rate": 7.380952380952382e-06,
"loss": 0.3772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2024303674697876,
"step": 125,
"valid_targets_mean": 4552.5,
"valid_targets_min": 2219
},
{
"epoch": 0.1356285863328117,
"grad_norm": 0.6426147411338267,
"learning_rate": 7.67857142857143e-06,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19902446866035461,
"step": 130,
"valid_targets_mean": 4261.1,
"valid_targets_min": 1714
},
{
"epoch": 0.14084507042253522,
"grad_norm": 0.5425425596699449,
"learning_rate": 7.976190476190477e-06,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1794453263282776,
"step": 135,
"valid_targets_mean": 4941.1,
"valid_targets_min": 2717
},
{
"epoch": 0.14606155451225875,
"grad_norm": 0.6099519495344266,
"learning_rate": 8.273809523809523e-06,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20556297898292542,
"step": 140,
"valid_targets_mean": 5149.0,
"valid_targets_min": 2683
},
{
"epoch": 0.15127803860198227,
"grad_norm": 0.5616784883743269,
"learning_rate": 8.571428571428571e-06,
"loss": 0.3737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20041660964488983,
"step": 145,
"valid_targets_mean": 4993.5,
"valid_targets_min": 2369
},
{
"epoch": 0.1564945226917058,
"grad_norm": 0.573865959626073,
"learning_rate": 8.869047619047619e-06,
"loss": 0.3732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1961544007062912,
"step": 150,
"valid_targets_mean": 6082.9,
"valid_targets_min": 3402
},
{
"epoch": 0.16171100678142933,
"grad_norm": 0.6318893370099948,
"learning_rate": 9.166666666666666e-06,
"loss": 0.3748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1895100474357605,
"step": 155,
"valid_targets_mean": 5077.5,
"valid_targets_min": 2645
},
{
"epoch": 0.16692749087115286,
"grad_norm": 0.62541969323896,
"learning_rate": 9.464285714285714e-06,
"loss": 0.3582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16339033842086792,
"step": 160,
"valid_targets_mean": 4114.4,
"valid_targets_min": 1777
},
{
"epoch": 0.17214397496087636,
"grad_norm": 0.5606657840484052,
"learning_rate": 9.761904761904762e-06,
"loss": 0.3576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15099817514419556,
"step": 165,
"valid_targets_mean": 5019.4,
"valid_targets_min": 2033
},
{
"epoch": 0.17736045905059988,
"grad_norm": 0.5365733878219655,
"learning_rate": 1.005952380952381e-05,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16473634541034698,
"step": 170,
"valid_targets_mean": 5306.1,
"valid_targets_min": 1850
},
{
"epoch": 0.1825769431403234,
"grad_norm": 0.7029064378668989,
"learning_rate": 1.0357142857142859e-05,
"loss": 0.3407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17407193779945374,
"step": 175,
"valid_targets_mean": 4721.5,
"valid_targets_min": 1269
},
{
"epoch": 0.18779342723004694,
"grad_norm": 0.48456037806978225,
"learning_rate": 1.0654761904761905e-05,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16871285438537598,
"step": 180,
"valid_targets_mean": 5911.6,
"valid_targets_min": 3213
},
{
"epoch": 0.19300991131977047,
"grad_norm": 0.585313639557234,
"learning_rate": 1.0952380952380955e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16843539476394653,
"step": 185,
"valid_targets_mean": 4861.0,
"valid_targets_min": 1564
},
{
"epoch": 0.198226395409494,
"grad_norm": 0.6211861060913116,
"learning_rate": 1.125e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20040014386177063,
"step": 190,
"valid_targets_mean": 5177.6,
"valid_targets_min": 845
},
{
"epoch": 0.20344287949921752,
"grad_norm": 0.5808811625651205,
"learning_rate": 1.1547619047619047e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14674122631549835,
"step": 195,
"valid_targets_mean": 4242.0,
"valid_targets_min": 1649
},
{
"epoch": 0.20865936358894105,
"grad_norm": 0.6379936783242135,
"learning_rate": 1.1845238095238096e-05,
"loss": 0.3501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1750584840774536,
"step": 200,
"valid_targets_mean": 5140.6,
"valid_targets_min": 2976
},
{
"epoch": 0.21387584767866458,
"grad_norm": 0.6471244895039363,
"learning_rate": 1.2142857142857142e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21840491890907288,
"step": 205,
"valid_targets_mean": 4205.1,
"valid_targets_min": 1637
},
{
"epoch": 0.2190923317683881,
"grad_norm": 0.6649540245139282,
"learning_rate": 1.2440476190476192e-05,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17277714610099792,
"step": 210,
"valid_targets_mean": 3557.8,
"valid_targets_min": 974
},
{
"epoch": 0.22430881585811163,
"grad_norm": 0.5805068966151554,
"learning_rate": 1.2738095238095238e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1522510051727295,
"step": 215,
"valid_targets_mean": 5786.1,
"valid_targets_min": 4208
},
{
"epoch": 0.22952529994783516,
"grad_norm": 0.5651854016863527,
"learning_rate": 1.3035714285714287e-05,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1737382411956787,
"step": 220,
"valid_targets_mean": 5721.5,
"valid_targets_min": 4956
},
{
"epoch": 0.2347417840375587,
"grad_norm": 0.5575886336701769,
"learning_rate": 1.3333333333333333e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1307171881198883,
"step": 225,
"valid_targets_mean": 4515.4,
"valid_targets_min": 2175
},
{
"epoch": 0.23995826812728221,
"grad_norm": 0.5292908481239273,
"learning_rate": 1.3630952380952383e-05,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17313320934772491,
"step": 230,
"valid_targets_mean": 6369.9,
"valid_targets_min": 2012
},
{
"epoch": 0.24517475221700574,
"grad_norm": 0.6057809728782292,
"learning_rate": 1.3928571428571429e-05,
"loss": 0.3379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14974744617938995,
"step": 235,
"valid_targets_mean": 3524.4,
"valid_targets_min": 1512
},
{
"epoch": 0.25039123630672927,
"grad_norm": 0.5217173574795259,
"learning_rate": 1.4226190476190478e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1415945291519165,
"step": 240,
"valid_targets_mean": 4837.8,
"valid_targets_min": 1942
},
{
"epoch": 0.2556077203964528,
"grad_norm": 0.5804691857168636,
"learning_rate": 1.4523809523809524e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14725586771965027,
"step": 245,
"valid_targets_mean": 4438.8,
"valid_targets_min": 2127
},
{
"epoch": 0.2608242044861763,
"grad_norm": 0.47455922996119354,
"learning_rate": 1.4821428571428574e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1384584605693817,
"step": 250,
"valid_targets_mean": 6362.5,
"valid_targets_min": 4182
},
{
"epoch": 0.26604068857589985,
"grad_norm": 0.5283181886582033,
"learning_rate": 1.511904761904762e-05,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14814651012420654,
"step": 255,
"valid_targets_mean": 5219.5,
"valid_targets_min": 1846
},
{
"epoch": 0.2712571726656234,
"grad_norm": 0.5121560567291197,
"learning_rate": 1.5416666666666668e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15080620348453522,
"step": 260,
"valid_targets_mean": 5809.4,
"valid_targets_min": 1283
},
{
"epoch": 0.2764736567553469,
"grad_norm": 0.5935465658304162,
"learning_rate": 1.5714285714285715e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419353485107422,
"step": 265,
"valid_targets_mean": 5533.5,
"valid_targets_min": 1370
},
{
"epoch": 0.28169014084507044,
"grad_norm": 0.5083365742176544,
"learning_rate": 1.6011904761904763e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14203351736068726,
"step": 270,
"valid_targets_mean": 4847.2,
"valid_targets_min": 1625
},
{
"epoch": 0.28690662493479396,
"grad_norm": 0.710129632830787,
"learning_rate": 1.630952380952381e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13648484647274017,
"step": 275,
"valid_targets_mean": 5074.6,
"valid_targets_min": 1206
},
{
"epoch": 0.2921231090245175,
"grad_norm": 0.6543408417526709,
"learning_rate": 1.660714285714286e-05,
"loss": 0.3253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14508678019046783,
"step": 280,
"valid_targets_mean": 5268.5,
"valid_targets_min": 2041
},
{
"epoch": 0.297339593114241,
"grad_norm": 0.6418915878980699,
"learning_rate": 1.6904761904761906e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18109339475631714,
"step": 285,
"valid_targets_mean": 4462.6,
"valid_targets_min": 2442
},
{
"epoch": 0.30255607720396455,
"grad_norm": 0.6194921336607193,
"learning_rate": 1.7202380952380954e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862541139125824,
"step": 290,
"valid_targets_mean": 4875.8,
"valid_targets_min": 1394
},
{
"epoch": 0.3077725612936881,
"grad_norm": 0.5319603288677237,
"learning_rate": 1.7500000000000002e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17491722106933594,
"step": 295,
"valid_targets_mean": 6071.2,
"valid_targets_min": 3280
},
{
"epoch": 0.3129890453834116,
"grad_norm": 0.6186814249083511,
"learning_rate": 1.779761904761905e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18440985679626465,
"step": 300,
"valid_targets_mean": 5409.8,
"valid_targets_min": 2536
},
{
"epoch": 0.31820552947313513,
"grad_norm": 0.5355216263580986,
"learning_rate": 1.8095238095238097e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1482452005147934,
"step": 305,
"valid_targets_mean": 5292.5,
"valid_targets_min": 1908
},
{
"epoch": 0.32342201356285866,
"grad_norm": 0.6241421491249363,
"learning_rate": 1.8392857142857142e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17003270983695984,
"step": 310,
"valid_targets_mean": 3620.0,
"valid_targets_min": 2145
},
{
"epoch": 0.3286384976525822,
"grad_norm": 0.5381406797781704,
"learning_rate": 1.8690476190476193e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20382024347782135,
"step": 315,
"valid_targets_mean": 6635.0,
"valid_targets_min": 1875
},
{
"epoch": 0.3338549817423057,
"grad_norm": 0.5140255577789234,
"learning_rate": 1.8988095238095237e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13623102009296417,
"step": 320,
"valid_targets_mean": 5313.2,
"valid_targets_min": 3440
},
{
"epoch": 0.33907146583202924,
"grad_norm": 0.5490101147993109,
"learning_rate": 1.928571428571429e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1648813635110855,
"step": 325,
"valid_targets_mean": 5498.0,
"valid_targets_min": 2695
},
{
"epoch": 0.3442879499217527,
"grad_norm": 0.5244338139150616,
"learning_rate": 1.9583333333333333e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14053672552108765,
"step": 330,
"valid_targets_mean": 4315.6,
"valid_targets_min": 1711
},
{
"epoch": 0.34950443401147624,
"grad_norm": 0.5313860431206892,
"learning_rate": 1.9880952380952384e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14705346524715424,
"step": 335,
"valid_targets_mean": 5682.1,
"valid_targets_min": 2366
},
{
"epoch": 0.35472091810119977,
"grad_norm": 0.5517836053206827,
"learning_rate": 2.0178571428571428e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14730581641197205,
"step": 340,
"valid_targets_mean": 4762.9,
"valid_targets_min": 648
},
{
"epoch": 0.3599374021909233,
"grad_norm": 0.5873148919465628,
"learning_rate": 2.0476190476190476e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14816001057624817,
"step": 345,
"valid_targets_mean": 4330.0,
"valid_targets_min": 1916
},
{
"epoch": 0.3651538862806468,
"grad_norm": 0.5868340714087114,
"learning_rate": 2.0773809523809527e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15234585106372833,
"step": 350,
"valid_targets_mean": 4120.2,
"valid_targets_min": 2846
},
{
"epoch": 0.37037037037037035,
"grad_norm": 0.5889924742292431,
"learning_rate": 2.1071428571428575e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1578396111726761,
"step": 355,
"valid_targets_mean": 3943.8,
"valid_targets_min": 1624
},
{
"epoch": 0.3755868544600939,
"grad_norm": 0.5327053695279573,
"learning_rate": 2.136904761904762e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13582128286361694,
"step": 360,
"valid_targets_mean": 4614.1,
"valid_targets_min": 1073
},
{
"epoch": 0.3808033385498174,
"grad_norm": 0.5987827349693853,
"learning_rate": 2.1666666666666667e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16083483397960663,
"step": 365,
"valid_targets_mean": 5879.5,
"valid_targets_min": 3184
},
{
"epoch": 0.38601982263954093,
"grad_norm": 0.5399690497041971,
"learning_rate": 2.1964285714285718e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14316409826278687,
"step": 370,
"valid_targets_mean": 5359.6,
"valid_targets_min": 2062
},
{
"epoch": 0.39123630672926446,
"grad_norm": 0.45995926795020464,
"learning_rate": 2.2261904761904766e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12717297673225403,
"step": 375,
"valid_targets_mean": 5594.1,
"valid_targets_min": 2426
},
{
"epoch": 0.396452790818988,
"grad_norm": 0.579643544005563,
"learning_rate": 2.255952380952381e-05,
"loss": 0.3179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15679344534873962,
"step": 380,
"valid_targets_mean": 4358.9,
"valid_targets_min": 1152
},
{
"epoch": 0.4016692749087115,
"grad_norm": 0.5444834444148753,
"learning_rate": 2.2857142857142858e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1315690577030182,
"step": 385,
"valid_targets_mean": 4194.0,
"valid_targets_min": 2077
},
{
"epoch": 0.40688575899843504,
"grad_norm": 0.5608144517538177,
"learning_rate": 2.315476190476191e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16721805930137634,
"step": 390,
"valid_targets_mean": 5650.0,
"valid_targets_min": 3618
},
{
"epoch": 0.41210224308815857,
"grad_norm": 0.6559864927637044,
"learning_rate": 2.3452380952380957e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18273624777793884,
"step": 395,
"valid_targets_mean": 4517.8,
"valid_targets_min": 1583
},
{
"epoch": 0.4173187271778821,
"grad_norm": 0.6378535909126191,
"learning_rate": 2.375e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16496604681015015,
"step": 400,
"valid_targets_mean": 5223.9,
"valid_targets_min": 1318
},
{
"epoch": 0.4225352112676056,
"grad_norm": 0.6781104998447693,
"learning_rate": 2.404761904761905e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17576375603675842,
"step": 405,
"valid_targets_mean": 3318.2,
"valid_targets_min": 578
},
{
"epoch": 0.42775169535732915,
"grad_norm": 0.5784644184137221,
"learning_rate": 2.4345238095238093e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16208800673484802,
"step": 410,
"valid_targets_mean": 5647.1,
"valid_targets_min": 3608
},
{
"epoch": 0.4329681794470527,
"grad_norm": 0.6573520288389244,
"learning_rate": 2.4642857142857145e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17460080981254578,
"step": 415,
"valid_targets_mean": 4403.0,
"valid_targets_min": 2081
},
{
"epoch": 0.4381846635367762,
"grad_norm": 0.5476098640503447,
"learning_rate": 2.4940476190476192e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1501733809709549,
"step": 420,
"valid_targets_mean": 4802.5,
"valid_targets_min": 2261
},
{
"epoch": 0.44340114762649974,
"grad_norm": 0.5511914866318157,
"learning_rate": 2.523809523809524e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14066597819328308,
"step": 425,
"valid_targets_mean": 6033.6,
"valid_targets_min": 3444
},
{
"epoch": 0.44861763171622326,
"grad_norm": 0.5825093311949527,
"learning_rate": 2.5535714285714284e-05,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14601226150989532,
"step": 430,
"valid_targets_mean": 5004.1,
"valid_targets_min": 1981
},
{
"epoch": 0.4538341158059468,
"grad_norm": 0.6225010243591146,
"learning_rate": 2.5833333333333336e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14383742213249207,
"step": 435,
"valid_targets_mean": 5421.5,
"valid_targets_min": 2777
},
{
"epoch": 0.4590505998956703,
"grad_norm": 0.7252997694301736,
"learning_rate": 2.6130952380952383e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17696425318717957,
"step": 440,
"valid_targets_mean": 5086.2,
"valid_targets_min": 2096
},
{
"epoch": 0.46426708398539385,
"grad_norm": 0.6002954989597811,
"learning_rate": 2.642857142857143e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1518591344356537,
"step": 445,
"valid_targets_mean": 4727.5,
"valid_targets_min": 2695
},
{
"epoch": 0.4694835680751174,
"grad_norm": 0.6363078433064229,
"learning_rate": 2.6726190476190475e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14227741956710815,
"step": 450,
"valid_targets_mean": 3842.5,
"valid_targets_min": 1852
},
{
"epoch": 0.4747000521648409,
"grad_norm": 0.6475283887341605,
"learning_rate": 2.7023809523809527e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1538422852754593,
"step": 455,
"valid_targets_mean": 4200.5,
"valid_targets_min": 474
},
{
"epoch": 0.47991653625456443,
"grad_norm": 0.6316203448975509,
"learning_rate": 2.7321428571428574e-05,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12457837909460068,
"step": 460,
"valid_targets_mean": 4195.6,
"valid_targets_min": 1664
},
{
"epoch": 0.48513302034428796,
"grad_norm": 0.5453336168892163,
"learning_rate": 2.7619047619047622e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14784672856330872,
"step": 465,
"valid_targets_mean": 5087.2,
"valid_targets_min": 1948
},
{
"epoch": 0.4903495044340115,
"grad_norm": 0.5319864811856899,
"learning_rate": 2.7916666666666666e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14754140377044678,
"step": 470,
"valid_targets_mean": 6058.4,
"valid_targets_min": 4615
},
{
"epoch": 0.495565988523735,
"grad_norm": 0.5747818680084603,
"learning_rate": 2.8214285714285718e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15875563025474548,
"step": 475,
"valid_targets_mean": 5760.1,
"valid_targets_min": 2787
},
{
"epoch": 0.5007824726134585,
"grad_norm": 0.537330584769206,
"learning_rate": 2.8511904761904765e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13198646903038025,
"step": 480,
"valid_targets_mean": 5275.2,
"valid_targets_min": 3038
},
{
"epoch": 0.5059989567031821,
"grad_norm": 0.570047820911184,
"learning_rate": 2.8809523809523813e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14526161551475525,
"step": 485,
"valid_targets_mean": 4437.0,
"valid_targets_min": 2076
},
{
"epoch": 0.5112154407929056,
"grad_norm": 0.5424253004654361,
"learning_rate": 2.9107142857142857e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13815993070602417,
"step": 490,
"valid_targets_mean": 4431.6,
"valid_targets_min": 1877
},
{
"epoch": 0.5164319248826291,
"grad_norm": 0.6056196332833156,
"learning_rate": 2.940476190476191e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13893744349479675,
"step": 495,
"valid_targets_mean": 5731.2,
"valid_targets_min": 2686
},
{
"epoch": 0.5216484089723527,
"grad_norm": 0.656594344651998,
"learning_rate": 2.9702380952380956e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16237576305866241,
"step": 500,
"valid_targets_mean": 4444.4,
"valid_targets_min": 1285
},
{
"epoch": 0.5268648930620762,
"grad_norm": 0.6575613660501014,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17889975011348724,
"step": 505,
"valid_targets_mean": 4299.6,
"valid_targets_min": 1091
},
{
"epoch": 0.5320813771517997,
"grad_norm": 0.5479096145334218,
"learning_rate": 3.029761904761905e-05,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14003689587116241,
"step": 510,
"valid_targets_mean": 4393.6,
"valid_targets_min": 1357
},
{
"epoch": 0.5372978612415232,
"grad_norm": 0.5360140658558523,
"learning_rate": 3.059523809523809e-05,
"loss": 0.2981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12671706080436707,
"step": 515,
"valid_targets_mean": 4213.6,
"valid_targets_min": 644
},
{
"epoch": 0.5425143453312468,
"grad_norm": 0.5819274109832838,
"learning_rate": 3.089285714285715e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15547394752502441,
"step": 520,
"valid_targets_mean": 5292.5,
"valid_targets_min": 2411
},
{
"epoch": 0.5477308294209703,
"grad_norm": 0.6271478607759707,
"learning_rate": 3.1190476190476195e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13740107417106628,
"step": 525,
"valid_targets_mean": 3955.8,
"valid_targets_min": 1794
},
{
"epoch": 0.5529473135106938,
"grad_norm": 0.6144076854065791,
"learning_rate": 3.148809523809524e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16323667764663696,
"step": 530,
"valid_targets_mean": 4617.8,
"valid_targets_min": 1360
},
{
"epoch": 0.5581637976004173,
"grad_norm": 0.5755859874184027,
"learning_rate": 3.1785714285714284e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16000992059707642,
"step": 535,
"valid_targets_mean": 4906.9,
"valid_targets_min": 1472
},
{
"epoch": 0.5633802816901409,
"grad_norm": 0.5841607584218472,
"learning_rate": 3.208333333333334e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1828911006450653,
"step": 540,
"valid_targets_mean": 4911.2,
"valid_targets_min": 1598
},
{
"epoch": 0.5685967657798644,
"grad_norm": 0.6225126753513331,
"learning_rate": 3.2380952380952386e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13055923581123352,
"step": 545,
"valid_targets_mean": 3726.4,
"valid_targets_min": 1582
},
{
"epoch": 0.5738132498695879,
"grad_norm": 0.6692567934262729,
"learning_rate": 3.2678571428571434e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15656331181526184,
"step": 550,
"valid_targets_mean": 4944.5,
"valid_targets_min": 2628
},
{
"epoch": 0.5790297339593115,
"grad_norm": 0.5229234196483743,
"learning_rate": 3.2976190476190475e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11388491094112396,
"step": 555,
"valid_targets_mean": 4577.4,
"valid_targets_min": 2796
},
{
"epoch": 0.584246218049035,
"grad_norm": 0.6005262130280019,
"learning_rate": 3.327380952380953e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1324496865272522,
"step": 560,
"valid_targets_mean": 4016.9,
"valid_targets_min": 1753
},
{
"epoch": 0.5894627021387585,
"grad_norm": 0.5582592039832068,
"learning_rate": 3.357142857142858e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16673031449317932,
"step": 565,
"valid_targets_mean": 4915.5,
"valid_targets_min": 3237
},
{
"epoch": 0.594679186228482,
"grad_norm": 0.5260273166710314,
"learning_rate": 3.386904761904762e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1317315697669983,
"step": 570,
"valid_targets_mean": 5027.9,
"valid_targets_min": 1969
},
{
"epoch": 0.5998956703182056,
"grad_norm": 0.5868369090440616,
"learning_rate": 3.4166666666666666e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18660710752010345,
"step": 575,
"valid_targets_mean": 5281.8,
"valid_targets_min": 3504
},
{
"epoch": 0.6051121544079291,
"grad_norm": 0.9504039681858983,
"learning_rate": 3.446428571428572e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1338704526424408,
"step": 580,
"valid_targets_mean": 3767.8,
"valid_targets_min": 1589
},
{
"epoch": 0.6103286384976526,
"grad_norm": 0.5713320017873411,
"learning_rate": 3.476190476190477e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1240009069442749,
"step": 585,
"valid_targets_mean": 3634.8,
"valid_targets_min": 802
},
{
"epoch": 0.6155451225873761,
"grad_norm": 0.5766203236737801,
"learning_rate": 3.505952380952381e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1292295604944229,
"step": 590,
"valid_targets_mean": 4069.0,
"valid_targets_min": 1502
},
{
"epoch": 0.6207616066770997,
"grad_norm": 0.509485527289052,
"learning_rate": 3.535714285714286e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13671892881393433,
"step": 595,
"valid_targets_mean": 4888.6,
"valid_targets_min": 1856
},
{
"epoch": 0.6259780907668232,
"grad_norm": 0.5632636770642139,
"learning_rate": 3.565476190476191e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1881425380706787,
"step": 600,
"valid_targets_mean": 5378.8,
"valid_targets_min": 1564
},
{
"epoch": 0.6311945748565467,
"grad_norm": 0.551815417531546,
"learning_rate": 3.595238095238096e-05,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12198884785175323,
"step": 605,
"valid_targets_mean": 4786.9,
"valid_targets_min": 1645
},
{
"epoch": 0.6364110589462703,
"grad_norm": 0.6064211172693338,
"learning_rate": 3.625e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13710130751132965,
"step": 610,
"valid_targets_mean": 3977.6,
"valid_targets_min": 1062
},
{
"epoch": 0.6416275430359938,
"grad_norm": 2.843437049352432,
"learning_rate": 3.654761904761905e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14728930592536926,
"step": 615,
"valid_targets_mean": 5308.1,
"valid_targets_min": 2902
},
{
"epoch": 0.6468440271257173,
"grad_norm": 0.5212278169545214,
"learning_rate": 3.6845238095238096e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11422304809093475,
"step": 620,
"valid_targets_mean": 4256.2,
"valid_targets_min": 1306
},
{
"epoch": 0.6520605112154408,
"grad_norm": 0.6069012446608004,
"learning_rate": 3.714285714285715e-05,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11972630023956299,
"step": 625,
"valid_targets_mean": 3628.0,
"valid_targets_min": 1473
},
{
"epoch": 0.6572769953051644,
"grad_norm": 0.5524190052154624,
"learning_rate": 3.744047619047619e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14479461312294006,
"step": 630,
"valid_targets_mean": 5443.0,
"valid_targets_min": 1800
},
{
"epoch": 0.6624934793948879,
"grad_norm": 0.5939914890338424,
"learning_rate": 3.773809523809524e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1578492522239685,
"step": 635,
"valid_targets_mean": 4863.4,
"valid_targets_min": 1855
},
{
"epoch": 0.6677099634846114,
"grad_norm": 0.5991744292599832,
"learning_rate": 3.803571428571429e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15006765723228455,
"step": 640,
"valid_targets_mean": 4413.6,
"valid_targets_min": 1766
},
{
"epoch": 0.672926447574335,
"grad_norm": 0.5457954762595464,
"learning_rate": 3.833333333333334e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14794906973838806,
"step": 645,
"valid_targets_mean": 6368.5,
"valid_targets_min": 4418
},
{
"epoch": 0.6781429316640585,
"grad_norm": 0.5704049215370746,
"learning_rate": 3.863095238095238e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14829003810882568,
"step": 650,
"valid_targets_mean": 4605.2,
"valid_targets_min": 3205
},
{
"epoch": 0.6833594157537819,
"grad_norm": 0.6576815095015953,
"learning_rate": 3.892857142857143e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12923435866832733,
"step": 655,
"valid_targets_mean": 5369.6,
"valid_targets_min": 3794
},
{
"epoch": 0.6885758998435054,
"grad_norm": 0.4740614886361887,
"learning_rate": 3.922619047619048e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11359081417322159,
"step": 660,
"valid_targets_mean": 6124.8,
"valid_targets_min": 2690
},
{
"epoch": 0.693792383933229,
"grad_norm": 0.5956200241918845,
"learning_rate": 3.9523809523809526e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1414283812046051,
"step": 665,
"valid_targets_mean": 4818.5,
"valid_targets_min": 2155
},
{
"epoch": 0.6990088680229525,
"grad_norm": 0.5490856058705245,
"learning_rate": 3.982142857142857e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13476689159870148,
"step": 670,
"valid_targets_mean": 4888.8,
"valid_targets_min": 2899
},
{
"epoch": 0.704225352112676,
"grad_norm": 0.5550928220084757,
"learning_rate": 3.999998918212333e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.149751678109169,
"step": 675,
"valid_targets_mean": 4782.4,
"valid_targets_min": 1897
},
{
"epoch": 0.7094418362023995,
"grad_norm": 0.5885239420736949,
"learning_rate": 3.999986748114514e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13731074333190918,
"step": 680,
"valid_targets_mean": 3692.5,
"valid_targets_min": 1406
},
{
"epoch": 0.7146583202921231,
"grad_norm": 0.60321378124438,
"learning_rate": 3.99996105576685e-05,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13662073016166687,
"step": 685,
"valid_targets_mean": 3336.6,
"valid_targets_min": 1719
},
{
"epoch": 0.7198748043818466,
"grad_norm": 0.5236148500487113,
"learning_rate": 3.999921841343052e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13473102450370789,
"step": 690,
"valid_targets_mean": 5899.0,
"valid_targets_min": 1893
},
{
"epoch": 0.7250912884715701,
"grad_norm": 0.5216261505238765,
"learning_rate": 3.999869105108254e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.149178609251976,
"step": 695,
"valid_targets_mean": 6292.6,
"valid_targets_min": 2097
},
{
"epoch": 0.7303077725612936,
"grad_norm": 0.5072205193470503,
"learning_rate": 3.9998028474190154e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1225869357585907,
"step": 700,
"valid_targets_mean": 4711.9,
"valid_targets_min": 1274
},
{
"epoch": 0.7355242566510172,
"grad_norm": 0.5870083608117771,
"learning_rate": 3.999723068723316e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16150489449501038,
"step": 705,
"valid_targets_mean": 3687.8,
"valid_targets_min": 1444
},
{
"epoch": 0.7407407407407407,
"grad_norm": 0.5716499953461907,
"learning_rate": 3.9996297695605534e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14318493008613586,
"step": 710,
"valid_targets_mean": 4756.6,
"valid_targets_min": 2589
},
{
"epoch": 0.7459572248304642,
"grad_norm": 0.5518834028265162,
"learning_rate": 3.999522950561537e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15709498524665833,
"step": 715,
"valid_targets_mean": 5477.6,
"valid_targets_min": 2652
},
{
"epoch": 0.7511737089201878,
"grad_norm": 0.5468921565229283,
"learning_rate": 3.999402612448491e-05,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13745816051959991,
"step": 720,
"valid_targets_mean": 5289.8,
"valid_targets_min": 1577
},
{
"epoch": 0.7563901930099113,
"grad_norm": 0.5341399634224744,
"learning_rate": 3.99926875603504e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11996178328990936,
"step": 725,
"valid_targets_mean": 4295.9,
"valid_targets_min": 1978
},
{
"epoch": 0.7616066770996348,
"grad_norm": 0.5370344491067444,
"learning_rate": 3.9991213822262105e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12039448320865631,
"step": 730,
"valid_targets_mean": 4307.6,
"valid_targets_min": 1036
},
{
"epoch": 0.7668231611893583,
"grad_norm": 0.5654025265803629,
"learning_rate": 3.9989604920184215e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16871072351932526,
"step": 735,
"valid_targets_mean": 4641.4,
"valid_targets_min": 2175
},
{
"epoch": 0.7720396452790819,
"grad_norm": 0.5259197078408168,
"learning_rate": 3.99878608649948e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13495999574661255,
"step": 740,
"valid_targets_mean": 4812.6,
"valid_targets_min": 2191
},
{
"epoch": 0.7772561293688054,
"grad_norm": 1.1255799489662346,
"learning_rate": 3.9985981668485694e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14621102809906006,
"step": 745,
"valid_targets_mean": 5571.9,
"valid_targets_min": 2454
},
{
"epoch": 0.7824726134585289,
"grad_norm": 0.6841805332983792,
"learning_rate": 3.9983967343362476e-05,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594194769859314,
"step": 750,
"valid_targets_mean": 4458.8,
"valid_targets_min": 2398
},
{
"epoch": 0.7876890975482524,
"grad_norm": 0.5688763680479169,
"learning_rate": 3.998181790324434e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11155922710895538,
"step": 755,
"valid_targets_mean": 5125.8,
"valid_targets_min": 1669
},
{
"epoch": 0.792905581637976,
"grad_norm": 0.5663799770218837,
"learning_rate": 3.997953336266402e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13671280443668365,
"step": 760,
"valid_targets_mean": 4331.0,
"valid_targets_min": 1698
},
{
"epoch": 0.7981220657276995,
"grad_norm": 0.4994161989543307,
"learning_rate": 3.997711373706768e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13220706582069397,
"step": 765,
"valid_targets_mean": 4664.6,
"valid_targets_min": 2156
},
{
"epoch": 0.803338549817423,
"grad_norm": 0.5643131809161603,
"learning_rate": 3.997455904281481e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13809676468372345,
"step": 770,
"valid_targets_mean": 4958.5,
"valid_targets_min": 2016
},
{
"epoch": 0.8085550339071466,
"grad_norm": 0.5300737652935752,
"learning_rate": 3.997186929717814e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.130964994430542,
"step": 775,
"valid_targets_mean": 5666.2,
"valid_targets_min": 2116
},
{
"epoch": 0.8137715179968701,
"grad_norm": 0.8166695055830062,
"learning_rate": 3.996904451834349e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1320631504058838,
"step": 780,
"valid_targets_mean": 5200.8,
"valid_targets_min": 885
},
{
"epoch": 0.8189880020865936,
"grad_norm": 0.543142258456127,
"learning_rate": 3.9966084725409675e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1417725682258606,
"step": 785,
"valid_targets_mean": 5192.5,
"valid_targets_min": 2511
},
{
"epoch": 0.8242044861763171,
"grad_norm": 0.5210956540849055,
"learning_rate": 3.996298993838836e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15136831998825073,
"step": 790,
"valid_targets_mean": 5622.9,
"valid_targets_min": 1956
},
{
"epoch": 0.8294209702660407,
"grad_norm": 0.47514344367102546,
"learning_rate": 3.995976017820392e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12267716228961945,
"step": 795,
"valid_targets_mean": 6080.2,
"valid_targets_min": 1678
},
{
"epoch": 0.8346374543557642,
"grad_norm": 0.5198837968552323,
"learning_rate": 3.995639546669331e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12230321764945984,
"step": 800,
"valid_targets_mean": 5335.1,
"valid_targets_min": 2366
},
{
"epoch": 0.8398539384454877,
"grad_norm": 0.5782590386242095,
"learning_rate": 3.995289582660593e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12575706839561462,
"step": 805,
"valid_targets_mean": 4269.2,
"valid_targets_min": 1913
},
{
"epoch": 0.8450704225352113,
"grad_norm": 0.7226163816777547,
"learning_rate": 3.9949261281603415e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16310575604438782,
"step": 810,
"valid_targets_mean": 4868.8,
"valid_targets_min": 2549
},
{
"epoch": 0.8502869066249348,
"grad_norm": 0.5820788067610744,
"learning_rate": 3.9945491856259556e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16203533113002777,
"step": 815,
"valid_targets_mean": 4391.1,
"valid_targets_min": 2389
},
{
"epoch": 0.8555033907146583,
"grad_norm": 0.4808444611294702,
"learning_rate": 3.994158757606009e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12435003370046616,
"step": 820,
"valid_targets_mean": 6628.9,
"valid_targets_min": 1219
},
{
"epoch": 0.8607198748043818,
"grad_norm": 0.5317205644416775,
"learning_rate": 3.993754846740249e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1366286277770996,
"step": 825,
"valid_targets_mean": 5113.5,
"valid_targets_min": 2620
},
{
"epoch": 0.8659363588941054,
"grad_norm": 0.514616285975049,
"learning_rate": 3.9933374557595875e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14324252307415009,
"step": 830,
"valid_targets_mean": 5052.0,
"valid_targets_min": 1822
},
{
"epoch": 0.8711528429838289,
"grad_norm": 0.5563820422337162,
"learning_rate": 3.992906587486076e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14511628448963165,
"step": 835,
"valid_targets_mean": 5581.1,
"valid_targets_min": 1457
},
{
"epoch": 0.8763693270735524,
"grad_norm": 0.5721077702569866,
"learning_rate": 3.992462244832886e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15223796665668488,
"step": 840,
"valid_targets_mean": 5086.6,
"valid_targets_min": 952
},
{
"epoch": 0.881585811163276,
"grad_norm": 0.5725237613771451,
"learning_rate": 3.9920044308042956e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10571226477622986,
"step": 845,
"valid_targets_mean": 3588.8,
"valid_targets_min": 1842
},
{
"epoch": 0.8868022952529995,
"grad_norm": 0.51365646064338,
"learning_rate": 3.991533148495662e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13923339545726776,
"step": 850,
"valid_targets_mean": 5327.6,
"valid_targets_min": 1084
},
{
"epoch": 0.892018779342723,
"grad_norm": 0.5828963561508581,
"learning_rate": 3.991048401093405e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13550780713558197,
"step": 855,
"valid_targets_mean": 4516.8,
"valid_targets_min": 1461
},
{
"epoch": 0.8972352634324465,
"grad_norm": 0.6966096284074984,
"learning_rate": 3.990550191874985e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1444419026374817,
"step": 860,
"valid_targets_mean": 3679.0,
"valid_targets_min": 854
},
{
"epoch": 0.9024517475221701,
"grad_norm": 0.5184778153693645,
"learning_rate": 3.990038524208878e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1318383663892746,
"step": 865,
"valid_targets_mean": 4986.8,
"valid_targets_min": 1791
},
{
"epoch": 0.9076682316118936,
"grad_norm": 0.5331023362961945,
"learning_rate": 3.9895134015545565e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11663781106472015,
"step": 870,
"valid_targets_mean": 3661.8,
"valid_targets_min": 1949
},
{
"epoch": 0.9128847157016171,
"grad_norm": 0.5407143848415595,
"learning_rate": 3.988974827462464e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13874134421348572,
"step": 875,
"valid_targets_mean": 5499.4,
"valid_targets_min": 2758
},
{
"epoch": 0.9181011997913406,
"grad_norm": 0.6194812388582897,
"learning_rate": 3.98842280557399e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12969379127025604,
"step": 880,
"valid_targets_mean": 3967.9,
"valid_targets_min": 1261
},
{
"epoch": 0.9233176838810642,
"grad_norm": 0.5699586459948414,
"learning_rate": 3.98785733962145e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12774772942066193,
"step": 885,
"valid_targets_mean": 5061.0,
"valid_targets_min": 1507
},
{
"epoch": 0.9285341679707877,
"grad_norm": 0.5607102394615596,
"learning_rate": 3.9872784334280555e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1534000188112259,
"step": 890,
"valid_targets_mean": 4859.0,
"valid_targets_min": 998
},
{
"epoch": 0.9337506520605112,
"grad_norm": 0.5331536557365746,
"learning_rate": 3.9866860909078876e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13779212534427643,
"step": 895,
"valid_targets_mean": 5181.9,
"valid_targets_min": 2671
},
{
"epoch": 0.9389671361502347,
"grad_norm": 0.5238806901596113,
"learning_rate": 3.9860803160658756e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17478299140930176,
"step": 900,
"valid_targets_mean": 5491.2,
"valid_targets_min": 2754
},
{
"epoch": 0.9441836202399583,
"grad_norm": 0.5398420703049978,
"learning_rate": 3.985461112997766e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11654013395309448,
"step": 905,
"valid_targets_mean": 4031.8,
"valid_targets_min": 1793
},
{
"epoch": 0.9494001043296818,
"grad_norm": 0.49304635275161546,
"learning_rate": 3.9848284858900955e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.137330561876297,
"step": 910,
"valid_targets_mean": 5403.9,
"valid_targets_min": 2683
},
{
"epoch": 0.9546165884194053,
"grad_norm": 0.5686775162126456,
"learning_rate": 3.984182439020164e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12234842777252197,
"step": 915,
"valid_targets_mean": 4553.5,
"valid_targets_min": 1963
},
{
"epoch": 0.9598330725091289,
"grad_norm": 0.615897132103767,
"learning_rate": 3.9835229767560034e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13465642929077148,
"step": 920,
"valid_targets_mean": 3425.9,
"valid_targets_min": 1124
},
{
"epoch": 0.9650495565988524,
"grad_norm": 0.5417221970747348,
"learning_rate": 3.982850103556351e-05,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15093615651130676,
"step": 925,
"valid_targets_mean": 5625.1,
"valid_targets_min": 3329
},
{
"epoch": 0.9702660406885759,
"grad_norm": 0.5082091887909534,
"learning_rate": 3.982163823970615e-05,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1644631326198578,
"step": 930,
"valid_targets_mean": 4725.9,
"valid_targets_min": 1249
},
{
"epoch": 0.9754825247782994,
"grad_norm": 0.5020653386918221,
"learning_rate": 3.98146414263885e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16657038033008575,
"step": 935,
"valid_targets_mean": 5279.6,
"valid_targets_min": 1039
},
{
"epoch": 0.980699008868023,
"grad_norm": 0.6491733294026691,
"learning_rate": 3.980751064291719e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11266623437404633,
"step": 940,
"valid_targets_mean": 5246.4,
"valid_targets_min": 2342
},
{
"epoch": 0.9859154929577465,
"grad_norm": 0.586745643603928,
"learning_rate": 3.980024593750466e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562008559703827,
"step": 945,
"valid_targets_mean": 4508.4,
"valid_targets_min": 2638
},
{
"epoch": 0.99113197704747,
"grad_norm": 0.5976427152991887,
"learning_rate": 3.979284735926882e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15834422409534454,
"step": 950,
"valid_targets_mean": 4706.4,
"valid_targets_min": 2701
},
{
"epoch": 0.9963484611371936,
"grad_norm": 0.552931359694199,
"learning_rate": 3.978531495823271e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1401374489068985,
"step": 955,
"valid_targets_mean": 5464.8,
"valid_targets_min": 1975
},
{
"epoch": 1.0010432968179448,
"grad_norm": 0.5555627129782201,
"learning_rate": 3.977764878532418e-05,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11594857275485992,
"step": 960,
"valid_targets_mean": 5819.6,
"valid_targets_min": 2150
},
{
"epoch": 1.0062597809076683,
"grad_norm": 0.621737305129113,
"learning_rate": 3.976984889237551e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1225830540060997,
"step": 965,
"valid_targets_mean": 3963.1,
"valid_targets_min": 530
},
{
"epoch": 1.0114762649973918,
"grad_norm": 0.609624728818975,
"learning_rate": 3.9761915332123113e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14671842753887177,
"step": 970,
"valid_targets_mean": 5083.1,
"valid_targets_min": 1630
},
{
"epoch": 1.0166927490871154,
"grad_norm": 0.49609282046376096,
"learning_rate": 3.975384815820713e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12384708225727081,
"step": 975,
"valid_targets_mean": 5693.2,
"valid_targets_min": 2773
},
{
"epoch": 1.021909233176839,
"grad_norm": 0.6954457613343509,
"learning_rate": 3.974564742517109e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12282181531190872,
"step": 980,
"valid_targets_mean": 3497.1,
"valid_targets_min": 1946
},
{
"epoch": 1.0271257172665624,
"grad_norm": 0.6348864007116859,
"learning_rate": 3.973731318846155e-05,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495770364999771,
"step": 985,
"valid_targets_mean": 4063.0,
"valid_targets_min": 1679
},
{
"epoch": 1.032342201356286,
"grad_norm": 0.482982401425952,
"learning_rate": 3.97288455044277e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1389351636171341,
"step": 990,
"valid_targets_mean": 7056.1,
"valid_targets_min": 2762
},
{
"epoch": 1.0375586854460095,
"grad_norm": 0.6245759540283572,
"learning_rate": 3.972024443032098e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15486538410186768,
"step": 995,
"valid_targets_mean": 5081.5,
"valid_targets_min": 2001
},
{
"epoch": 1.042775169535733,
"grad_norm": 0.5572267300723684,
"learning_rate": 3.971151002429471e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11726558208465576,
"step": 1000,
"valid_targets_mean": 3408.6,
"valid_targets_min": 1378
},
{
"epoch": 1.0479916536254565,
"grad_norm": 0.6297986573579426,
"learning_rate": 3.97026423454037e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11347624659538269,
"step": 1005,
"valid_targets_mean": 4425.0,
"valid_targets_min": 1233
},
{
"epoch": 1.05320813771518,
"grad_norm": 1.0334220724567058,
"learning_rate": 3.969364145360383e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1397000104188919,
"step": 1010,
"valid_targets_mean": 5443.9,
"valid_targets_min": 2683
},
{
"epoch": 1.0584246218049036,
"grad_norm": 0.5487545829063336,
"learning_rate": 3.9684507409751655e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12293633818626404,
"step": 1015,
"valid_targets_mean": 4722.2,
"valid_targets_min": 538
},
{
"epoch": 1.063641105894627,
"grad_norm": 0.5225719855265429,
"learning_rate": 3.967524027560401e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12677009403705597,
"step": 1020,
"valid_targets_mean": 5619.6,
"valid_targets_min": 3686
},
{
"epoch": 1.0688575899843507,
"grad_norm": 0.864013546733522,
"learning_rate": 3.966584011381753e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1692778766155243,
"step": 1025,
"valid_targets_mean": 6027.2,
"valid_targets_min": 1870
},
{
"epoch": 1.074074074074074,
"grad_norm": 0.5121362893536919,
"learning_rate": 3.965630698794833e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09930215775966644,
"step": 1030,
"valid_targets_mean": 4419.8,
"valid_targets_min": 699
},
{
"epoch": 1.0792905581637977,
"grad_norm": 0.6385093892320182,
"learning_rate": 3.964664096245149e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14801526069641113,
"step": 1035,
"valid_targets_mean": 5311.0,
"valid_targets_min": 2371
},
{
"epoch": 1.084507042253521,
"grad_norm": 0.5519490683028426,
"learning_rate": 3.9636842102680635e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13327637314796448,
"step": 1040,
"valid_targets_mean": 4245.5,
"valid_targets_min": 521
},
{
"epoch": 1.0897235263432448,
"grad_norm": 0.5813596168647382,
"learning_rate": 3.962691047488754e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15237219631671906,
"step": 1045,
"valid_targets_mean": 4386.4,
"valid_targets_min": 2232
},
{
"epoch": 1.094940010432968,
"grad_norm": 0.6065188708681333,
"learning_rate": 3.9616846146221606e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14218102395534515,
"step": 1050,
"valid_targets_mean": 3918.5,
"valid_targets_min": 908
},
{
"epoch": 1.1001564945226918,
"grad_norm": 0.6071274238740759,
"learning_rate": 3.960664918472947e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1331966370344162,
"step": 1055,
"valid_targets_mean": 4948.6,
"valid_targets_min": 1431
},
{
"epoch": 1.1053729786124151,
"grad_norm": 0.5810232005672644,
"learning_rate": 3.959631965935453e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1407533884048462,
"step": 1060,
"valid_targets_mean": 4580.9,
"valid_targets_min": 1066
},
{
"epoch": 1.1105894627021389,
"grad_norm": 0.5631301298626795,
"learning_rate": 3.958585763993646e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10973257571458817,
"step": 1065,
"valid_targets_mean": 5161.8,
"valid_targets_min": 2310
},
{
"epoch": 1.1158059467918622,
"grad_norm": 0.5202732767439506,
"learning_rate": 3.9575263197210736e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10115311294794083,
"step": 1070,
"valid_targets_mean": 5175.4,
"valid_targets_min": 2177
},
{
"epoch": 1.1210224308815857,
"grad_norm": 0.5882733680606071,
"learning_rate": 3.9564536402808194e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12298896908760071,
"step": 1075,
"valid_targets_mean": 4286.4,
"valid_targets_min": 2060
},
{
"epoch": 1.1262389149713092,
"grad_norm": 0.5995795533171111,
"learning_rate": 3.955367732925451e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12658976018428802,
"step": 1080,
"valid_targets_mean": 4708.6,
"valid_targets_min": 2377
},
{
"epoch": 1.131455399061033,
"grad_norm": 0.6038080285810509,
"learning_rate": 3.954268604996972e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14354118704795837,
"step": 1085,
"valid_targets_mean": 4013.9,
"valid_targets_min": 1598
},
{
"epoch": 1.1366718831507563,
"grad_norm": 0.5477620531002403,
"learning_rate": 3.953156263926773e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15162897109985352,
"step": 1090,
"valid_targets_mean": 6166.2,
"valid_targets_min": 4399
},
{
"epoch": 1.14188836724048,
"grad_norm": 0.7334723583908891,
"learning_rate": 3.952030717235581e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14085112512111664,
"step": 1095,
"valid_targets_mean": 4769.4,
"valid_targets_min": 1678
},
{
"epoch": 1.1471048513302033,
"grad_norm": 0.5306348893521031,
"learning_rate": 3.950891972533408e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13832436501979828,
"step": 1100,
"valid_targets_mean": 6099.9,
"valid_targets_min": 3870
},
{
"epoch": 1.1523213354199269,
"grad_norm": 0.5449133161144042,
"learning_rate": 3.9497400375195e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13858945667743683,
"step": 1105,
"valid_targets_mean": 5039.5,
"valid_targets_min": 1281
},
{
"epoch": 1.1575378195096504,
"grad_norm": 0.7632046290203769,
"learning_rate": 3.948574919982286e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11112897843122482,
"step": 1110,
"valid_targets_mean": 3455.1,
"valid_targets_min": 1829
},
{
"epoch": 1.162754303599374,
"grad_norm": 0.49851988432836863,
"learning_rate": 3.947396627799322e-05,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11539632827043533,
"step": 1115,
"valid_targets_mean": 5286.5,
"valid_targets_min": 1511
},
{
"epoch": 1.1679707876890975,
"grad_norm": 0.5024471509769345,
"learning_rate": 3.946205168937243e-05,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13856856524944305,
"step": 1120,
"valid_targets_mean": 4765.1,
"valid_targets_min": 1964
},
{
"epoch": 1.173187271778821,
"grad_norm": 0.5432749443314605,
"learning_rate": 3.945000551451703e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1260114163160324,
"step": 1125,
"valid_targets_mean": 4719.8,
"valid_targets_min": 3216
},
{
"epoch": 1.1784037558685445,
"grad_norm": 0.5347251152463858,
"learning_rate": 3.9437827834873265e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13661740720272064,
"step": 1130,
"valid_targets_mean": 5735.2,
"valid_targets_min": 2569
},
{
"epoch": 1.183620239958268,
"grad_norm": 0.5849586970257857,
"learning_rate": 3.942551873277649e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13512352108955383,
"step": 1135,
"valid_targets_mean": 3875.9,
"valid_targets_min": 1736
},
{
"epoch": 1.1888367240479916,
"grad_norm": 0.706188938231076,
"learning_rate": 3.941307829145063e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1348978728055954,
"step": 1140,
"valid_targets_mean": 3433.6,
"valid_targets_min": 1074
},
{
"epoch": 1.194053208137715,
"grad_norm": 0.5819976508163556,
"learning_rate": 3.9400506595007624e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12072448432445526,
"step": 1145,
"valid_targets_mean": 5552.4,
"valid_targets_min": 746
},
{
"epoch": 1.1992696922274386,
"grad_norm": 0.521212706251135,
"learning_rate": 3.938780372844685e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12627771496772766,
"step": 1150,
"valid_targets_mean": 4875.2,
"valid_targets_min": 2060
},
{
"epoch": 1.2044861763171621,
"grad_norm": 0.4991058739569063,
"learning_rate": 3.9374969777654535e-05,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11231563240289688,
"step": 1155,
"valid_targets_mean": 4992.5,
"valid_targets_min": 1974
},
{
"epoch": 1.2097026604068857,
"grad_norm": 0.5866190042090614,
"learning_rate": 3.93620048294032e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11389137804508209,
"step": 1160,
"valid_targets_mean": 6012.9,
"valid_targets_min": 2817
},
{
"epoch": 1.2149191444966092,
"grad_norm": 0.4629469681351049,
"learning_rate": 3.9348908971351065e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12433037161827087,
"step": 1165,
"valid_targets_mean": 4916.2,
"valid_targets_min": 2756
},
{
"epoch": 1.2201356285863327,
"grad_norm": 0.509878580010751,
"learning_rate": 3.933568229204145e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10058669745922089,
"step": 1170,
"valid_targets_mean": 4582.0,
"valid_targets_min": 2072
},
{
"epoch": 1.2253521126760563,
"grad_norm": 0.5073486803677913,
"learning_rate": 3.9322324880902177e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14870202541351318,
"step": 1175,
"valid_targets_mean": 6096.4,
"valid_targets_min": 2270
},
{
"epoch": 1.2305685967657798,
"grad_norm": 0.6612168228167724,
"learning_rate": 3.930883682824496e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15461964905261993,
"step": 1180,
"valid_targets_mean": 4362.9,
"valid_targets_min": 3061
},
{
"epoch": 1.2357850808555033,
"grad_norm": 0.6620573437399087,
"learning_rate": 3.929521822526483e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15261363983154297,
"step": 1185,
"valid_targets_mean": 4584.1,
"valid_targets_min": 2628
},
{
"epoch": 1.2410015649452268,
"grad_norm": 0.4756252268617344,
"learning_rate": 3.928146916403946e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12918442487716675,
"step": 1190,
"valid_targets_mean": 5145.9,
"valid_targets_min": 2544
},
{
"epoch": 1.2462180490349504,
"grad_norm": 0.5674756284095253,
"learning_rate": 3.926758973752859e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11604364216327667,
"step": 1195,
"valid_targets_mean": 3338.5,
"valid_targets_min": 1460
},
{
"epoch": 1.251434533124674,
"grad_norm": 0.6470503790424013,
"learning_rate": 3.925358003957338e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12425130605697632,
"step": 1200,
"valid_targets_mean": 3237.9,
"valid_targets_min": 1388
},
{
"epoch": 1.2566510172143974,
"grad_norm": 0.5160599914067892,
"learning_rate": 3.923944016489578e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11762993782758713,
"step": 1205,
"valid_targets_mean": 4643.5,
"valid_targets_min": 1558
},
{
"epoch": 1.261867501304121,
"grad_norm": 0.6457663474938289,
"learning_rate": 3.9225170209097865e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1162123754620552,
"step": 1210,
"valid_targets_mean": 5133.0,
"valid_targets_min": 1571
},
{
"epoch": 1.2670839853938445,
"grad_norm": 0.5568943712279375,
"learning_rate": 3.921077026866125e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14134006202220917,
"step": 1215,
"valid_targets_mean": 4286.0,
"valid_targets_min": 1389
},
{
"epoch": 1.272300469483568,
"grad_norm": 0.517359055890604,
"learning_rate": 3.919624044094636e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11771930754184723,
"step": 1220,
"valid_targets_mean": 4357.6,
"valid_targets_min": 1490
},
{
"epoch": 1.2775169535732915,
"grad_norm": 0.5454382018602275,
"learning_rate": 3.918158082419184e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11294469237327576,
"step": 1225,
"valid_targets_mean": 3347.9,
"valid_targets_min": 1687
},
{
"epoch": 1.282733437663015,
"grad_norm": 0.6268629083676116,
"learning_rate": 3.916679151751383e-05,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13156986236572266,
"step": 1230,
"valid_targets_mean": 5386.9,
"valid_targets_min": 2398
},
{
"epoch": 1.2879499217527386,
"grad_norm": 0.5152482932661713,
"learning_rate": 3.9151872620905356e-05,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12673966586589813,
"step": 1235,
"valid_targets_mean": 5135.2,
"valid_targets_min": 2135
},
{
"epoch": 1.2931664058424621,
"grad_norm": 0.5279356047844522,
"learning_rate": 3.913682423523561e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16639316082000732,
"step": 1240,
"valid_targets_mean": 5856.9,
"valid_targets_min": 2179
},
{
"epoch": 1.2983828899321856,
"grad_norm": 0.5152996791191741,
"learning_rate": 3.912164646224927e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12303348630666733,
"step": 1245,
"valid_targets_mean": 5895.6,
"valid_targets_min": 3347
},
{
"epoch": 1.3035993740219092,
"grad_norm": 0.5491144223145925,
"learning_rate": 3.910633940456585e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11502029746770859,
"step": 1250,
"valid_targets_mean": 4442.5,
"valid_targets_min": 1243
},
{
"epoch": 1.3088158581116327,
"grad_norm": 0.48581532743409384,
"learning_rate": 3.909090316567896e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10068874061107635,
"step": 1255,
"valid_targets_mean": 4060.6,
"valid_targets_min": 1660
},
{
"epoch": 1.3140323422013562,
"grad_norm": 0.5354120459678681,
"learning_rate": 3.9075337849955614e-05,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09602093696594238,
"step": 1260,
"valid_targets_mean": 3535.4,
"valid_targets_min": 1612
},
{
"epoch": 1.3192488262910798,
"grad_norm": 0.6410666645859446,
"learning_rate": 3.905964356263558e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13208051025867462,
"step": 1265,
"valid_targets_mean": 4003.4,
"valid_targets_min": 1629
},
{
"epoch": 1.3244653103808033,
"grad_norm": 0.5129454984326265,
"learning_rate": 3.9043820409830585e-05,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11679510772228241,
"step": 1270,
"valid_targets_mean": 5320.9,
"valid_targets_min": 2200
},
{
"epoch": 1.3296817944705268,
"grad_norm": 0.5156628308288126,
"learning_rate": 3.9027868498523645e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10929737985134125,
"step": 1275,
"valid_targets_mean": 4530.8,
"valid_targets_min": 1509
},
{
"epoch": 1.3348982785602503,
"grad_norm": 0.46219046923829427,
"learning_rate": 3.901178793656836e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10228785872459412,
"step": 1280,
"valid_targets_mean": 5299.5,
"valid_targets_min": 2905
},
{
"epoch": 1.3401147626499739,
"grad_norm": 0.5341016427474178,
"learning_rate": 3.899557883268811e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09990217536687851,
"step": 1285,
"valid_targets_mean": 4161.8,
"valid_targets_min": 1101
},
{
"epoch": 1.3453312467396974,
"grad_norm": 0.5979056549754926,
"learning_rate": 3.897924129647542e-05,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.149190291762352,
"step": 1290,
"valid_targets_mean": 4748.6,
"valid_targets_min": 1896
},
{
"epoch": 1.350547730829421,
"grad_norm": 0.4679255872634688,
"learning_rate": 3.896277543839114e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07849105447530746,
"step": 1295,
"valid_targets_mean": 4052.5,
"valid_targets_min": 1020
},
{
"epoch": 1.3557642149191445,
"grad_norm": 0.48873872918678035,
"learning_rate": 3.894618136976372e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12221433222293854,
"step": 1300,
"valid_targets_mean": 6071.9,
"valid_targets_min": 3029
},
{
"epoch": 1.360980699008868,
"grad_norm": 0.5021611507848466,
"learning_rate": 3.89294592027885e-05,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11469393223524094,
"step": 1305,
"valid_targets_mean": 5044.8,
"valid_targets_min": 1538
},
{
"epoch": 1.3661971830985915,
"grad_norm": 0.6851521282855704,
"learning_rate": 3.891260905052685e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12349982559680939,
"step": 1310,
"valid_targets_mean": 4046.6,
"valid_targets_min": 571
},
{
"epoch": 1.371413667188315,
"grad_norm": 0.4857351004667739,
"learning_rate": 3.8895631026905546e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11351583153009415,
"step": 1315,
"valid_targets_mean": 4832.2,
"valid_targets_min": 474
},
{
"epoch": 1.3766301512780386,
"grad_norm": 0.48743716553823263,
"learning_rate": 3.887852524671587e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13305367529392242,
"step": 1320,
"valid_targets_mean": 4628.4,
"valid_targets_min": 3069
},
{
"epoch": 1.381846635367762,
"grad_norm": 0.5121653531868553,
"learning_rate": 3.886129182561291e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13066956400871277,
"step": 1325,
"valid_targets_mean": 5233.6,
"valid_targets_min": 2904
},
{
"epoch": 1.3870631194574856,
"grad_norm": 0.5334399942963226,
"learning_rate": 3.8843930880114745e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13521258533000946,
"step": 1330,
"valid_targets_mean": 4983.1,
"valid_targets_min": 2285
},
{
"epoch": 1.3922796035472091,
"grad_norm": 0.5364662379844092,
"learning_rate": 3.882644252760168e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09757325053215027,
"step": 1335,
"valid_targets_mean": 5430.8,
"valid_targets_min": 1906
},
{
"epoch": 1.3974960876369327,
"grad_norm": 0.5647185520715633,
"learning_rate": 3.8808826886315426e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16115015745162964,
"step": 1340,
"valid_targets_mean": 5568.1,
"valid_targets_min": 3457
},
{
"epoch": 1.4027125717266562,
"grad_norm": 0.5014826960092932,
"learning_rate": 3.8791084075358344e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11483775824308395,
"step": 1345,
"valid_targets_mean": 4442.0,
"valid_targets_min": 2289
},
{
"epoch": 1.4079290558163797,
"grad_norm": 0.5704838065984214,
"learning_rate": 3.8773214214692564e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11861691623926163,
"step": 1350,
"valid_targets_mean": 4343.2,
"valid_targets_min": 1774
},
{
"epoch": 1.4131455399061033,
"grad_norm": 0.761018845309024,
"learning_rate": 3.8755217425139264e-05,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13714927434921265,
"step": 1355,
"valid_targets_mean": 5168.2,
"valid_targets_min": 3425
},
{
"epoch": 1.4183620239958268,
"grad_norm": 1.0936619935803085,
"learning_rate": 3.8737093828377785e-05,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14459095895290375,
"step": 1360,
"valid_targets_mean": 6778.4,
"valid_targets_min": 3605
},
{
"epoch": 1.4235785080855503,
"grad_norm": 0.7122909792884763,
"learning_rate": 3.8718843546944844e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13594117760658264,
"step": 1365,
"valid_targets_mean": 3794.0,
"valid_targets_min": 2609
},
{
"epoch": 1.4287949921752738,
"grad_norm": 0.6457112430833799,
"learning_rate": 3.870046670423369e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17264269292354584,
"step": 1370,
"valid_targets_mean": 5524.8,
"valid_targets_min": 2106
},
{
"epoch": 1.4340114762649974,
"grad_norm": 0.5822348000748305,
"learning_rate": 3.868196342449327e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16046279668807983,
"step": 1375,
"valid_targets_mean": 5263.5,
"valid_targets_min": 2182
},
{
"epoch": 1.439227960354721,
"grad_norm": 0.5455896041089222,
"learning_rate": 3.8663333832827415e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12363915145397186,
"step": 1380,
"valid_targets_mean": 4780.6,
"valid_targets_min": 1889
},
{
"epoch": 1.4444444444444444,
"grad_norm": 0.5204598568724569,
"learning_rate": 3.864457805519395e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11119193583726883,
"step": 1385,
"valid_targets_mean": 4275.2,
"valid_targets_min": 1765
},
{
"epoch": 1.449660928534168,
"grad_norm": 0.5157545561785613,
"learning_rate": 3.862569621840385e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10522519052028656,
"step": 1390,
"valid_targets_mean": 4213.8,
"valid_targets_min": 1582
},
{
"epoch": 1.4548774126238915,
"grad_norm": 0.6264579348760222,
"learning_rate": 3.860668845012044e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15325672924518585,
"step": 1395,
"valid_targets_mean": 3898.5,
"valid_targets_min": 537
},
{
"epoch": 1.460093896713615,
"grad_norm": 0.5585909276055782,
"learning_rate": 3.8587554878858466e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11405700445175171,
"step": 1400,
"valid_targets_mean": 3959.1,
"valid_targets_min": 2054
},
{
"epoch": 1.4653103808033385,
"grad_norm": 0.49813932042181147,
"learning_rate": 3.8568295633983244e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09434691071510315,
"step": 1405,
"valid_targets_mean": 3593.0,
"valid_targets_min": 1552
},
{
"epoch": 1.470526864893062,
"grad_norm": 0.6041663662890155,
"learning_rate": 3.85489108457098e-05,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1227974146604538,
"step": 1410,
"valid_targets_mean": 5324.5,
"valid_targets_min": 3171
},
{
"epoch": 1.4757433489827856,
"grad_norm": 0.5406878285872566,
"learning_rate": 3.8529400645101984e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16151192784309387,
"step": 1415,
"valid_targets_mean": 6263.1,
"valid_targets_min": 2764
},
{
"epoch": 1.4809598330725091,
"grad_norm": 0.5238933209978773,
"learning_rate": 3.850976516407157e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12694543600082397,
"step": 1420,
"valid_targets_mean": 4904.8,
"valid_targets_min": 3051
},
{
"epoch": 1.4861763171622326,
"grad_norm": 0.49515325116736575,
"learning_rate": 3.8490004535377356e-05,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13720092177391052,
"step": 1425,
"valid_targets_mean": 4950.0,
"valid_targets_min": 1835
},
{
"epoch": 1.4913928012519562,
"grad_norm": 0.5409120061465099,
"learning_rate": 3.8470118892624345e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12328615039587021,
"step": 1430,
"valid_targets_mean": 4782.9,
"valid_targets_min": 1710
},
{
"epoch": 1.4966092853416797,
"grad_norm": 0.5345646077783061,
"learning_rate": 3.8450108370262714e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18213754892349243,
"step": 1435,
"valid_targets_mean": 5736.0,
"valid_targets_min": 2259
},
{
"epoch": 1.5018257694314032,
"grad_norm": 0.5103518853898554,
"learning_rate": 3.8429973103587016e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1235252320766449,
"step": 1440,
"valid_targets_mean": 4339.1,
"valid_targets_min": 1166
},
{
"epoch": 1.5070422535211268,
"grad_norm": 0.4747786716627152,
"learning_rate": 3.840971322873519e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10930084437131882,
"step": 1445,
"valid_targets_mean": 5637.6,
"valid_targets_min": 2409
},
{
"epoch": 1.5122587376108503,
"grad_norm": 0.5150860304783956,
"learning_rate": 3.838932888268771e-05,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14165997505187988,
"step": 1450,
"valid_targets_mean": 5255.9,
"valid_targets_min": 1939
},
{
"epoch": 1.5174752217005738,
"grad_norm": 0.5198511487212314,
"learning_rate": 3.836882020326658e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14433275163173676,
"step": 1455,
"valid_targets_mean": 5713.9,
"valid_targets_min": 2514
},
{
"epoch": 1.5226917057902973,
"grad_norm": 0.671332298083507,
"learning_rate": 3.834818732913448e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14078345894813538,
"step": 1460,
"valid_targets_mean": 3379.2,
"valid_targets_min": 2012
},
{
"epoch": 1.5279081898800209,
"grad_norm": 0.49013989594302837,
"learning_rate": 3.8327430399793754e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11260563135147095,
"step": 1465,
"valid_targets_mean": 5242.4,
"valid_targets_min": 2071
},
{
"epoch": 1.5331246739697444,
"grad_norm": 0.5364799216625429,
"learning_rate": 3.8306549555585536e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09743601083755493,
"step": 1470,
"valid_targets_mean": 2970.5,
"valid_targets_min": 627
},
{
"epoch": 1.538341158059468,
"grad_norm": 0.5204043919051834,
"learning_rate": 3.828554493768876e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11134983599185944,
"step": 1475,
"valid_targets_mean": 4600.8,
"valid_targets_min": 1666
},
{
"epoch": 1.5435576421491914,
"grad_norm": 0.533126954524228,
"learning_rate": 3.826441668811921e-05,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12382099032402039,
"step": 1480,
"valid_targets_mean": 4916.2,
"valid_targets_min": 2308
},
{
"epoch": 1.548774126238915,
"grad_norm": 0.629159424717442,
"learning_rate": 3.8243164949728565e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1136583536863327,
"step": 1485,
"valid_targets_mean": 4257.9,
"valid_targets_min": 1824
},
{
"epoch": 1.5539906103286385,
"grad_norm": 0.5576499245867822,
"learning_rate": 3.8221789866203434e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16036765277385712,
"step": 1490,
"valid_targets_mean": 5219.4,
"valid_targets_min": 2558
},
{
"epoch": 1.559207094418362,
"grad_norm": 0.5011305426689374,
"learning_rate": 3.820029158206438e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10513623058795929,
"step": 1495,
"valid_targets_mean": 5296.9,
"valid_targets_min": 1128
},
{
"epoch": 1.5644235785080856,
"grad_norm": 0.5810044246720123,
"learning_rate": 3.817867024266497e-05,
"loss": 0.2613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13431760668754578,
"step": 1500,
"valid_targets_mean": 4602.8,
"valid_targets_min": 1710
},
{
"epoch": 1.569640062597809,
"grad_norm": 0.4619545433317578,
"learning_rate": 3.8156925994190735e-05,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09452519565820694,
"step": 1505,
"valid_targets_mean": 5179.8,
"valid_targets_min": 2189
},
{
"epoch": 1.5748565466875326,
"grad_norm": 0.5751374560743624,
"learning_rate": 3.813505898365822e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09860014170408249,
"step": 1510,
"valid_targets_mean": 3707.4,
"valid_targets_min": 1501
},
{
"epoch": 1.5800730307772561,
"grad_norm": 0.5174007955451221,
"learning_rate": 3.8113069358914024e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11332970857620239,
"step": 1515,
"valid_targets_mean": 5254.5,
"valid_targets_min": 1860
},
{
"epoch": 1.5852895148669797,
"grad_norm": 0.6377777694857345,
"learning_rate": 3.80909572686337e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12425677478313446,
"step": 1520,
"valid_targets_mean": 5519.5,
"valid_targets_min": 878
},
{
"epoch": 1.5905059989567032,
"grad_norm": 0.531286078112967,
"learning_rate": 3.806872286232086e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10937950015068054,
"step": 1525,
"valid_targets_mean": 5120.5,
"valid_targets_min": 1810
},
{
"epoch": 1.5957224830464267,
"grad_norm": 0.5064919099325197,
"learning_rate": 3.80463662903061e-05,
"loss": 0.2737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10155424475669861,
"step": 1530,
"valid_targets_mean": 5331.2,
"valid_targets_min": 1440
},
{
"epoch": 1.6009389671361502,
"grad_norm": 0.5171512298024863,
"learning_rate": 3.802388770374598e-05,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11525417864322662,
"step": 1535,
"valid_targets_mean": 4886.1,
"valid_targets_min": 2724
},
{
"epoch": 1.6061554512258738,
"grad_norm": 0.5843884031448716,
"learning_rate": 3.8001287254622064e-05,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11978837847709656,
"step": 1540,
"valid_targets_mean": 3578.6,
"valid_targets_min": 1241
},
{
"epoch": 1.6113719353155973,
"grad_norm": 0.5172038207495926,
"learning_rate": 3.797856509573981e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11195925623178482,
"step": 1545,
"valid_targets_mean": 3779.6,
"valid_targets_min": 208
},
{
"epoch": 1.6165884194053208,
"grad_norm": 0.47122341882486524,
"learning_rate": 3.795572138072759e-05,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12011150270700455,
"step": 1550,
"valid_targets_mean": 6209.4,
"valid_targets_min": 1410
},
{
"epoch": 1.6218049034950444,
"grad_norm": 0.48927193258845336,
"learning_rate": 3.793275626403564e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1319829821586609,
"step": 1555,
"valid_targets_mean": 5578.1,
"valid_targets_min": 2057
},
{
"epoch": 1.6270213875847679,
"grad_norm": 0.48409051046392965,
"learning_rate": 3.790966990093503e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10502097010612488,
"step": 1560,
"valid_targets_mean": 5231.0,
"valid_targets_min": 3204
},
{
"epoch": 1.6322378716744914,
"grad_norm": 0.5544493076567448,
"learning_rate": 3.788646244751654e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12199460715055466,
"step": 1565,
"valid_targets_mean": 4882.4,
"valid_targets_min": 3027
},
{
"epoch": 1.637454355764215,
"grad_norm": 0.5645954649757362,
"learning_rate": 3.7863134060689734e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11990859359502792,
"step": 1570,
"valid_targets_mean": 3640.4,
"valid_targets_min": 1349
},
{
"epoch": 1.6426708398539385,
"grad_norm": 0.45622175926885516,
"learning_rate": 3.783968489818179e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09329172968864441,
"step": 1575,
"valid_targets_mean": 5609.4,
"valid_targets_min": 967
},
{
"epoch": 1.647887323943662,
"grad_norm": 0.5746045595380861,
"learning_rate": 3.781611511853646e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15213215351104736,
"step": 1580,
"valid_targets_mean": 4927.5,
"valid_targets_min": 2514
},
{
"epoch": 1.6531038080333855,
"grad_norm": 0.4756606852258843,
"learning_rate": 3.779242488111304e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09551073610782623,
"step": 1585,
"valid_targets_mean": 4230.0,
"valid_targets_min": 1646
},
{
"epoch": 1.658320292123109,
"grad_norm": 0.50567057762336,
"learning_rate": 3.776861434608524e-05,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12129361927509308,
"step": 1590,
"valid_targets_mean": 4804.4,
"valid_targets_min": 2404
},
{
"epoch": 1.6635367762128326,
"grad_norm": 0.5017088642180424,
"learning_rate": 3.774468367444012e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12084630131721497,
"step": 1595,
"valid_targets_mean": 4832.0,
"valid_targets_min": 2261
},
{
"epoch": 1.668753260302556,
"grad_norm": 0.5067963445162644,
"learning_rate": 3.7720633027977034e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10921032726764679,
"step": 1600,
"valid_targets_mean": 4878.5,
"valid_targets_min": 1522
},
{
"epoch": 1.6739697443922796,
"grad_norm": 0.5670844609525346,
"learning_rate": 3.7696462569306467e-05,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11840958148241043,
"step": 1605,
"valid_targets_mean": 3607.9,
"valid_targets_min": 2357
},
{
"epoch": 1.6791862284820032,
"grad_norm": 0.47359585402114174,
"learning_rate": 3.7672172461849e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10673607885837555,
"step": 1610,
"valid_targets_mean": 5604.9,
"valid_targets_min": 1862
},
{
"epoch": 1.6844027125717267,
"grad_norm": 0.48428867641956413,
"learning_rate": 3.7647762869834164e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12657439708709717,
"step": 1615,
"valid_targets_mean": 4580.1,
"valid_targets_min": 1450
},
{
"epoch": 1.6896191966614502,
"grad_norm": 0.5013336800445145,
"learning_rate": 3.7623233958299364e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08720278739929199,
"step": 1620,
"valid_targets_mean": 3723.0,
"valid_targets_min": 1383
},
{
"epoch": 1.6948356807511737,
"grad_norm": 0.5933134524932153,
"learning_rate": 3.7598585893088726e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14190977811813354,
"step": 1625,
"valid_targets_mean": 4540.6,
"valid_targets_min": 1762
},
{
"epoch": 1.7000521648408973,
"grad_norm": 1.2127607017517221,
"learning_rate": 3.7573818840852004e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1074744164943695,
"step": 1630,
"valid_targets_mean": 4648.8,
"valid_targets_min": 2365
},
{
"epoch": 1.7052686489306208,
"grad_norm": 0.4752655984423174,
"learning_rate": 3.754893296904344e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0906633660197258,
"step": 1635,
"valid_targets_mean": 4332.1,
"valid_targets_min": 1967
},
{
"epoch": 1.7104851330203443,
"grad_norm": 0.48332414158338666,
"learning_rate": 3.752392844592064e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12134155631065369,
"step": 1640,
"valid_targets_mean": 4402.6,
"valid_targets_min": 1857
},
{
"epoch": 1.7157016171100679,
"grad_norm": 0.5528011425591683,
"learning_rate": 3.7498805440543436e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13630694150924683,
"step": 1645,
"valid_targets_mean": 4838.1,
"valid_targets_min": 2858
},
{
"epoch": 1.7209181011997914,
"grad_norm": 0.539257716336949,
"learning_rate": 3.747356412277272e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12012304365634918,
"step": 1650,
"valid_targets_mean": 5222.1,
"valid_targets_min": 1210
},
{
"epoch": 1.726134585289515,
"grad_norm": 0.4985928915472987,
"learning_rate": 3.744820466326933e-05,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12551480531692505,
"step": 1655,
"valid_targets_mean": 4609.0,
"valid_targets_min": 1461
},
{
"epoch": 1.7313510693792384,
"grad_norm": 0.48441783157096807,
"learning_rate": 3.7422727233492876e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15556228160858154,
"step": 1660,
"valid_targets_mean": 5658.8,
"valid_targets_min": 1767
},
{
"epoch": 1.736567553468962,
"grad_norm": 0.532508856659577,
"learning_rate": 3.739713200570058e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10466257482767105,
"step": 1665,
"valid_targets_mean": 4985.1,
"valid_targets_min": 1046
},
{
"epoch": 1.7417840375586855,
"grad_norm": 0.5450230060599003,
"learning_rate": 3.737141915294612e-05,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10845594108104706,
"step": 1670,
"valid_targets_mean": 4706.2,
"valid_targets_min": 1168
},
{
"epoch": 1.747000521648409,
"grad_norm": 0.591198881980741,
"learning_rate": 3.734558884907847e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1261470913887024,
"step": 1675,
"valid_targets_mean": 4374.8,
"valid_targets_min": 1659
},
{
"epoch": 1.7522170057381325,
"grad_norm": 0.4954991221034555,
"learning_rate": 3.7319641268740684e-05,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12304702401161194,
"step": 1680,
"valid_targets_mean": 5559.2,
"valid_targets_min": 3116
},
{
"epoch": 1.757433489827856,
"grad_norm": 0.4523983100902319,
"learning_rate": 3.729357658736877e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10654617100954056,
"step": 1685,
"valid_targets_mean": 5304.4,
"valid_targets_min": 2748
},
{
"epoch": 1.7626499739175796,
"grad_norm": 0.4781303041020441,
"learning_rate": 3.7267394981190456e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13260826468467712,
"step": 1690,
"valid_targets_mean": 5369.8,
"valid_targets_min": 2116
},
{
"epoch": 1.7678664580073031,
"grad_norm": 0.4665938814513094,
"learning_rate": 3.724109662722402e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11321903765201569,
"step": 1695,
"valid_targets_mean": 5622.1,
"valid_targets_min": 3314
},
{
"epoch": 1.7730829420970267,
"grad_norm": 0.563972673121229,
"learning_rate": 3.72146817032771e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12348375469446182,
"step": 1700,
"valid_targets_mean": 4625.1,
"valid_targets_min": 916
},
{
"epoch": 1.77829942618675,
"grad_norm": 0.49684534538885133,
"learning_rate": 3.718815038794549e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11572001874446869,
"step": 1705,
"valid_targets_mean": 4280.5,
"valid_targets_min": 617
},
{
"epoch": 1.7835159102764737,
"grad_norm": 0.539515924089831,
"learning_rate": 3.71615028606119e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1124250739812851,
"step": 1710,
"valid_targets_mean": 4333.1,
"valid_targets_min": 1636
},
{
"epoch": 1.788732394366197,
"grad_norm": 0.5258087357470302,
"learning_rate": 3.713473930144479e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1382165402173996,
"step": 1715,
"valid_targets_mean": 4965.2,
"valid_targets_min": 1416
},
{
"epoch": 1.7939488784559208,
"grad_norm": 0.5235070365330642,
"learning_rate": 3.710785989139713e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12338519096374512,
"step": 1720,
"valid_targets_mean": 4041.2,
"valid_targets_min": 1908
},
{
"epoch": 1.799165362545644,
"grad_norm": 0.5419756293085212,
"learning_rate": 3.7080864812205176e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12302734702825546,
"step": 1725,
"valid_targets_mean": 4363.4,
"valid_targets_min": 719
},
{
"epoch": 1.8043818466353678,
"grad_norm": 0.4802544830790868,
"learning_rate": 3.705375424638723e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.124026820063591,
"step": 1730,
"valid_targets_mean": 4707.2,
"valid_targets_min": 2589
},
{
"epoch": 1.8095983307250911,
"grad_norm": 0.48677623141738435,
"learning_rate": 3.702652837724244e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13875910639762878,
"step": 1735,
"valid_targets_mean": 5555.6,
"valid_targets_min": 3939
},
{
"epoch": 1.8148148148148149,
"grad_norm": 0.9516607300521612,
"learning_rate": 3.6999187388849517e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442538946866989,
"step": 1740,
"valid_targets_mean": 4964.8,
"valid_targets_min": 977
},
{
"epoch": 1.8200312989045382,
"grad_norm": 0.5283790292684337,
"learning_rate": 3.697173146606553e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10957943648099899,
"step": 1745,
"valid_targets_mean": 3189.6,
"valid_targets_min": 628
},
{
"epoch": 1.825247782994262,
"grad_norm": 0.5387767109946204,
"learning_rate": 3.694416079452463e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11930787563323975,
"step": 1750,
"valid_targets_mean": 4071.8,
"valid_targets_min": 578
},
{
"epoch": 1.8304642670839852,
"grad_norm": 0.5581490472860003,
"learning_rate": 3.6916475560636806e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12916062772274017,
"step": 1755,
"valid_targets_mean": 4486.4,
"valid_targets_min": 1629
},
{
"epoch": 1.835680751173709,
"grad_norm": 0.5536821065094885,
"learning_rate": 3.688867595158663e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14876341819763184,
"step": 1760,
"valid_targets_mean": 4862.4,
"valid_targets_min": 1730
},
{
"epoch": 1.8408972352634323,
"grad_norm": 0.5843970090001455,
"learning_rate": 3.686076215533198e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16234152019023895,
"step": 1765,
"valid_targets_mean": 5925.6,
"valid_targets_min": 3125
},
{
"epoch": 1.846113719353156,
"grad_norm": 0.6527702228685233,
"learning_rate": 3.683273436060275e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514151692390442,
"step": 1770,
"valid_targets_mean": 3472.9,
"valid_targets_min": 997
},
{
"epoch": 1.8513302034428794,
"grad_norm": 0.46388789877785,
"learning_rate": 3.680459275689964e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.136823832988739,
"step": 1775,
"valid_targets_mean": 5753.6,
"valid_targets_min": 1458
},
{
"epoch": 1.856546687532603,
"grad_norm": 0.5332179778953855,
"learning_rate": 3.677633753449278e-05,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11068500578403473,
"step": 1780,
"valid_targets_mean": 5434.1,
"valid_targets_min": 3823
},
{
"epoch": 1.8617631716223264,
"grad_norm": 1.1242798095109956,
"learning_rate": 3.674796888442056e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11812400817871094,
"step": 1785,
"valid_targets_mean": 4917.5,
"valid_targets_min": 2439
},
{
"epoch": 1.8669796557120502,
"grad_norm": 0.5522589864356385,
"learning_rate": 3.671948699848822e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11022226512432098,
"step": 1790,
"valid_targets_mean": 3553.0,
"valid_targets_min": 2518
},
{
"epoch": 1.8721961398017735,
"grad_norm": 0.5586953345582154,
"learning_rate": 3.6690892069266624e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12100788950920105,
"step": 1795,
"valid_targets_mean": 4217.9,
"valid_targets_min": 2319
},
{
"epoch": 1.8774126238914972,
"grad_norm": 0.6245335282858276,
"learning_rate": 3.666218429009094e-05,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11601720750331879,
"step": 1800,
"valid_targets_mean": 4822.2,
"valid_targets_min": 1259
},
{
"epoch": 1.8826291079812205,
"grad_norm": 0.4361533309646699,
"learning_rate": 3.6633363855059336e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11116553843021393,
"step": 1805,
"valid_targets_mean": 6440.9,
"valid_targets_min": 2174
},
{
"epoch": 1.8878455920709443,
"grad_norm": 0.49914721297729236,
"learning_rate": 3.6604430959031676e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15305811166763306,
"step": 1810,
"valid_targets_mean": 4380.8,
"valid_targets_min": 1366
},
{
"epoch": 1.8930620761606676,
"grad_norm": 0.5437652077862022,
"learning_rate": 3.6575385797628166e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13775449991226196,
"step": 1815,
"valid_targets_mean": 5084.4,
"valid_targets_min": 2826
},
{
"epoch": 1.8982785602503913,
"grad_norm": 0.5165100386805054,
"learning_rate": 3.654622856722808e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13797417283058167,
"step": 1820,
"valid_targets_mean": 4657.2,
"valid_targets_min": 1428
},
{
"epoch": 1.9034950443401146,
"grad_norm": 0.8637494671339646,
"learning_rate": 3.651695946496839e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09824159741401672,
"step": 1825,
"valid_targets_mean": 5041.9,
"valid_targets_min": 3198
},
{
"epoch": 1.9087115284298384,
"grad_norm": 0.45619472777373626,
"learning_rate": 3.6487578688742485e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09745252877473831,
"step": 1830,
"valid_targets_mean": 4831.0,
"valid_targets_min": 648
},
{
"epoch": 1.9139280125195617,
"grad_norm": 0.46659452122338013,
"learning_rate": 3.6458086437198764e-05,
"loss": 0.2343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11686418205499649,
"step": 1835,
"valid_targets_mean": 5696.5,
"valid_targets_min": 1816
},
{
"epoch": 1.9191444966092854,
"grad_norm": 0.5734880079061442,
"learning_rate": 3.642848290973934e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1568131148815155,
"step": 1840,
"valid_targets_mean": 4659.0,
"valid_targets_min": 1469
},
{
"epoch": 1.9243609806990087,
"grad_norm": 0.4718312237043105,
"learning_rate": 3.6398768306518706e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10714077949523926,
"step": 1845,
"valid_targets_mean": 5023.5,
"valid_targets_min": 2130
},
{
"epoch": 1.9295774647887325,
"grad_norm": 0.5573780363946851,
"learning_rate": 3.636894282844233e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1489737182855606,
"step": 1850,
"valid_targets_mean": 3690.5,
"valid_targets_min": 3023
},
{
"epoch": 1.9347939488784558,
"grad_norm": 0.4695102238444236,
"learning_rate": 3.6339006677165316e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11228922009468079,
"step": 1855,
"valid_targets_mean": 5067.9,
"valid_targets_min": 1794
},
{
"epoch": 1.9400104329681795,
"grad_norm": 0.509184552401322,
"learning_rate": 3.630896005509108e-05,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12257759273052216,
"step": 1860,
"valid_targets_mean": 5672.6,
"valid_targets_min": 3567
},
{
"epoch": 1.9452269170579028,
"grad_norm": 0.5624899738669874,
"learning_rate": 3.6278803165369926e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10627146065235138,
"step": 1865,
"valid_targets_mean": 3758.6,
"valid_targets_min": 1298
},
{
"epoch": 1.9504434011476266,
"grad_norm": 0.5845320960330752,
"learning_rate": 3.6248536211897715e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1219656765460968,
"step": 1870,
"valid_targets_mean": 4353.5,
"valid_targets_min": 1778
},
{
"epoch": 1.95565988523735,
"grad_norm": 0.5898029464379284,
"learning_rate": 3.621815939931444e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11879602074623108,
"step": 1875,
"valid_targets_mean": 3925.4,
"valid_targets_min": 1267
},
{
"epoch": 1.9608763693270737,
"grad_norm": 0.47207322347001124,
"learning_rate": 3.6187672933002904e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12292701750993729,
"step": 1880,
"valid_targets_mean": 5703.8,
"valid_targets_min": 3091
},
{
"epoch": 1.966092853416797,
"grad_norm": 0.49751207176942625,
"learning_rate": 3.6157077019087254e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12327823042869568,
"step": 1885,
"valid_targets_mean": 4978.5,
"valid_targets_min": 1778
},
{
"epoch": 1.9713093375065207,
"grad_norm": 0.5215491471402459,
"learning_rate": 3.612637186443169e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13275089859962463,
"step": 1890,
"valid_targets_mean": 4872.0,
"valid_targets_min": 869
},
{
"epoch": 1.976525821596244,
"grad_norm": 0.5480006277598584,
"learning_rate": 3.609555767663895e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11053438484668732,
"step": 1895,
"valid_targets_mean": 6055.5,
"valid_targets_min": 2435
},
{
"epoch": 1.9817423056859678,
"grad_norm": 0.9008272684690406,
"learning_rate": 3.6064634664048996e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14233778417110443,
"step": 1900,
"valid_targets_mean": 3512.8,
"valid_targets_min": 1351
},
{
"epoch": 1.986958789775691,
"grad_norm": 0.6617795177051474,
"learning_rate": 3.603360303573757e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1280476152896881,
"step": 1905,
"valid_targets_mean": 4181.1,
"valid_targets_min": 1982
},
{
"epoch": 1.9921752738654148,
"grad_norm": 0.5497708615752375,
"learning_rate": 3.600246300151476e-05,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11217804253101349,
"step": 1910,
"valid_targets_mean": 4834.0,
"valid_targets_min": 1885
},
{
"epoch": 1.9973917579551381,
"grad_norm": 0.5549717938139402,
"learning_rate": 3.597121477192364e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14330707490444183,
"step": 1915,
"valid_targets_mean": 5543.5,
"valid_targets_min": 1502
},
{
"epoch": 2.0020865936358896,
"grad_norm": 0.5269936041252705,
"learning_rate": 3.593985855823878e-05,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10810284316539764,
"step": 1920,
"valid_targets_mean": 5318.8,
"valid_targets_min": 4030
},
{
"epoch": 2.007303077725613,
"grad_norm": 0.5974233968850137,
"learning_rate": 3.590839457246487e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1327662169933319,
"step": 1925,
"valid_targets_mean": 4653.5,
"valid_targets_min": 1209
},
{
"epoch": 2.0125195618153366,
"grad_norm": 0.569055358921142,
"learning_rate": 3.587682302733527e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15174917876720428,
"step": 1930,
"valid_targets_mean": 5089.8,
"valid_targets_min": 2551
},
{
"epoch": 2.01773604590506,
"grad_norm": 0.6071785094734595,
"learning_rate": 3.584514413631054e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1039377972483635,
"step": 1935,
"valid_targets_mean": 4698.2,
"valid_targets_min": 3511
},
{
"epoch": 2.0229525299947837,
"grad_norm": 0.7649753469176215,
"learning_rate": 3.581335811357703e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1236136332154274,
"step": 1940,
"valid_targets_mean": 5705.1,
"valid_targets_min": 2985
},
{
"epoch": 2.028169014084507,
"grad_norm": 0.55394336882652,
"learning_rate": 3.578146517404546e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11663387715816498,
"step": 1945,
"valid_targets_mean": 4723.4,
"valid_targets_min": 1671
},
{
"epoch": 2.0333854981742308,
"grad_norm": 0.5082030698850123,
"learning_rate": 3.574946553334938e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10076865553855896,
"step": 1950,
"valid_targets_mean": 4673.2,
"valid_targets_min": 2717
},
{
"epoch": 2.038601982263954,
"grad_norm": 0.5567379435319525,
"learning_rate": 3.571735940784381e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1046312004327774,
"step": 1955,
"valid_targets_mean": 4137.0,
"valid_targets_min": 1847
},
{
"epoch": 2.043818466353678,
"grad_norm": 0.48985358034713516,
"learning_rate": 3.5685147014603705e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08953490853309631,
"step": 1960,
"valid_targets_mean": 5168.4,
"valid_targets_min": 3013
},
{
"epoch": 2.049034950443401,
"grad_norm": 0.571831332261129,
"learning_rate": 3.5652828571422536e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10120147466659546,
"step": 1965,
"valid_targets_mean": 4631.1,
"valid_targets_min": 1478
},
{
"epoch": 2.054251434533125,
"grad_norm": 0.7529034629375903,
"learning_rate": 3.5620404296810766e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09623203426599503,
"step": 1970,
"valid_targets_mean": 4019.8,
"valid_targets_min": 1673
},
{
"epoch": 2.059467918622848,
"grad_norm": 0.5687919001896762,
"learning_rate": 3.558787440999442e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11071816086769104,
"step": 1975,
"valid_targets_mean": 5494.5,
"valid_targets_min": 2436
},
{
"epoch": 2.064684402712572,
"grad_norm": 0.5368577826880351,
"learning_rate": 3.55552391309136e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1275230348110199,
"step": 1980,
"valid_targets_mean": 6043.0,
"valid_targets_min": 2155
},
{
"epoch": 2.0699008868022952,
"grad_norm": 0.5409911221432354,
"learning_rate": 3.5522498680220954e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11893551796674728,
"step": 1985,
"valid_targets_mean": 5916.8,
"valid_targets_min": 2004
},
{
"epoch": 2.075117370892019,
"grad_norm": 0.50408544253174,
"learning_rate": 3.5489653279280225e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09793812036514282,
"step": 1990,
"valid_targets_mean": 5182.1,
"valid_targets_min": 2615
},
{
"epoch": 2.0803338549817423,
"grad_norm": 0.6171549014287283,
"learning_rate": 3.545670315016475e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13135838508605957,
"step": 1995,
"valid_targets_mean": 4706.6,
"valid_targets_min": 1718
},
{
"epoch": 2.085550339071466,
"grad_norm": 0.46573730964278404,
"learning_rate": 3.5423648515655934e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09348612278699875,
"step": 2000,
"valid_targets_mean": 5483.9,
"valid_targets_min": 3057
},
{
"epoch": 2.0907668231611893,
"grad_norm": 0.5522490520394556,
"learning_rate": 3.539048959924178e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1360378861427307,
"step": 2005,
"valid_targets_mean": 4643.5,
"valid_targets_min": 1534
},
{
"epoch": 2.095983307250913,
"grad_norm": 0.5474360037399448,
"learning_rate": 3.535722662511535e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12546919286251068,
"step": 2010,
"valid_targets_mean": 4983.0,
"valid_targets_min": 1833
},
{
"epoch": 2.1011997913406364,
"grad_norm": 0.524017047747236,
"learning_rate": 3.532385981817326e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09845712780952454,
"step": 2015,
"valid_targets_mean": 4596.1,
"valid_targets_min": 1390
},
{
"epoch": 2.10641627543036,
"grad_norm": 0.493032897409189,
"learning_rate": 3.5290389404014136e-05,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09936146438121796,
"step": 2020,
"valid_targets_mean": 5361.8,
"valid_targets_min": 2427
},
{
"epoch": 2.1116327595200834,
"grad_norm": 0.48009492015893784,
"learning_rate": 3.5256815608937155e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08758233487606049,
"step": 2025,
"valid_targets_mean": 4458.4,
"valid_targets_min": 1363
},
{
"epoch": 2.116849243609807,
"grad_norm": 0.5338485179025612,
"learning_rate": 3.522313865994043e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09387579560279846,
"step": 2030,
"valid_targets_mean": 4182.8,
"valid_targets_min": 671
},
{
"epoch": 2.1220657276995305,
"grad_norm": 0.7751541416535409,
"learning_rate": 3.518935878471952e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12653851509094238,
"step": 2035,
"valid_targets_mean": 3748.4,
"valid_targets_min": 1312
},
{
"epoch": 2.127282211789254,
"grad_norm": 0.5172812414306709,
"learning_rate": 3.515547621166591e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11102648824453354,
"step": 2040,
"valid_targets_mean": 5220.8,
"valid_targets_min": 2812
},
{
"epoch": 2.1324986958789776,
"grad_norm": 0.5421914141921881,
"learning_rate": 3.5121491169865425e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11301957070827484,
"step": 2045,
"valid_targets_mean": 5223.4,
"valid_targets_min": 2652
},
{
"epoch": 2.1377151799687013,
"grad_norm": 0.5487760380319388,
"learning_rate": 3.508740388909669e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0976884514093399,
"step": 2050,
"valid_targets_mean": 4488.4,
"valid_targets_min": 1460
},
{
"epoch": 2.1429316640584246,
"grad_norm": 0.5405842722582158,
"learning_rate": 3.505321459982961e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12626048922538757,
"step": 2055,
"valid_targets_mean": 5094.5,
"valid_targets_min": 2013
},
{
"epoch": 2.148148148148148,
"grad_norm": 0.5246815278254859,
"learning_rate": 3.501892353322376e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09376654028892517,
"step": 2060,
"valid_targets_mean": 4093.5,
"valid_targets_min": 1208
},
{
"epoch": 2.1533646322378717,
"grad_norm": 0.4251847589281074,
"learning_rate": 3.498453092112687e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08616240322589874,
"step": 2065,
"valid_targets_mean": 4603.5,
"valid_targets_min": 2121
},
{
"epoch": 2.1585811163275954,
"grad_norm": 0.47383850020780094,
"learning_rate": 3.495003699607322e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1174222081899643,
"step": 2070,
"valid_targets_mean": 6127.4,
"valid_targets_min": 2805
},
{
"epoch": 2.1637976004173187,
"grad_norm": 0.47843260960694084,
"learning_rate": 3.49154419912821e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10661450028419495,
"step": 2075,
"valid_targets_mean": 4927.1,
"valid_targets_min": 1689
},
{
"epoch": 2.169014084507042,
"grad_norm": 0.4899763108410606,
"learning_rate": 3.48807461406562e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10473626852035522,
"step": 2080,
"valid_targets_mean": 5954.0,
"valid_targets_min": 1628
},
{
"epoch": 2.174230568596766,
"grad_norm": 0.5388649564403426,
"learning_rate": 3.484594967878007e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11704675853252411,
"step": 2085,
"valid_targets_mean": 5408.0,
"valid_targets_min": 3345
},
{
"epoch": 2.1794470526864895,
"grad_norm": 0.5038235678306854,
"learning_rate": 3.481105284091847e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12047860026359558,
"step": 2090,
"valid_targets_mean": 4923.1,
"valid_targets_min": 2056
},
{
"epoch": 2.184663536776213,
"grad_norm": 0.5218145944948759,
"learning_rate": 3.4776055863014864e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10921941697597504,
"step": 2095,
"valid_targets_mean": 4686.8,
"valid_targets_min": 1503
},
{
"epoch": 2.189880020865936,
"grad_norm": 0.5464581574239525,
"learning_rate": 3.474095898168975e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.132952481508255,
"step": 2100,
"valid_targets_mean": 4852.8,
"valid_targets_min": 2843
},
{
"epoch": 2.19509650495566,
"grad_norm": 0.4939978105645992,
"learning_rate": 3.470576243423911e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08919451385736465,
"step": 2105,
"valid_targets_mean": 4851.6,
"valid_targets_min": 1716
},
{
"epoch": 2.2003129890453836,
"grad_norm": 0.5339982334715729,
"learning_rate": 3.467046645863276e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12849083542823792,
"step": 2110,
"valid_targets_mean": 5342.1,
"valid_targets_min": 2569
},
{
"epoch": 2.205529473135107,
"grad_norm": 0.50197354954302,
"learning_rate": 3.463507129351279e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11599946022033691,
"step": 2115,
"valid_targets_mean": 4914.8,
"valid_targets_min": 1776
},
{
"epoch": 2.2107459572248302,
"grad_norm": 0.5788077914862068,
"learning_rate": 3.459957717819191e-05,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12925925850868225,
"step": 2120,
"valid_targets_mean": 3880.0,
"valid_targets_min": 1375
},
{
"epoch": 2.215962441314554,
"grad_norm": 0.46285027634666653,
"learning_rate": 3.4563984352651874e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07943163812160492,
"step": 2125,
"valid_targets_mean": 4488.4,
"valid_targets_min": 1208
},
{
"epoch": 2.2211789254042777,
"grad_norm": 0.642471074334573,
"learning_rate": 3.45282930575418e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09657199680805206,
"step": 2130,
"valid_targets_mean": 3349.5,
"valid_targets_min": 1582
},
{
"epoch": 2.226395409494001,
"grad_norm": 0.570788848317248,
"learning_rate": 3.449250353417661e-05,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13143855333328247,
"step": 2135,
"valid_targets_mean": 4533.5,
"valid_targets_min": 1976
},
{
"epoch": 2.2316118935837244,
"grad_norm": 0.46714669131619335,
"learning_rate": 3.445661602453533e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1163138896226883,
"step": 2140,
"valid_targets_mean": 6082.4,
"valid_targets_min": 3087
},
{
"epoch": 2.236828377673448,
"grad_norm": 0.5587627949228191,
"learning_rate": 3.44206307712595e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10658030956983566,
"step": 2145,
"valid_targets_mean": 5567.4,
"valid_targets_min": 1752
},
{
"epoch": 2.2420448617631714,
"grad_norm": 0.5303710463405483,
"learning_rate": 3.4384548017651544e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12135177850723267,
"step": 2150,
"valid_targets_mean": 4302.0,
"valid_targets_min": 1581
},
{
"epoch": 2.247261345852895,
"grad_norm": 0.5375666300344333,
"learning_rate": 3.4348368007673065e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10137631744146347,
"step": 2155,
"valid_targets_mean": 4868.8,
"valid_targets_min": 2466
},
{
"epoch": 2.2524778299426185,
"grad_norm": 0.4744381052708486,
"learning_rate": 3.4312090985943266e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12538987398147583,
"step": 2160,
"valid_targets_mean": 6205.9,
"valid_targets_min": 3568
},
{
"epoch": 2.257694314032342,
"grad_norm": 0.5048698772755993,
"learning_rate": 3.4275717197737234e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13870665431022644,
"step": 2165,
"valid_targets_mean": 6170.1,
"valid_targets_min": 4471
},
{
"epoch": 2.262910798122066,
"grad_norm": 0.5539634836266141,
"learning_rate": 3.423924688898433e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11574719846248627,
"step": 2170,
"valid_targets_mean": 3427.8,
"valid_targets_min": 952
},
{
"epoch": 2.2681272822117893,
"grad_norm": 0.5553833706907942,
"learning_rate": 3.420268030626651e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15152722597122192,
"step": 2175,
"valid_targets_mean": 5756.5,
"valid_targets_min": 3664
},
{
"epoch": 2.2733437663015126,
"grad_norm": 0.5095935579851769,
"learning_rate": 3.416601769681663e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11749089509248734,
"step": 2180,
"valid_targets_mean": 5107.2,
"valid_targets_min": 2944
},
{
"epoch": 2.2785602503912363,
"grad_norm": 0.5234036773875547,
"learning_rate": 3.412925930851683e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09326408058404922,
"step": 2185,
"valid_targets_mean": 4192.4,
"valid_targets_min": 637
},
{
"epoch": 2.28377673448096,
"grad_norm": 0.4626305179647282,
"learning_rate": 3.40924053898968e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11077827215194702,
"step": 2190,
"valid_targets_mean": 5611.8,
"valid_targets_min": 2071
},
{
"epoch": 2.2889932185706834,
"grad_norm": 0.4695916370734793,
"learning_rate": 3.405545619013214e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09071405231952667,
"step": 2195,
"valid_targets_mean": 4260.8,
"valid_targets_min": 1449
},
{
"epoch": 2.2942097026604067,
"grad_norm": 0.4893098076374061,
"learning_rate": 3.401841195904267e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09764277935028076,
"step": 2200,
"valid_targets_mean": 5340.1,
"valid_targets_min": 1390
},
{
"epoch": 2.2994261867501304,
"grad_norm": 0.4998943508577529,
"learning_rate": 3.398127294709072e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11398491263389587,
"step": 2205,
"valid_targets_mean": 5257.5,
"valid_targets_min": 2999
},
{
"epoch": 2.3046426708398537,
"grad_norm": 0.6434654135986683,
"learning_rate": 3.3944039405379444e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1256795972585678,
"step": 2210,
"valid_targets_mean": 4567.8,
"valid_targets_min": 1197
},
{
"epoch": 2.3098591549295775,
"grad_norm": 0.4832895047866086,
"learning_rate": 3.390671158565115e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10829693078994751,
"step": 2215,
"valid_targets_mean": 5266.4,
"valid_targets_min": 1833
},
{
"epoch": 2.315075639019301,
"grad_norm": 0.5197732499257903,
"learning_rate": 3.386928974028555e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11667078733444214,
"step": 2220,
"valid_targets_mean": 4708.9,
"valid_targets_min": 2253
},
{
"epoch": 2.3202921231090246,
"grad_norm": 0.7416911718593487,
"learning_rate": 3.3831774122298106e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13515786826610565,
"step": 2225,
"valid_targets_mean": 4782.2,
"valid_targets_min": 2366
},
{
"epoch": 2.325508607198748,
"grad_norm": 0.5510764958479842,
"learning_rate": 3.3794164985338266e-05,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10666011273860931,
"step": 2230,
"valid_targets_mean": 4350.9,
"valid_targets_min": 1540
},
{
"epoch": 2.3307250912884716,
"grad_norm": 0.5423326354389533,
"learning_rate": 3.37564625836878e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10791268199682236,
"step": 2235,
"valid_targets_mean": 4865.4,
"valid_targets_min": 2019
},
{
"epoch": 2.335941575378195,
"grad_norm": 0.4972937429968323,
"learning_rate": 3.3718667172259026e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08703801780939102,
"step": 2240,
"valid_targets_mean": 2945.8,
"valid_targets_min": 952
},
{
"epoch": 2.3411580594679187,
"grad_norm": 0.5383237315751074,
"learning_rate": 3.368077900659315e-05,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1342734694480896,
"step": 2245,
"valid_targets_mean": 5155.4,
"valid_targets_min": 2019
},
{
"epoch": 2.346374543557642,
"grad_norm": 0.514318390379442,
"learning_rate": 3.364279834285848e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09559551626443863,
"step": 2250,
"valid_targets_mean": 5152.1,
"valid_targets_min": 976
},
{
"epoch": 2.3515910276473657,
"grad_norm": 0.4910773560407386,
"learning_rate": 3.360472543784875e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10180678218603134,
"step": 2255,
"valid_targets_mean": 4525.9,
"valid_targets_min": 1009
},
{
"epoch": 2.356807511737089,
"grad_norm": 0.5174129329847302,
"learning_rate": 3.356656054898132e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10733669251203537,
"step": 2260,
"valid_targets_mean": 5592.4,
"valid_targets_min": 1074
},
{
"epoch": 2.3620239958268128,
"grad_norm": 0.5954295865676773,
"learning_rate": 3.352830393429547e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09375312924385071,
"step": 2265,
"valid_targets_mean": 3314.8,
"valid_targets_min": 1484
},
{
"epoch": 2.367240479916536,
"grad_norm": 0.5076393805523123,
"learning_rate": 3.3489955852450675e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10176807641983032,
"step": 2270,
"valid_targets_mean": 5248.9,
"valid_targets_min": 1404
},
{
"epoch": 2.37245696400626,
"grad_norm": 0.5436901139551851,
"learning_rate": 3.3451516562724834e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11518465727567673,
"step": 2275,
"valid_targets_mean": 4245.1,
"valid_targets_min": 1524
},
{
"epoch": 2.377673448095983,
"grad_norm": 0.6268421209222852,
"learning_rate": 3.341298632501249e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09579107910394669,
"step": 2280,
"valid_targets_mean": 3428.9,
"valid_targets_min": 1678
},
{
"epoch": 2.382889932185707,
"grad_norm": 0.5315792277064773,
"learning_rate": 3.3374365399823134e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11502724140882492,
"step": 2285,
"valid_targets_mean": 6031.4,
"valid_targets_min": 2479
},
{
"epoch": 2.38810641627543,
"grad_norm": 0.49735017544368204,
"learning_rate": 3.3335654048279395e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09845283627510071,
"step": 2290,
"valid_targets_mean": 4845.5,
"valid_targets_min": 2411
},
{
"epoch": 2.393322900365154,
"grad_norm": 0.5469215023981283,
"learning_rate": 3.329685253211528e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11125972121953964,
"step": 2295,
"valid_targets_mean": 4891.2,
"valid_targets_min": 1818
},
{
"epoch": 2.3985393844548772,
"grad_norm": 0.5596864924707663,
"learning_rate": 3.325796111367444e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09879964590072632,
"step": 2300,
"valid_targets_mean": 4206.2,
"valid_targets_min": 1500
},
{
"epoch": 2.403755868544601,
"grad_norm": 0.653380795920544,
"learning_rate": 3.321898005590835e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12416934967041016,
"step": 2305,
"valid_targets_mean": 6310.6,
"valid_targets_min": 1974
},
{
"epoch": 2.4089723526343243,
"grad_norm": 0.5247996620010477,
"learning_rate": 3.317990962237454e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10957548022270203,
"step": 2310,
"valid_targets_mean": 4463.8,
"valid_targets_min": 1607
},
{
"epoch": 2.414188836724048,
"grad_norm": 0.5196272325888798,
"learning_rate": 3.314075007723487e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08740301430225372,
"step": 2315,
"valid_targets_mean": 4568.4,
"valid_targets_min": 832
},
{
"epoch": 2.4194053208137714,
"grad_norm": 0.5008644373074299,
"learning_rate": 3.3101501685253657e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11096716672182083,
"step": 2320,
"valid_targets_mean": 5336.0,
"valid_targets_min": 4362
},
{
"epoch": 2.424621804903495,
"grad_norm": 0.428977239056974,
"learning_rate": 3.306216471179594e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08757981657981873,
"step": 2325,
"valid_targets_mean": 5136.8,
"valid_targets_min": 2698
},
{
"epoch": 2.4298382889932184,
"grad_norm": 0.5202747625384637,
"learning_rate": 3.3022739422825686e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13886937499046326,
"step": 2330,
"valid_targets_mean": 5362.8,
"valid_targets_min": 2061
},
{
"epoch": 2.435054773082942,
"grad_norm": 0.6250715487666877,
"learning_rate": 3.2983226084903944e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1500546783208847,
"step": 2335,
"valid_targets_mean": 4644.6,
"valid_targets_min": 2649
},
{
"epoch": 2.4402712571726655,
"grad_norm": 0.5557503693150626,
"learning_rate": 3.294362496518711e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09636768698692322,
"step": 2340,
"valid_targets_mean": 3254.9,
"valid_targets_min": 2193
},
{
"epoch": 2.445487741262389,
"grad_norm": 0.5881862964624829,
"learning_rate": 3.290393633142507e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11908422410488129,
"step": 2345,
"valid_targets_mean": 3358.6,
"valid_targets_min": 1389
},
{
"epoch": 2.4507042253521125,
"grad_norm": 0.6091244420286501,
"learning_rate": 3.286416045195943e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11243793368339539,
"step": 2350,
"valid_targets_mean": 4268.9,
"valid_targets_min": 1955
},
{
"epoch": 2.4559207094418363,
"grad_norm": 0.48418326756678837,
"learning_rate": 3.282429759572164e-05,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10682648420333862,
"step": 2355,
"valid_targets_mean": 4991.8,
"valid_targets_min": 2411
},
{
"epoch": 2.4611371935315596,
"grad_norm": 0.6154620221091804,
"learning_rate": 3.2784348032231245e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14139145612716675,
"step": 2360,
"valid_targets_mean": 4965.9,
"valid_targets_min": 2315
},
{
"epoch": 2.4663536776212833,
"grad_norm": 0.5385970318526734,
"learning_rate": 3.274431203159402e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14069698750972748,
"step": 2365,
"valid_targets_mean": 4361.8,
"valid_targets_min": 1566
},
{
"epoch": 2.4715701617110066,
"grad_norm": 0.5238156534717102,
"learning_rate": 3.270418986450017e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14405012130737305,
"step": 2370,
"valid_targets_mean": 4839.0,
"valid_targets_min": 2308
},
{
"epoch": 2.4767866458007304,
"grad_norm": 0.5200091388870949,
"learning_rate": 3.266398180222247e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11240924149751663,
"step": 2375,
"valid_targets_mean": 5034.5,
"valid_targets_min": 2717
},
{
"epoch": 2.4820031298904537,
"grad_norm": 0.4730142225715713,
"learning_rate": 3.262368811661446e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10924851894378662,
"step": 2380,
"valid_targets_mean": 5697.5,
"valid_targets_min": 3468
},
{
"epoch": 2.4872196139801774,
"grad_norm": 0.46335257394324575,
"learning_rate": 3.2583309080108576e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1245822086930275,
"step": 2385,
"valid_targets_mean": 6104.1,
"valid_targets_min": 2641
},
{
"epoch": 2.4924360980699007,
"grad_norm": 0.6316903304176071,
"learning_rate": 3.254284496571434e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12317271530628204,
"step": 2390,
"valid_targets_mean": 3770.5,
"valid_targets_min": 1728
},
{
"epoch": 2.4976525821596245,
"grad_norm": 0.5103735358120499,
"learning_rate": 3.25022960470165e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11588916182518005,
"step": 2395,
"valid_targets_mean": 4118.6,
"valid_targets_min": 1346
},
{
"epoch": 2.502869066249348,
"grad_norm": 0.4871119144422768,
"learning_rate": 3.246166259817318e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13652253150939941,
"step": 2400,
"valid_targets_mean": 5047.4,
"valid_targets_min": 1612
},
{
"epoch": 2.5080855503390715,
"grad_norm": 0.4861440062729529,
"learning_rate": 3.242094489391402e-05,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10882267355918884,
"step": 2405,
"valid_targets_mean": 5876.6,
"valid_targets_min": 3946
},
{
"epoch": 2.513302034428795,
"grad_norm": 0.46289868704399717,
"learning_rate": 3.238014320953832e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1044938936829567,
"step": 2410,
"valid_targets_mean": 4208.9,
"valid_targets_min": 1687
},
{
"epoch": 2.5185185185185186,
"grad_norm": 0.5602170615460815,
"learning_rate": 3.233925782091322e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12824594974517822,
"step": 2415,
"valid_targets_mean": 5145.0,
"valid_targets_min": 2146
},
{
"epoch": 2.523735002608242,
"grad_norm": 0.5057079123729123,
"learning_rate": 3.229828900447174e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10087256878614426,
"step": 2420,
"valid_targets_mean": 3804.2,
"valid_targets_min": 1705
},
{
"epoch": 2.5289514866979657,
"grad_norm": 0.4891221057987663,
"learning_rate": 3.2257237037211026e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10101897269487381,
"step": 2425,
"valid_targets_mean": 4812.5,
"valid_targets_min": 1906
},
{
"epoch": 2.534167970787689,
"grad_norm": 0.4800832908969296,
"learning_rate": 3.221610219669038e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09936263412237167,
"step": 2430,
"valid_targets_mean": 5023.1,
"valid_targets_min": 2494
},
{
"epoch": 2.5393844548774127,
"grad_norm": 0.5214332602895505,
"learning_rate": 3.2174884761029456e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11070659756660461,
"step": 2435,
"valid_targets_mean": 3862.4,
"valid_targets_min": 1360
},
{
"epoch": 2.544600938967136,
"grad_norm": 0.4380816528769799,
"learning_rate": 3.2133585008906307e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1011088639497757,
"step": 2440,
"valid_targets_mean": 5430.8,
"valid_targets_min": 1446
},
{
"epoch": 2.5498174230568598,
"grad_norm": 0.46027248912239865,
"learning_rate": 3.209220321955559e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10920900106430054,
"step": 2445,
"valid_targets_mean": 5854.5,
"valid_targets_min": 2768
},
{
"epoch": 2.555033907146583,
"grad_norm": 0.48906639298459353,
"learning_rate": 3.205073967276659e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10530338436365128,
"step": 2450,
"valid_targets_mean": 4083.2,
"valid_targets_min": 1128
},
{
"epoch": 2.560250391236307,
"grad_norm": 0.5144930723935189,
"learning_rate": 3.20091946488814e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0825672447681427,
"step": 2455,
"valid_targets_mean": 3818.4,
"valid_targets_min": 1026
},
{
"epoch": 2.56546687532603,
"grad_norm": 0.4803660050648124,
"learning_rate": 3.196756842879297e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10335831344127655,
"step": 2460,
"valid_targets_mean": 5047.2,
"valid_targets_min": 2337
},
{
"epoch": 2.570683359415754,
"grad_norm": 0.5012910750754004,
"learning_rate": 3.1925861293943234e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11575934290885925,
"step": 2465,
"valid_targets_mean": 5853.1,
"valid_targets_min": 2189
},
{
"epoch": 2.575899843505477,
"grad_norm": 0.4688930376633368,
"learning_rate": 3.1884073526321216e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14094386994838715,
"step": 2470,
"valid_targets_mean": 5949.8,
"valid_targets_min": 3518
},
{
"epoch": 2.581116327595201,
"grad_norm": 0.5088090240154572,
"learning_rate": 3.18422054084611e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09743362665176392,
"step": 2475,
"valid_targets_mean": 4409.0,
"valid_targets_min": 1524
},
{
"epoch": 2.5863328116849242,
"grad_norm": 0.4703303047324992,
"learning_rate": 3.180025722344034e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10678398609161377,
"step": 2480,
"valid_targets_mean": 4728.4,
"valid_targets_min": 1598
},
{
"epoch": 2.591549295774648,
"grad_norm": 0.47593412985692757,
"learning_rate": 3.175822925487774e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10073505342006683,
"step": 2485,
"valid_targets_mean": 4718.8,
"valid_targets_min": 3346
},
{
"epoch": 2.5967657798643713,
"grad_norm": 0.4920218712524974,
"learning_rate": 3.171612178693151e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11507917940616608,
"step": 2490,
"valid_targets_mean": 4916.9,
"valid_targets_min": 1860
},
{
"epoch": 2.601982263954095,
"grad_norm": 0.4704795417511032,
"learning_rate": 3.1673935104297414e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1106872484087944,
"step": 2495,
"valid_targets_mean": 4785.4,
"valid_targets_min": 2302
},
{
"epoch": 2.6071987480438183,
"grad_norm": 0.5091338737668465,
"learning_rate": 3.163166949220675e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10870622843503952,
"step": 2500,
"valid_targets_mean": 4724.8,
"valid_targets_min": 2701
},
{
"epoch": 2.612415232133542,
"grad_norm": 0.5760031101096204,
"learning_rate": 3.158932523642451e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11305932700634003,
"step": 2505,
"valid_targets_mean": 3259.8,
"valid_targets_min": 1670
},
{
"epoch": 2.6176317162232654,
"grad_norm": 0.5586883651231902,
"learning_rate": 3.1546902623247385e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11771593242883682,
"step": 2510,
"valid_targets_mean": 4426.1,
"valid_targets_min": 1614
},
{
"epoch": 2.622848200312989,
"grad_norm": 0.44460060389704,
"learning_rate": 3.1504401939501866e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09268401563167572,
"step": 2515,
"valid_targets_mean": 5090.4,
"valid_targets_min": 1438
},
{
"epoch": 2.6280646844027125,
"grad_norm": 0.5286504269687488,
"learning_rate": 3.146182347254228e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09826931357383728,
"step": 2520,
"valid_targets_mean": 3926.9,
"valid_targets_min": 1849
},
{
"epoch": 2.633281168492436,
"grad_norm": 0.5472063222952046,
"learning_rate": 3.141916751024889e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11021539568901062,
"step": 2525,
"valid_targets_mean": 3473.4,
"valid_targets_min": 1142
},
{
"epoch": 2.6384976525821595,
"grad_norm": 0.5300711810657301,
"learning_rate": 3.137643434102588e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10026170313358307,
"step": 2530,
"valid_targets_mean": 4814.9,
"valid_targets_min": 2288
},
{
"epoch": 2.6437141366718833,
"grad_norm": 1.174712487837169,
"learning_rate": 3.1333624253799464e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12371222674846649,
"step": 2535,
"valid_targets_mean": 4467.4,
"valid_targets_min": 2724
},
{
"epoch": 2.6489306207616066,
"grad_norm": 0.4546709608823972,
"learning_rate": 3.1290737538015904e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10781063139438629,
"step": 2540,
"valid_targets_mean": 5799.5,
"valid_targets_min": 2347
},
{
"epoch": 2.6541471048513303,
"grad_norm": 0.5291702687360377,
"learning_rate": 3.1247774483639575e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1144791916012764,
"step": 2545,
"valid_targets_mean": 5432.8,
"valid_targets_min": 2682
},
{
"epoch": 2.6593635889410536,
"grad_norm": 0.5852435107991737,
"learning_rate": 3.120473538115096e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1168883740901947,
"step": 2550,
"valid_targets_mean": 3021.1,
"valid_targets_min": 1301
},
{
"epoch": 2.6645800730307774,
"grad_norm": 0.47127956576865276,
"learning_rate": 3.116162052154476e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11396898329257965,
"step": 2555,
"valid_targets_mean": 6150.8,
"valid_targets_min": 2352
},
{
"epoch": 2.6697965571205007,
"grad_norm": 0.5677104907261632,
"learning_rate": 3.111843019632784e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1140974909067154,
"step": 2560,
"valid_targets_mean": 4371.8,
"valid_targets_min": 797
},
{
"epoch": 2.6750130412102244,
"grad_norm": 0.5135047232303005,
"learning_rate": 3.1075164697517326e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14363232254981995,
"step": 2565,
"valid_targets_mean": 4825.5,
"valid_targets_min": 1654
},
{
"epoch": 2.6802295252999477,
"grad_norm": 0.4614751924595173,
"learning_rate": 3.10318243176386e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12825116515159607,
"step": 2570,
"valid_targets_mean": 6663.1,
"valid_targets_min": 4549
},
{
"epoch": 2.6854460093896715,
"grad_norm": 0.4447211391455603,
"learning_rate": 3.0988409349723317e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09917019307613373,
"step": 2575,
"valid_targets_mean": 4940.4,
"valid_targets_min": 1874
},
{
"epoch": 2.690662493479395,
"grad_norm": 0.5923061285468841,
"learning_rate": 3.094492008730746e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12513403594493866,
"step": 2580,
"valid_targets_mean": 4263.1,
"valid_targets_min": 1205
},
{
"epoch": 2.6958789775691185,
"grad_norm": 0.47124178649015935,
"learning_rate": 3.09013568244293e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13531747460365295,
"step": 2585,
"valid_targets_mean": 5632.5,
"valid_targets_min": 3831
},
{
"epoch": 2.701095461658842,
"grad_norm": 0.5403423623876756,
"learning_rate": 3.085771985562745e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12237776815891266,
"step": 2590,
"valid_targets_mean": 3775.8,
"valid_targets_min": 965
},
{
"epoch": 2.7063119457485656,
"grad_norm": 0.5155907110817727,
"learning_rate": 3.081400947593887e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13526003062725067,
"step": 2595,
"valid_targets_mean": 5696.9,
"valid_targets_min": 2821
},
{
"epoch": 2.711528429838289,
"grad_norm": 0.44091513916610836,
"learning_rate": 3.077022598089685e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11125567555427551,
"step": 2600,
"valid_targets_mean": 5083.6,
"valid_targets_min": 2907
},
{
"epoch": 2.7167449139280127,
"grad_norm": 0.4431674084041847,
"learning_rate": 3.072636966652904e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09183455258607864,
"step": 2605,
"valid_targets_mean": 5000.2,
"valid_targets_min": 1051
},
{
"epoch": 2.721961398017736,
"grad_norm": 0.5143712648136293,
"learning_rate": 3.0682440829355416e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.095421701669693,
"step": 2610,
"valid_targets_mean": 5004.0,
"valid_targets_min": 1716
},
{
"epoch": 2.7271778821074597,
"grad_norm": 0.651128340932718,
"learning_rate": 3.06384397663863e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12816166877746582,
"step": 2615,
"valid_targets_mean": 4944.4,
"valid_targets_min": 2675
},
{
"epoch": 2.732394366197183,
"grad_norm": 0.5121680237262853,
"learning_rate": 3.059436677512035e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09256739914417267,
"step": 2620,
"valid_targets_mean": 5635.0,
"valid_targets_min": 1654
},
{
"epoch": 2.7376108502869068,
"grad_norm": 0.5253930631743816,
"learning_rate": 3.055022215354254e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0999249666929245,
"step": 2625,
"valid_targets_mean": 4448.1,
"valid_targets_min": 1759
},
{
"epoch": 2.74282733437663,
"grad_norm": 0.4665503122808902,
"learning_rate": 3.0506006200122154e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0951077789068222,
"step": 2630,
"valid_targets_mean": 6096.5,
"valid_targets_min": 2287
},
{
"epoch": 2.748043818466354,
"grad_norm": 0.5540067912846297,
"learning_rate": 3.0461719213810756e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10958708822727203,
"step": 2635,
"valid_targets_mean": 4392.0,
"valid_targets_min": 1177
},
{
"epoch": 2.753260302556077,
"grad_norm": 0.5403656845643583,
"learning_rate": 3.0417361494040167e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09634451568126678,
"step": 2640,
"valid_targets_mean": 4302.9,
"valid_targets_min": 2000
},
{
"epoch": 2.758476786645801,
"grad_norm": 0.48890425105030777,
"learning_rate": 3.037293334072047e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09244073927402496,
"step": 2645,
"valid_targets_mean": 4441.4,
"valid_targets_min": 1241
},
{
"epoch": 2.763693270735524,
"grad_norm": 0.8071588301611544,
"learning_rate": 3.0328435054237944e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12001083046197891,
"step": 2650,
"valid_targets_mean": 5670.4,
"valid_targets_min": 3512
},
{
"epoch": 2.768909754825248,
"grad_norm": 0.5166100506124706,
"learning_rate": 3.0283866935453057e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09812520444393158,
"step": 2655,
"valid_targets_mean": 4672.1,
"valid_targets_min": 2182
},
{
"epoch": 2.7741262389149712,
"grad_norm": 0.5431485751253808,
"learning_rate": 3.023922928569843e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08231854438781738,
"step": 2660,
"valid_targets_mean": 4050.5,
"valid_targets_min": 1195
},
{
"epoch": 2.779342723004695,
"grad_norm": 0.548024674822343,
"learning_rate": 3.019452240677678e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10818839073181152,
"step": 2665,
"valid_targets_mean": 5073.2,
"valid_targets_min": 2784
},
{
"epoch": 2.7845592070944183,
"grad_norm": 0.45219125259119536,
"learning_rate": 3.0149746600958908e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09542427957057953,
"step": 2670,
"valid_targets_mean": 5374.5,
"valid_targets_min": 2643
},
{
"epoch": 2.789775691184142,
"grad_norm": 0.5237070659230012,
"learning_rate": 3.0104902170981633e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12666651606559753,
"step": 2675,
"valid_targets_mean": 5108.5,
"valid_targets_min": 2881
},
{
"epoch": 2.7949921752738653,
"grad_norm": 0.5623383881117362,
"learning_rate": 3.005998942004576e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11492735147476196,
"step": 2680,
"valid_targets_mean": 4912.5,
"valid_targets_min": 1576
},
{
"epoch": 2.800208659363589,
"grad_norm": 0.4967970451357785,
"learning_rate": 3.0015008651814023e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10141061246395111,
"step": 2685,
"valid_targets_mean": 5782.2,
"valid_targets_min": 4685
},
{
"epoch": 2.8054251434533124,
"grad_norm": 0.5569297331417894,
"learning_rate": 2.9969960170409033e-05,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09066125750541687,
"step": 2690,
"valid_targets_mean": 3822.2,
"valid_targets_min": 1107
},
{
"epoch": 2.810641627543036,
"grad_norm": 0.506000102515865,
"learning_rate": 2.9924844280411208e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08468958735466003,
"step": 2695,
"valid_targets_mean": 4311.0,
"valid_targets_min": 1357
},
{
"epoch": 2.8158581116327595,
"grad_norm": 0.5017771195620422,
"learning_rate": 2.987966128685674e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10154730081558228,
"step": 2700,
"valid_targets_mean": 5108.1,
"valid_targets_min": 1460
},
{
"epoch": 2.821074595722483,
"grad_norm": 0.5476798734262958,
"learning_rate": 2.9834411495235526e-05,
"loss": 0.2133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12037491798400879,
"step": 2705,
"valid_targets_mean": 5233.4,
"valid_targets_min": 2800
},
{
"epoch": 2.8262910798122065,
"grad_norm": 0.44932035235145384,
"learning_rate": 2.9789095211489082e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09355040639638901,
"step": 2710,
"valid_targets_mean": 5838.6,
"valid_targets_min": 3760
},
{
"epoch": 2.8315075639019303,
"grad_norm": 0.47333389883380045,
"learning_rate": 2.9743712742008486e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10253272950649261,
"step": 2715,
"valid_targets_mean": 4421.9,
"valid_targets_min": 2890
},
{
"epoch": 2.8367240479916536,
"grad_norm": 0.5375950820349465,
"learning_rate": 2.9698264393632326e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1102854460477829,
"step": 2720,
"valid_targets_mean": 4968.8,
"valid_targets_min": 2680
},
{
"epoch": 2.8419405320813773,
"grad_norm": 0.5232020100718042,
"learning_rate": 2.9652750473644597e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11462263762950897,
"step": 2725,
"valid_targets_mean": 4508.1,
"valid_targets_min": 797
},
{
"epoch": 2.8471570161711006,
"grad_norm": 0.5091367498962615,
"learning_rate": 2.9607171289772635e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.079213947057724,
"step": 2730,
"valid_targets_mean": 3589.6,
"valid_targets_min": 1720
},
{
"epoch": 2.8523735002608244,
"grad_norm": 0.5643515615874065,
"learning_rate": 2.9561527150185035e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1061231940984726,
"step": 2735,
"valid_targets_mean": 3623.8,
"valid_targets_min": 2571
},
{
"epoch": 2.8575899843505477,
"grad_norm": 0.5613579427983747,
"learning_rate": 2.9515818363489582e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11006490886211395,
"step": 2740,
"valid_targets_mean": 3667.1,
"valid_targets_min": 1005
},
{
"epoch": 2.8628064684402714,
"grad_norm": 0.5135290693677292,
"learning_rate": 2.9470045238731127e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08775778114795685,
"step": 2745,
"valid_targets_mean": 3874.0,
"valid_targets_min": 1796
},
{
"epoch": 2.8680229525299947,
"grad_norm": 0.5463293762668832,
"learning_rate": 2.9424208085389544e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09706106781959534,
"step": 2750,
"valid_targets_mean": 3911.5,
"valid_targets_min": 1673
},
{
"epoch": 2.873239436619718,
"grad_norm": 0.5183834834422304,
"learning_rate": 2.9378307213377603e-05,
"loss": 0.2115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08352254331111908,
"step": 2755,
"valid_targets_mean": 4454.4,
"valid_targets_min": 2804
},
{
"epoch": 2.878455920709442,
"grad_norm": 0.5770424551148836,
"learning_rate": 2.93323429330389e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09712273627519608,
"step": 2760,
"valid_targets_mean": 3493.5,
"valid_targets_min": 852
},
{
"epoch": 2.8836724047991655,
"grad_norm": 0.570092751100507,
"learning_rate": 2.9286315555145718e-05,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09480474889278412,
"step": 2765,
"valid_targets_mean": 3264.5,
"valid_targets_min": 1352
},
{
"epoch": 2.888888888888889,
"grad_norm": 0.5805090100880006,
"learning_rate": 2.924022539089698e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10904529690742493,
"step": 2770,
"valid_targets_mean": 3947.9,
"valid_targets_min": 1133
},
{
"epoch": 2.894105372978612,
"grad_norm": 0.5143467986188817,
"learning_rate": 2.9194072751916106e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10561254620552063,
"step": 2775,
"valid_targets_mean": 4174.1,
"valid_targets_min": 1432
},
{
"epoch": 2.899321857068336,
"grad_norm": 0.5183144103803144,
"learning_rate": 2.914785795024893e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11688891053199768,
"step": 2780,
"valid_targets_mean": 4901.1,
"valid_targets_min": 1730
},
{
"epoch": 2.9045383411580596,
"grad_norm": 0.46116198229098343,
"learning_rate": 2.9101581298361563e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09363597631454468,
"step": 2785,
"valid_targets_mean": 5823.0,
"valid_targets_min": 2244
},
{
"epoch": 2.909754825247783,
"grad_norm": 0.48816280745048407,
"learning_rate": 2.90552431091383e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10668014734983444,
"step": 2790,
"valid_targets_mean": 5915.4,
"valid_targets_min": 3217
},
{
"epoch": 2.9149713093375063,
"grad_norm": 0.5517023076313732,
"learning_rate": 2.9008843695879508e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08863114565610886,
"step": 2795,
"valid_targets_mean": 3674.1,
"valid_targets_min": 2100
},
{
"epoch": 2.92018779342723,
"grad_norm": 0.5499560039327777,
"learning_rate": 2.896238337229949e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09519973397254944,
"step": 2800,
"valid_targets_mean": 3128.8,
"valid_targets_min": 1972
},
{
"epoch": 2.9254042775169538,
"grad_norm": 0.5069525819334271,
"learning_rate": 2.891586245252439e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09028097987174988,
"step": 2805,
"valid_targets_mean": 3955.2,
"valid_targets_min": 1256
},
{
"epoch": 2.930620761606677,
"grad_norm": 0.5284167009175657,
"learning_rate": 2.886928125109003e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09937043488025665,
"step": 2810,
"valid_targets_mean": 3209.9,
"valid_targets_min": 1695
},
{
"epoch": 2.9358372456964004,
"grad_norm": 0.514428610600362,
"learning_rate": 2.882264008293982e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09932732582092285,
"step": 2815,
"valid_targets_mean": 4201.6,
"valid_targets_min": 3051
},
{
"epoch": 2.941053729786124,
"grad_norm": 0.47964295600940404,
"learning_rate": 2.8775939263422615e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09465121477842331,
"step": 2820,
"valid_targets_mean": 4782.0,
"valid_targets_min": 721
},
{
"epoch": 2.946270213875848,
"grad_norm": 0.486121904797812,
"learning_rate": 2.872917910829059e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08913619071245193,
"step": 2825,
"valid_targets_mean": 5105.4,
"valid_targets_min": 1089
},
{
"epoch": 2.951486697965571,
"grad_norm": 0.5131169786296125,
"learning_rate": 2.8682359933697075e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11593284457921982,
"step": 2830,
"valid_targets_mean": 6001.1,
"valid_targets_min": 4034
},
{
"epoch": 2.9567031820552945,
"grad_norm": 0.459211391733568,
"learning_rate": 2.863548205619447e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09318007528781891,
"step": 2835,
"valid_targets_mean": 6029.0,
"valid_targets_min": 3253
},
{
"epoch": 2.9619196661450182,
"grad_norm": 0.4458782331734817,
"learning_rate": 2.8588545792732056e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09560025483369827,
"step": 2840,
"valid_targets_mean": 6000.8,
"valid_targets_min": 2719
},
{
"epoch": 2.967136150234742,
"grad_norm": 0.5232106421625217,
"learning_rate": 2.8541551460653875e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10834867507219315,
"step": 2845,
"valid_targets_mean": 4287.6,
"valid_targets_min": 1332
},
{
"epoch": 2.9723526343244653,
"grad_norm": 0.4928528121504029,
"learning_rate": 2.8494499377696586e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10745708644390106,
"step": 2850,
"valid_targets_mean": 4780.6,
"valid_targets_min": 2086
},
{
"epoch": 2.9775691184141886,
"grad_norm": 0.5418304544270003,
"learning_rate": 2.8447389861987295e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11443772912025452,
"step": 2855,
"valid_targets_mean": 5209.1,
"valid_targets_min": 2074
},
{
"epoch": 2.9827856025039123,
"grad_norm": 0.5349528695072473,
"learning_rate": 2.8400223232041456e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0880689024925232,
"step": 2860,
"valid_targets_mean": 3408.2,
"valid_targets_min": 521
},
{
"epoch": 2.988002086593636,
"grad_norm": 0.521180920734931,
"learning_rate": 2.835299980676064e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09700939059257507,
"step": 2865,
"valid_targets_mean": 4068.4,
"valid_targets_min": 1601
},
{
"epoch": 2.9932185706833594,
"grad_norm": 0.5841605140570019,
"learning_rate": 2.8305719905430442e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09895017743110657,
"step": 2870,
"valid_targets_mean": 3847.4,
"valid_targets_min": 1880
},
{
"epoch": 2.9984350547730827,
"grad_norm": 0.5340999977183173,
"learning_rate": 2.8258383847718306e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0996866226196289,
"step": 2875,
"valid_targets_mean": 4587.4,
"valid_targets_min": 728
},
{
"epoch": 3.0041731872717787,
"grad_norm": 0.5432573380933222,
"learning_rate": 2.821099195367135e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10880480706691742,
"step": 2880,
"valid_targets_mean": 4063.4,
"valid_targets_min": 1935
},
{
"epoch": 3.0093896713615025,
"grad_norm": 0.5098029143065635,
"learning_rate": 2.8163544543714216e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1081823781132698,
"step": 2885,
"valid_targets_mean": 5142.0,
"valid_targets_min": 3182
},
{
"epoch": 3.014606155451226,
"grad_norm": 0.5895808146199872,
"learning_rate": 2.811604193864689e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10698902606964111,
"step": 2890,
"valid_targets_mean": 4254.1,
"valid_targets_min": 2355
},
{
"epoch": 3.0198226395409495,
"grad_norm": 0.5650383200847922,
"learning_rate": 2.806848445964255e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11510180681943893,
"step": 2895,
"valid_targets_mean": 5211.9,
"valid_targets_min": 1209
},
{
"epoch": 3.025039123630673,
"grad_norm": 0.5046127729418071,
"learning_rate": 2.8020872428245382e-05,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10055027157068253,
"step": 2900,
"valid_targets_mean": 4550.6,
"valid_targets_min": 2221
},
{
"epoch": 3.0302556077203966,
"grad_norm": 0.5143888700198478,
"learning_rate": 2.797320616636841e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08974705636501312,
"step": 2905,
"valid_targets_mean": 4972.5,
"valid_targets_min": 1387
},
{
"epoch": 3.03547209181012,
"grad_norm": 0.5639627901417625,
"learning_rate": 2.792548599629132e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1048688143491745,
"step": 2910,
"valid_targets_mean": 3778.1,
"valid_targets_min": 1697
},
{
"epoch": 3.0406885758998436,
"grad_norm": 0.4911563103950299,
"learning_rate": 2.787771224065829e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10737472772598267,
"step": 2915,
"valid_targets_mean": 5409.1,
"valid_targets_min": 1856
},
{
"epoch": 3.045905059989567,
"grad_norm": 0.5109420202460491,
"learning_rate": 2.782988522247578e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07555101811885834,
"step": 2920,
"valid_targets_mean": 3609.0,
"valid_targets_min": 1389
},
{
"epoch": 3.0511215440792907,
"grad_norm": 0.5698280895875829,
"learning_rate": 2.7782005265110375e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1072496846318245,
"step": 2925,
"valid_targets_mean": 4099.1,
"valid_targets_min": 1709
},
{
"epoch": 3.056338028169014,
"grad_norm": 0.5686178883209573,
"learning_rate": 2.7734072692286604e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.098935566842556,
"step": 2930,
"valid_targets_mean": 4887.2,
"valid_targets_min": 2229
},
{
"epoch": 3.0615545122587378,
"grad_norm": 0.46177160728507305,
"learning_rate": 2.768608782808472e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11339068412780762,
"step": 2935,
"valid_targets_mean": 4938.5,
"valid_targets_min": 2697
},
{
"epoch": 3.066770996348461,
"grad_norm": 0.6115771579825644,
"learning_rate": 2.763805099693854e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11126293987035751,
"step": 2940,
"valid_targets_mean": 5077.1,
"valid_targets_min": 2709
},
{
"epoch": 3.071987480438185,
"grad_norm": 0.49981838433460235,
"learning_rate": 2.7589962523633218e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10545983910560608,
"step": 2945,
"valid_targets_mean": 5120.2,
"valid_targets_min": 4024
},
{
"epoch": 3.077203964527908,
"grad_norm": 0.5155139995422544,
"learning_rate": 2.75418227333031e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09514853358268738,
"step": 2950,
"valid_targets_mean": 4197.0,
"valid_targets_min": 1432
},
{
"epoch": 3.082420448617632,
"grad_norm": 0.5631463806969298,
"learning_rate": 2.749363195142947e-05,
"loss": 0.2114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11387265473604202,
"step": 2955,
"valid_targets_mean": 3833.0,
"valid_targets_min": 1200
},
{
"epoch": 3.087636932707355,
"grad_norm": 0.4798516487742818,
"learning_rate": 2.744539050383838e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08828402310609818,
"step": 2960,
"valid_targets_mean": 5108.2,
"valid_targets_min": 3763
},
{
"epoch": 3.092853416797079,
"grad_norm": 0.49935619585933316,
"learning_rate": 2.7397098716698463e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0784873217344284,
"step": 2965,
"valid_targets_mean": 3645.4,
"valid_targets_min": 1248
},
{
"epoch": 3.0980699008868022,
"grad_norm": 0.5740236186286182,
"learning_rate": 2.7348756916518663e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11879893392324448,
"step": 2970,
"valid_targets_mean": 4630.5,
"valid_targets_min": 2337
},
{
"epoch": 3.103286384976526,
"grad_norm": 0.49720043396949304,
"learning_rate": 2.7300365430146117e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09360023587942123,
"step": 2975,
"valid_targets_mean": 4715.8,
"valid_targets_min": 2100
},
{
"epoch": 3.1085028690662493,
"grad_norm": 0.5748390414549844,
"learning_rate": 2.7251924584763867e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08847415447235107,
"step": 2980,
"valid_targets_mean": 5378.0,
"valid_targets_min": 1436
},
{
"epoch": 3.113719353155973,
"grad_norm": 0.6128159668745522,
"learning_rate": 2.7203434707888684e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10356289148330688,
"step": 2985,
"valid_targets_mean": 4386.2,
"valid_targets_min": 1504
},
{
"epoch": 3.1189358372456963,
"grad_norm": 0.4623396861624209,
"learning_rate": 2.7154896127368872e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08556468784809113,
"step": 2990,
"valid_targets_mean": 4330.9,
"valid_targets_min": 1170
},
{
"epoch": 3.12415232133542,
"grad_norm": 0.47632641128775954,
"learning_rate": 2.7106309171381995e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09726077318191528,
"step": 2995,
"valid_targets_mean": 5095.5,
"valid_targets_min": 2772
},
{
"epoch": 3.1293688054251434,
"grad_norm": 0.4358985904565822,
"learning_rate": 2.705767416843272e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08343064039945602,
"step": 3000,
"valid_targets_mean": 5686.4,
"valid_targets_min": 2232
},
{
"epoch": 3.134585289514867,
"grad_norm": 0.4662300187644352,
"learning_rate": 2.700899144735055e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09762425720691681,
"step": 3005,
"valid_targets_mean": 7094.2,
"valid_targets_min": 4216
},
{
"epoch": 3.1398017736045905,
"grad_norm": 0.572864701842524,
"learning_rate": 2.696026133728763e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11816585063934326,
"step": 3010,
"valid_targets_mean": 4220.5,
"valid_targets_min": 1831
},
{
"epoch": 3.145018257694314,
"grad_norm": 0.6564931432141663,
"learning_rate": 2.69114841677165e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14300262928009033,
"step": 3015,
"valid_targets_mean": 4046.2,
"valid_targets_min": 2195
},
{
"epoch": 3.1502347417840375,
"grad_norm": 0.5445913204399667,
"learning_rate": 2.6862660268427885e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08168022334575653,
"step": 3020,
"valid_targets_mean": 3510.5,
"valid_targets_min": 1256
},
{
"epoch": 3.1554512258737613,
"grad_norm": 0.43119649018053213,
"learning_rate": 2.6813789969528454e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09258949756622314,
"step": 3025,
"valid_targets_mean": 5464.4,
"valid_targets_min": 1446
},
{
"epoch": 3.1606677099634846,
"grad_norm": 0.4836818452699736,
"learning_rate": 2.6764873601438588e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09587261825799942,
"step": 3030,
"valid_targets_mean": 4636.5,
"valid_targets_min": 3153
},
{
"epoch": 3.1658841940532083,
"grad_norm": 0.5586001035995521,
"learning_rate": 2.6715911494890163e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10193102061748505,
"step": 3035,
"valid_targets_mean": 4426.2,
"valid_targets_min": 1840
},
{
"epoch": 3.1711006781429316,
"grad_norm": 0.5283576654998282,
"learning_rate": 2.6666903980924284e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0847351923584938,
"step": 3040,
"valid_targets_mean": 3890.5,
"valid_targets_min": 1195
},
{
"epoch": 3.1763171622326554,
"grad_norm": 0.5676964469700314,
"learning_rate": 2.6617851390889074e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09379324316978455,
"step": 3045,
"valid_targets_mean": 4143.2,
"valid_targets_min": 1282
},
{
"epoch": 3.1815336463223787,
"grad_norm": 0.4716476728022729,
"learning_rate": 2.6568754056437412e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09522826969623566,
"step": 3050,
"valid_targets_mean": 5153.1,
"valid_targets_min": 1109
},
{
"epoch": 3.1867501304121024,
"grad_norm": 0.5416779765838748,
"learning_rate": 2.6519612309524727e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1138598769903183,
"step": 3055,
"valid_targets_mean": 5099.8,
"valid_targets_min": 1988
},
{
"epoch": 3.1919666145018257,
"grad_norm": 0.46628157941186205,
"learning_rate": 2.6470426482406688e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09998682886362076,
"step": 3060,
"valid_targets_mean": 5174.2,
"valid_targets_min": 2479
},
{
"epoch": 3.1971830985915495,
"grad_norm": 0.47981739400067036,
"learning_rate": 2.6421196907637036e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12754079699516296,
"step": 3065,
"valid_targets_mean": 5541.4,
"valid_targets_min": 1640
},
{
"epoch": 3.202399582681273,
"grad_norm": 0.4885126359821133,
"learning_rate": 2.6371923918065273e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10627619922161102,
"step": 3070,
"valid_targets_mean": 5309.2,
"valid_targets_min": 2826
},
{
"epoch": 3.2076160667709965,
"grad_norm": 0.48230793079709744,
"learning_rate": 2.6322607846834444e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09124992787837982,
"step": 3075,
"valid_targets_mean": 5459.0,
"valid_targets_min": 1847
},
{
"epoch": 3.21283255086072,
"grad_norm": 0.4840767198131845,
"learning_rate": 2.6273249027378878e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11224304139614105,
"step": 3080,
"valid_targets_mean": 6000.8,
"valid_targets_min": 2293
},
{
"epoch": 3.2180490349504436,
"grad_norm": 0.5298237383686266,
"learning_rate": 2.6223847793421938e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12696264684200287,
"step": 3085,
"valid_targets_mean": 5593.4,
"valid_targets_min": 1575
},
{
"epoch": 3.223265519040167,
"grad_norm": 0.5203116045231617,
"learning_rate": 2.6174404478973746e-05,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1275153011083603,
"step": 3090,
"valid_targets_mean": 5331.2,
"valid_targets_min": 1190
},
{
"epoch": 3.2284820031298906,
"grad_norm": 0.5828601869235734,
"learning_rate": 2.612491941832894e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0915302038192749,
"step": 3095,
"valid_targets_mean": 4977.4,
"valid_targets_min": 2578
},
{
"epoch": 3.233698487219614,
"grad_norm": 0.5398544671737381,
"learning_rate": 2.6075392946064417e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10789971053600311,
"step": 3100,
"valid_targets_mean": 3956.2,
"valid_targets_min": 2939
},
{
"epoch": 3.2389149713093377,
"grad_norm": 0.4403664580551399,
"learning_rate": 2.6025825397037057e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08687441051006317,
"step": 3105,
"valid_targets_mean": 5205.9,
"valid_targets_min": 2809
},
{
"epoch": 3.244131455399061,
"grad_norm": 0.7045669258986819,
"learning_rate": 2.5976217106381477e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10237893462181091,
"step": 3110,
"valid_targets_mean": 4216.4,
"valid_targets_min": 2507
},
{
"epoch": 3.2493479394887848,
"grad_norm": 0.7939478704963069,
"learning_rate": 2.5926568409507754e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10826735943555832,
"step": 3115,
"valid_targets_mean": 3386.1,
"valid_targets_min": 2024
},
{
"epoch": 3.254564423578508,
"grad_norm": 0.4631710792328562,
"learning_rate": 2.587687964209914e-05,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09974386543035507,
"step": 3120,
"valid_targets_mean": 6154.4,
"valid_targets_min": 3831
},
{
"epoch": 3.2597809076682314,
"grad_norm": 0.6167658223322712,
"learning_rate": 2.5827151140109836e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10356143116950989,
"step": 3125,
"valid_targets_mean": 3086.8,
"valid_targets_min": 628
},
{
"epoch": 3.264997391757955,
"grad_norm": 0.4803738947300794,
"learning_rate": 2.5777383239762676e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0884963721036911,
"step": 3130,
"valid_targets_mean": 4174.9,
"valid_targets_min": 1509
},
{
"epoch": 3.270213875847679,
"grad_norm": 0.4983305286310679,
"learning_rate": 2.5727576277546888e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10087882727384567,
"step": 3135,
"valid_targets_mean": 5994.5,
"valid_targets_min": 2589
},
{
"epoch": 3.275430359937402,
"grad_norm": 0.5292682881012424,
"learning_rate": 2.5677730590215792e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08946658670902252,
"step": 3140,
"valid_targets_mean": 4218.1,
"valid_targets_min": 2399
},
{
"epoch": 3.2806468440271255,
"grad_norm": 0.5432813000606039,
"learning_rate": 2.5627846514784553e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10207852721214294,
"step": 3145,
"valid_targets_mean": 4425.6,
"valid_targets_min": 1771
},
{
"epoch": 3.2858633281168492,
"grad_norm": 0.4739180329442054,
"learning_rate": 2.5577924388527847e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08045230805873871,
"step": 3150,
"valid_targets_mean": 4412.9,
"valid_targets_min": 1902
},
{
"epoch": 3.291079812206573,
"grad_norm": 0.5129124350976356,
"learning_rate": 2.552796454897766e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10335686802864075,
"step": 3155,
"valid_targets_mean": 4059.5,
"valid_targets_min": 1269
},
{
"epoch": 3.2962962962962963,
"grad_norm": 0.5048649484725314,
"learning_rate": 2.5477967333920942e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08793478459119797,
"step": 3160,
"valid_targets_mean": 4847.5,
"valid_targets_min": 2248
},
{
"epoch": 3.3015127803860196,
"grad_norm": 0.5096565360116999,
"learning_rate": 2.5427933081397357e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09852844476699829,
"step": 3165,
"valid_targets_mean": 6222.0,
"valid_targets_min": 2832
},
{
"epoch": 3.3067292644757433,
"grad_norm": 0.5524222903071977,
"learning_rate": 2.5377862129696966e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09711448103189468,
"step": 3170,
"valid_targets_mean": 3722.2,
"valid_targets_min": 807
},
{
"epoch": 3.311945748565467,
"grad_norm": 0.5010581256335986,
"learning_rate": 2.5327754817357974e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11068551242351532,
"step": 3175,
"valid_targets_mean": 4448.4,
"valid_targets_min": 642
},
{
"epoch": 3.3171622326551904,
"grad_norm": 0.5784075536421294,
"learning_rate": 2.527761148316443e-05,
"loss": 0.2112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11487346887588501,
"step": 3180,
"valid_targets_mean": 4466.1,
"valid_targets_min": 2013
},
{
"epoch": 3.3223787167449137,
"grad_norm": 0.426680182728146,
"learning_rate": 2.522743246614392e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10178497433662415,
"step": 3185,
"valid_targets_mean": 7223.5,
"valid_targets_min": 3311
},
{
"epoch": 3.3275952008346374,
"grad_norm": 0.49811839249156864,
"learning_rate": 2.5177218105565306e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1128610149025917,
"step": 3190,
"valid_targets_mean": 6292.2,
"valid_targets_min": 3554
},
{
"epoch": 3.332811684924361,
"grad_norm": 0.5078621835027752,
"learning_rate": 2.5126968740936386e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08550669997930527,
"step": 3195,
"valid_targets_mean": 4097.4,
"valid_targets_min": 513
},
{
"epoch": 3.3380281690140845,
"grad_norm": 0.45696188434632573,
"learning_rate": 2.5076684712001655e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10041764378547668,
"step": 3200,
"valid_targets_mean": 5978.9,
"valid_targets_min": 4028
},
{
"epoch": 3.343244653103808,
"grad_norm": 0.5543164563658722,
"learning_rate": 2.5026366358739963e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09462873637676239,
"step": 3205,
"valid_targets_mean": 3540.6,
"valid_targets_min": 1551
},
{
"epoch": 3.3484611371935316,
"grad_norm": 0.48975883173543067,
"learning_rate": 2.4976014021362236e-05,
"loss": 0.2017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09664043039083481,
"step": 3210,
"valid_targets_mean": 5091.4,
"valid_targets_min": 1972
},
{
"epoch": 3.3536776212832553,
"grad_norm": 0.513525253001271,
"learning_rate": 2.492562804030918e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09498007595539093,
"step": 3215,
"valid_targets_mean": 4646.6,
"valid_targets_min": 2783
},
{
"epoch": 3.3588941053729786,
"grad_norm": 0.45078436201229916,
"learning_rate": 2.487520875624895e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08881426602602005,
"step": 3220,
"valid_targets_mean": 5305.9,
"valid_targets_min": 1930
},
{
"epoch": 3.364110589462702,
"grad_norm": 0.5572321448921217,
"learning_rate": 2.48247565100749e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10880579054355621,
"step": 3225,
"valid_targets_mean": 4563.0,
"valid_targets_min": 2926
},
{
"epoch": 3.3693270735524257,
"grad_norm": 0.45553103261946104,
"learning_rate": 2.4774271642903213e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09201472997665405,
"step": 3230,
"valid_targets_mean": 5588.8,
"valid_targets_min": 3122
},
{
"epoch": 3.3745435576421494,
"grad_norm": 0.5351435584039045,
"learning_rate": 2.4723754496070652e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12355613708496094,
"step": 3235,
"valid_targets_mean": 5921.0,
"valid_targets_min": 1685
},
{
"epoch": 3.3797600417318727,
"grad_norm": 0.525343936043067,
"learning_rate": 2.4673205411132218e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08146161586046219,
"step": 3240,
"valid_targets_mean": 4078.1,
"valid_targets_min": 1735
},
{
"epoch": 3.384976525821596,
"grad_norm": 0.5969585175703439,
"learning_rate": 2.462262472985886e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11669494211673737,
"step": 3245,
"valid_targets_mean": 4652.0,
"valid_targets_min": 2152
},
{
"epoch": 3.3901930099113198,
"grad_norm": 0.4904811094853748,
"learning_rate": 2.457201279423514e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09706364572048187,
"step": 3250,
"valid_targets_mean": 5183.4,
"valid_targets_min": 997
},
{
"epoch": 3.3954094940010435,
"grad_norm": 0.48524335395336343,
"learning_rate": 2.4521369946456954e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07379470020532608,
"step": 3255,
"valid_targets_mean": 4762.6,
"valid_targets_min": 2958
},
{
"epoch": 3.400625978090767,
"grad_norm": 0.5190341323172759,
"learning_rate": 2.447069652892918e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09849357604980469,
"step": 3260,
"valid_targets_mean": 4050.6,
"valid_targets_min": 1211
},
{
"epoch": 3.40584246218049,
"grad_norm": 0.5384524430842462,
"learning_rate": 2.4419992884263404e-05,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10016826540231705,
"step": 3265,
"valid_targets_mean": 3539.6,
"valid_targets_min": 1561
},
{
"epoch": 3.411058946270214,
"grad_norm": 0.4839432642617593,
"learning_rate": 2.436925935527557e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09900754690170288,
"step": 3270,
"valid_targets_mean": 5767.1,
"valid_targets_min": 2299
},
{
"epoch": 3.4162754303599376,
"grad_norm": 0.5696481657445573,
"learning_rate": 2.4318496284983676e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10886025428771973,
"step": 3275,
"valid_targets_mean": 3911.4,
"valid_targets_min": 869
},
{
"epoch": 3.421491914449661,
"grad_norm": 0.5366826232420506,
"learning_rate": 2.4267704016605453e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08289587497711182,
"step": 3280,
"valid_targets_mean": 3652.1,
"valid_targets_min": 1364
},
{
"epoch": 3.4267083985393842,
"grad_norm": 0.44760621004310186,
"learning_rate": 2.421688289355606e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08253911137580872,
"step": 3285,
"valid_targets_mean": 5076.9,
"valid_targets_min": 1472
},
{
"epoch": 3.431924882629108,
"grad_norm": 0.4659646608854954,
"learning_rate": 2.4166033259445723e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09929650276899338,
"step": 3290,
"valid_targets_mean": 5470.1,
"valid_targets_min": 1714
},
{
"epoch": 3.4371413667188317,
"grad_norm": 0.4944754452218446,
"learning_rate": 2.4115155458077453e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077100932598114,
"step": 3295,
"valid_targets_mean": 6142.6,
"valid_targets_min": 4037
},
{
"epoch": 3.442357850808555,
"grad_norm": 0.522019943595844,
"learning_rate": 2.4064249833444702e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10570424795150757,
"step": 3300,
"valid_targets_mean": 4540.2,
"valid_targets_min": 2456
},
{
"epoch": 3.4475743348982784,
"grad_norm": 0.522378360073098,
"learning_rate": 2.401331672972904e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11249788105487823,
"step": 3305,
"valid_targets_mean": 4124.2,
"valid_targets_min": 1964
},
{
"epoch": 3.452790818988002,
"grad_norm": 0.42580018646073436,
"learning_rate": 2.3962356491297814e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07327315956354141,
"step": 3310,
"valid_targets_mean": 5672.4,
"valid_targets_min": 4383
},
{
"epoch": 3.458007303077726,
"grad_norm": 0.4679885478899873,
"learning_rate": 2.391136946270186e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10529530048370361,
"step": 3315,
"valid_targets_mean": 5588.2,
"valid_targets_min": 1455
},
{
"epoch": 3.463223787167449,
"grad_norm": 0.5281070345011083,
"learning_rate": 2.3860355988673122e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09942032396793365,
"step": 3320,
"valid_targets_mean": 5508.9,
"valid_targets_min": 1571
},
{
"epoch": 3.4684402712571725,
"grad_norm": 0.5745443529023152,
"learning_rate": 2.380931641412236e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11996541917324066,
"step": 3325,
"valid_targets_mean": 5269.0,
"valid_targets_min": 2910
},
{
"epoch": 3.473656755346896,
"grad_norm": 0.5576721588744232,
"learning_rate": 2.3758251084136794e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10790915787220001,
"step": 3330,
"valid_targets_mean": 4009.0,
"valid_targets_min": 1859
},
{
"epoch": 3.4788732394366195,
"grad_norm": 0.4679862459416396,
"learning_rate": 2.3707160343977792e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10469825565814972,
"step": 3335,
"valid_targets_mean": 5888.2,
"valid_targets_min": 2404
},
{
"epoch": 3.4840897235263433,
"grad_norm": 0.49135430552405057,
"learning_rate": 2.3656044539078523e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10415101796388626,
"step": 3340,
"valid_targets_mean": 5754.0,
"valid_targets_min": 3117
},
{
"epoch": 3.4893062076160666,
"grad_norm": 0.49652290425608847,
"learning_rate": 2.3604904015041617e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1110752671957016,
"step": 3345,
"valid_targets_mean": 5765.8,
"valid_targets_min": 4411
},
{
"epoch": 3.4945226917057903,
"grad_norm": 0.5481521868558625,
"learning_rate": 2.3553739117636835e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11676967144012451,
"step": 3350,
"valid_targets_mean": 5643.6,
"valid_targets_min": 1626
},
{
"epoch": 3.4997391757955136,
"grad_norm": 0.5427911383944662,
"learning_rate": 2.3502550192798726e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13177376985549927,
"step": 3355,
"valid_targets_mean": 4822.4,
"valid_targets_min": 1401
},
{
"epoch": 3.5049556598852374,
"grad_norm": 0.5260980866358562,
"learning_rate": 2.345133758662431e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10232182592153549,
"step": 3360,
"valid_targets_mean": 4270.2,
"valid_targets_min": 1748
},
{
"epoch": 3.5101721439749607,
"grad_norm": 0.46855511810503486,
"learning_rate": 2.3400101645370702e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11119550466537476,
"step": 3365,
"valid_targets_mean": 5504.2,
"valid_targets_min": 2764
},
{
"epoch": 3.5153886280646844,
"grad_norm": 0.5238851262161284,
"learning_rate": 2.3348842715452803e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11851681768894196,
"step": 3370,
"valid_targets_mean": 5526.2,
"valid_targets_min": 3314
},
{
"epoch": 3.520605112154408,
"grad_norm": 0.5351641663094854,
"learning_rate": 2.3297561143440932e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10816239565610886,
"step": 3375,
"valid_targets_mean": 5042.5,
"valid_targets_min": 2194
},
{
"epoch": 3.5258215962441315,
"grad_norm": 0.5418076404930998,
"learning_rate": 2.3246257276058507e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10289973020553589,
"step": 3380,
"valid_targets_mean": 4962.2,
"valid_targets_min": 1250
},
{
"epoch": 3.531038080333855,
"grad_norm": 0.5835177880403055,
"learning_rate": 2.3194931460179677e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11193951964378357,
"step": 3385,
"valid_targets_mean": 4545.5,
"valid_targets_min": 1285
},
{
"epoch": 3.5362545644235786,
"grad_norm": 0.4409714869921065,
"learning_rate": 2.314358404282699e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09257347881793976,
"step": 3390,
"valid_targets_mean": 5921.9,
"valid_targets_min": 4133
},
{
"epoch": 3.5414710485133023,
"grad_norm": 0.48479378902625975,
"learning_rate": 2.309221537116906e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10169748961925507,
"step": 3395,
"valid_targets_mean": 5093.8,
"valid_targets_min": 2127
},
{
"epoch": 3.5466875326030256,
"grad_norm": 0.4999342137491525,
"learning_rate": 2.3040825792518188e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10100770741701126,
"step": 3400,
"valid_targets_mean": 5618.4,
"valid_targets_min": 4602
},
{
"epoch": 3.551904016692749,
"grad_norm": 0.5798992641647128,
"learning_rate": 2.298941565432804e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10427383333444595,
"step": 3405,
"valid_targets_mean": 4501.9,
"valid_targets_min": 2200
},
{
"epoch": 3.5571205007824727,
"grad_norm": 0.514151979940359,
"learning_rate": 2.2937985304191285e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09981776773929596,
"step": 3410,
"valid_targets_mean": 5144.2,
"valid_targets_min": 2434
},
{
"epoch": 3.5623369848721964,
"grad_norm": 0.49224599352391807,
"learning_rate": 2.2886535089837247e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11161879450082779,
"step": 3415,
"valid_targets_mean": 7394.0,
"valid_targets_min": 2984
},
{
"epoch": 3.5675534689619197,
"grad_norm": 0.5112976626672822,
"learning_rate": 2.2835065359129564e-05,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08873531967401505,
"step": 3420,
"valid_targets_mean": 4770.6,
"valid_targets_min": 3574
},
{
"epoch": 3.572769953051643,
"grad_norm": 0.5368546255179795,
"learning_rate": 2.278357646006381e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08348749577999115,
"step": 3425,
"valid_targets_mean": 4058.6,
"valid_targets_min": 885
},
{
"epoch": 3.5779864371413668,
"grad_norm": 0.5130542955157593,
"learning_rate": 2.273206874076518e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10261701047420502,
"step": 3430,
"valid_targets_mean": 5305.4,
"valid_targets_min": 3152
},
{
"epoch": 3.5832029212310905,
"grad_norm": 0.4841718810074,
"learning_rate": 2.26805425494861e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09375569969415665,
"step": 3435,
"valid_targets_mean": 5293.2,
"valid_targets_min": 2908
},
{
"epoch": 3.588419405320814,
"grad_norm": 0.5169121108069523,
"learning_rate": 2.26289982346039e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09104648232460022,
"step": 3440,
"valid_targets_mean": 4429.5,
"valid_targets_min": 1439
},
{
"epoch": 3.593635889410537,
"grad_norm": 0.49322986983878714,
"learning_rate": 2.2577436144618438e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09873166680335999,
"step": 3445,
"valid_targets_mean": 4847.2,
"valid_targets_min": 1858
},
{
"epoch": 3.598852373500261,
"grad_norm": 0.524507361163139,
"learning_rate": 2.2525856628149754e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10959742963314056,
"step": 3450,
"valid_targets_mean": 5337.8,
"valid_targets_min": 1515
},
{
"epoch": 3.604068857589984,
"grad_norm": 0.5038836279165287,
"learning_rate": 2.2474260033935718e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09655040502548218,
"step": 3455,
"valid_targets_mean": 5096.9,
"valid_targets_min": 935
},
{
"epoch": 3.609285341679708,
"grad_norm": 0.5434625017319136,
"learning_rate": 2.2422646710829653e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11120036989450455,
"step": 3460,
"valid_targets_mean": 4631.4,
"valid_targets_min": 1669
},
{
"epoch": 3.6145018257694312,
"grad_norm": 0.4643557437705012,
"learning_rate": 2.2371017007798005e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1015571653842926,
"step": 3465,
"valid_targets_mean": 5713.1,
"valid_targets_min": 2234
},
{
"epoch": 3.619718309859155,
"grad_norm": 0.5438936323798786,
"learning_rate": 2.231937127391795e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1269652396440506,
"step": 3470,
"valid_targets_mean": 4342.6,
"valid_targets_min": 2144
},
{
"epoch": 3.6249347939488783,
"grad_norm": 0.5261720551564346,
"learning_rate": 2.226770985837507e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10666371881961823,
"step": 3475,
"valid_targets_mean": 4991.1,
"valid_targets_min": 1505
},
{
"epoch": 3.630151278038602,
"grad_norm": 0.48971826448674355,
"learning_rate": 2.2216033110460952e-05,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11108003556728363,
"step": 3480,
"valid_targets_mean": 5494.9,
"valid_targets_min": 2406
},
{
"epoch": 3.6353677621283254,
"grad_norm": 0.6310033254541642,
"learning_rate": 2.216434137957087e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14492467045783997,
"step": 3485,
"valid_targets_mean": 4256.5,
"valid_targets_min": 2999
},
{
"epoch": 3.640584246218049,
"grad_norm": 0.4509439637081253,
"learning_rate": 2.2112635015201383e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10062622278928757,
"step": 3490,
"valid_targets_mean": 4395.6,
"valid_targets_min": 2232
},
{
"epoch": 3.6458007303077724,
"grad_norm": 0.5309888811229617,
"learning_rate": 2.2060914366948004e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13531291484832764,
"step": 3495,
"valid_targets_mean": 4848.5,
"valid_targets_min": 1243
},
{
"epoch": 3.651017214397496,
"grad_norm": 0.49378897883013445,
"learning_rate": 2.2009179784502802e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10192813724279404,
"step": 3500,
"valid_targets_mean": 4548.9,
"valid_targets_min": 1422
},
{
"epoch": 3.6562336984872195,
"grad_norm": 0.4496118679496516,
"learning_rate": 2.1957431617652074e-05,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09512370079755783,
"step": 3505,
"valid_targets_mean": 5200.8,
"valid_targets_min": 1777
},
{
"epoch": 3.661450182576943,
"grad_norm": 0.4627518225433372,
"learning_rate": 2.1905670216273967e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10607169568538666,
"step": 3510,
"valid_targets_mean": 5725.0,
"valid_targets_min": 2263
},
{
"epoch": 3.6666666666666665,
"grad_norm": 0.6142333426220774,
"learning_rate": 2.185389593033609e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10711097717285156,
"step": 3515,
"valid_targets_mean": 3951.2,
"valid_targets_min": 2040
},
{
"epoch": 3.6718831507563903,
"grad_norm": 0.4564859698569454,
"learning_rate": 2.1802109109893184e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10178106278181076,
"step": 3520,
"valid_targets_mean": 5606.4,
"valid_targets_min": 1631
},
{
"epoch": 3.6770996348461136,
"grad_norm": 0.4578707908340693,
"learning_rate": 2.1750310105084725e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11136416345834732,
"step": 3525,
"valid_targets_mean": 7570.0,
"valid_targets_min": 2331
},
{
"epoch": 3.6823161189358373,
"grad_norm": 0.4530824968720263,
"learning_rate": 2.1698499266132585e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08735674619674683,
"step": 3530,
"valid_targets_mean": 4930.5,
"valid_targets_min": 2301
},
{
"epoch": 3.6875326030255606,
"grad_norm": 0.45806092476342786,
"learning_rate": 2.164667694333863e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08106125891208649,
"step": 3535,
"valid_targets_mean": 4889.6,
"valid_targets_min": 2107
},
{
"epoch": 3.6927490871152844,
"grad_norm": 0.5918590421269798,
"learning_rate": 2.159484348708239e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11161507666110992,
"step": 3540,
"valid_targets_mean": 4062.0,
"valid_targets_min": 1044
},
{
"epoch": 3.6979655712050077,
"grad_norm": 0.509743862744301,
"learning_rate": 2.1542999247818653e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12011369317770004,
"step": 3545,
"valid_targets_mean": 5757.8,
"valid_targets_min": 2037
},
{
"epoch": 3.7031820552947314,
"grad_norm": 0.4753458839491459,
"learning_rate": 2.149114457607512e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11911623179912567,
"step": 3550,
"valid_targets_mean": 5659.5,
"valid_targets_min": 3885
},
{
"epoch": 3.7083985393844547,
"grad_norm": 0.5342061703088573,
"learning_rate": 2.1439279822450034e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08299921452999115,
"step": 3555,
"valid_targets_mean": 3785.2,
"valid_targets_min": 897
},
{
"epoch": 3.7136150234741785,
"grad_norm": 0.4727141206820206,
"learning_rate": 2.1387405337609787e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11511692404747009,
"step": 3560,
"valid_targets_mean": 5902.4,
"valid_targets_min": 3456
},
{
"epoch": 3.718831507563902,
"grad_norm": 0.4698992789174544,
"learning_rate": 2.1335521472286578e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09991538524627686,
"step": 3565,
"valid_targets_mean": 5482.8,
"valid_targets_min": 2860
},
{
"epoch": 3.7240479916536255,
"grad_norm": 0.44549155893660347,
"learning_rate": 2.1283628577276034e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09587128460407257,
"step": 3570,
"valid_targets_mean": 6596.9,
"valid_targets_min": 5190
},
{
"epoch": 3.729264475743349,
"grad_norm": 0.5225931871767929,
"learning_rate": 2.1231727003434816e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11135206371545792,
"step": 3575,
"valid_targets_mean": 4997.1,
"valid_targets_min": 3775
},
{
"epoch": 3.7344809598330726,
"grad_norm": 0.5052943373674356,
"learning_rate": 2.1179817101678272e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11900711059570312,
"step": 3580,
"valid_targets_mean": 4403.1,
"valid_targets_min": 2023
},
{
"epoch": 3.739697443922796,
"grad_norm": 0.47991849736021147,
"learning_rate": 2.1127899222978064e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10209795087575912,
"step": 3585,
"valid_targets_mean": 5810.5,
"valid_targets_min": 1632
},
{
"epoch": 3.7449139280125197,
"grad_norm": 0.4664445962766321,
"learning_rate": 2.107597371835979e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09806659072637558,
"step": 3590,
"valid_targets_mean": 4265.9,
"valid_targets_min": 1091
},
{
"epoch": 3.750130412102243,
"grad_norm": 0.5482988875290883,
"learning_rate": 2.1024040938900586e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11896420270204544,
"step": 3595,
"valid_targets_mean": 5041.1,
"valid_targets_min": 1875
},
{
"epoch": 3.7553468961919667,
"grad_norm": 0.5046703560081168,
"learning_rate": 2.097210123572679e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10202568769454956,
"step": 3600,
"valid_targets_mean": 4581.6,
"valid_targets_min": 2032
},
{
"epoch": 3.76056338028169,
"grad_norm": 0.5134332654087025,
"learning_rate": 2.092015496001155e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09612300992012024,
"step": 3605,
"valid_targets_mean": 4159.4,
"valid_targets_min": 1893
},
{
"epoch": 3.7657798643714138,
"grad_norm": 0.49986159400195557,
"learning_rate": 2.0868202462972458e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09765844792127609,
"step": 3610,
"valid_targets_mean": 4365.2,
"valid_targets_min": 2086
},
{
"epoch": 3.770996348461137,
"grad_norm": 0.49759426834449094,
"learning_rate": 2.0816244095869157e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10434122383594513,
"step": 3615,
"valid_targets_mean": 4772.0,
"valid_targets_min": 2390
},
{
"epoch": 3.776212832550861,
"grad_norm": 0.48191796442862084,
"learning_rate": 2.0764280210001e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09581761062145233,
"step": 3620,
"valid_targets_mean": 4700.4,
"valid_targets_min": 1854
},
{
"epoch": 3.781429316640584,
"grad_norm": 0.45651214224663467,
"learning_rate": 2.0712311156704624e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11849430203437805,
"step": 3625,
"valid_targets_mean": 6474.9,
"valid_targets_min": 2325
},
{
"epoch": 3.786645800730308,
"grad_norm": 0.5128768250151106,
"learning_rate": 2.066033728735162e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10043670237064362,
"step": 3630,
"valid_targets_mean": 4569.6,
"valid_targets_min": 2703
},
{
"epoch": 3.791862284820031,
"grad_norm": 0.5205659397746013,
"learning_rate": 2.0608358953346146e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12045201659202576,
"step": 3635,
"valid_targets_mean": 4408.4,
"valid_targets_min": 1794
},
{
"epoch": 3.797078768909755,
"grad_norm": 0.44524938384432866,
"learning_rate": 2.0556376506122535e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09781882166862488,
"step": 3640,
"valid_targets_mean": 5613.9,
"valid_targets_min": 2932
},
{
"epoch": 3.8022952529994782,
"grad_norm": 0.5628102931009461,
"learning_rate": 2.0504390297142935e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11225159466266632,
"step": 3645,
"valid_targets_mean": 5291.5,
"valid_targets_min": 3199
},
{
"epoch": 3.807511737089202,
"grad_norm": 0.48068417775523864,
"learning_rate": 2.0452400677894936e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11818863451480865,
"step": 3650,
"valid_targets_mean": 6005.4,
"valid_targets_min": 1832
},
{
"epoch": 3.8127282211789253,
"grad_norm": 0.4802884620146345,
"learning_rate": 2.0400407999889165e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08356926590204239,
"step": 3655,
"valid_targets_mean": 4897.5,
"valid_targets_min": 1323
},
{
"epoch": 3.817944705268649,
"grad_norm": 0.4996117329409353,
"learning_rate": 2.0348412614656952e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10854753106832504,
"step": 3660,
"valid_targets_mean": 5317.0,
"valid_targets_min": 2965
},
{
"epoch": 3.8231611893583723,
"grad_norm": 0.4822390374810917,
"learning_rate": 2.0296414873747915e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10188714414834976,
"step": 3665,
"valid_targets_mean": 5403.4,
"valid_targets_min": 2299
},
{
"epoch": 3.828377673448096,
"grad_norm": 0.508619515441862,
"learning_rate": 2.0244415128727612e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09003810584545135,
"step": 3670,
"valid_targets_mean": 4603.9,
"valid_targets_min": 2767
},
{
"epoch": 3.8335941575378194,
"grad_norm": 0.46912333306432125,
"learning_rate": 2.0192413731175146e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09568269550800323,
"step": 3675,
"valid_targets_mean": 5408.6,
"valid_targets_min": 1774
},
{
"epoch": 3.838810641627543,
"grad_norm": 0.5460759203899835,
"learning_rate": 2.0140411032680775e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1019095927476883,
"step": 3680,
"valid_targets_mean": 4524.6,
"valid_targets_min": 1596
},
{
"epoch": 3.8440271257172665,
"grad_norm": 0.4974781466356231,
"learning_rate": 2.008840738484359e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10185645520687103,
"step": 3685,
"valid_targets_mean": 4695.8,
"valid_targets_min": 2022
},
{
"epoch": 3.84924360980699,
"grad_norm": 0.5521100717903332,
"learning_rate": 2.0036403139269067e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09987007081508636,
"step": 3690,
"valid_targets_mean": 4702.2,
"valid_targets_min": 1670
},
{
"epoch": 3.8544600938967135,
"grad_norm": 0.5097492757774731,
"learning_rate": 1.998439864756674e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11091513931751251,
"step": 3695,
"valid_targets_mean": 5430.6,
"valid_targets_min": 3621
},
{
"epoch": 3.8596765779864373,
"grad_norm": 0.5149786258022108,
"learning_rate": 1.993239426134781e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12105295807123184,
"step": 3700,
"valid_targets_mean": 5099.6,
"valid_targets_min": 2804
},
{
"epoch": 3.8648930620761606,
"grad_norm": 0.5485933673253874,
"learning_rate": 1.988039033222275e-05,
"loss": 0.2159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11051084101200104,
"step": 3705,
"valid_targets_mean": 4257.6,
"valid_targets_min": 2166
},
{
"epoch": 3.8701095461658843,
"grad_norm": 0.5637753025367358,
"learning_rate": 1.982838721179896e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10755988210439682,
"step": 3710,
"valid_targets_mean": 4024.9,
"valid_targets_min": 987
},
{
"epoch": 3.8753260302556076,
"grad_norm": 0.8170415462558644,
"learning_rate": 1.9776385251678352e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11058570444583893,
"step": 3715,
"valid_targets_mean": 4973.9,
"valid_targets_min": 2001
},
{
"epoch": 3.8805425143453314,
"grad_norm": 0.4929423575864892,
"learning_rate": 1.9724384803455013e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10546065121889114,
"step": 3720,
"valid_targets_mean": 4542.1,
"valid_targets_min": 1234
},
{
"epoch": 3.8857589984350547,
"grad_norm": 0.5979911719291678,
"learning_rate": 1.9672386218712794e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09815919399261475,
"step": 3725,
"valid_targets_mean": 4957.8,
"valid_targets_min": 2453
},
{
"epoch": 3.8909754825247784,
"grad_norm": 0.5153570159758912,
"learning_rate": 1.962038984902295e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10997527837753296,
"step": 3730,
"valid_targets_mean": 4998.4,
"valid_targets_min": 1986
},
{
"epoch": 3.8961919666145017,
"grad_norm": 0.5593692235819094,
"learning_rate": 1.9568396045941766e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10075406730175018,
"step": 3735,
"valid_targets_mean": 3630.2,
"valid_targets_min": 1345
},
{
"epoch": 3.9014084507042255,
"grad_norm": 0.49266099775399863,
"learning_rate": 1.951640516100817e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10078372061252594,
"step": 3740,
"valid_targets_mean": 4820.2,
"valid_targets_min": 1153
},
{
"epoch": 3.906624934793949,
"grad_norm": 0.6120689199450674,
"learning_rate": 1.9464417545741352e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13580328226089478,
"step": 3745,
"valid_targets_mean": 4586.2,
"valid_targets_min": 1724
},
{
"epoch": 3.9118414188836725,
"grad_norm": 0.5385939169738648,
"learning_rate": 1.941243355163841e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11604689061641693,
"step": 3750,
"valid_targets_mean": 5049.1,
"valid_targets_min": 1586
},
{
"epoch": 3.917057902973396,
"grad_norm": 0.4701296001393863,
"learning_rate": 1.936045353017195e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10644729435443878,
"step": 3755,
"valid_targets_mean": 4908.4,
"valid_targets_min": 2287
},
{
"epoch": 3.9222743870631196,
"grad_norm": 0.5300256155038029,
"learning_rate": 1.9308477832787724e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08712330460548401,
"step": 3760,
"valid_targets_mean": 4941.6,
"valid_targets_min": 1214
},
{
"epoch": 3.927490871152843,
"grad_norm": 0.5473484318788164,
"learning_rate": 1.9256506810902226e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11402727663516998,
"step": 3765,
"valid_targets_mean": 4187.4,
"valid_targets_min": 869
},
{
"epoch": 3.9327073552425666,
"grad_norm": 0.48275177236367606,
"learning_rate": 1.9204540815900368e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10041767358779907,
"step": 3770,
"valid_targets_mean": 5450.4,
"valid_targets_min": 1852
},
{
"epoch": 3.93792383933229,
"grad_norm": 0.5194319283174178,
"learning_rate": 1.915258019913306e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10384313762187958,
"step": 3775,
"valid_targets_mean": 4937.1,
"valid_targets_min": 2276
},
{
"epoch": 3.9431403234220137,
"grad_norm": 0.5102834439544414,
"learning_rate": 1.9100625311914855e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11289326846599579,
"step": 3780,
"valid_targets_mean": 5011.9,
"valid_targets_min": 2077
},
{
"epoch": 3.948356807511737,
"grad_norm": 0.5188674050207436,
"learning_rate": 1.9048676505521552e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1049310639500618,
"step": 3785,
"valid_targets_mean": 4873.9,
"valid_targets_min": 2730
},
{
"epoch": 3.9535732916014608,
"grad_norm": 0.4969938713059937,
"learning_rate": 1.8996734131187867e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1003921777009964,
"step": 3790,
"valid_targets_mean": 4873.9,
"valid_targets_min": 809
},
{
"epoch": 3.958789775691184,
"grad_norm": 0.5311902182679525,
"learning_rate": 1.894479854010499e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10483424365520477,
"step": 3795,
"valid_targets_mean": 4369.6,
"valid_targets_min": 1711
},
{
"epoch": 3.964006259780908,
"grad_norm": 0.5333966811645783,
"learning_rate": 1.8892870083418272e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09669163823127747,
"step": 3800,
"valid_targets_mean": 3691.0,
"valid_targets_min": 1875
},
{
"epoch": 3.969222743870631,
"grad_norm": 0.4544249740651942,
"learning_rate": 1.8840949112224823e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10293082892894745,
"step": 3805,
"valid_targets_mean": 5624.8,
"valid_targets_min": 1428
},
{
"epoch": 3.974439227960355,
"grad_norm": 0.5444361564882776,
"learning_rate": 1.8789035977571145e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10902902483940125,
"step": 3810,
"valid_targets_mean": 4516.5,
"valid_targets_min": 702
},
{
"epoch": 3.979655712050078,
"grad_norm": 0.5111837101240407,
"learning_rate": 1.873713103045076e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09919290989637375,
"step": 3815,
"valid_targets_mean": 4874.5,
"valid_targets_min": 2037
},
{
"epoch": 3.984872196139802,
"grad_norm": 0.5541412732399372,
"learning_rate": 1.8685234621801803e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1078808456659317,
"step": 3820,
"valid_targets_mean": 3935.0,
"valid_targets_min": 530
},
{
"epoch": 3.9900886802295252,
"grad_norm": 0.5213068337768594,
"learning_rate": 1.863334710250471e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11251041293144226,
"step": 3825,
"valid_targets_mean": 4976.2,
"valid_targets_min": 2908
},
{
"epoch": 3.995305164319249,
"grad_norm": 0.6187092625734034,
"learning_rate": 1.858146882337981e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10999973118305206,
"step": 3830,
"valid_targets_mean": 3286.1,
"valid_targets_min": 1397
},
{
"epoch": 4.0,
"grad_norm": 0.5917940970126754,
"learning_rate": 1.852960013518495e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1782897263765335,
"step": 3835,
"valid_targets_mean": 5665.9,
"valid_targets_min": 3034
},
{
"epoch": 4.005216484089724,
"grad_norm": 0.46607771414324617,
"learning_rate": 1.8477741388613132e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09920147061347961,
"step": 3840,
"valid_targets_mean": 6056.2,
"valid_targets_min": 2699
},
{
"epoch": 4.010432968179447,
"grad_norm": 0.4768192176770827,
"learning_rate": 1.8425892934290152e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07980208843946457,
"step": 3845,
"valid_targets_mean": 4985.4,
"valid_targets_min": 1433
},
{
"epoch": 4.01564945226917,
"grad_norm": 0.6027113819965128,
"learning_rate": 1.8374055122772195e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11384853720664978,
"step": 3850,
"valid_targets_mean": 4757.9,
"valid_targets_min": 2591
},
{
"epoch": 4.020865936358894,
"grad_norm": 0.6170472555517669,
"learning_rate": 1.8322228304543515e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10987308621406555,
"step": 3855,
"valid_targets_mean": 4566.6,
"valid_targets_min": 1568
},
{
"epoch": 4.026082420448618,
"grad_norm": 0.5361888807617837,
"learning_rate": 1.827041283001403e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10329025983810425,
"step": 3860,
"valid_targets_mean": 6410.9,
"valid_targets_min": 2809
},
{
"epoch": 4.031298904538341,
"grad_norm": 0.5138123234586494,
"learning_rate": 1.8218609049516943e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10162970423698425,
"step": 3865,
"valid_targets_mean": 4866.2,
"valid_targets_min": 2589
},
{
"epoch": 4.0365153886280645,
"grad_norm": 0.629738341072631,
"learning_rate": 1.816681731330641e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09866997599601746,
"step": 3870,
"valid_targets_mean": 3714.9,
"valid_targets_min": 1792
},
{
"epoch": 4.041731872717788,
"grad_norm": 0.5076510284900337,
"learning_rate": 1.811503797155516e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08396624028682709,
"step": 3875,
"valid_targets_mean": 4964.0,
"valid_targets_min": 2687
},
{
"epoch": 4.046948356807512,
"grad_norm": 0.5604202388209889,
"learning_rate": 1.8063271374352097e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07950867712497711,
"step": 3880,
"valid_targets_mean": 4328.1,
"valid_targets_min": 2683
},
{
"epoch": 4.052164840897235,
"grad_norm": 0.5195318213554949,
"learning_rate": 1.8011517871699978e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09295456111431122,
"step": 3885,
"valid_targets_mean": 4763.0,
"valid_targets_min": 2191
},
{
"epoch": 4.057381324986959,
"grad_norm": 0.49574508785301097,
"learning_rate": 1.7959777813513015e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08722072839736938,
"step": 3890,
"valid_targets_mean": 5509.4,
"valid_targets_min": 2389
},
{
"epoch": 4.062597809076682,
"grad_norm": 0.555672291436396,
"learning_rate": 1.7908051549614527e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10567817091941833,
"step": 3895,
"valid_targets_mean": 4166.8,
"valid_targets_min": 850
},
{
"epoch": 4.067814293166406,
"grad_norm": 0.576453985393876,
"learning_rate": 1.7856339429734557e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10580688714981079,
"step": 3900,
"valid_targets_mean": 4304.9,
"valid_targets_min": 648
},
{
"epoch": 4.073030777256129,
"grad_norm": 0.48395931003632825,
"learning_rate": 1.780464180350753e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08282601833343506,
"step": 3905,
"valid_targets_mean": 5238.0,
"valid_targets_min": 1478
},
{
"epoch": 4.078247261345853,
"grad_norm": 0.4822897854810889,
"learning_rate": 1.7752959020469868e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09229675680398941,
"step": 3910,
"valid_targets_mean": 5155.9,
"valid_targets_min": 2004
},
{
"epoch": 4.083463745435576,
"grad_norm": 0.6181703509272917,
"learning_rate": 1.7701291430057653e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10611573606729507,
"step": 3915,
"valid_targets_mean": 3013.1,
"valid_targets_min": 578
},
{
"epoch": 4.0886802295253,
"grad_norm": 0.49745890025257705,
"learning_rate": 1.7649639381604207e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08665668964385986,
"step": 3920,
"valid_targets_mean": 5601.6,
"valid_targets_min": 2905
},
{
"epoch": 4.093896713615023,
"grad_norm": 0.5178774003263724,
"learning_rate": 1.759800322433781e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1114279106259346,
"step": 3925,
"valid_targets_mean": 5073.0,
"valid_targets_min": 1884
},
{
"epoch": 4.099113197704747,
"grad_norm": 0.48501226491558996,
"learning_rate": 1.7546383307379284e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09173507988452911,
"step": 3930,
"valid_targets_mean": 5578.1,
"valid_targets_min": 1780
},
{
"epoch": 4.1043296817944706,
"grad_norm": 0.609147488412618,
"learning_rate": 1.7494779979739645e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10356195271015167,
"step": 3935,
"valid_targets_mean": 4226.8,
"valid_targets_min": 1939
},
{
"epoch": 4.109546165884194,
"grad_norm": 0.5526486664927994,
"learning_rate": 1.7443193590317756e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08991257846355438,
"step": 3940,
"valid_targets_mean": 3742.1,
"valid_targets_min": 2015
},
{
"epoch": 4.114762649973917,
"grad_norm": 0.520797455000569,
"learning_rate": 1.7391624487897947e-05,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0994281992316246,
"step": 3945,
"valid_targets_mean": 4919.4,
"valid_targets_min": 1876
},
{
"epoch": 4.119979134063641,
"grad_norm": 0.5815937259094293,
"learning_rate": 1.734007302114768e-05,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07230329513549805,
"step": 3950,
"valid_targets_mean": 3220.5,
"valid_targets_min": 1525
},
{
"epoch": 4.125195618153365,
"grad_norm": 0.498745760416118,
"learning_rate": 1.728853953861516e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10175873339176178,
"step": 3955,
"valid_targets_mean": 5411.1,
"valid_targets_min": 3212
},
{
"epoch": 4.130412102243088,
"grad_norm": 0.48426613600890606,
"learning_rate": 1.723702438872701e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07348211109638214,
"step": 3960,
"valid_targets_mean": 4504.8,
"valid_targets_min": 1674
},
{
"epoch": 4.135628586332811,
"grad_norm": 0.4949250093153264,
"learning_rate": 1.718552791978591e-05,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08084411919116974,
"step": 3965,
"valid_targets_mean": 4177.2,
"valid_targets_min": 1305
},
{
"epoch": 4.140845070422535,
"grad_norm": 0.5462401892454734,
"learning_rate": 1.713405047996822e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08703359961509705,
"step": 3970,
"valid_targets_mean": 4648.9,
"valid_targets_min": 3039
},
{
"epoch": 4.146061554512259,
"grad_norm": 0.5596781224211703,
"learning_rate": 1.7082592417321647e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0826859325170517,
"step": 3975,
"valid_targets_mean": 4734.5,
"valid_targets_min": 1646
},
{
"epoch": 4.1512780386019825,
"grad_norm": 0.5208769324737493,
"learning_rate": 1.7031154079762885e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10567048192024231,
"step": 3980,
"valid_targets_mean": 6375.9,
"valid_targets_min": 3444
},
{
"epoch": 4.156494522691705,
"grad_norm": 0.46231862393023193,
"learning_rate": 1.6979735815075263e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08094746619462967,
"step": 3985,
"valid_targets_mean": 5711.2,
"valid_targets_min": 2724
},
{
"epoch": 4.161711006781429,
"grad_norm": 0.47782347604207814,
"learning_rate": 1.6928337970906406e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10498857498168945,
"step": 3990,
"valid_targets_mean": 6370.1,
"valid_targets_min": 3429
},
{
"epoch": 4.166927490871153,
"grad_norm": 0.533700092920349,
"learning_rate": 1.687696089476585e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09806228429079056,
"step": 3995,
"valid_targets_mean": 4882.9,
"valid_targets_min": 2680
},
{
"epoch": 4.172143974960877,
"grad_norm": 0.5973811736413226,
"learning_rate": 1.6825604934022734e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10948151350021362,
"step": 4000,
"valid_targets_mean": 4622.4,
"valid_targets_min": 757
},
{
"epoch": 4.1773604590505995,
"grad_norm": 0.5839781166361364,
"learning_rate": 1.6774270435903423e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09380412101745605,
"step": 4005,
"valid_targets_mean": 4379.6,
"valid_targets_min": 2864
},
{
"epoch": 4.182576943140323,
"grad_norm": 0.4932464057306441,
"learning_rate": 1.6722957747489172e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08225096017122269,
"step": 4010,
"valid_targets_mean": 5334.0,
"valid_targets_min": 1478
},
{
"epoch": 4.187793427230047,
"grad_norm": 0.5860383161281291,
"learning_rate": 1.6671667215713784e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13215795159339905,
"step": 4015,
"valid_targets_mean": 5308.4,
"valid_targets_min": 2775
},
{
"epoch": 4.193009911319771,
"grad_norm": 0.5247016468745013,
"learning_rate": 1.6620399187361226e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09403416514396667,
"step": 4020,
"valid_targets_mean": 4737.9,
"valid_targets_min": 1846
},
{
"epoch": 4.198226395409494,
"grad_norm": 0.5463858968727039,
"learning_rate": 1.656915400906336e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12462165206670761,
"step": 4025,
"valid_targets_mean": 5254.2,
"valid_targets_min": 2690
},
{
"epoch": 4.203442879499217,
"grad_norm": 0.5437506670021418,
"learning_rate": 1.6517932027297525e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10087625682353973,
"step": 4030,
"valid_targets_mean": 5404.0,
"valid_targets_min": 2414
},
{
"epoch": 4.208659363588941,
"grad_norm": 0.4920007300056477,
"learning_rate": 1.6466733588384233e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0758361667394638,
"step": 4035,
"valid_targets_mean": 4849.0,
"valid_targets_min": 2562
},
{
"epoch": 4.213875847678665,
"grad_norm": 0.5334617341832782,
"learning_rate": 1.6415559038484827e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09430640190839767,
"step": 4040,
"valid_targets_mean": 4943.1,
"valid_targets_min": 1510
},
{
"epoch": 4.219092331768388,
"grad_norm": 0.5275723874222573,
"learning_rate": 1.6364408723599116e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09793593734502792,
"step": 4045,
"valid_targets_mean": 4466.1,
"valid_targets_min": 1009
},
{
"epoch": 4.2243088158581115,
"grad_norm": 0.5463254998017771,
"learning_rate": 1.6313282989563062e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09902290999889374,
"step": 4050,
"valid_targets_mean": 5299.5,
"valid_targets_min": 2944
},
{
"epoch": 4.229525299947835,
"grad_norm": 0.5464292051087032,
"learning_rate": 1.626218218204643e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08867479115724564,
"step": 4055,
"valid_targets_mean": 4553.4,
"valid_targets_min": 1264
},
{
"epoch": 4.234741784037559,
"grad_norm": 0.5750184592559107,
"learning_rate": 1.6211106646550455e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08512931317090988,
"step": 4060,
"valid_targets_mean": 4165.4,
"valid_targets_min": 993
},
{
"epoch": 4.239958268127282,
"grad_norm": 0.482544491305686,
"learning_rate": 1.616005672840551e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0946473479270935,
"step": 4065,
"valid_targets_mean": 6244.1,
"valid_targets_min": 3696
},
{
"epoch": 4.245174752217006,
"grad_norm": 0.6441334590686112,
"learning_rate": 1.6109032772768736e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12765106558799744,
"step": 4070,
"valid_targets_mean": 4555.0,
"valid_targets_min": 2488
},
{
"epoch": 4.250391236306729,
"grad_norm": 0.5467731898668896,
"learning_rate": 1.6058035124621766e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09254036843776703,
"step": 4075,
"valid_targets_mean": 4768.2,
"valid_targets_min": 1312
},
{
"epoch": 4.255607720396453,
"grad_norm": 0.5335943285352456,
"learning_rate": 1.6007064128768354e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09836730360984802,
"step": 4080,
"valid_targets_mean": 4161.2,
"valid_targets_min": 2358
},
{
"epoch": 4.260824204486176,
"grad_norm": 0.505854543811336,
"learning_rate": 1.5956120129832054e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09282954782247543,
"step": 4085,
"valid_targets_mean": 5335.9,
"valid_targets_min": 2540
},
{
"epoch": 4.2660406885759,
"grad_norm": 0.5168993888236286,
"learning_rate": 1.5905203472253892e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10466302931308746,
"step": 4090,
"valid_targets_mean": 5806.4,
"valid_targets_min": 1544
},
{
"epoch": 4.271257172665623,
"grad_norm": 0.5570781330788017,
"learning_rate": 1.5854314500290025e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08315970003604889,
"step": 4095,
"valid_targets_mean": 3761.0,
"valid_targets_min": 2307
},
{
"epoch": 4.276473656755347,
"grad_norm": 0.5180539101793878,
"learning_rate": 1.580345355800944e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10318869352340698,
"step": 4100,
"valid_targets_mean": 6067.6,
"valid_targets_min": 3533
},
{
"epoch": 4.28169014084507,
"grad_norm": 0.4759566364417453,
"learning_rate": 1.5752620989291592e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08804687112569809,
"step": 4105,
"valid_targets_mean": 5481.1,
"valid_targets_min": 2230
},
{
"epoch": 4.286906624934794,
"grad_norm": 0.6145751936823841,
"learning_rate": 1.5701817137824108e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08851298689842224,
"step": 4110,
"valid_targets_mean": 3818.9,
"valid_targets_min": 1279
},
{
"epoch": 4.2921231090245175,
"grad_norm": 0.52579025932417,
"learning_rate": 1.5651042347100452e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11087971180677414,
"step": 4115,
"valid_targets_mean": 4957.0,
"valid_targets_min": 2571
},
{
"epoch": 4.297339593114241,
"grad_norm": 0.5076438247402,
"learning_rate": 1.5600296960417597e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08762188255786896,
"step": 4120,
"valid_targets_mean": 4572.0,
"valid_targets_min": 2468
},
{
"epoch": 4.302556077203964,
"grad_norm": 0.5232042525437712,
"learning_rate": 1.5549581320873715e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10302773863077164,
"step": 4125,
"valid_targets_mean": 5525.5,
"valid_targets_min": 3418
},
{
"epoch": 4.307772561293688,
"grad_norm": 0.5084431660923632,
"learning_rate": 1.549889577136586e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0906180590391159,
"step": 4130,
"valid_targets_mean": 4597.6,
"valid_targets_min": 2371
},
{
"epoch": 4.312989045383412,
"grad_norm": 0.5164682116047572,
"learning_rate": 1.5448240654587622e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08768324553966522,
"step": 4135,
"valid_targets_mean": 5027.8,
"valid_targets_min": 1861
},
{
"epoch": 4.318205529473135,
"grad_norm": 0.4705826792702526,
"learning_rate": 1.5397616313026853e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0866117849946022,
"step": 4140,
"valid_targets_mean": 5228.9,
"valid_targets_min": 4108
},
{
"epoch": 4.323422013562858,
"grad_norm": 0.5119602922505897,
"learning_rate": 1.5347023088963315e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10736275464296341,
"step": 4145,
"valid_targets_mean": 4940.8,
"valid_targets_min": 2638
},
{
"epoch": 4.328638497652582,
"grad_norm": 0.5780230067512474,
"learning_rate": 1.5296461324466384e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11072811484336853,
"step": 4150,
"valid_targets_mean": 3822.2,
"valid_targets_min": 1490
},
{
"epoch": 4.333854981742306,
"grad_norm": 0.45976859901606687,
"learning_rate": 1.5245931361392727e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09216370433568954,
"step": 4155,
"valid_targets_mean": 5424.5,
"valid_targets_min": 2679
},
{
"epoch": 4.3390714658320295,
"grad_norm": 0.4822877754433266,
"learning_rate": 1.5195433541384009e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09953758120536804,
"step": 4160,
"valid_targets_mean": 6368.4,
"valid_targets_min": 3936
},
{
"epoch": 4.344287949921752,
"grad_norm": 0.5462791770593632,
"learning_rate": 1.514496820586456e-05,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11608624458312988,
"step": 4165,
"valid_targets_mean": 4398.8,
"valid_targets_min": 809
},
{
"epoch": 4.349504434011476,
"grad_norm": 0.5280279895369452,
"learning_rate": 1.5094535696039067e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08779674768447876,
"step": 4170,
"valid_targets_mean": 4909.9,
"valid_targets_min": 1002
},
{
"epoch": 4.3547209181012,
"grad_norm": 0.497296131238902,
"learning_rate": 1.50441363528903e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08548164367675781,
"step": 4175,
"valid_targets_mean": 4348.1,
"valid_targets_min": 1040
},
{
"epoch": 4.359937402190924,
"grad_norm": 0.571056849057062,
"learning_rate": 1.4993770517176764e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09022928774356842,
"step": 4180,
"valid_targets_mean": 4375.6,
"valid_targets_min": 1328
},
{
"epoch": 4.3651538862806465,
"grad_norm": 0.552954874618173,
"learning_rate": 1.4943438529430428e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11038275063037872,
"step": 4185,
"valid_targets_mean": 5781.0,
"valid_targets_min": 2714
},
{
"epoch": 4.37037037037037,
"grad_norm": 0.5709690624150761,
"learning_rate": 1.4893140729954402e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07892560213804245,
"step": 4190,
"valid_targets_mean": 3561.4,
"valid_targets_min": 1302
},
{
"epoch": 4.375586854460094,
"grad_norm": 0.46304764562125006,
"learning_rate": 1.4842877458820644e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07885998487472534,
"step": 4195,
"valid_targets_mean": 5008.0,
"valid_targets_min": 2734
},
{
"epoch": 4.380803338549818,
"grad_norm": 0.5489716863526718,
"learning_rate": 1.4792649055867668e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12214149534702301,
"step": 4200,
"valid_targets_mean": 5317.6,
"valid_targets_min": 3488
},
{
"epoch": 4.386019822639541,
"grad_norm": 0.5936222854237478,
"learning_rate": 1.474245586069822e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10609170794487,
"step": 4205,
"valid_targets_mean": 3679.5,
"valid_targets_min": 1860
},
{
"epoch": 4.391236306729264,
"grad_norm": 0.8794519825330008,
"learning_rate": 1.4692298212677018e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08555130660533905,
"step": 4210,
"valid_targets_mean": 4084.1,
"valid_targets_min": 858
},
{
"epoch": 4.396452790818988,
"grad_norm": 0.5014053800504651,
"learning_rate": 1.464217645092843e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10078731179237366,
"step": 4215,
"valid_targets_mean": 5622.2,
"valid_targets_min": 2675
},
{
"epoch": 4.401669274908712,
"grad_norm": 0.45310896431300557,
"learning_rate": 1.4592090914334206e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08208087086677551,
"step": 4220,
"valid_targets_mean": 5558.6,
"valid_targets_min": 2868
},
{
"epoch": 4.406885758998435,
"grad_norm": 0.49986230812739674,
"learning_rate": 1.4542041941531136e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10097955167293549,
"step": 4225,
"valid_targets_mean": 5447.5,
"valid_targets_min": 2116
},
{
"epoch": 4.4121022430881585,
"grad_norm": 0.5059809184345644,
"learning_rate": 1.4492029870908835e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09783491492271423,
"step": 4230,
"valid_targets_mean": 5252.1,
"valid_targets_min": 4056
},
{
"epoch": 4.417318727177882,
"grad_norm": 0.520314079146309,
"learning_rate": 1.4442055040607402e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0887046605348587,
"step": 4235,
"valid_targets_mean": 4721.4,
"valid_targets_min": 2066
},
{
"epoch": 4.422535211267606,
"grad_norm": 0.6181759123091992,
"learning_rate": 1.4392117788515138e-05,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08616556227207184,
"step": 4240,
"valid_targets_mean": 3734.6,
"valid_targets_min": 869
},
{
"epoch": 4.427751695357329,
"grad_norm": 0.4976989934186071,
"learning_rate": 1.4342218452266284e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08760233223438263,
"step": 4245,
"valid_targets_mean": 3873.8,
"valid_targets_min": 614
},
{
"epoch": 4.432968179447053,
"grad_norm": 0.5501596884251593,
"learning_rate": 1.4292357369238726e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09641134738922119,
"step": 4250,
"valid_targets_mean": 5268.8,
"valid_targets_min": 1951
},
{
"epoch": 4.438184663536776,
"grad_norm": 0.48594084697619444,
"learning_rate": 1.42425348765517e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08059099316596985,
"step": 4255,
"valid_targets_mean": 5099.4,
"valid_targets_min": 1572
},
{
"epoch": 4.4434011476265,
"grad_norm": 0.48163357483780256,
"learning_rate": 1.4192751311063541e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07465652376413345,
"step": 4260,
"valid_targets_mean": 4928.2,
"valid_targets_min": 1986
},
{
"epoch": 4.448617631716223,
"grad_norm": 0.5582075282557117,
"learning_rate": 1.4143007009369388e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08925212919712067,
"step": 4265,
"valid_targets_mean": 4252.5,
"valid_targets_min": 2466
},
{
"epoch": 4.453834115805947,
"grad_norm": 0.49782397194604244,
"learning_rate": 1.4093302307798906e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08925595879554749,
"step": 4270,
"valid_targets_mean": 4721.1,
"valid_targets_min": 2373
},
{
"epoch": 4.45905059989567,
"grad_norm": 0.5009132428350149,
"learning_rate": 1.4043637542414007e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08160844445228577,
"step": 4275,
"valid_targets_mean": 3924.8,
"valid_targets_min": 1261
},
{
"epoch": 4.464267083985394,
"grad_norm": 0.5628054062789214,
"learning_rate": 1.399401304900661e-05,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09798973798751831,
"step": 4280,
"valid_targets_mean": 3923.4,
"valid_targets_min": 964
},
{
"epoch": 4.469483568075117,
"grad_norm": 0.585729577018991,
"learning_rate": 1.3944429163096332e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08872173726558685,
"step": 4285,
"valid_targets_mean": 3880.2,
"valid_targets_min": 1583
},
{
"epoch": 4.474700052164841,
"grad_norm": 0.5760467170898765,
"learning_rate": 1.3894886219928247e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09322041273117065,
"step": 4290,
"valid_targets_mean": 3371.4,
"valid_targets_min": 1312
},
{
"epoch": 4.4799165362545645,
"grad_norm": 0.5291247471161196,
"learning_rate": 1.3845384554470596e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08454497158527374,
"step": 4295,
"valid_targets_mean": 4669.1,
"valid_targets_min": 2090
},
{
"epoch": 4.485133020344288,
"grad_norm": 0.5617399480952876,
"learning_rate": 1.3795924501412542e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09035874158143997,
"step": 4300,
"valid_targets_mean": 4323.1,
"valid_targets_min": 1451
},
{
"epoch": 4.490349504434011,
"grad_norm": 0.5485745370649264,
"learning_rate": 1.3746506395161901e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09074965864419937,
"step": 4305,
"valid_targets_mean": 4551.8,
"valid_targets_min": 1200
},
{
"epoch": 4.495565988523735,
"grad_norm": 0.5405262796801544,
"learning_rate": 1.3697130569842874e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10740135610103607,
"step": 4310,
"valid_targets_mean": 5237.6,
"valid_targets_min": 1602
},
{
"epoch": 4.500782472613459,
"grad_norm": 0.5557849275633413,
"learning_rate": 1.3647797359293797e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09277792274951935,
"step": 4315,
"valid_targets_mean": 3707.9,
"valid_targets_min": 1389
},
{
"epoch": 4.505998956703182,
"grad_norm": 0.48870583625018515,
"learning_rate": 1.359850709706489e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09530732780694962,
"step": 4320,
"valid_targets_mean": 5565.2,
"valid_targets_min": 4395
},
{
"epoch": 4.511215440792905,
"grad_norm": 0.5622484777803662,
"learning_rate": 1.354926011641596e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08089743554592133,
"step": 4325,
"valid_targets_mean": 3019.0,
"valid_targets_min": 1126
},
{
"epoch": 4.516431924882629,
"grad_norm": 0.5542477243808857,
"learning_rate": 1.3500056750314215e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09326313436031342,
"step": 4330,
"valid_targets_mean": 3765.6,
"valid_targets_min": 2014
},
{
"epoch": 4.521648408972353,
"grad_norm": 0.5233146742760183,
"learning_rate": 1.345089733143196e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10327020287513733,
"step": 4335,
"valid_targets_mean": 4620.4,
"valid_targets_min": 2016
},
{
"epoch": 4.5268648930620765,
"grad_norm": 0.4698810059913912,
"learning_rate": 1.3401782192144372e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06537723541259766,
"step": 4340,
"valid_targets_mean": 4914.2,
"valid_targets_min": 952
},
{
"epoch": 4.532081377151799,
"grad_norm": 0.4813674546712752,
"learning_rate": 1.3352711664527242e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08028852939605713,
"step": 4345,
"valid_targets_mean": 4774.6,
"valid_targets_min": 1768
},
{
"epoch": 4.537297861241523,
"grad_norm": 0.55463033366809,
"learning_rate": 1.3303686080354739e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0880127102136612,
"step": 4350,
"valid_targets_mean": 3802.6,
"valid_targets_min": 1248
},
{
"epoch": 4.542514345331247,
"grad_norm": 0.5472619983465714,
"learning_rate": 1.3254705771097154e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10948982834815979,
"step": 4355,
"valid_targets_mean": 4689.6,
"valid_targets_min": 2202
},
{
"epoch": 4.547730829420971,
"grad_norm": 0.5603369394501863,
"learning_rate": 1.3205771067918675e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07711246609687805,
"step": 4360,
"valid_targets_mean": 4079.0,
"valid_targets_min": 1105
},
{
"epoch": 4.5529473135106935,
"grad_norm": 0.5492810122172286,
"learning_rate": 1.3156882301675133e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08386009186506271,
"step": 4365,
"valid_targets_mean": 3945.0,
"valid_targets_min": 1135
},
{
"epoch": 4.558163797600417,
"grad_norm": 0.4715280247213639,
"learning_rate": 1.3108039802911776e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08024720102548599,
"step": 4370,
"valid_targets_mean": 5053.8,
"valid_targets_min": 2785
},
{
"epoch": 4.563380281690141,
"grad_norm": 0.5877837255800695,
"learning_rate": 1.3059243901861024e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09088737517595291,
"step": 4375,
"valid_targets_mean": 3530.5,
"valid_targets_min": 1410
},
{
"epoch": 4.568596765779865,
"grad_norm": 0.5176398815331197,
"learning_rate": 1.3010494928440248e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09199392050504684,
"step": 4380,
"valid_targets_mean": 4320.6,
"valid_targets_min": 2250
},
{
"epoch": 4.573813249869588,
"grad_norm": 0.4934780148015792,
"learning_rate": 1.2961793212249527e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08720052242279053,
"step": 4385,
"valid_targets_mean": 4446.1,
"valid_targets_min": 2146
},
{
"epoch": 4.579029733959311,
"grad_norm": 0.4754133828329036,
"learning_rate": 1.2913139082569434e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07586514949798584,
"step": 4390,
"valid_targets_mean": 4668.9,
"valid_targets_min": 1697
},
{
"epoch": 4.584246218049035,
"grad_norm": 0.49030213981053966,
"learning_rate": 1.2864532868358799e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08727875351905823,
"step": 4395,
"valid_targets_mean": 6398.2,
"valid_targets_min": 2712
},
{
"epoch": 4.589462702138759,
"grad_norm": 0.4978857129207338,
"learning_rate": 1.2815974898252482e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09104059636592865,
"step": 4400,
"valid_targets_mean": 5123.6,
"valid_targets_min": 420
},
{
"epoch": 4.594679186228482,
"grad_norm": 0.5064315260591452,
"learning_rate": 1.2767465500559162e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10585306584835052,
"step": 4405,
"valid_targets_mean": 5692.2,
"valid_targets_min": 1967
},
{
"epoch": 4.5998956703182055,
"grad_norm": 0.5367081628888567,
"learning_rate": 1.271900500325911e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09236375987529755,
"step": 4410,
"valid_targets_mean": 4742.2,
"valid_targets_min": 1586
},
{
"epoch": 4.605112154407929,
"grad_norm": 0.5758230696012199,
"learning_rate": 1.2670593734001972e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09824080020189285,
"step": 4415,
"valid_targets_mean": 4728.8,
"valid_targets_min": 3753
},
{
"epoch": 4.610328638497653,
"grad_norm": 0.4734993971322568,
"learning_rate": 1.2622232020104568e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09226129949092865,
"step": 4420,
"valid_targets_mean": 5586.2,
"valid_targets_min": 2757
},
{
"epoch": 4.615545122587376,
"grad_norm": 0.4959936805670171,
"learning_rate": 1.2573920188548634e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10080541670322418,
"step": 4425,
"valid_targets_mean": 5626.9,
"valid_targets_min": 3439
},
{
"epoch": 4.6207616066771,
"grad_norm": 0.5551311601238801,
"learning_rate": 1.2525658565978668e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11569254845380783,
"step": 4430,
"valid_targets_mean": 5708.4,
"valid_targets_min": 2079
},
{
"epoch": 4.625978090766823,
"grad_norm": 0.665499653435843,
"learning_rate": 1.2477447478699696e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10402677953243256,
"step": 4435,
"valid_targets_mean": 3055.1,
"valid_targets_min": 1490
},
{
"epoch": 4.631194574856547,
"grad_norm": 0.6135164109299587,
"learning_rate": 1.2429287252675062e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08897197991609573,
"step": 4440,
"valid_targets_mean": 4009.1,
"valid_targets_min": 1195
},
{
"epoch": 4.63641105894627,
"grad_norm": 0.6150723224583431,
"learning_rate": 1.2381178213524223e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09846167266368866,
"step": 4445,
"valid_targets_mean": 3743.9,
"valid_targets_min": 2535
},
{
"epoch": 4.641627543035994,
"grad_norm": 0.4603297482,
"learning_rate": 1.2333120686520568e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07244417071342468,
"step": 4450,
"valid_targets_mean": 4653.0,
"valid_targets_min": 1433
},
{
"epoch": 4.646844027125717,
"grad_norm": 0.5421584576747219,
"learning_rate": 1.2285114996589181e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09737575054168701,
"step": 4455,
"valid_targets_mean": 4780.5,
"valid_targets_min": 1596
},
{
"epoch": 4.652060511215441,
"grad_norm": 0.5306503819722574,
"learning_rate": 1.2237161468304681e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1015390157699585,
"step": 4460,
"valid_targets_mean": 4998.6,
"valid_targets_min": 2885
},
{
"epoch": 4.657276995305164,
"grad_norm": 0.48783463584651493,
"learning_rate": 1.218926042588902e-05,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07946668565273285,
"step": 4465,
"valid_targets_mean": 4776.6,
"valid_targets_min": 1922
},
{
"epoch": 4.662493479394888,
"grad_norm": 0.5305581567223895,
"learning_rate": 1.2141412193209274e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09118214249610901,
"step": 4470,
"valid_targets_mean": 4462.5,
"valid_targets_min": 3245
},
{
"epoch": 4.6677099634846115,
"grad_norm": 0.4768961351208789,
"learning_rate": 1.2093617093775458e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08062206208705902,
"step": 4475,
"valid_targets_mean": 5484.6,
"valid_targets_min": 1214
},
{
"epoch": 4.672926447574335,
"grad_norm": 0.5063335449476011,
"learning_rate": 1.2045875450738352e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07570169866085052,
"step": 4480,
"valid_targets_mean": 4700.0,
"valid_targets_min": 1504
},
{
"epoch": 4.678142931664058,
"grad_norm": 0.4568648722852648,
"learning_rate": 1.199818758688731e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07844646275043488,
"step": 4485,
"valid_targets_mean": 4799.9,
"valid_targets_min": 1221
},
{
"epoch": 4.683359415753782,
"grad_norm": 0.5085681390429685,
"learning_rate": 1.1950553824648077e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11995210498571396,
"step": 4490,
"valid_targets_mean": 5328.2,
"valid_targets_min": 2971
},
{
"epoch": 4.688575899843506,
"grad_norm": 0.5129356193317287,
"learning_rate": 1.1902974486080599e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07197125256061554,
"step": 4495,
"valid_targets_mean": 3731.9,
"valid_targets_min": 2461
},
{
"epoch": 4.6937923839332285,
"grad_norm": 0.5253442583183974,
"learning_rate": 1.1855449892876858e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09587593376636505,
"step": 4500,
"valid_targets_mean": 5387.5,
"valid_targets_min": 3194
},
{
"epoch": 4.699008868022952,
"grad_norm": 0.5519442551812616,
"learning_rate": 1.1807980366358699e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12228633463382721,
"step": 4505,
"valid_targets_mean": 5418.8,
"valid_targets_min": 2167
},
{
"epoch": 4.704225352112676,
"grad_norm": 0.537327606366864,
"learning_rate": 1.1760566227475642e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08802211284637451,
"step": 4510,
"valid_targets_mean": 4752.1,
"valid_targets_min": 1858
},
{
"epoch": 4.7094418362024,
"grad_norm": 0.5001814385756308,
"learning_rate": 1.1713207796802739e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07559408247470856,
"step": 4515,
"valid_targets_mean": 4547.1,
"valid_targets_min": 2084
},
{
"epoch": 4.7146583202921235,
"grad_norm": 0.6139574218469945,
"learning_rate": 1.166590539453837e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0800754651427269,
"step": 4520,
"valid_targets_mean": 2884.9,
"valid_targets_min": 1128
},
{
"epoch": 4.719874804381846,
"grad_norm": 0.44098987196857486,
"learning_rate": 1.1618659340502104e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07793943583965302,
"step": 4525,
"valid_targets_mean": 5205.0,
"valid_targets_min": 3386
},
{
"epoch": 4.72509128847157,
"grad_norm": 0.5328520356066797,
"learning_rate": 1.157146995413252e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09932157397270203,
"step": 4530,
"valid_targets_mean": 5007.4,
"valid_targets_min": 3180
},
{
"epoch": 4.730307772561294,
"grad_norm": 0.5714349312818425,
"learning_rate": 1.152433755448509e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11112132668495178,
"step": 4535,
"valid_targets_mean": 4135.0,
"valid_targets_min": 845
},
{
"epoch": 4.735524256651017,
"grad_norm": 0.6077934906569697,
"learning_rate": 1.1477262460229945e-05,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10875889658927917,
"step": 4540,
"valid_targets_mean": 4602.1,
"valid_targets_min": 2684
},
{
"epoch": 4.7407407407407405,
"grad_norm": 0.49634424152814044,
"learning_rate": 1.143024498964981e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08921676874160767,
"step": 4545,
"valid_targets_mean": 4846.4,
"valid_targets_min": 1671
},
{
"epoch": 4.745957224830464,
"grad_norm": 0.5484808828375776,
"learning_rate": 1.1383285460637766e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08307075500488281,
"step": 4550,
"valid_targets_mean": 4329.8,
"valid_targets_min": 2076
},
{
"epoch": 4.751173708920188,
"grad_norm": 0.5699100757156194,
"learning_rate": 1.1336384190695172e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0887555330991745,
"step": 4555,
"valid_targets_mean": 4386.0,
"valid_targets_min": 2263
},
{
"epoch": 4.756390193009912,
"grad_norm": 0.6162552932737473,
"learning_rate": 1.1289541496929466e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1148238554596901,
"step": 4560,
"valid_targets_mean": 4499.8,
"valid_targets_min": 1708
},
{
"epoch": 4.761606677099635,
"grad_norm": 0.5482788011589695,
"learning_rate": 1.1242757696052044e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12479747831821442,
"step": 4565,
"valid_targets_mean": 5401.1,
"valid_targets_min": 2918
},
{
"epoch": 4.766823161189358,
"grad_norm": 0.5888332418366768,
"learning_rate": 1.1196033104376141e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09170383214950562,
"step": 4570,
"valid_targets_mean": 3555.5,
"valid_targets_min": 1731
},
{
"epoch": 4.772039645279082,
"grad_norm": 0.5317249435508927,
"learning_rate": 1.1149368037814644e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10484310239553452,
"step": 4575,
"valid_targets_mean": 4555.9,
"valid_targets_min": 2096
},
{
"epoch": 4.777256129368805,
"grad_norm": 0.4799591252187416,
"learning_rate": 1.1102762811877974e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08517284691333771,
"step": 4580,
"valid_targets_mean": 5683.2,
"valid_targets_min": 992
},
{
"epoch": 4.782472613458529,
"grad_norm": 0.5368871499454133,
"learning_rate": 1.1056217741672e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09460750967264175,
"step": 4585,
"valid_targets_mean": 4530.9,
"valid_targets_min": 1460
},
{
"epoch": 4.7876890975482524,
"grad_norm": 0.6264850463625782,
"learning_rate": 1.1009733141895823e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1226273775100708,
"step": 4590,
"valid_targets_mean": 3832.9,
"valid_targets_min": 1265
},
{
"epoch": 4.792905581637976,
"grad_norm": 0.5854870439324866,
"learning_rate": 1.0963309326839708e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09034893661737442,
"step": 4595,
"valid_targets_mean": 4724.6,
"valid_targets_min": 1686
},
{
"epoch": 4.7981220657277,
"grad_norm": 0.5325653015133102,
"learning_rate": 1.0916946610382966e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0999528169631958,
"step": 4600,
"valid_targets_mean": 4824.1,
"valid_targets_min": 1005
},
{
"epoch": 4.803338549817423,
"grad_norm": 1.1082587355140117,
"learning_rate": 1.0870645305991772e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09996119141578674,
"step": 4605,
"valid_targets_mean": 3833.6,
"valid_targets_min": 2319
},
{
"epoch": 4.808555033907147,
"grad_norm": 0.5691295113560585,
"learning_rate": 1.0824405726717119e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10683897137641907,
"step": 4610,
"valid_targets_mean": 5273.0,
"valid_targets_min": 2815
},
{
"epoch": 4.81377151799687,
"grad_norm": 0.4870388968066102,
"learning_rate": 1.0778228185192639e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10072125494480133,
"step": 4615,
"valid_targets_mean": 5368.4,
"valid_targets_min": 2944
},
{
"epoch": 4.818988002086593,
"grad_norm": 0.4751385993259293,
"learning_rate": 1.0732112993632539e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10202068090438843,
"step": 4620,
"valid_targets_mean": 6273.8,
"valid_targets_min": 3310
},
{
"epoch": 4.824204486176317,
"grad_norm": 0.5417469989722015,
"learning_rate": 1.0686060463829451e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09483262896537781,
"step": 4625,
"valid_targets_mean": 4831.4,
"valid_targets_min": 3176
},
{
"epoch": 4.829420970266041,
"grad_norm": 0.5340135754400219,
"learning_rate": 1.0640070907152342e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08007314801216125,
"step": 4630,
"valid_targets_mean": 4769.1,
"valid_targets_min": 3676
},
{
"epoch": 4.834637454355764,
"grad_norm": 0.535400223422294,
"learning_rate": 1.0594144634544405e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10891067236661911,
"step": 4635,
"valid_targets_mean": 5453.6,
"valid_targets_min": 2466
},
{
"epoch": 4.839853938445488,
"grad_norm": 0.5421802927843254,
"learning_rate": 1.0548281956520978e-05,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10159303992986679,
"step": 4640,
"valid_targets_mean": 4223.2,
"valid_targets_min": 1504
},
{
"epoch": 4.845070422535211,
"grad_norm": 0.4817463581579997,
"learning_rate": 1.0502483183167395e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09178589284420013,
"step": 4645,
"valid_targets_mean": 5853.9,
"valid_targets_min": 3404
},
{
"epoch": 4.850286906624935,
"grad_norm": 0.4579589936355861,
"learning_rate": 1.0456748624136951e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.089797243475914,
"step": 4650,
"valid_targets_mean": 5684.2,
"valid_targets_min": 1831
},
{
"epoch": 4.8555033907146585,
"grad_norm": 0.5325226015959841,
"learning_rate": 1.0411078588648756e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10591491311788559,
"step": 4655,
"valid_targets_mean": 4545.8,
"valid_targets_min": 1281
},
{
"epoch": 4.860719874804381,
"grad_norm": 0.5359785835739626,
"learning_rate": 1.0365473385485662e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11070498824119568,
"step": 4660,
"valid_targets_mean": 5118.9,
"valid_targets_min": 2572
},
{
"epoch": 4.865936358894105,
"grad_norm": 0.4681140800466057,
"learning_rate": 1.0319933322992206e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06727112829685211,
"step": 4665,
"valid_targets_mean": 6828.0,
"valid_targets_min": 3398
},
{
"epoch": 4.871152842983829,
"grad_norm": 0.544596415614375,
"learning_rate": 1.0274458709072459e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10550592839717865,
"step": 4670,
"valid_targets_mean": 4509.0,
"valid_targets_min": 1603
},
{
"epoch": 4.876369327073553,
"grad_norm": 0.5211494915877919,
"learning_rate": 1.022904985118803e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08883964270353317,
"step": 4675,
"valid_targets_mean": 4939.5,
"valid_targets_min": 2072
},
{
"epoch": 4.881585811163276,
"grad_norm": 0.5366796706123248,
"learning_rate": 1.0183707056355883e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08497545123100281,
"step": 4680,
"valid_targets_mean": 4657.1,
"valid_targets_min": 2882
},
{
"epoch": 4.886802295252999,
"grad_norm": 0.5538098669256223,
"learning_rate": 1.0138430631146372e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09791304171085358,
"step": 4685,
"valid_targets_mean": 4562.9,
"valid_targets_min": 1733
},
{
"epoch": 4.892018779342723,
"grad_norm": 0.5122227553184248,
"learning_rate": 1.009322088168108e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08409063518047333,
"step": 4690,
"valid_targets_mean": 4454.1,
"valid_targets_min": 2488
},
{
"epoch": 4.897235263432447,
"grad_norm": 0.47515776141982186,
"learning_rate": 1.0048078113630806e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09185665845870972,
"step": 4695,
"valid_targets_mean": 5278.4,
"valid_targets_min": 2265
},
{
"epoch": 4.90245174752217,
"grad_norm": 0.4708229178412286,
"learning_rate": 1.0003002632213455e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08610205352306366,
"step": 4700,
"valid_targets_mean": 5702.5,
"valid_targets_min": 1669
},
{
"epoch": 4.907668231611893,
"grad_norm": 0.5456843140599923,
"learning_rate": 9.95799474219202e-06,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08927833288908005,
"step": 4705,
"valid_targets_mean": 3771.5,
"valid_targets_min": 699
},
{
"epoch": 4.912884715701617,
"grad_norm": 0.5304864811688249,
"learning_rate": 9.913054747872473e-06,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08944433927536011,
"step": 4710,
"valid_targets_mean": 3983.1,
"valid_targets_min": 1205
},
{
"epoch": 4.918101199791341,
"grad_norm": 0.5120679513132991,
"learning_rate": 9.868182953101754e-06,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09833677113056183,
"step": 4715,
"valid_targets_mean": 4892.6,
"valid_targets_min": 1868
},
{
"epoch": 4.923317683881065,
"grad_norm": 0.4740197796982808,
"learning_rate": 9.823379661265677e-06,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09384319186210632,
"step": 4720,
"valid_targets_mean": 5562.9,
"valid_targets_min": 1211
},
{
"epoch": 4.9285341679707875,
"grad_norm": 0.5754044617169406,
"learning_rate": 9.778645175286904e-06,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09790576994419098,
"step": 4725,
"valid_targets_mean": 3851.1,
"valid_targets_min": 2615
},
{
"epoch": 4.933750652060511,
"grad_norm": 0.5467350049580387,
"learning_rate": 9.733979797622874e-06,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08118186891078949,
"step": 4730,
"valid_targets_mean": 4144.5,
"valid_targets_min": 2603
},
{
"epoch": 4.938967136150235,
"grad_norm": 0.5391696977368485,
"learning_rate": 9.689383830263808e-06,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09587861597537994,
"step": 4735,
"valid_targets_mean": 4530.6,
"valid_targets_min": 1367
},
{
"epoch": 4.944183620239958,
"grad_norm": 0.5053495433942577,
"learning_rate": 9.6448575747306e-06,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09295158088207245,
"step": 4740,
"valid_targets_mean": 5147.0,
"valid_targets_min": 2828
},
{
"epoch": 4.949400104329682,
"grad_norm": 0.5045776281748604,
"learning_rate": 9.60040133207281e-06,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10613466799259186,
"step": 4745,
"valid_targets_mean": 5857.0,
"valid_targets_min": 1833
},
{
"epoch": 4.954616588419405,
"grad_norm": 0.6058619681222275,
"learning_rate": 9.556015402866661e-06,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09133664518594742,
"step": 4750,
"valid_targets_mean": 4276.0,
"valid_targets_min": 1717
},
{
"epoch": 4.959833072509129,
"grad_norm": 0.4959626512225186,
"learning_rate": 9.511700087212934e-06,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07980967313051224,
"step": 4755,
"valid_targets_mean": 5189.9,
"valid_targets_min": 1708
},
{
"epoch": 4.965049556598853,
"grad_norm": 0.48580137728306516,
"learning_rate": 9.467455684735015e-06,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09308650344610214,
"step": 4760,
"valid_targets_mean": 5298.2,
"valid_targets_min": 2556
},
{
"epoch": 4.970266040688576,
"grad_norm": 0.5535867237148877,
"learning_rate": 9.423282494576804e-06,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10663655400276184,
"step": 4765,
"valid_targets_mean": 3930.9,
"valid_targets_min": 1183
},
{
"epoch": 4.975482524778299,
"grad_norm": 0.4835117585178872,
"learning_rate": 9.379180815400753e-06,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08318492770195007,
"step": 4770,
"valid_targets_mean": 4649.0,
"valid_targets_min": 1607
},
{
"epoch": 4.980699008868023,
"grad_norm": 0.5328360355929028,
"learning_rate": 9.33515094538579e-06,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11444680392742157,
"step": 4775,
"valid_targets_mean": 4569.6,
"valid_targets_min": 2494
},
{
"epoch": 4.985915492957746,
"grad_norm": 2.34205486469549,
"learning_rate": 9.291193182225341e-06,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09870575368404388,
"step": 4780,
"valid_targets_mean": 4542.0,
"valid_targets_min": 2048
},
{
"epoch": 4.99113197704747,
"grad_norm": 0.5444826085311868,
"learning_rate": 9.247307823125296e-06,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09969726204872131,
"step": 4785,
"valid_targets_mean": 4778.9,
"valid_targets_min": 2030
},
{
"epoch": 4.9963484611371936,
"grad_norm": 0.4600774725768868,
"learning_rate": 9.203495164802027e-06,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08270413428544998,
"step": 4790,
"valid_targets_mean": 4215.5,
"valid_targets_min": 1426
},
{
"epoch": 5.001043296817945,
"grad_norm": 0.5767089850528268,
"learning_rate": 9.159755503480345e-06,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09802889823913574,
"step": 4795,
"valid_targets_mean": 3765.0,
"valid_targets_min": 2046
},
{
"epoch": 5.006259780907668,
"grad_norm": 0.5088779515908076,
"learning_rate": 9.116089134891532e-06,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08812258392572403,
"step": 4800,
"valid_targets_mean": 4855.0,
"valid_targets_min": 904
},
{
"epoch": 5.011476264997392,
"grad_norm": 0.5579258578134513,
"learning_rate": 9.072496354271307e-06,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10268765687942505,
"step": 4805,
"valid_targets_mean": 5290.8,
"valid_targets_min": 2498
},
{
"epoch": 5.016692749087115,
"grad_norm": 0.49026031524788816,
"learning_rate": 9.028977456357872e-06,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08821749687194824,
"step": 4810,
"valid_targets_mean": 4934.0,
"valid_targets_min": 2634
},
{
"epoch": 5.021909233176839,
"grad_norm": 0.5755929497427029,
"learning_rate": 8.985532735389873e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09229262173175812,
"step": 4815,
"valid_targets_mean": 4120.2,
"valid_targets_min": 2454
},
{
"epoch": 5.027125717266562,
"grad_norm": 0.4788832049075145,
"learning_rate": 8.942162485104436e-06,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10502435266971588,
"step": 4820,
"valid_targets_mean": 7206.6,
"valid_targets_min": 3051
},
{
"epoch": 5.032342201356286,
"grad_norm": 0.5452723647928759,
"learning_rate": 8.898866998735195e-06,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07429133355617523,
"step": 4825,
"valid_targets_mean": 5484.9,
"valid_targets_min": 1170
},
{
"epoch": 5.037558685446009,
"grad_norm": 0.4701185100292731,
"learning_rate": 8.85564656901028e-06,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07872854173183441,
"step": 4830,
"valid_targets_mean": 6550.2,
"valid_targets_min": 2823
},
{
"epoch": 5.042775169535733,
"grad_norm": 0.5136050624625815,
"learning_rate": 8.81250148815035e-06,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09415871649980545,
"step": 4835,
"valid_targets_mean": 5931.8,
"valid_targets_min": 3171
},
{
"epoch": 5.0479916536254565,
"grad_norm": 0.52701581256359,
"learning_rate": 8.769432047866608e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09285668283700943,
"step": 4840,
"valid_targets_mean": 5262.5,
"valid_targets_min": 2397
},
{
"epoch": 5.05320813771518,
"grad_norm": 0.49187753178141813,
"learning_rate": 8.72643853935887e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07486429065465927,
"step": 4845,
"valid_targets_mean": 5657.0,
"valid_targets_min": 2807
},
{
"epoch": 5.058424621804903,
"grad_norm": 0.5222415808875729,
"learning_rate": 8.683521253313527e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0767851322889328,
"step": 4850,
"valid_targets_mean": 5430.5,
"valid_targets_min": 1363
},
{
"epoch": 5.063641105894627,
"grad_norm": 0.5849510322338102,
"learning_rate": 8.640680479901648e-06,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1165381669998169,
"step": 4855,
"valid_targets_mean": 5751.6,
"valid_targets_min": 1450
},
{
"epoch": 5.068857589984351,
"grad_norm": 0.552824844759434,
"learning_rate": 8.597916508776958e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08179624378681183,
"step": 4860,
"valid_targets_mean": 4421.5,
"valid_targets_min": 2044
},
{
"epoch": 5.074074074074074,
"grad_norm": 0.5852806584482265,
"learning_rate": 8.55522962907394e-06,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09368069469928741,
"step": 4865,
"valid_targets_mean": 4771.2,
"valid_targets_min": 2303
},
{
"epoch": 5.079290558163797,
"grad_norm": 0.5656026175754425,
"learning_rate": 8.512620129405816e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08062414079904556,
"step": 4870,
"valid_targets_mean": 4366.1,
"valid_targets_min": 1651
},
{
"epoch": 5.084507042253521,
"grad_norm": 0.6056679184030501,
"learning_rate": 8.470088297862669e-06,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.093223437666893,
"step": 4875,
"valid_targets_mean": 4162.6,
"valid_targets_min": 1806
},
{
"epoch": 5.089723526343245,
"grad_norm": 0.46297603218535177,
"learning_rate": 8.427634422009399e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06911472976207733,
"step": 4880,
"valid_targets_mean": 4408.1,
"valid_targets_min": 182
},
{
"epoch": 5.0949400104329685,
"grad_norm": 0.480165349242614,
"learning_rate": 8.385258788883889e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.080543652176857,
"step": 4885,
"valid_targets_mean": 5390.2,
"valid_targets_min": 2339
},
{
"epoch": 5.100156494522691,
"grad_norm": 0.6187632230317968,
"learning_rate": 8.342961684994975e-06,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09540046751499176,
"step": 4890,
"valid_targets_mean": 4305.9,
"valid_targets_min": 571
},
{
"epoch": 5.105372978612415,
"grad_norm": 0.5014931985409201,
"learning_rate": 8.300743396320566e-06,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09194246679544449,
"step": 4895,
"valid_targets_mean": 5965.2,
"valid_targets_min": 4203
},
{
"epoch": 5.110589462702139,
"grad_norm": 0.4761619942669461,
"learning_rate": 8.25860420830567e-06,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08677559345960617,
"step": 4900,
"valid_targets_mean": 6193.1,
"valid_targets_min": 2616
},
{
"epoch": 5.115805946791863,
"grad_norm": 0.5438438081832728,
"learning_rate": 8.216544405860482e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07954394817352295,
"step": 4905,
"valid_targets_mean": 4145.0,
"valid_targets_min": 1802
},
{
"epoch": 5.1210224308815855,
"grad_norm": 0.5844190463597226,
"learning_rate": 8.17456427335848e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0916503518819809,
"step": 4910,
"valid_targets_mean": 4599.1,
"valid_targets_min": 3185
},
{
"epoch": 5.126238914971309,
"grad_norm": 0.4767795377130653,
"learning_rate": 8.132664094634452e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07637080550193787,
"step": 4915,
"valid_targets_mean": 5424.6,
"valid_targets_min": 1951
},
{
"epoch": 5.131455399061033,
"grad_norm": 0.5719534354285207,
"learning_rate": 8.090844152982628e-06,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0903482586145401,
"step": 4920,
"valid_targets_mean": 4490.8,
"valid_targets_min": 3336
},
{
"epoch": 5.136671883150757,
"grad_norm": 0.594228113828102,
"learning_rate": 8.049104731154722e-06,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10992646217346191,
"step": 4925,
"valid_targets_mean": 4066.6,
"valid_targets_min": 1850
},
{
"epoch": 5.14188836724048,
"grad_norm": 0.5393641346325978,
"learning_rate": 8.007446111358066e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10360969603061676,
"step": 4930,
"valid_targets_mean": 5236.2,
"valid_targets_min": 1630
},
{
"epoch": 5.147104851330203,
"grad_norm": 0.8629098322126454,
"learning_rate": 7.965868575253632e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08919937908649445,
"step": 4935,
"valid_targets_mean": 5563.1,
"valid_targets_min": 3712
},
{
"epoch": 5.152321335419927,
"grad_norm": 0.5271937265549865,
"learning_rate": 7.92437240395422e-06,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07373526692390442,
"step": 4940,
"valid_targets_mean": 4110.0,
"valid_targets_min": 2084
},
{
"epoch": 5.157537819509651,
"grad_norm": 0.5319044522991199,
"learning_rate": 7.882957878022472e-06,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10028360038995743,
"step": 4945,
"valid_targets_mean": 4937.0,
"valid_targets_min": 1926
},
{
"epoch": 5.162754303599374,
"grad_norm": 0.5770944750107858,
"learning_rate": 7.841625277469043e-06,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09501786530017853,
"step": 4950,
"valid_targets_mean": 4708.1,
"valid_targets_min": 1991
},
{
"epoch": 5.1679707876890975,
"grad_norm": 0.5449691133821197,
"learning_rate": 7.800374881750644e-06,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09172935783863068,
"step": 4955,
"valid_targets_mean": 4663.4,
"valid_targets_min": 1223
},
{
"epoch": 5.173187271778821,
"grad_norm": 0.5307143737733113,
"learning_rate": 7.759206969768216e-06,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07758703082799911,
"step": 4960,
"valid_targets_mean": 4877.8,
"valid_targets_min": 1460
},
{
"epoch": 5.178403755868545,
"grad_norm": 0.5757575845426983,
"learning_rate": 7.718121819864983e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0805349200963974,
"step": 4965,
"valid_targets_mean": 4184.6,
"valid_targets_min": 1156
},
{
"epoch": 5.183620239958268,
"grad_norm": 0.5721969021340418,
"learning_rate": 7.677119709824635e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07684718072414398,
"step": 4970,
"valid_targets_mean": 4147.8,
"valid_targets_min": 1616
},
{
"epoch": 5.188836724047992,
"grad_norm": 0.5078691963548261,
"learning_rate": 7.636200916869387e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08875864744186401,
"step": 4975,
"valid_targets_mean": 5011.4,
"valid_targets_min": 1036
},
{
"epoch": 5.194053208137715,
"grad_norm": 0.5524157308543848,
"learning_rate": 7.595365717658143e-06,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.083509162068367,
"step": 4980,
"valid_targets_mean": 4123.9,
"valid_targets_min": 1454
},
{
"epoch": 5.199269692227439,
"grad_norm": 0.51400023936975,
"learning_rate": 7.554614388284609e-06,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08999491482973099,
"step": 4985,
"valid_targets_mean": 4854.6,
"valid_targets_min": 2395
},
{
"epoch": 5.204486176317162,
"grad_norm": 0.5864600154596398,
"learning_rate": 7.513947204275453e-06,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09562638401985168,
"step": 4990,
"valid_targets_mean": 4584.2,
"valid_targets_min": 2267
},
{
"epoch": 5.209702660406886,
"grad_norm": 0.5532188252087719,
"learning_rate": 7.473364440588404e-06,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0839436799287796,
"step": 4995,
"valid_targets_mean": 4932.2,
"valid_targets_min": 1548
},
{
"epoch": 5.214919144496609,
"grad_norm": 0.6299330322378309,
"learning_rate": 7.432866371610403e-06,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08354543149471283,
"step": 5000,
"valid_targets_mean": 4348.8,
"valid_targets_min": 1748
},
{
"epoch": 5.220135628586333,
"grad_norm": 0.4959684289084111,
"learning_rate": 7.392453271155786e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08260548859834671,
"step": 5005,
"valid_targets_mean": 5807.4,
"valid_targets_min": 1669
},
{
"epoch": 5.225352112676056,
"grad_norm": 0.5620999384066929,
"learning_rate": 7.352125412464368e-06,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0748911052942276,
"step": 5010,
"valid_targets_mean": 4590.0,
"valid_targets_min": 1848
},
{
"epoch": 5.23056859676578,
"grad_norm": 0.5581675018957084,
"learning_rate": 7.311883068199659e-06,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0873471274971962,
"step": 5015,
"valid_targets_mean": 4160.9,
"valid_targets_min": 1793
},
{
"epoch": 5.2357850808555035,
"grad_norm": 0.5052128067171061,
"learning_rate": 7.271726510446968e-06,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08994010090827942,
"step": 5020,
"valid_targets_mean": 5267.4,
"valid_targets_min": 3135
},
{
"epoch": 5.241001564945227,
"grad_norm": 0.4877172138308242,
"learning_rate": 7.231656010711609e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08713434636592865,
"step": 5025,
"valid_targets_mean": 5588.8,
"valid_targets_min": 3191
},
{
"epoch": 5.24621804903495,
"grad_norm": 0.5816293543459301,
"learning_rate": 7.191671839917025e-06,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09546761214733124,
"step": 5030,
"valid_targets_mean": 4677.6,
"valid_targets_min": 3102
},
{
"epoch": 5.251434533124674,
"grad_norm": 0.5452525730299029,
"learning_rate": 7.15177426840298e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09644042700529099,
"step": 5035,
"valid_targets_mean": 5553.9,
"valid_targets_min": 2409
},
{
"epoch": 5.256651017214398,
"grad_norm": 0.5146838047889054,
"learning_rate": 7.111963565923723e-06,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08240243792533875,
"step": 5040,
"valid_targets_mean": 5156.4,
"valid_targets_min": 2389
},
{
"epoch": 5.261867501304121,
"grad_norm": 0.5502902856949233,
"learning_rate": 7.07224000164618e-06,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10105292499065399,
"step": 5045,
"valid_targets_mean": 4615.9,
"valid_targets_min": 2221
},
{
"epoch": 5.267083985393844,
"grad_norm": 0.5516918505283356,
"learning_rate": 7.032603844148098e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09628251194953918,
"step": 5050,
"valid_targets_mean": 5681.5,
"valid_targets_min": 3383
},
{
"epoch": 5.272300469483568,
"grad_norm": 0.5388756000981851,
"learning_rate": 6.993055361416281e-06,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09925254434347153,
"step": 5055,
"valid_targets_mean": 4482.9,
"valid_targets_min": 3670
},
{
"epoch": 5.277516953573292,
"grad_norm": 0.5006488169663625,
"learning_rate": 6.953594820844725e-06,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08879800140857697,
"step": 5060,
"valid_targets_mean": 6420.1,
"valid_targets_min": 3558
},
{
"epoch": 5.2827334376630155,
"grad_norm": 0.5560127327398505,
"learning_rate": 6.914222489232834e-06,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0899522602558136,
"step": 5065,
"valid_targets_mean": 5202.9,
"valid_targets_min": 3176
},
{
"epoch": 5.287949921752738,
"grad_norm": 0.6756236046106081,
"learning_rate": 6.874938632783639e-06,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08966085314750671,
"step": 5070,
"valid_targets_mean": 3571.6,
"valid_targets_min": 627
},
{
"epoch": 5.293166405842462,
"grad_norm": 0.5422017060339238,
"learning_rate": 6.835743517101947e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08440357446670532,
"step": 5075,
"valid_targets_mean": 4761.0,
"valid_targets_min": 1624
},
{
"epoch": 5.298382889932186,
"grad_norm": 0.5591333270753611,
"learning_rate": 6.796637407192608e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07776360213756561,
"step": 5080,
"valid_targets_mean": 4593.9,
"valid_targets_min": 2015
},
{
"epoch": 5.30359937402191,
"grad_norm": 0.6151205137047357,
"learning_rate": 6.7576205674586405e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0986764132976532,
"step": 5085,
"valid_targets_mean": 3976.8,
"valid_targets_min": 1415
},
{
"epoch": 5.3088158581116325,
"grad_norm": 0.5539153347512382,
"learning_rate": 6.718693261699542e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08884495496749878,
"step": 5090,
"valid_targets_mean": 4511.4,
"valid_targets_min": 2240
},
{
"epoch": 5.314032342201356,
"grad_norm": 0.5839635887811082,
"learning_rate": 6.679855753109419e-06,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0866798609495163,
"step": 5095,
"valid_targets_mean": 3695.5,
"valid_targets_min": 1185
},
{
"epoch": 5.31924882629108,
"grad_norm": 0.524703444091149,
"learning_rate": 6.64110830427527e-06,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07154019176959991,
"step": 5100,
"valid_targets_mean": 4561.2,
"valid_targets_min": 2558
},
{
"epoch": 5.324465310380804,
"grad_norm": 0.5815298167263548,
"learning_rate": 6.602451177175162e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08907519280910492,
"step": 5105,
"valid_targets_mean": 3357.4,
"valid_targets_min": 2213
},
{
"epoch": 5.329681794470527,
"grad_norm": 0.4817977233073812,
"learning_rate": 6.563884633176505e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08714839071035385,
"step": 5110,
"valid_targets_mean": 5580.0,
"valid_targets_min": 2439
},
{
"epoch": 5.33489827856025,
"grad_norm": 0.5242439779801624,
"learning_rate": 6.5254089330342366e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07945850491523743,
"step": 5115,
"valid_targets_mean": 4681.1,
"valid_targets_min": 3074
},
{
"epoch": 5.340114762649974,
"grad_norm": 0.5615047976477149,
"learning_rate": 6.487024336889107e-06,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09414586424827576,
"step": 5120,
"valid_targets_mean": 5437.2,
"valid_targets_min": 2212
},
{
"epoch": 5.345331246739698,
"grad_norm": 0.5258908501065038,
"learning_rate": 6.448731104265871e-06,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10087031126022339,
"step": 5125,
"valid_targets_mean": 5349.8,
"valid_targets_min": 2886
},
{
"epoch": 5.350547730829421,
"grad_norm": 0.5321933147958745,
"learning_rate": 6.410529494071596e-06,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09096763283014297,
"step": 5130,
"valid_targets_mean": 5575.4,
"valid_targets_min": 1571
},
{
"epoch": 5.3557642149191445,
"grad_norm": 0.47426003796053384,
"learning_rate": 6.372419764593825e-06,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08991380780935287,
"step": 5135,
"valid_targets_mean": 6106.4,
"valid_targets_min": 3744
},
{
"epoch": 5.360980699008868,
"grad_norm": 0.5301388683550673,
"learning_rate": 6.334402173498926e-06,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07810938358306885,
"step": 5140,
"valid_targets_mean": 4348.8,
"valid_targets_min": 2076
},
{
"epoch": 5.366197183098592,
"grad_norm": 0.5374279733696077,
"learning_rate": 6.296476977830272e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08754917979240417,
"step": 5145,
"valid_targets_mean": 5014.2,
"valid_targets_min": 2862
},
{
"epoch": 5.371413667188315,
"grad_norm": 0.7206731702211141,
"learning_rate": 6.2586444340065625e-06,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0999416708946228,
"step": 5150,
"valid_targets_mean": 4403.9,
"valid_targets_min": 1066
},
{
"epoch": 5.376630151278039,
"grad_norm": 0.47298145612120657,
"learning_rate": 6.22090479782004e-06,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07644212245941162,
"step": 5155,
"valid_targets_mean": 4559.2,
"valid_targets_min": 1091
},
{
"epoch": 5.381846635367762,
"grad_norm": 0.6183890277166507,
"learning_rate": 6.18325832443478e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09842634201049805,
"step": 5160,
"valid_targets_mean": 4859.1,
"valid_targets_min": 3053
},
{
"epoch": 5.387063119457486,
"grad_norm": 0.5809269936749796,
"learning_rate": 6.145705268384996e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08372758328914642,
"step": 5165,
"valid_targets_mean": 4085.4,
"valid_targets_min": 1622
},
{
"epoch": 5.392279603547209,
"grad_norm": 0.4953269082886467,
"learning_rate": 6.108245883573258e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08300064504146576,
"step": 5170,
"valid_targets_mean": 5048.5,
"valid_targets_min": 2023
},
{
"epoch": 5.397496087636933,
"grad_norm": 0.5175745081691734,
"learning_rate": 6.070880423268839e-06,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08488012105226517,
"step": 5175,
"valid_targets_mean": 5152.5,
"valid_targets_min": 3232
},
{
"epoch": 5.402712571726656,
"grad_norm": 0.5076264348082026,
"learning_rate": 6.033609140105949e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07731913775205612,
"step": 5180,
"valid_targets_mean": 4969.0,
"valid_targets_min": 1591
},
{
"epoch": 5.40792905581638,
"grad_norm": 0.5404816837020461,
"learning_rate": 5.996432286082061e-06,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09518995881080627,
"step": 5185,
"valid_targets_mean": 5947.1,
"valid_targets_min": 2923
},
{
"epoch": 5.413145539906103,
"grad_norm": 0.5159738238694263,
"learning_rate": 5.9593501125561885e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07734167575836182,
"step": 5190,
"valid_targets_mean": 5073.8,
"valid_targets_min": 3352
},
{
"epoch": 5.418362023995827,
"grad_norm": 0.5684634602268366,
"learning_rate": 5.922362870247214e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10236285626888275,
"step": 5195,
"valid_targets_mean": 4632.4,
"valid_targets_min": 2124
},
{
"epoch": 5.4235785080855505,
"grad_norm": 0.5373820991292663,
"learning_rate": 5.885470809232143e-06,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07851923257112503,
"step": 5200,
"valid_targets_mean": 4475.5,
"valid_targets_min": 1766
},
{
"epoch": 5.428794992175274,
"grad_norm": 0.5458806892088824,
"learning_rate": 5.8486741789444804e-06,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0888456404209137,
"step": 5205,
"valid_targets_mean": 4564.1,
"valid_targets_min": 1108
},
{
"epoch": 5.434011476264997,
"grad_norm": 0.5479391419138662,
"learning_rate": 5.8119732281724715e-06,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09237441420555115,
"step": 5210,
"valid_targets_mean": 5527.6,
"valid_targets_min": 2991
},
{
"epoch": 5.439227960354721,
"grad_norm": 0.5194660932458187,
"learning_rate": 5.775368205057488e-06,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07880048453807831,
"step": 5215,
"valid_targets_mean": 4676.0,
"valid_targets_min": 2155
},
{
"epoch": 5.444444444444445,
"grad_norm": 0.5598013074244899,
"learning_rate": 5.738859357092297e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08336806297302246,
"step": 5220,
"valid_targets_mean": 4326.5,
"valid_targets_min": 1821
},
{
"epoch": 5.449660928534168,
"grad_norm": 0.5747509440158713,
"learning_rate": 5.7024469311194095e-06,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0965658500790596,
"step": 5225,
"valid_targets_mean": 3991.5,
"valid_targets_min": 1306
},
{
"epoch": 5.454877412623891,
"grad_norm": 0.5983423632567207,
"learning_rate": 5.66613117332943e-06,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11357493698596954,
"step": 5230,
"valid_targets_mean": 5065.5,
"valid_targets_min": 3065
},
{
"epoch": 5.460093896713615,
"grad_norm": 0.5468847755310513,
"learning_rate": 5.629912329259355e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09041740000247955,
"step": 5235,
"valid_targets_mean": 4774.6,
"valid_targets_min": 1518
},
{
"epoch": 5.465310380803339,
"grad_norm": 0.5117526048335445,
"learning_rate": 5.593790643790935e-06,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09142474830150604,
"step": 5240,
"valid_targets_mean": 5328.4,
"valid_targets_min": 3105
},
{
"epoch": 5.470526864893062,
"grad_norm": 0.5251513808853013,
"learning_rate": 5.557766361149013e-06,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08423709869384766,
"step": 5245,
"valid_targets_mean": 4627.4,
"valid_targets_min": 2463
},
{
"epoch": 5.475743348982785,
"grad_norm": 0.5367593742044022,
"learning_rate": 5.521839724899887e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08371119946241379,
"step": 5250,
"valid_targets_mean": 4551.9,
"valid_targets_min": 474
},
{
"epoch": 5.480959833072509,
"grad_norm": 0.5999861887031098,
"learning_rate": 5.48601097794963e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08510912209749222,
"step": 5255,
"valid_targets_mean": 3554.6,
"valid_targets_min": 1257
},
{
"epoch": 5.486176317162233,
"grad_norm": 0.5291638823924313,
"learning_rate": 5.450280362542495e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08900319039821625,
"step": 5260,
"valid_targets_mean": 5461.8,
"valid_targets_min": 1675
},
{
"epoch": 5.491392801251957,
"grad_norm": 0.5538581823082644,
"learning_rate": 5.414648120259225e-06,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0811634510755539,
"step": 5265,
"valid_targets_mean": 4332.2,
"valid_targets_min": 2098
},
{
"epoch": 5.4966092853416795,
"grad_norm": 0.6247487880807111,
"learning_rate": 5.379114492015467e-06,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1094445213675499,
"step": 5270,
"valid_targets_mean": 4459.2,
"valid_targets_min": 2641
},
{
"epoch": 5.501825769431403,
"grad_norm": 0.5155655112469832,
"learning_rate": 5.343679718060104e-06,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06469831615686417,
"step": 5275,
"valid_targets_mean": 4931.0,
"valid_targets_min": 3162
},
{
"epoch": 5.507042253521127,
"grad_norm": 0.5920115869396942,
"learning_rate": 5.308344037973672e-06,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08934450894594193,
"step": 5280,
"valid_targets_mean": 4298.9,
"valid_targets_min": 1184
},
{
"epoch": 5.51225873761085,
"grad_norm": 0.5119002875008457,
"learning_rate": 5.2731076906666786e-06,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08615301549434662,
"step": 5285,
"valid_targets_mean": 4840.4,
"valid_targets_min": 1406
},
{
"epoch": 5.517475221700574,
"grad_norm": 0.5262229363816199,
"learning_rate": 5.237970914378068e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09570074081420898,
"step": 5290,
"valid_targets_mean": 5322.9,
"valid_targets_min": 3350
},
{
"epoch": 5.522691705790297,
"grad_norm": 0.5538227803274636,
"learning_rate": 5.202933946673532e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08771003782749176,
"step": 5295,
"valid_targets_mean": 4497.5,
"valid_targets_min": 2001
},
{
"epoch": 5.527908189880021,
"grad_norm": 0.5502507076068306,
"learning_rate": 5.1679970244439695e-06,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07107767462730408,
"step": 5300,
"valid_targets_mean": 3696.2,
"valid_targets_min": 2225
},
{
"epoch": 5.533124673969745,
"grad_norm": 0.5512386550175091,
"learning_rate": 5.13316038390383e-06,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0939207673072815,
"step": 5305,
"valid_targets_mean": 5463.0,
"valid_targets_min": 3574
},
{
"epoch": 5.538341158059468,
"grad_norm": 0.5278227929504776,
"learning_rate": 5.098424260589565e-06,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10499151796102524,
"step": 5310,
"valid_targets_mean": 5881.4,
"valid_targets_min": 3680
},
{
"epoch": 5.5435576421491914,
"grad_norm": 0.5519375612123985,
"learning_rate": 5.063788889357995e-06,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09371333569288254,
"step": 5315,
"valid_targets_mean": 5093.1,
"valid_targets_min": 1624
},
{
"epoch": 5.548774126238915,
"grad_norm": 0.5716503917543002,
"learning_rate": 5.029254504384733e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10242068767547607,
"step": 5320,
"valid_targets_mean": 4717.9,
"valid_targets_min": 2413
},
{
"epoch": 5.553990610328638,
"grad_norm": 0.5874419944817311,
"learning_rate": 4.9948213391626325e-06,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10250916332006454,
"step": 5325,
"valid_targets_mean": 4346.5,
"valid_targets_min": 2439
},
{
"epoch": 5.559207094418362,
"grad_norm": 0.5504381846725983,
"learning_rate": 4.960489626500153e-06,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07717075943946838,
"step": 5330,
"valid_targets_mean": 4242.8,
"valid_targets_min": 897
},
{
"epoch": 5.5644235785080856,
"grad_norm": 0.5146939011973244,
"learning_rate": 4.926259598519851e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06690868735313416,
"step": 5335,
"valid_targets_mean": 4106.6,
"valid_targets_min": 1369
},
{
"epoch": 5.569640062597809,
"grad_norm": 0.5505646821539498,
"learning_rate": 4.892131486656733e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08535034954547882,
"step": 5340,
"valid_targets_mean": 5032.8,
"valid_targets_min": 1013
},
{
"epoch": 5.574856546687533,
"grad_norm": 0.529809183401811,
"learning_rate": 4.858105521656768e-06,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08789815753698349,
"step": 5345,
"valid_targets_mean": 5742.9,
"valid_targets_min": 3928
},
{
"epoch": 5.580073030777256,
"grad_norm": 0.5370726178638763,
"learning_rate": 4.824181933575272e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10115206241607666,
"step": 5350,
"valid_targets_mean": 5713.5,
"valid_targets_min": 1421
},
{
"epoch": 5.58528951486698,
"grad_norm": 0.5569605856751727,
"learning_rate": 4.790360951775392e-06,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09263263642787933,
"step": 5355,
"valid_targets_mean": 5239.4,
"valid_targets_min": 2056
},
{
"epoch": 5.590505998956703,
"grad_norm": 0.5455568305099259,
"learning_rate": 4.756642804926517e-06,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09849033504724503,
"step": 5360,
"valid_targets_mean": 5447.1,
"valid_targets_min": 967
},
{
"epoch": 5.595722483046426,
"grad_norm": 0.6272566838215045,
"learning_rate": 4.7230277210027685e-06,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09728604555130005,
"step": 5365,
"valid_targets_mean": 3810.0,
"valid_targets_min": 2077
},
{
"epoch": 5.60093896713615,
"grad_norm": 0.4949180746326753,
"learning_rate": 4.689515927281427e-06,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07689865678548813,
"step": 5370,
"valid_targets_mean": 5535.0,
"valid_targets_min": 1205
},
{
"epoch": 5.606155451225874,
"grad_norm": 0.521391228466892,
"learning_rate": 4.6561076503414235e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07850983738899231,
"step": 5375,
"valid_targets_mean": 4991.0,
"valid_targets_min": 2411
},
{
"epoch": 5.6113719353155975,
"grad_norm": 0.5047705118028566,
"learning_rate": 4.622803116061789e-06,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08694680035114288,
"step": 5380,
"valid_targets_mean": 5849.4,
"valid_targets_min": 3531
},
{
"epoch": 5.616588419405321,
"grad_norm": 0.535962737554241,
"learning_rate": 4.589602549620127e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09452635049819946,
"step": 5385,
"valid_targets_mean": 5429.2,
"valid_targets_min": 3055
},
{
"epoch": 5.621804903495044,
"grad_norm": 0.5852505700527569,
"learning_rate": 4.556506175491097e-06,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08648938685655594,
"step": 5390,
"valid_targets_mean": 4766.6,
"valid_targets_min": 2003
},
{
"epoch": 5.627021387584768,
"grad_norm": 0.5898102688979189,
"learning_rate": 4.523514217444918e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11465403437614441,
"step": 5395,
"valid_targets_mean": 5365.4,
"valid_targets_min": 1202
},
{
"epoch": 5.632237871674492,
"grad_norm": 0.5229012788505973,
"learning_rate": 4.490626898545805e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07465511560440063,
"step": 5400,
"valid_targets_mean": 4374.1,
"valid_targets_min": 1664
},
{
"epoch": 5.6374543557642145,
"grad_norm": 0.5409442222602789,
"learning_rate": 4.4578444411505005e-06,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08053886890411377,
"step": 5405,
"valid_targets_mean": 5253.8,
"valid_targets_min": 2479
},
{
"epoch": 5.642670839853938,
"grad_norm": 0.5285523050183011,
"learning_rate": 4.425167066906777e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07296570390462875,
"step": 5410,
"valid_targets_mean": 4937.6,
"valid_targets_min": 3123
},
{
"epoch": 5.647887323943662,
"grad_norm": 0.5416239529994494,
"learning_rate": 4.392594996751891e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09565962851047516,
"step": 5415,
"valid_targets_mean": 5340.2,
"valid_targets_min": 3983
},
{
"epoch": 5.653103808033386,
"grad_norm": 0.5311968413285663,
"learning_rate": 4.360128450911154e-06,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0871681272983551,
"step": 5420,
"valid_targets_mean": 5207.1,
"valid_targets_min": 617
},
{
"epoch": 5.6583202921231095,
"grad_norm": 0.507054671436209,
"learning_rate": 4.3277676488963775e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08645960688591003,
"step": 5425,
"valid_targets_mean": 5039.8,
"valid_targets_min": 1143
},
{
"epoch": 5.663536776212832,
"grad_norm": 0.568306365639052,
"learning_rate": 4.295512809504447e-06,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08979377150535583,
"step": 5430,
"valid_targets_mean": 5396.4,
"valid_targets_min": 1649
},
{
"epoch": 5.668753260302556,
"grad_norm": 0.5130604318115416,
"learning_rate": 4.263364150815803e-06,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06490998715162277,
"step": 5435,
"valid_targets_mean": 3744.5,
"valid_targets_min": 1432
},
{
"epoch": 5.67396974439228,
"grad_norm": 0.5692022571266344,
"learning_rate": 4.231321890192981e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10590483248233795,
"step": 5440,
"valid_targets_mean": 4565.5,
"valid_targets_min": 1410
},
{
"epoch": 5.679186228482003,
"grad_norm": 0.5957273632676808,
"learning_rate": 4.19938624427914e-06,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08738480508327484,
"step": 5445,
"valid_targets_mean": 4124.2,
"valid_targets_min": 2426
},
{
"epoch": 5.6844027125717265,
"grad_norm": 0.5059513068357104,
"learning_rate": 4.167557428996611e-06,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09112801402807236,
"step": 5450,
"valid_targets_mean": 4731.6,
"valid_targets_min": 2194
},
{
"epoch": 5.68961919666145,
"grad_norm": 0.5693590655270471,
"learning_rate": 4.135835659545406e-06,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09921035915613174,
"step": 5455,
"valid_targets_mean": 4494.1,
"valid_targets_min": 1559
},
{
"epoch": 5.694835680751174,
"grad_norm": 0.5024039878747486,
"learning_rate": 4.104221150401806e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10560700297355652,
"step": 5460,
"valid_targets_mean": 6348.4,
"valid_targets_min": 1947
},
{
"epoch": 5.700052164840898,
"grad_norm": 0.4650548652863463,
"learning_rate": 4.072714115316863e-06,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06292714923620224,
"step": 5465,
"valid_targets_mean": 5174.2,
"valid_targets_min": 1897
},
{
"epoch": 5.705268648930621,
"grad_norm": 0.4486459885321795,
"learning_rate": 4.041314767314983e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07271754741668701,
"step": 5470,
"valid_targets_mean": 5976.1,
"valid_targets_min": 2077
},
{
"epoch": 5.710485133020344,
"grad_norm": 0.5938653009407587,
"learning_rate": 4.010023318692502e-06,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09291598200798035,
"step": 5475,
"valid_targets_mean": 3675.5,
"valid_targets_min": 1525
},
{
"epoch": 5.715701617110068,
"grad_norm": 0.5328052077536234,
"learning_rate": 3.978839981016203e-06,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10603446513414383,
"step": 5480,
"valid_targets_mean": 5534.8,
"valid_targets_min": 1353
},
{
"epoch": 5.720918101199791,
"grad_norm": 0.5222740838976995,
"learning_rate": 3.947764965121934e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07417292892932892,
"step": 5485,
"valid_targets_mean": 4324.2,
"valid_targets_min": 1883
},
{
"epoch": 5.726134585289515,
"grad_norm": 0.5901115757033547,
"learning_rate": 3.916798481113144e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09025438129901886,
"step": 5490,
"valid_targets_mean": 3641.8,
"valid_targets_min": 1759
},
{
"epoch": 5.731351069379238,
"grad_norm": 0.5857376932555667,
"learning_rate": 3.885940738359492e-06,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0782744288444519,
"step": 5495,
"valid_targets_mean": 3576.2,
"valid_targets_min": 1538
},
{
"epoch": 5.736567553468962,
"grad_norm": 0.47645456542263637,
"learning_rate": 3.855191945495405e-06,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0868457555770874,
"step": 5500,
"valid_targets_mean": 5765.2,
"valid_targets_min": 1375
},
{
"epoch": 5.741784037558686,
"grad_norm": 0.5236361251793296,
"learning_rate": 3.824552310418703e-06,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06546823680400848,
"step": 5505,
"valid_targets_mean": 5086.6,
"valid_targets_min": 2965
},
{
"epoch": 5.747000521648409,
"grad_norm": 0.5091732574059794,
"learning_rate": 3.794022040289147e-06,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07745197415351868,
"step": 5510,
"valid_targets_mean": 5054.1,
"valid_targets_min": 2306
},
{
"epoch": 5.7522170057381325,
"grad_norm": 0.46441623103319934,
"learning_rate": 3.763601341527088e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07298596203327179,
"step": 5515,
"valid_targets_mean": 5433.0,
"valid_targets_min": 1438
},
{
"epoch": 5.757433489827856,
"grad_norm": 0.49641591292243104,
"learning_rate": 3.733290419812019e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08252263814210892,
"step": 5520,
"valid_targets_mean": 5315.5,
"valid_targets_min": 1678
},
{
"epoch": 5.762649973917579,
"grad_norm": 0.6789379381663515,
"learning_rate": 3.7030894800812365e-06,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10934539139270782,
"step": 5525,
"valid_targets_mean": 4483.8,
"valid_targets_min": 1772
},
{
"epoch": 5.767866458007303,
"grad_norm": 0.5423814329508395,
"learning_rate": 3.672998726528414e-06,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11362475156784058,
"step": 5530,
"valid_targets_mean": 5748.1,
"valid_targets_min": 2177
},
{
"epoch": 5.773082942097027,
"grad_norm": 0.5489625563953952,
"learning_rate": 3.6430183626022574e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09776196628808975,
"step": 5535,
"valid_targets_mean": 6000.1,
"valid_targets_min": 3982
},
{
"epoch": 5.77829942618675,
"grad_norm": 0.6233184110121164,
"learning_rate": 3.613148591005071e-06,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08113294094800949,
"step": 5540,
"valid_targets_mean": 4493.1,
"valid_targets_min": 1197
},
{
"epoch": 5.783515910276473,
"grad_norm": 0.4822987640375631,
"learning_rate": 3.5833896136914705e-06,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07164439558982849,
"step": 5545,
"valid_targets_mean": 5387.6,
"valid_targets_min": 2047
},
{
"epoch": 5.788732394366197,
"grad_norm": 0.4749912986402253,
"learning_rate": 3.553741631866938e-06,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09115122258663177,
"step": 5550,
"valid_targets_mean": 6122.4,
"valid_targets_min": 2286
},
{
"epoch": 5.793948878455921,
"grad_norm": 0.5946909865400563,
"learning_rate": 3.524204845986523e-06,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08981865644454956,
"step": 5555,
"valid_targets_mean": 4332.4,
"valid_targets_min": 1866
},
{
"epoch": 5.7991653625456445,
"grad_norm": 0.4981777296421743,
"learning_rate": 3.494779455753443e-06,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07500408589839935,
"step": 5560,
"valid_targets_mean": 4568.4,
"valid_targets_min": 2141
},
{
"epoch": 5.804381846635367,
"grad_norm": 0.6142734821840982,
"learning_rate": 3.4654656601177482e-06,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10738922655582428,
"step": 5565,
"valid_targets_mean": 3865.8,
"valid_targets_min": 1623
},
{
"epoch": 5.809598330725091,
"grad_norm": 0.6888133941635042,
"learning_rate": 3.4362636572749984e-06,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09062996506690979,
"step": 5570,
"valid_targets_mean": 4535.8,
"valid_targets_min": 1079
},
{
"epoch": 5.814814814814815,
"grad_norm": 0.5144938987206906,
"learning_rate": 3.4071736446648805e-06,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08362233638763428,
"step": 5575,
"valid_targets_mean": 5688.2,
"valid_targets_min": 1588
},
{
"epoch": 5.820031298904539,
"grad_norm": 0.55001093740802,
"learning_rate": 3.3781958189699183e-06,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10185902565717697,
"step": 5580,
"valid_targets_mean": 5194.5,
"valid_targets_min": 2848
},
{
"epoch": 5.8252477829942615,
"grad_norm": 0.5048679008418444,
"learning_rate": 3.3493303761141016e-06,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08554618060588837,
"step": 5585,
"valid_targets_mean": 6494.1,
"valid_targets_min": 2608
},
{
"epoch": 5.830464267083985,
"grad_norm": 0.5470595580590045,
"learning_rate": 3.320577511261589e-06,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09496854245662689,
"step": 5590,
"valid_targets_mean": 5576.2,
"valid_targets_min": 3507
},
{
"epoch": 5.835680751173709,
"grad_norm": 0.52994182216623,
"learning_rate": 3.291937418815376e-06,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08456946909427643,
"step": 5595,
"valid_targets_mean": 3731.2,
"valid_targets_min": 1021
},
{
"epoch": 5.840897235263433,
"grad_norm": 0.5798170124783152,
"learning_rate": 3.2634102924159982e-06,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10535246133804321,
"step": 5600,
"valid_targets_mean": 4603.9,
"valid_targets_min": 1345
},
{
"epoch": 5.846113719353156,
"grad_norm": 0.5136604632732348,
"learning_rate": 3.2349963249401894e-06,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08853639662265778,
"step": 5605,
"valid_targets_mean": 5272.5,
"valid_targets_min": 2097
},
{
"epoch": 5.851330203442879,
"grad_norm": 0.5423322037998392,
"learning_rate": 3.2066957084996163e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1070578321814537,
"step": 5610,
"valid_targets_mean": 5331.8,
"valid_targets_min": 3613
},
{
"epoch": 5.856546687532603,
"grad_norm": 0.5064494433132412,
"learning_rate": 3.178508634439539e-06,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07132753729820251,
"step": 5615,
"valid_targets_mean": 4434.9,
"valid_targets_min": 1705
},
{
"epoch": 5.861763171622327,
"grad_norm": 0.5051160365914387,
"learning_rate": 3.150435293337557e-06,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07303132116794586,
"step": 5620,
"valid_targets_mean": 4491.8,
"valid_targets_min": 1976
},
{
"epoch": 5.86697965571205,
"grad_norm": 0.5606453533642057,
"learning_rate": 3.1224758750022934e-06,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06995655596256256,
"step": 5625,
"valid_targets_mean": 4081.4,
"valid_targets_min": 1896
},
{
"epoch": 5.8721961398017735,
"grad_norm": 0.5653178986022215,
"learning_rate": 3.0946305684721145e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09811203926801682,
"step": 5630,
"valid_targets_mean": 5245.2,
"valid_targets_min": 1947
},
{
"epoch": 5.877412623891497,
"grad_norm": 0.5252545759785076,
"learning_rate": 3.066899562013872e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07529449462890625,
"step": 5635,
"valid_targets_mean": 3975.2,
"valid_targets_min": 1194
},
{
"epoch": 5.882629107981221,
"grad_norm": 0.5433632880437022,
"learning_rate": 3.0392830431216037e-06,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07809676975011826,
"step": 5640,
"valid_targets_mean": 4935.0,
"valid_targets_min": 1503
},
{
"epoch": 5.887845592070944,
"grad_norm": 0.5289957385883606,
"learning_rate": 3.01178119851528e-06,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08336209505796432,
"step": 5645,
"valid_targets_mean": 4886.6,
"valid_targets_min": 1800
},
{
"epoch": 5.893062076160668,
"grad_norm": 0.5575156548605359,
"learning_rate": 2.9843942141395365e-06,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0846119076013565,
"step": 5650,
"valid_targets_mean": 3872.9,
"valid_targets_min": 1389
},
{
"epoch": 5.898278560250391,
"grad_norm": 0.5878385442301363,
"learning_rate": 2.9571222751624317e-06,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09252753853797913,
"step": 5655,
"valid_targets_mean": 4209.4,
"valid_targets_min": 2028
},
{
"epoch": 5.903495044340115,
"grad_norm": 0.551111216455573,
"learning_rate": 2.9299655659741622e-06,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09265060722827911,
"step": 5660,
"valid_targets_mean": 4456.5,
"valid_targets_min": 1219
},
{
"epoch": 5.908711528429838,
"grad_norm": 0.5820990540633043,
"learning_rate": 2.9029242701858606e-06,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08701181411743164,
"step": 5665,
"valid_targets_mean": 4254.0,
"valid_targets_min": 2724
},
{
"epoch": 5.913928012519562,
"grad_norm": 0.5226092777050476,
"learning_rate": 2.8759985706283068e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08515148609876633,
"step": 5670,
"valid_targets_mean": 4590.4,
"valid_targets_min": 2366
},
{
"epoch": 5.919144496609285,
"grad_norm": 0.5971219829568228,
"learning_rate": 2.8491886493507313e-06,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10314597189426422,
"step": 5675,
"valid_targets_mean": 4606.9,
"valid_targets_min": 1281
},
{
"epoch": 5.924360980699009,
"grad_norm": 0.5665002869239318,
"learning_rate": 2.8224946876195593e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08449500799179077,
"step": 5680,
"valid_targets_mean": 4555.5,
"valid_targets_min": 1272
},
{
"epoch": 5.929577464788732,
"grad_norm": 0.6007551768138341,
"learning_rate": 2.795916865917201e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.100425586104393,
"step": 5685,
"valid_targets_mean": 4430.6,
"valid_targets_min": 1239
},
{
"epoch": 5.934793948878456,
"grad_norm": 0.5553678028748384,
"learning_rate": 2.7694553639408163e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09645190834999084,
"step": 5690,
"valid_targets_mean": 5136.9,
"valid_targets_min": 2097
},
{
"epoch": 5.9400104329681795,
"grad_norm": 0.5350257692219152,
"learning_rate": 2.7431103606011113e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07542605698108673,
"step": 5695,
"valid_targets_mean": 4592.1,
"valid_targets_min": 2235
},
{
"epoch": 5.945226917057903,
"grad_norm": 0.5370749848123485,
"learning_rate": 2.71688203402112e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10020209103822708,
"step": 5700,
"valid_targets_mean": 4956.2,
"valid_targets_min": 2666
},
{
"epoch": 5.950443401147626,
"grad_norm": 0.5616035739838323,
"learning_rate": 2.690770561535019e-06,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1056441217660904,
"step": 5705,
"valid_targets_mean": 5587.0,
"valid_targets_min": 3696
},
{
"epoch": 5.95565988523735,
"grad_norm": 0.505396409620737,
"learning_rate": 2.664776119686896e-06,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06738579273223877,
"step": 5710,
"valid_targets_mean": 4772.8,
"valid_targets_min": 1612
},
{
"epoch": 5.960876369327074,
"grad_norm": 0.558148133432388,
"learning_rate": 2.6388988842295947e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08058644086122513,
"step": 5715,
"valid_targets_mean": 3943.5,
"valid_targets_min": 1629
},
{
"epoch": 5.966092853416797,
"grad_norm": 0.49142281395227094,
"learning_rate": 2.6131390301234927e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08975610136985779,
"step": 5720,
"valid_targets_mean": 6229.9,
"valid_targets_min": 3962
},
{
"epoch": 5.97130933750652,
"grad_norm": 0.5127563839312393,
"learning_rate": 2.587496731535326e-06,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08209004998207092,
"step": 5725,
"valid_targets_mean": 5349.5,
"valid_targets_min": 3091
},
{
"epoch": 5.976525821596244,
"grad_norm": 0.5870781435714937,
"learning_rate": 2.561972161837041e-06,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09318692982196808,
"step": 5730,
"valid_targets_mean": 4410.8,
"valid_targets_min": 2042
},
{
"epoch": 5.981742305685968,
"grad_norm": 0.5331167201677213,
"learning_rate": 2.536565493604575e-06,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11014723777770996,
"step": 5735,
"valid_targets_mean": 6198.2,
"valid_targets_min": 4202
},
{
"epoch": 5.9869587897756915,
"grad_norm": 0.5217330036417076,
"learning_rate": 2.511276898616737e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09141227602958679,
"step": 5740,
"valid_targets_mean": 5061.2,
"valid_targets_min": 1855
},
{
"epoch": 5.992175273865414,
"grad_norm": 0.7628287327814164,
"learning_rate": 2.4861065478539925e-06,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09051162749528885,
"step": 5745,
"valid_targets_mean": 4572.0,
"valid_targets_min": 2408
},
{
"epoch": 5.997391757955138,
"grad_norm": 0.5412099702884833,
"learning_rate": 2.4610546114973666e-06,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08535590022802353,
"step": 5750,
"valid_targets_mean": 4914.4,
"valid_targets_min": 2299
},
{
"epoch": 6.002086593635889,
"grad_norm": 0.5666885471819875,
"learning_rate": 2.4361212589272488e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09032214432954788,
"step": 5755,
"valid_targets_mean": 3914.6,
"valid_targets_min": 1557
},
{
"epoch": 6.007303077725613,
"grad_norm": 0.6348974302582981,
"learning_rate": 2.41130665872227e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09823325276374817,
"step": 5760,
"valid_targets_mean": 3898.2,
"valid_targets_min": 2288
},
{
"epoch": 6.012519561815337,
"grad_norm": 0.5197451846846918,
"learning_rate": 2.3866109786581484e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08300504088401794,
"step": 5765,
"valid_targets_mean": 5492.9,
"valid_targets_min": 2909
},
{
"epoch": 6.01773604590506,
"grad_norm": 0.5408708311715636,
"learning_rate": 2.3620343857065776e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09408125281333923,
"step": 5770,
"valid_targets_mean": 5499.2,
"valid_targets_min": 2076
},
{
"epoch": 6.022952529994783,
"grad_norm": 0.5192312881257993,
"learning_rate": 2.3375770460340654e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06746099889278412,
"step": 5775,
"valid_targets_mean": 3975.4,
"valid_targets_min": 501
},
{
"epoch": 6.028169014084507,
"grad_norm": 0.5604784350505317,
"learning_rate": 2.313239125000841e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07895144820213318,
"step": 5780,
"valid_targets_mean": 5031.9,
"valid_targets_min": 1614
},
{
"epoch": 6.033385498174231,
"grad_norm": 0.6306239061423632,
"learning_rate": 2.2890207871597192e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0700065940618515,
"step": 5785,
"valid_targets_mean": 4056.4,
"valid_targets_min": 1135
},
{
"epoch": 6.0386019822639545,
"grad_norm": 0.5089884137450019,
"learning_rate": 2.2649221962549905e-06,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07413844764232635,
"step": 5790,
"valid_targets_mean": 3877.6,
"valid_targets_min": 1967
},
{
"epoch": 6.043818466353677,
"grad_norm": 0.5490139284297806,
"learning_rate": 2.2409435152213123e-06,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07719350606203079,
"step": 5795,
"valid_targets_mean": 4704.6,
"valid_targets_min": 1875
},
{
"epoch": 6.049034950443401,
"grad_norm": 0.5200749426838338,
"learning_rate": 2.217084906182629e-06,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09560975432395935,
"step": 5800,
"valid_targets_mean": 4587.0,
"valid_targets_min": 2004
},
{
"epoch": 6.054251434533125,
"grad_norm": 0.5279382480355144,
"learning_rate": 2.1933465304510394e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07469984143972397,
"step": 5805,
"valid_targets_mean": 4616.1,
"valid_targets_min": 2787
},
{
"epoch": 6.059467918622849,
"grad_norm": 0.5220287099547348,
"learning_rate": 2.1697285485257245e-06,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08868516981601715,
"step": 5810,
"valid_targets_mean": 5075.2,
"valid_targets_min": 2445
},
{
"epoch": 6.0646844027125715,
"grad_norm": 0.46278683097215284,
"learning_rate": 2.1462311200918816e-06,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08032315969467163,
"step": 5815,
"valid_targets_mean": 6912.1,
"valid_targets_min": 4191
},
{
"epoch": 6.069900886802295,
"grad_norm": 0.5398578125617447,
"learning_rate": 2.122854404019601e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08614116907119751,
"step": 5820,
"valid_targets_mean": 5010.5,
"valid_targets_min": 1165
},
{
"epoch": 6.075117370892019,
"grad_norm": 0.5510448083868443,
"learning_rate": 2.0995985583628366e-06,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08615755289793015,
"step": 5825,
"valid_targets_mean": 4735.5,
"valid_targets_min": 2360
},
{
"epoch": 6.080333854981743,
"grad_norm": 0.5286206981684528,
"learning_rate": 2.076463740358299e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07922375202178955,
"step": 5830,
"valid_targets_mean": 4719.9,
"valid_targets_min": 1278
},
{
"epoch": 6.085550339071466,
"grad_norm": 0.542601600303056,
"learning_rate": 2.053450106424426e-06,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09550304710865021,
"step": 5835,
"valid_targets_mean": 5393.1,
"valid_targets_min": 2149
},
{
"epoch": 6.090766823161189,
"grad_norm": 0.5306422592987686,
"learning_rate": 2.030557812160301e-06,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07130551338195801,
"step": 5840,
"valid_targets_mean": 5550.6,
"valid_targets_min": 2537
},
{
"epoch": 6.095983307250913,
"grad_norm": 0.5524670056940677,
"learning_rate": 2.0077870123446107e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09660788625478745,
"step": 5845,
"valid_targets_mean": 5510.6,
"valid_targets_min": 3218
},
{
"epoch": 6.101199791340637,
"grad_norm": 0.6028201350072254,
"learning_rate": 1.985137860934594e-06,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0916367769241333,
"step": 5850,
"valid_targets_mean": 4280.0,
"valid_targets_min": 2785
},
{
"epoch": 6.10641627543036,
"grad_norm": 0.6232053815595153,
"learning_rate": 1.962610511065013e-06,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10127604007720947,
"step": 5855,
"valid_targets_mean": 4280.5,
"valid_targets_min": 2726
},
{
"epoch": 6.1116327595200834,
"grad_norm": 0.619280822162956,
"learning_rate": 1.940205115047098e-06,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12848986685276031,
"step": 5860,
"valid_targets_mean": 4106.4,
"valid_targets_min": 1269
},
{
"epoch": 6.116849243609807,
"grad_norm": 0.5292656123250503,
"learning_rate": 1.917921824367539e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08275945484638214,
"step": 5865,
"valid_targets_mean": 4719.5,
"valid_targets_min": 1832
},
{
"epoch": 6.122065727699531,
"grad_norm": 0.5288161525038574,
"learning_rate": 1.8957607896874419e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08273669332265854,
"step": 5870,
"valid_targets_mean": 5099.6,
"valid_targets_min": 3109
},
{
"epoch": 6.127282211789254,
"grad_norm": 0.5663131444928124,
"learning_rate": 1.8737221608413314e-06,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07949776947498322,
"step": 5875,
"valid_targets_mean": 4202.1,
"valid_targets_min": 1950
},
{
"epoch": 6.132498695878978,
"grad_norm": 0.5866117096283481,
"learning_rate": 1.8518060868361099e-06,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07808201014995575,
"step": 5880,
"valid_targets_mean": 4536.1,
"valid_targets_min": 2511
},
{
"epoch": 6.137715179968701,
"grad_norm": 0.5630696018312298,
"learning_rate": 1.8300127158500714e-06,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09297695755958557,
"step": 5885,
"valid_targets_mean": 4877.8,
"valid_targets_min": 1476
},
{
"epoch": 6.142931664058425,
"grad_norm": 0.5508892680415837,
"learning_rate": 1.8083421952319047e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08836787194013596,
"step": 5890,
"valid_targets_mean": 4473.0,
"valid_targets_min": 1981
},
{
"epoch": 6.148148148148148,
"grad_norm": 0.4665790269124101,
"learning_rate": 1.786794671499672e-06,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08136850595474243,
"step": 5895,
"valid_targets_mean": 6519.1,
"valid_targets_min": 2308
},
{
"epoch": 6.153364632237872,
"grad_norm": 0.5891418596351246,
"learning_rate": 1.7653702903398384e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0934087485074997,
"step": 5900,
"valid_targets_mean": 5352.8,
"valid_targets_min": 3204
},
{
"epoch": 6.158581116327595,
"grad_norm": 0.5608103296545519,
"learning_rate": 1.7440691966062816e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08997437357902527,
"step": 5905,
"valid_targets_mean": 4794.9,
"valid_targets_min": 2556
},
{
"epoch": 6.163797600417318,
"grad_norm": 0.5098134796184438,
"learning_rate": 1.722891534319313e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06943631917238235,
"step": 5910,
"valid_targets_mean": 4535.1,
"valid_targets_min": 1853
},
{
"epoch": 6.169014084507042,
"grad_norm": 0.526164578027781,
"learning_rate": 1.7018374466646981e-06,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07023682445287704,
"step": 5915,
"valid_targets_mean": 3967.6,
"valid_targets_min": 981
},
{
"epoch": 6.174230568596766,
"grad_norm": 0.457588070414583,
"learning_rate": 1.6809070759927015e-06,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0662381500005722,
"step": 5920,
"valid_targets_mean": 5071.5,
"valid_targets_min": 1691
},
{
"epoch": 6.1794470526864895,
"grad_norm": 0.5283325738816248,
"learning_rate": 1.6601005638171065e-06,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07992766052484512,
"step": 5925,
"valid_targets_mean": 4880.5,
"valid_targets_min": 1822
},
{
"epoch": 6.184663536776213,
"grad_norm": 0.5747524763800537,
"learning_rate": 1.639418050814281e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08078983426094055,
"step": 5930,
"valid_targets_mean": 4498.0,
"valid_targets_min": 1281
},
{
"epoch": 6.189880020865936,
"grad_norm": 0.6198787612885583,
"learning_rate": 1.6188596768221976e-06,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08396267890930176,
"step": 5935,
"valid_targets_mean": 4227.2,
"valid_targets_min": 2318
},
{
"epoch": 6.19509650495566,
"grad_norm": 0.5888969905988224,
"learning_rate": 1.5984255808395198e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07747550308704376,
"step": 5940,
"valid_targets_mean": 3874.4,
"valid_targets_min": 2695
},
{
"epoch": 6.200312989045384,
"grad_norm": 0.6054536148347041,
"learning_rate": 1.5781159010246306e-06,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08089844882488251,
"step": 5945,
"valid_targets_mean": 4071.9,
"valid_targets_min": 2128
},
{
"epoch": 6.2055294731351065,
"grad_norm": 0.5858727701096971,
"learning_rate": 1.557930774694727e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08756640553474426,
"step": 5950,
"valid_targets_mean": 4455.8,
"valid_targets_min": 1541
},
{
"epoch": 6.21074595722483,
"grad_norm": 0.5025857589454156,
"learning_rate": 1.5378703383248694e-06,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06149665266275406,
"step": 5955,
"valid_targets_mean": 4103.9,
"valid_targets_min": 2589
},
{
"epoch": 6.215962441314554,
"grad_norm": 0.5378682703982972,
"learning_rate": 1.5179347275470812e-06,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07153839617967606,
"step": 5960,
"valid_targets_mean": 4121.4,
"valid_targets_min": 2355
},
{
"epoch": 6.221178925404278,
"grad_norm": 0.5349205613738541,
"learning_rate": 1.4981240771494032e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08590535074472427,
"step": 5965,
"valid_targets_mean": 5365.2,
"valid_targets_min": 1035
},
{
"epoch": 6.2263954094940015,
"grad_norm": 0.5325294007196091,
"learning_rate": 1.4784385210750052e-06,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08586692810058594,
"step": 5970,
"valid_targets_mean": 5268.0,
"valid_targets_min": 2695
},
{
"epoch": 6.231611893583724,
"grad_norm": 0.4855600868655522,
"learning_rate": 1.458878192421278e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08848752081394196,
"step": 5975,
"valid_targets_mean": 6680.2,
"valid_targets_min": 4403
},
{
"epoch": 6.236828377673448,
"grad_norm": 0.6015572517875324,
"learning_rate": 1.4394432234389167e-06,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09191454201936722,
"step": 5980,
"valid_targets_mean": 4356.5,
"valid_targets_min": 1719
},
{
"epoch": 6.242044861763172,
"grad_norm": 0.4402990787358173,
"learning_rate": 1.4201337455310537e-06,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06941086053848267,
"step": 5985,
"valid_targets_mean": 6787.0,
"valid_targets_min": 2317
},
{
"epoch": 6.247261345852895,
"grad_norm": 0.5872346587921095,
"learning_rate": 1.4009498892523388e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08713740855455399,
"step": 5990,
"valid_targets_mean": 3955.1,
"valid_targets_min": 1153
},
{
"epoch": 6.2524778299426185,
"grad_norm": 0.5316055760875934,
"learning_rate": 1.3818917843080848e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09362940490245819,
"step": 5995,
"valid_targets_mean": 5888.6,
"valid_targets_min": 2046
},
{
"epoch": 6.257694314032342,
"grad_norm": 0.5763307643943745,
"learning_rate": 1.3629595595533673e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09008698165416718,
"step": 6000,
"valid_targets_mean": 4186.6,
"valid_targets_min": 2044
},
{
"epoch": 6.262910798122066,
"grad_norm": 0.49631777502298174,
"learning_rate": 1.3441533429921804e-06,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08558864891529083,
"step": 6005,
"valid_targets_mean": 6150.6,
"valid_targets_min": 1425
},
{
"epoch": 6.26812728221179,
"grad_norm": 0.542934183154514,
"learning_rate": 1.3254732617765375e-06,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0806925892829895,
"step": 6010,
"valid_targets_mean": 5129.9,
"valid_targets_min": 1893
},
{
"epoch": 6.273343766301513,
"grad_norm": 0.597025228662152,
"learning_rate": 1.3069194422056454e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09697069227695465,
"step": 6015,
"valid_targets_mean": 4211.5,
"valid_targets_min": 1074
},
{
"epoch": 6.278560250391236,
"grad_norm": 0.568551323103317,
"learning_rate": 1.2884920097250197e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08361931890249252,
"step": 6020,
"valid_targets_mean": 3935.1,
"valid_targets_min": 1387
},
{
"epoch": 6.28377673448096,
"grad_norm": 0.5386832032057025,
"learning_rate": 1.2701910889256651e-06,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07516301423311234,
"step": 6025,
"valid_targets_mean": 4690.6,
"valid_targets_min": 1490
},
{
"epoch": 6.288993218570683,
"grad_norm": 0.5096384905174148,
"learning_rate": 1.2520168035432102e-06,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06578829884529114,
"step": 6030,
"valid_targets_mean": 4611.1,
"valid_targets_min": 3188
},
{
"epoch": 6.294209702660407,
"grad_norm": 0.5078443664032133,
"learning_rate": 1.2339692764570853e-06,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08106677234172821,
"step": 6035,
"valid_targets_mean": 5301.2,
"valid_targets_min": 2076
},
{
"epoch": 6.29942618675013,
"grad_norm": 0.6013232433244711,
"learning_rate": 1.2160486296896834e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08288998156785965,
"step": 6040,
"valid_targets_mean": 3733.9,
"valid_targets_min": 1111
},
{
"epoch": 6.304642670839854,
"grad_norm": 0.5419758577541648,
"learning_rate": 1.198254984405538e-06,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09677646309137344,
"step": 6045,
"valid_targets_mean": 4574.4,
"valid_targets_min": 2195
},
{
"epoch": 6.309859154929577,
"grad_norm": 0.5446277500236966,
"learning_rate": 1.1805884609105012e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09340253472328186,
"step": 6050,
"valid_targets_mean": 4646.2,
"valid_targets_min": 1737
},
{
"epoch": 6.315075639019301,
"grad_norm": 0.5243574814276308,
"learning_rate": 1.1630491786509457e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07701204717159271,
"step": 6055,
"valid_targets_mean": 5141.8,
"valid_targets_min": 2266
},
{
"epoch": 6.3202921231090246,
"grad_norm": 0.6435320951413327,
"learning_rate": 1.1456372562129281e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08175545930862427,
"step": 6060,
"valid_targets_mean": 5562.0,
"valid_targets_min": 1603
},
{
"epoch": 6.325508607198748,
"grad_norm": 0.5265813662985552,
"learning_rate": 1.1283528113214114e-06,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08022892475128174,
"step": 6065,
"valid_targets_mean": 4575.2,
"valid_targets_min": 208
},
{
"epoch": 6.330725091288471,
"grad_norm": 0.5119238855169547,
"learning_rate": 1.1111959608394662e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061150819063186646,
"step": 6070,
"valid_targets_mean": 4400.9,
"valid_targets_min": 2043
},
{
"epoch": 6.335941575378195,
"grad_norm": 0.5238475909765726,
"learning_rate": 1.094166820767464e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07575885951519012,
"step": 6075,
"valid_targets_mean": 5175.4,
"valid_targets_min": 2431
},
{
"epoch": 6.341158059467919,
"grad_norm": 0.5587142799014,
"learning_rate": 1.0772655062423176e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07077431678771973,
"step": 6080,
"valid_targets_mean": 4443.2,
"valid_targets_min": 1914
},
{
"epoch": 6.346374543557642,
"grad_norm": 0.612857706137813,
"learning_rate": 1.0604921315366767e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08608610928058624,
"step": 6085,
"valid_targets_mean": 4559.0,
"valid_targets_min": 1757
},
{
"epoch": 6.351591027647365,
"grad_norm": 0.6670742752657252,
"learning_rate": 1.0438468100581823e-06,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11555208265781403,
"step": 6090,
"valid_targets_mean": 3916.6,
"valid_targets_min": 2320
},
{
"epoch": 6.356807511737089,
"grad_norm": 0.5332052239349687,
"learning_rate": 1.027329654348672e-06,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06971243023872375,
"step": 6095,
"valid_targets_mean": 3657.0,
"valid_targets_min": 1091
},
{
"epoch": 6.362023995826813,
"grad_norm": 0.5501198346395842,
"learning_rate": 1.01094077608344e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09527956694364548,
"step": 6100,
"valid_targets_mean": 5293.6,
"valid_targets_min": 1475
},
{
"epoch": 6.3672404799165365,
"grad_norm": 0.7035339378264363,
"learning_rate": 9.946802860704706e-07,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0827580913901329,
"step": 6105,
"valid_targets_mean": 4001.9,
"valid_targets_min": 1451
},
{
"epoch": 6.372456964006259,
"grad_norm": 0.493625895550495,
"learning_rate": 9.785482942497037e-07,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07613112032413483,
"step": 6110,
"valid_targets_mean": 4524.5,
"valid_targets_min": 1899
},
{
"epoch": 6.377673448095983,
"grad_norm": 0.5241022319748064,
"learning_rate": 9.625449096922667e-07,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09136146306991577,
"step": 6115,
"valid_targets_mean": 5662.6,
"valid_targets_min": 3728
},
{
"epoch": 6.382889932185707,
"grad_norm": 1.0353966703876931,
"learning_rate": 9.466702405997674e-07,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.067151740193367,
"step": 6120,
"valid_targets_mean": 3555.2,
"valid_targets_min": 1302
},
{
"epoch": 6.388106416275431,
"grad_norm": 0.5746423268370077,
"learning_rate": 9.309243943035295e-07,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09859921038150787,
"step": 6125,
"valid_targets_mean": 4599.2,
"valid_targets_min": 3171
},
{
"epoch": 6.3933229003651535,
"grad_norm": 0.6544515306472833,
"learning_rate": 9.153074772638937e-07,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.096698097884655,
"step": 6130,
"valid_targets_mean": 4089.5,
"valid_targets_min": 1654
},
{
"epoch": 6.398539384454877,
"grad_norm": 0.5566676155158136,
"learning_rate": 8.99819595069491e-07,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1017160415649414,
"step": 6135,
"valid_targets_mean": 5410.6,
"valid_targets_min": 1624
},
{
"epoch": 6.403755868544601,
"grad_norm": 0.5230990896861292,
"learning_rate": 8.844608524365172e-07,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08459442108869553,
"step": 6140,
"valid_targets_mean": 5277.2,
"valid_targets_min": 2523
},
{
"epoch": 6.408972352634325,
"grad_norm": 0.5274707382276024,
"learning_rate": 8.692313532080443e-07,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07985209673643112,
"step": 6145,
"valid_targets_mean": 5341.5,
"valid_targets_min": 2441
},
{
"epoch": 6.414188836724048,
"grad_norm": 0.5416031184874927,
"learning_rate": 8.54131200353292e-07,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08388903737068176,
"step": 6150,
"valid_targets_mean": 5301.2,
"valid_targets_min": 1152
},
{
"epoch": 6.419405320813771,
"grad_norm": 0.5391134609004025,
"learning_rate": 8.391604959669619e-07,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07807138562202454,
"step": 6155,
"valid_targets_mean": 4546.0,
"valid_targets_min": 1655
},
{
"epoch": 6.424621804903495,
"grad_norm": 0.4960672468122204,
"learning_rate": 8.243193412685246e-07,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07477937638759613,
"step": 6160,
"valid_targets_mean": 5704.6,
"valid_targets_min": 3157
},
{
"epoch": 6.429838288993219,
"grad_norm": 0.5500642984629969,
"learning_rate": 8.096078366015514e-07,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0865449458360672,
"step": 6165,
"valid_targets_mean": 5272.1,
"valid_targets_min": 2280
},
{
"epoch": 6.435054773082942,
"grad_norm": 0.4982969915490319,
"learning_rate": 7.950260814330169e-07,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07472272962331772,
"step": 6170,
"valid_targets_mean": 4460.2,
"valid_targets_min": 1878
},
{
"epoch": 6.4402712571726655,
"grad_norm": 0.5341667921203153,
"learning_rate": 7.805741743526441e-07,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0895976796746254,
"step": 6175,
"valid_targets_mean": 5404.6,
"valid_targets_min": 2367
},
{
"epoch": 6.445487741262389,
"grad_norm": 0.5492125654290198,
"learning_rate": 7.662522130722294e-07,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07540404051542282,
"step": 6180,
"valid_targets_mean": 4739.1,
"valid_targets_min": 1735
},
{
"epoch": 6.450704225352113,
"grad_norm": 0.5358545190242257,
"learning_rate": 7.520602944249855e-07,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10180626064538956,
"step": 6185,
"valid_targets_mean": 5684.0,
"valid_targets_min": 1306
},
{
"epoch": 6.455920709441836,
"grad_norm": 0.5091791636322476,
"learning_rate": 7.379985143648815e-07,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058316584676504135,
"step": 6190,
"valid_targets_mean": 4836.5,
"valid_targets_min": 1569
},
{
"epoch": 6.46113719353156,
"grad_norm": 0.5586442466521836,
"learning_rate": 7.240669679660017e-07,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09539739787578583,
"step": 6195,
"valid_targets_mean": 5895.9,
"valid_targets_min": 3541
},
{
"epoch": 6.466353677621283,
"grad_norm": 0.5006232216627376,
"learning_rate": 7.102657494218879e-07,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06938563287258148,
"step": 6200,
"valid_targets_mean": 4634.5,
"valid_targets_min": 1128
},
{
"epoch": 6.471570161711007,
"grad_norm": 0.5546239126291488,
"learning_rate": 6.965949520449311e-07,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0821041464805603,
"step": 6205,
"valid_targets_mean": 5086.8,
"valid_targets_min": 1856
},
{
"epoch": 6.47678664580073,
"grad_norm": 0.4910903623028209,
"learning_rate": 6.830546682657035e-07,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07834288477897644,
"step": 6210,
"valid_targets_mean": 5048.6,
"valid_targets_min": 2940
},
{
"epoch": 6.482003129890454,
"grad_norm": 0.554755174369064,
"learning_rate": 6.696449896323698e-07,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08156804740428925,
"step": 6215,
"valid_targets_mean": 4262.4,
"valid_targets_min": 1410
},
{
"epoch": 6.487219613980177,
"grad_norm": 0.5793166829491566,
"learning_rate": 6.563660068100408e-07,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08402011543512344,
"step": 6220,
"valid_targets_mean": 3359.8,
"valid_targets_min": 1691
},
{
"epoch": 6.492436098069901,
"grad_norm": 0.5586393784517392,
"learning_rate": 6.432178095801678e-07,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09661173820495605,
"step": 6225,
"valid_targets_mean": 4351.2,
"valid_targets_min": 2666
},
{
"epoch": 6.497652582159624,
"grad_norm": 0.5716779271221131,
"learning_rate": 6.302004868399514e-07,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07923077046871185,
"step": 6230,
"valid_targets_mean": 3839.8,
"valid_targets_min": 530
},
{
"epoch": 6.502869066249348,
"grad_norm": 0.5753569634982648,
"learning_rate": 6.173141266017113e-07,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07147848606109619,
"step": 6235,
"valid_targets_mean": 3394.2,
"valid_targets_min": 1401
},
{
"epoch": 6.5080855503390715,
"grad_norm": 0.5245411730700712,
"learning_rate": 6.045588159923266e-07,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08123113214969635,
"step": 6240,
"valid_targets_mean": 5400.9,
"valid_targets_min": 3096
},
{
"epoch": 6.513302034428795,
"grad_norm": 0.5374981308134168,
"learning_rate": 5.919346412526117e-07,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08702099323272705,
"step": 6245,
"valid_targets_mean": 5240.4,
"valid_targets_min": 1771
},
{
"epoch": 6.518518518518518,
"grad_norm": 0.5926256551419858,
"learning_rate": 5.794416877367526e-07,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07396068423986435,
"step": 6250,
"valid_targets_mean": 3938.5,
"valid_targets_min": 2393
},
{
"epoch": 6.523735002608242,
"grad_norm": 0.5130895160388712,
"learning_rate": 5.670800399117316e-07,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08972735702991486,
"step": 6255,
"valid_targets_mean": 5926.8,
"valid_targets_min": 2193
},
{
"epoch": 6.528951486697966,
"grad_norm": 0.6837534994812857,
"learning_rate": 5.548497813567455e-07,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09018000960350037,
"step": 6260,
"valid_targets_mean": 4145.4,
"valid_targets_min": 2124
},
{
"epoch": 6.534167970787689,
"grad_norm": 0.5858320399320168,
"learning_rate": 5.427509947626486e-07,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06871044635772705,
"step": 6265,
"valid_targets_mean": 4609.0,
"valid_targets_min": 1686
},
{
"epoch": 6.539384454877412,
"grad_norm": 0.9369134981527133,
"learning_rate": 5.307837619313949e-07,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09468284249305725,
"step": 6270,
"valid_targets_mean": 4776.0,
"valid_targets_min": 1565
},
{
"epoch": 6.544600938967136,
"grad_norm": 0.4906643606770716,
"learning_rate": 5.189481637754679e-07,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06301077455282211,
"step": 6275,
"valid_targets_mean": 4904.9,
"valid_targets_min": 2530
},
{
"epoch": 6.54981742305686,
"grad_norm": 0.5299721524580903,
"learning_rate": 5.072442803173649e-07,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0912301167845726,
"step": 6280,
"valid_targets_mean": 4950.5,
"valid_targets_min": 1084
},
{
"epoch": 6.5550339071465835,
"grad_norm": 0.6255622891103191,
"learning_rate": 4.956721906890228e-07,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09659097343683243,
"step": 6285,
"valid_targets_mean": 4950.6,
"valid_targets_min": 1533
},
{
"epoch": 6.560250391236306,
"grad_norm": 0.6174968011521565,
"learning_rate": 4.842319731313016e-07,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10585039108991623,
"step": 6290,
"valid_targets_mean": 4290.8,
"valid_targets_min": 1528
},
{
"epoch": 6.56546687532603,
"grad_norm": 0.5861852083749461,
"learning_rate": 4.729237049934621e-07,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08830663561820984,
"step": 6295,
"valid_targets_mean": 4821.6,
"valid_targets_min": 1612
},
{
"epoch": 6.570683359415754,
"grad_norm": 0.5463462106108242,
"learning_rate": 4.6174746273261793e-07,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08798755705356598,
"step": 6300,
"valid_targets_mean": 4962.6,
"valid_targets_min": 1741
},
{
"epoch": 6.575899843505478,
"grad_norm": 0.5532379866364969,
"learning_rate": 4.507033219132395e-07,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07625909149646759,
"step": 6305,
"valid_targets_mean": 4648.1,
"valid_targets_min": 2171
},
{
"epoch": 6.5811163275952005,
"grad_norm": 0.5065410208057752,
"learning_rate": 4.3979135720664035e-07,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06727365404367447,
"step": 6310,
"valid_targets_mean": 5517.6,
"valid_targets_min": 2833
},
{
"epoch": 6.586332811684924,
"grad_norm": 0.5493744454932743,
"learning_rate": 4.2901164239046443e-07,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09966464340686798,
"step": 6315,
"valid_targets_mean": 5292.9,
"valid_targets_min": 3144
},
{
"epoch": 6.591549295774648,
"grad_norm": 0.5761969297622763,
"learning_rate": 4.1836425034819106e-07,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08473914861679077,
"step": 6320,
"valid_targets_mean": 4597.6,
"valid_targets_min": 2802
},
{
"epoch": 6.596765779864372,
"grad_norm": 0.7363640904744337,
"learning_rate": 4.078492530686506e-07,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08203506469726562,
"step": 6325,
"valid_targets_mean": 3774.4,
"valid_targets_min": 1338
},
{
"epoch": 6.601982263954095,
"grad_norm": 0.5094006763949639,
"learning_rate": 3.9746672164551856e-07,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07795064151287079,
"step": 6330,
"valid_targets_mean": 5433.5,
"valid_targets_min": 1882
},
{
"epoch": 6.607198748043818,
"grad_norm": 0.6061614255410304,
"learning_rate": 3.872167262768578e-07,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07970091700553894,
"step": 6335,
"valid_targets_mean": 4424.8,
"valid_targets_min": 637
},
{
"epoch": 6.612415232133542,
"grad_norm": 0.505158025715867,
"learning_rate": 3.7709933626461916e-07,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07546493411064148,
"step": 6340,
"valid_targets_mean": 4831.2,
"valid_targets_min": 2092
},
{
"epoch": 6.617631716223266,
"grad_norm": 0.48956541874495973,
"learning_rate": 3.671146200142017e-07,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08042104542255402,
"step": 6345,
"valid_targets_mean": 6330.6,
"valid_targets_min": 3720
},
{
"epoch": 6.622848200312989,
"grad_norm": 0.552499065585299,
"learning_rate": 3.5726264503396e-07,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0773078203201294,
"step": 6350,
"valid_targets_mean": 4676.6,
"valid_targets_min": 1059
},
{
"epoch": 6.6280646844027125,
"grad_norm": 0.5241665236185439,
"learning_rate": 3.475434779347731e-07,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08315479755401611,
"step": 6355,
"valid_targets_mean": 4854.5,
"valid_targets_min": 2492
},
{
"epoch": 6.633281168492436,
"grad_norm": 0.5229494178000254,
"learning_rate": 3.3795718442957593e-07,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07639910280704498,
"step": 6360,
"valid_targets_mean": 4369.9,
"valid_targets_min": 2310
},
{
"epoch": 6.63849765258216,
"grad_norm": 0.6365838431533449,
"learning_rate": 3.2850382933292903e-07,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06544691324234009,
"step": 6365,
"valid_targets_mean": 4716.8,
"valid_targets_min": 1774
},
{
"epoch": 6.643714136671883,
"grad_norm": 0.6078803116735846,
"learning_rate": 3.1918347656056946e-07,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08977963775396347,
"step": 6370,
"valid_targets_mean": 4123.0,
"valid_targets_min": 2271
},
{
"epoch": 6.648930620761607,
"grad_norm": 0.5502228136170516,
"learning_rate": 3.0999618912898267e-07,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08217453956604004,
"step": 6375,
"valid_targets_mean": 5216.9,
"valid_targets_min": 2267
},
{
"epoch": 6.65414710485133,
"grad_norm": 0.4903820521932893,
"learning_rate": 3.009420291549825e-07,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07962026447057724,
"step": 6380,
"valid_targets_mean": 6445.1,
"valid_targets_min": 1973
},
{
"epoch": 6.659363588941054,
"grad_norm": 0.6635091094279434,
"learning_rate": 2.9202105785527623e-07,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10168874263763428,
"step": 6385,
"valid_targets_mean": 3914.8,
"valid_targets_min": 2387
},
{
"epoch": 6.664580073030777,
"grad_norm": 0.5674026350366216,
"learning_rate": 2.8323333554606923e-07,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09658002853393555,
"step": 6390,
"valid_targets_mean": 5366.6,
"valid_targets_min": 2041
},
{
"epoch": 6.669796557120501,
"grad_norm": 0.5317292589938676,
"learning_rate": 2.745789216426387e-07,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07777095586061478,
"step": 6395,
"valid_targets_mean": 4769.0,
"valid_targets_min": 2111
},
{
"epoch": 6.675013041210224,
"grad_norm": 0.6203666831879747,
"learning_rate": 2.660578746589515e-07,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09512919187545776,
"step": 6400,
"valid_targets_mean": 4147.4,
"valid_targets_min": 1817
},
{
"epoch": 6.680229525299948,
"grad_norm": 0.6113606882976234,
"learning_rate": 2.5767025220724717e-07,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10862178355455399,
"step": 6405,
"valid_targets_mean": 5514.9,
"valid_targets_min": 2444
},
{
"epoch": 6.685446009389671,
"grad_norm": 0.5684941882814628,
"learning_rate": 2.4941611099766896e-07,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07307954132556915,
"step": 6410,
"valid_targets_mean": 4531.8,
"valid_targets_min": 1787
},
{
"epoch": 6.690662493479395,
"grad_norm": 0.5125407630567089,
"learning_rate": 2.4129550683786194e-07,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07515746355056763,
"step": 6415,
"valid_targets_mean": 4874.9,
"valid_targets_min": 2187
},
{
"epoch": 6.6958789775691185,
"grad_norm": 0.5153495108176748,
"learning_rate": 2.3330849463261363e-07,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0719965398311615,
"step": 6420,
"valid_targets_mean": 3854.9,
"valid_targets_min": 698
},
{
"epoch": 6.701095461658842,
"grad_norm": 0.5176861251483592,
"learning_rate": 2.2545512838346716e-07,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06797109544277191,
"step": 6425,
"valid_targets_mean": 4365.1,
"valid_targets_min": 1264
},
{
"epoch": 6.706311945748565,
"grad_norm": 0.559817981189732,
"learning_rate": 2.1773546118836418e-07,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0822562575340271,
"step": 6430,
"valid_targets_mean": 4119.1,
"valid_targets_min": 1455
},
{
"epoch": 6.711528429838289,
"grad_norm": 0.5474882365834455,
"learning_rate": 2.1014954524128493e-07,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08481225371360779,
"step": 6435,
"valid_targets_mean": 5039.8,
"valid_targets_min": 1460
},
{
"epoch": 6.716744913928013,
"grad_norm": 0.5086535693869745,
"learning_rate": 2.0269743183189528e-07,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0783454105257988,
"step": 6440,
"valid_targets_mean": 4745.6,
"valid_targets_min": 1473
},
{
"epoch": 6.721961398017736,
"grad_norm": 0.5080116207115293,
"learning_rate": 1.9537917134520023e-07,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.068985216319561,
"step": 6445,
"valid_targets_mean": 4546.9,
"valid_targets_min": 3249
},
{
"epoch": 6.727177882107459,
"grad_norm": 0.5495255536817283,
"learning_rate": 1.881948132611977e-07,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06369595229625702,
"step": 6450,
"valid_targets_mean": 3474.2,
"valid_targets_min": 1267
},
{
"epoch": 6.732394366197183,
"grad_norm": 0.5994488137520114,
"learning_rate": 1.811444061545542e-07,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08287137746810913,
"step": 6455,
"valid_targets_mean": 4944.2,
"valid_targets_min": 2391
},
{
"epoch": 6.737610850286907,
"grad_norm": 0.5126567683176668,
"learning_rate": 1.7422799769426736e-07,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061244308948516846,
"step": 6460,
"valid_targets_mean": 3977.2,
"valid_targets_min": 2516
},
{
"epoch": 6.7428273343766305,
"grad_norm": 0.5831515070930245,
"learning_rate": 1.674456346433506e-07,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08915935456752777,
"step": 6465,
"valid_targets_mean": 4809.4,
"valid_targets_min": 2022
},
{
"epoch": 6.748043818466353,
"grad_norm": 0.5730307050297281,
"learning_rate": 1.607973628585091e-07,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08513954281806946,
"step": 6470,
"valid_targets_mean": 4412.6,
"valid_targets_min": 484
},
{
"epoch": 6.753260302556077,
"grad_norm": 0.5790497202571583,
"learning_rate": 1.542832272898398e-07,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09173041582107544,
"step": 6475,
"valid_targets_mean": 4468.9,
"valid_targets_min": 1852
},
{
"epoch": 6.758476786645801,
"grad_norm": 0.5159289857385856,
"learning_rate": 1.4790327198051624e-07,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07732409238815308,
"step": 6480,
"valid_targets_mean": 4268.2,
"valid_targets_min": 1460
},
{
"epoch": 6.763693270735525,
"grad_norm": 0.5261496459131189,
"learning_rate": 1.416575400664999e-07,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08644157648086548,
"step": 6485,
"valid_targets_mean": 5388.8,
"valid_targets_min": 2127
},
{
"epoch": 6.7689097548252475,
"grad_norm": 0.5229503599641532,
"learning_rate": 1.3554607377624263e-07,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07498866319656372,
"step": 6490,
"valid_targets_mean": 4785.5,
"valid_targets_min": 2022
},
{
"epoch": 6.774126238914971,
"grad_norm": 0.5073924620034521,
"learning_rate": 1.295689144304091e-07,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07597608864307404,
"step": 6495,
"valid_targets_mean": 5095.1,
"valid_targets_min": 1500
},
{
"epoch": 6.779342723004695,
"grad_norm": 0.5742958458442429,
"learning_rate": 1.237261024415881e-07,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08016721159219742,
"step": 6500,
"valid_targets_mean": 4903.2,
"valid_targets_min": 2192
},
{
"epoch": 6.784559207094419,
"grad_norm": 0.5634137025390458,
"learning_rate": 1.1801767731401958e-07,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0954822227358818,
"step": 6505,
"valid_targets_mean": 4574.5,
"valid_targets_min": 1753
},
{
"epoch": 6.789775691184142,
"grad_norm": 0.568993442444071,
"learning_rate": 1.1244367764333464e-07,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10571624338626862,
"step": 6510,
"valid_targets_mean": 5754.6,
"valid_targets_min": 3334
},
{
"epoch": 6.794992175273865,
"grad_norm": 0.5520081151531104,
"learning_rate": 1.0700414111629365e-07,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09768638759851456,
"step": 6515,
"valid_targets_mean": 3943.8,
"valid_targets_min": 965
},
{
"epoch": 6.800208659363589,
"grad_norm": 0.5760719080774065,
"learning_rate": 1.0169910451052422e-07,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07405383884906769,
"step": 6520,
"valid_targets_mean": 4556.4,
"valid_targets_min": 1193
},
{
"epoch": 6.805425143453313,
"grad_norm": 0.4978196958326634,
"learning_rate": 9.652860369428141e-08,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0769326388835907,
"step": 6525,
"valid_targets_mean": 5648.2,
"valid_targets_min": 3140
},
{
"epoch": 6.810641627543036,
"grad_norm": 0.6255097736995268,
"learning_rate": 9.149267362619895e-08,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09469383209943771,
"step": 6530,
"valid_targets_mean": 5004.4,
"valid_targets_min": 1876
},
{
"epoch": 6.8158581116327595,
"grad_norm": 0.5891644536704017,
"learning_rate": 8.659134835504956e-08,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1021219789981842,
"step": 6535,
"valid_targets_mean": 4905.6,
"valid_targets_min": 2000
},
{
"epoch": 6.821074595722483,
"grad_norm": 0.5525031252703527,
"learning_rate": 8.18246610195339e-08,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08424567431211472,
"step": 6540,
"valid_targets_mean": 4678.4,
"valid_targets_min": 1207
},
{
"epoch": 6.826291079812207,
"grad_norm": 0.5791393289700533,
"learning_rate": 7.719264384802527e-08,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07773526012897491,
"step": 6545,
"valid_targets_mean": 4099.8,
"valid_targets_min": 1625
},
{
"epoch": 6.83150756390193,
"grad_norm": 0.5161030337927414,
"learning_rate": 7.269532815838532e-08,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08431129157543182,
"step": 6550,
"valid_targets_mean": 5410.5,
"valid_targets_min": 2155
},
{
"epoch": 6.836724047991654,
"grad_norm": 0.490060135511807,
"learning_rate": 6.833274435772196e-08,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06826452910900116,
"step": 6555,
"valid_targets_mean": 5077.6,
"valid_targets_min": 2890
},
{
"epoch": 6.841940532081377,
"grad_norm": 0.6084355470618008,
"learning_rate": 6.410492194220963e-08,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09635565429925919,
"step": 6560,
"valid_targets_mean": 4256.8,
"valid_targets_min": 1858
},
{
"epoch": 6.847157016171101,
"grad_norm": 0.5464942429975727,
"learning_rate": 6.001188949687153e-08,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0908285453915596,
"step": 6565,
"valid_targets_mean": 4766.1,
"valid_targets_min": 2251
},
{
"epoch": 6.852373500260824,
"grad_norm": 0.5324427723013748,
"learning_rate": 5.6053674695395463e-08,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07651311159133911,
"step": 6570,
"valid_targets_mean": 4681.2,
"valid_targets_min": 420
},
{
"epoch": 6.857589984350548,
"grad_norm": 0.5316025405834288,
"learning_rate": 5.22303042999428e-08,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09243462979793549,
"step": 6575,
"valid_targets_mean": 5462.0,
"valid_targets_min": 2448
},
{
"epoch": 6.862806468440271,
"grad_norm": 0.5548110954612004,
"learning_rate": 4.8541804160968655e-08,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08866509795188904,
"step": 6580,
"valid_targets_mean": 4857.0,
"valid_targets_min": 2369
},
{
"epoch": 6.868022952529994,
"grad_norm": 0.6056436002002238,
"learning_rate": 4.498819921705089e-08,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08769193291664124,
"step": 6585,
"valid_targets_mean": 4305.8,
"valid_targets_min": 2471
},
{
"epoch": 6.873239436619718,
"grad_norm": 0.6181972867280068,
"learning_rate": 4.15695134947125e-08,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09733624756336212,
"step": 6590,
"valid_targets_mean": 3868.6,
"valid_targets_min": 1982
},
{
"epoch": 6.878455920709442,
"grad_norm": 0.5205648849887881,
"learning_rate": 3.8285770108272836e-08,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08204355835914612,
"step": 6595,
"valid_targets_mean": 5234.4,
"valid_targets_min": 2231
},
{
"epoch": 6.8836724047991655,
"grad_norm": 0.5328299359281365,
"learning_rate": 3.5136991259672183e-08,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06707605719566345,
"step": 6600,
"valid_targets_mean": 5658.4,
"valid_targets_min": 1472
},
{
"epoch": 6.888888888888889,
"grad_norm": 0.5526066203448274,
"learning_rate": 3.212319823834298e-08,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12305822968482971,
"step": 6605,
"valid_targets_mean": 4908.1,
"valid_targets_min": 1847
},
{
"epoch": 6.894105372978612,
"grad_norm": 0.48472299525783724,
"learning_rate": 2.9244411421049946e-08,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0804297924041748,
"step": 6610,
"valid_targets_mean": 4955.9,
"valid_targets_min": 2223
},
{
"epoch": 6.899321857068336,
"grad_norm": 0.491359095042733,
"learning_rate": 2.6500650271759077e-08,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0729602798819542,
"step": 6615,
"valid_targets_mean": 5261.2,
"valid_targets_min": 2934
},
{
"epoch": 6.90453834115806,
"grad_norm": 0.5105255246216366,
"learning_rate": 2.3891933341506636e-08,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07847601920366287,
"step": 6620,
"valid_targets_mean": 5682.6,
"valid_targets_min": 2283
},
{
"epoch": 6.9097548252477825,
"grad_norm": 0.5651999326941914,
"learning_rate": 2.1418278268270365e-08,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08119011670351028,
"step": 6625,
"valid_targets_mean": 5365.1,
"valid_targets_min": 2328
},
{
"epoch": 6.914971309337506,
"grad_norm": 0.4752856662151638,
"learning_rate": 1.907970177684737e-08,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07210240513086319,
"step": 6630,
"valid_targets_mean": 6072.9,
"valid_targets_min": 3350
},
{
"epoch": 6.92018779342723,
"grad_norm": 0.536334628512583,
"learning_rate": 1.687621967875863e-08,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08057719469070435,
"step": 6635,
"valid_targets_mean": 5156.0,
"valid_targets_min": 2835
},
{
"epoch": 6.925404277516954,
"grad_norm": 0.5605009892985632,
"learning_rate": 1.4807846872113563e-08,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08201783895492554,
"step": 6640,
"valid_targets_mean": 4241.5,
"valid_targets_min": 2650
},
{
"epoch": 6.9306207616066775,
"grad_norm": 0.5315249799499744,
"learning_rate": 1.2874597341534512e-08,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08200040459632874,
"step": 6645,
"valid_targets_mean": 4877.6,
"valid_targets_min": 2332
},
{
"epoch": 6.9358372456964,
"grad_norm": 0.6271880493962537,
"learning_rate": 1.1076484158047962e-08,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11016195267438889,
"step": 6650,
"valid_targets_mean": 4848.4,
"valid_targets_min": 2185
},
{
"epoch": 6.941053729786124,
"grad_norm": 0.4985270702899821,
"learning_rate": 9.413519479004596e-09,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06930582225322723,
"step": 6655,
"valid_targets_mean": 5042.6,
"valid_targets_min": 999
},
{
"epoch": 6.946270213875848,
"grad_norm": 0.5376613750357377,
"learning_rate": 7.885714547990475e-09,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07879330217838287,
"step": 6660,
"valid_targets_mean": 5642.0,
"valid_targets_min": 1683
},
{
"epoch": 6.951486697965571,
"grad_norm": 0.6210626987569594,
"learning_rate": 6.493079694753768e-09,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08401305973529816,
"step": 6665,
"valid_targets_mean": 4189.1,
"valid_targets_min": 1431
},
{
"epoch": 6.9567031820552945,
"grad_norm": 0.6346567450751912,
"learning_rate": 5.235624335133693e-09,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11028879135847092,
"step": 6670,
"valid_targets_mean": 4331.8,
"valid_targets_min": 1737
},
{
"epoch": 6.961919666145018,
"grad_norm": 0.5399427080559815,
"learning_rate": 4.113356971002791e-09,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06442070007324219,
"step": 6675,
"valid_targets_mean": 3822.8,
"valid_targets_min": 873
},
{
"epoch": 6.967136150234742,
"grad_norm": 0.5544017097545518,
"learning_rate": 3.126285190195866e-09,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061635371297597885,
"step": 6680,
"valid_targets_mean": 3973.4,
"valid_targets_min": 229
},
{
"epoch": 6.972352634324466,
"grad_norm": 0.5098397885779282,
"learning_rate": 2.2744156664766813e-09,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08478450775146484,
"step": 6685,
"valid_targets_mean": 4589.8,
"valid_targets_min": 1221
},
{
"epoch": 6.977569118414189,
"grad_norm": 0.5411222657320197,
"learning_rate": 1.5577541594802293e-09,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10507169365882874,
"step": 6690,
"valid_targets_mean": 6228.5,
"valid_targets_min": 865
},
{
"epoch": 6.982785602503912,
"grad_norm": 0.5713424510280001,
"learning_rate": 9.7630551467498e-10,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08130859583616257,
"step": 6695,
"valid_targets_mean": 4436.1,
"valid_targets_min": 1928
},
{
"epoch": 6.988002086593636,
"grad_norm": 0.49450624264968135,
"learning_rate": 5.300736633317982e-10,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07469873875379562,
"step": 6700,
"valid_targets_mean": 5284.1,
"valid_targets_min": 1889
},
{
"epoch": 6.993218570683359,
"grad_norm": 0.8620431386424838,
"learning_rate": 2.1906162250395768e-10,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08396423608064651,
"step": 6705,
"valid_targets_mean": 5400.6,
"valid_targets_min": 1757
},
{
"epoch": 6.998435054773083,
"grad_norm": 0.5780156319377473,
"learning_rate": 4.3271494996055544e-11,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0954805314540863,
"step": 6710,
"valid_targets_mean": 4702.2,
"valid_targets_min": 3222
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14267900586128235,
"step": 6712,
"total_flos": 3.0948342577517036e+18,
"train_loss": 0.11350778881926644,
"train_runtime": 136690.7198,
"train_samples_per_second": 0.785,
"train_steps_per_second": 0.049,
"valid_targets_mean": 6167.6,
"valid_targets_min": 3936
}
],
"logging_steps": 5,
"max_steps": 6713,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 3.0948342577517036e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}