a1_math_formulas / trainer_state.json
penfever's picture
End of training
26c5644 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"eval_steps": 500,
"global_step": 4940,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.005063291139240506,
"grad_norm": 4.609051043616223,
"learning_rate": 3.238866396761134e-07,
"loss": 0.5035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25989317893981934,
"step": 5,
"valid_targets_mean": 3288.2,
"valid_targets_min": 815
},
{
"epoch": 0.010126582278481013,
"grad_norm": 3.6056753367980687,
"learning_rate": 7.287449392712551e-07,
"loss": 0.4979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23132257163524628,
"step": 10,
"valid_targets_mean": 4994.0,
"valid_targets_min": 1103
},
{
"epoch": 0.015189873417721518,
"grad_norm": 3.75046312941662,
"learning_rate": 1.133603238866397e-06,
"loss": 0.5107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23433995246887207,
"step": 15,
"valid_targets_mean": 4084.1,
"valid_targets_min": 1248
},
{
"epoch": 0.020253164556962026,
"grad_norm": 4.009323566522028,
"learning_rate": 1.5384615384615387e-06,
"loss": 0.4757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19289864599704742,
"step": 20,
"valid_targets_mean": 4351.0,
"valid_targets_min": 1208
},
{
"epoch": 0.02531645569620253,
"grad_norm": 3.857687726883038,
"learning_rate": 1.9433198380566803e-06,
"loss": 0.4795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25582650303840637,
"step": 25,
"valid_targets_mean": 4894.1,
"valid_targets_min": 1784
},
{
"epoch": 0.030379746835443037,
"grad_norm": 2.431783748480512,
"learning_rate": 2.348178137651822e-06,
"loss": 0.4538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21279120445251465,
"step": 30,
"valid_targets_mean": 4872.4,
"valid_targets_min": 1107
},
{
"epoch": 0.035443037974683546,
"grad_norm": 2.0913610531108153,
"learning_rate": 2.7530364372469636e-06,
"loss": 0.4576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21099823713302612,
"step": 35,
"valid_targets_mean": 4177.9,
"valid_targets_min": 1173
},
{
"epoch": 0.04050632911392405,
"grad_norm": 2.1267526423567826,
"learning_rate": 3.157894736842105e-06,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21998053789138794,
"step": 40,
"valid_targets_mean": 5318.6,
"valid_targets_min": 1431
},
{
"epoch": 0.04556962025316456,
"grad_norm": 1.8229308674567508,
"learning_rate": 3.562753036437247e-06,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21922659873962402,
"step": 45,
"valid_targets_mean": 3793.9,
"valid_targets_min": 1470
},
{
"epoch": 0.05063291139240506,
"grad_norm": 1.1764023018227465,
"learning_rate": 3.967611336032389e-06,
"loss": 0.3992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1912367194890976,
"step": 50,
"valid_targets_mean": 4403.0,
"valid_targets_min": 1320
},
{
"epoch": 0.05569620253164557,
"grad_norm": 1.0017414517719199,
"learning_rate": 4.372469635627531e-06,
"loss": 0.3867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19108061492443085,
"step": 55,
"valid_targets_mean": 4060.0,
"valid_targets_min": 1137
},
{
"epoch": 0.060759493670886074,
"grad_norm": 0.7507852394561627,
"learning_rate": 4.7773279352226725e-06,
"loss": 0.3841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16387608647346497,
"step": 60,
"valid_targets_mean": 4424.5,
"valid_targets_min": 1409
},
{
"epoch": 0.06582278481012659,
"grad_norm": 0.557594133353884,
"learning_rate": 5.1821862348178145e-06,
"loss": 0.3711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16386422514915466,
"step": 65,
"valid_targets_mean": 3916.2,
"valid_targets_min": 1045
},
{
"epoch": 0.07088607594936709,
"grad_norm": 0.421043632829371,
"learning_rate": 5.5870445344129565e-06,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19452455639839172,
"step": 70,
"valid_targets_mean": 5656.6,
"valid_targets_min": 1746
},
{
"epoch": 0.0759493670886076,
"grad_norm": 0.41166529544187236,
"learning_rate": 5.991902834008098e-06,
"loss": 0.3747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2017640769481659,
"step": 75,
"valid_targets_mean": 5565.6,
"valid_targets_min": 1301
},
{
"epoch": 0.0810126582278481,
"grad_norm": 0.37589937170078513,
"learning_rate": 6.39676113360324e-06,
"loss": 0.3707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13995295763015747,
"step": 80,
"valid_targets_mean": 3588.8,
"valid_targets_min": 994
},
{
"epoch": 0.08607594936708861,
"grad_norm": 0.3714038081964425,
"learning_rate": 6.801619433198381e-06,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21744906902313232,
"step": 85,
"valid_targets_mean": 5115.6,
"valid_targets_min": 898
},
{
"epoch": 0.09113924050632911,
"grad_norm": 0.34597741271059124,
"learning_rate": 7.206477732793523e-06,
"loss": 0.3564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17021265625953674,
"step": 90,
"valid_targets_mean": 5033.3,
"valid_targets_min": 886
},
{
"epoch": 0.09620253164556962,
"grad_norm": 0.3172791695402959,
"learning_rate": 7.611336032388664e-06,
"loss": 0.3739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16697894036769867,
"step": 95,
"valid_targets_mean": 5135.7,
"valid_targets_min": 776
},
{
"epoch": 0.10126582278481013,
"grad_norm": 0.3605571673212477,
"learning_rate": 8.016194331983806e-06,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17649498581886292,
"step": 100,
"valid_targets_mean": 4052.9,
"valid_targets_min": 1407
},
{
"epoch": 0.10632911392405063,
"grad_norm": 0.3126393081213533,
"learning_rate": 8.421052631578948e-06,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14957275986671448,
"step": 105,
"valid_targets_mean": 4704.9,
"valid_targets_min": 1914
},
{
"epoch": 0.11139240506329114,
"grad_norm": 0.3531313178759686,
"learning_rate": 8.82591093117409e-06,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16743913292884827,
"step": 110,
"valid_targets_mean": 3947.0,
"valid_targets_min": 1052
},
{
"epoch": 0.11645569620253164,
"grad_norm": 0.361312795641348,
"learning_rate": 9.230769230769232e-06,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1453179121017456,
"step": 115,
"valid_targets_mean": 2979.1,
"valid_targets_min": 1042
},
{
"epoch": 0.12151898734177215,
"grad_norm": 0.3118010440427671,
"learning_rate": 9.635627530364373e-06,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1923716962337494,
"step": 120,
"valid_targets_mean": 5371.9,
"valid_targets_min": 1279
},
{
"epoch": 0.12658227848101267,
"grad_norm": 0.35948459926380516,
"learning_rate": 1.0040485829959515e-05,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2048473060131073,
"step": 125,
"valid_targets_mean": 4750.8,
"valid_targets_min": 990
},
{
"epoch": 0.13164556962025317,
"grad_norm": 0.31537572490184773,
"learning_rate": 1.0445344129554658e-05,
"loss": 0.3713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20135825872421265,
"step": 130,
"valid_targets_mean": 4831.9,
"valid_targets_min": 1663
},
{
"epoch": 0.13670886075949368,
"grad_norm": 0.36436085249069955,
"learning_rate": 1.0850202429149799e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21216928958892822,
"step": 135,
"valid_targets_mean": 4523.4,
"valid_targets_min": 1238
},
{
"epoch": 0.14177215189873418,
"grad_norm": 0.3366824015027373,
"learning_rate": 1.1255060728744939e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17111346125602722,
"step": 140,
"valid_targets_mean": 3792.1,
"valid_targets_min": 1100
},
{
"epoch": 0.1468354430379747,
"grad_norm": 0.35533807007148477,
"learning_rate": 1.1659919028340081e-05,
"loss": 0.3589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1642487645149231,
"step": 145,
"valid_targets_mean": 4016.7,
"valid_targets_min": 1556
},
{
"epoch": 0.1518987341772152,
"grad_norm": 0.31790675871917146,
"learning_rate": 1.2064777327935225e-05,
"loss": 0.3429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.197759211063385,
"step": 150,
"valid_targets_mean": 5829.0,
"valid_targets_min": 1509
},
{
"epoch": 0.1569620253164557,
"grad_norm": 0.32375174058174566,
"learning_rate": 1.2469635627530365e-05,
"loss": 0.3571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1860826313495636,
"step": 155,
"valid_targets_mean": 4697.8,
"valid_targets_min": 1042
},
{
"epoch": 0.1620253164556962,
"grad_norm": 0.971603737593077,
"learning_rate": 1.2874493927125507e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2078309953212738,
"step": 160,
"valid_targets_mean": 5384.2,
"valid_targets_min": 1144
},
{
"epoch": 0.1670886075949367,
"grad_norm": 0.47966039195161064,
"learning_rate": 1.327935222672065e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18700364232063293,
"step": 165,
"valid_targets_mean": 4719.9,
"valid_targets_min": 1071
},
{
"epoch": 0.17215189873417722,
"grad_norm": 0.2955436571363374,
"learning_rate": 1.3684210526315791e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16040512919425964,
"step": 170,
"valid_targets_mean": 5175.4,
"valid_targets_min": 1035
},
{
"epoch": 0.17721518987341772,
"grad_norm": 0.2909056024011537,
"learning_rate": 1.4089068825910932e-05,
"loss": 0.3611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14239881932735443,
"step": 175,
"valid_targets_mean": 4601.9,
"valid_targets_min": 1236
},
{
"epoch": 0.18227848101265823,
"grad_norm": 0.3684074269197893,
"learning_rate": 1.4493927125506074e-05,
"loss": 0.3607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17205636203289032,
"step": 180,
"valid_targets_mean": 3363.9,
"valid_targets_min": 899
},
{
"epoch": 0.18734177215189873,
"grad_norm": 0.2978543096994537,
"learning_rate": 1.4898785425101216e-05,
"loss": 0.3606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1950611174106598,
"step": 185,
"valid_targets_mean": 5937.9,
"valid_targets_min": 1368
},
{
"epoch": 0.19240506329113924,
"grad_norm": 0.30414263404359004,
"learning_rate": 1.5303643724696356e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18548183143138885,
"step": 190,
"valid_targets_mean": 5815.7,
"valid_targets_min": 1087
},
{
"epoch": 0.19746835443037974,
"grad_norm": 0.3751151244554016,
"learning_rate": 1.5708502024291498e-05,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2703745365142822,
"step": 195,
"valid_targets_mean": 5632.3,
"valid_targets_min": 1444
},
{
"epoch": 0.20253164556962025,
"grad_norm": 0.3183245241372493,
"learning_rate": 1.6113360323886644e-05,
"loss": 0.3597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15712594985961914,
"step": 200,
"valid_targets_mean": 4035.7,
"valid_targets_min": 1064
},
{
"epoch": 0.20759493670886076,
"grad_norm": 0.3632627857891178,
"learning_rate": 1.6518218623481782e-05,
"loss": 0.3525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17240820825099945,
"step": 205,
"valid_targets_mean": 4021.2,
"valid_targets_min": 1114
},
{
"epoch": 0.21265822784810126,
"grad_norm": 0.34057034041346584,
"learning_rate": 1.6923076923076924e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22665713727474213,
"step": 210,
"valid_targets_mean": 5157.8,
"valid_targets_min": 1706
},
{
"epoch": 0.21772151898734177,
"grad_norm": 0.32892662546524415,
"learning_rate": 1.7327935222672066e-05,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1358383297920227,
"step": 215,
"valid_targets_mean": 3612.9,
"valid_targets_min": 1015
},
{
"epoch": 0.22278481012658227,
"grad_norm": 0.3323805458845017,
"learning_rate": 1.7732793522267208e-05,
"loss": 0.3405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14480899274349213,
"step": 220,
"valid_targets_mean": 6220.1,
"valid_targets_min": 1090
},
{
"epoch": 0.22784810126582278,
"grad_norm": 0.2969456771010524,
"learning_rate": 1.813765182186235e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16806533932685852,
"step": 225,
"valid_targets_mean": 5594.2,
"valid_targets_min": 1290
},
{
"epoch": 0.23291139240506328,
"grad_norm": 0.35442807757680916,
"learning_rate": 1.8542510121457492e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20088203251361847,
"step": 230,
"valid_targets_mean": 4364.5,
"valid_targets_min": 1537
},
{
"epoch": 0.2379746835443038,
"grad_norm": 0.32766837251688363,
"learning_rate": 1.894736842105263e-05,
"loss": 0.3597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12136702239513397,
"step": 235,
"valid_targets_mean": 2704.7,
"valid_targets_min": 1252
},
{
"epoch": 0.2430379746835443,
"grad_norm": 0.3298038015043137,
"learning_rate": 1.9352226720647776e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17166192829608917,
"step": 240,
"valid_targets_mean": 4605.7,
"valid_targets_min": 1445
},
{
"epoch": 0.2481012658227848,
"grad_norm": 0.2811058024334916,
"learning_rate": 1.9757085020242915e-05,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17767693102359772,
"step": 245,
"valid_targets_mean": 5949.4,
"valid_targets_min": 992
},
{
"epoch": 0.25316455696202533,
"grad_norm": 0.3238895469625763,
"learning_rate": 2.016194331983806e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1756962537765503,
"step": 250,
"valid_targets_mean": 4702.4,
"valid_targets_min": 1101
},
{
"epoch": 0.2582278481012658,
"grad_norm": 0.30654096002239845,
"learning_rate": 2.05668016194332e-05,
"loss": 0.3556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18253913521766663,
"step": 255,
"valid_targets_mean": 5601.0,
"valid_targets_min": 977
},
{
"epoch": 0.26329113924050634,
"grad_norm": 0.33818696625352207,
"learning_rate": 2.097165991902834e-05,
"loss": 0.3604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20197951793670654,
"step": 260,
"valid_targets_mean": 4999.4,
"valid_targets_min": 859
},
{
"epoch": 0.2683544303797468,
"grad_norm": 0.3221593835641881,
"learning_rate": 2.1376518218623487e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1421291083097458,
"step": 265,
"valid_targets_mean": 3732.8,
"valid_targets_min": 1159
},
{
"epoch": 0.27341772151898736,
"grad_norm": 0.3467001085595146,
"learning_rate": 2.1781376518218625e-05,
"loss": 0.3541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19689059257507324,
"step": 270,
"valid_targets_mean": 4544.8,
"valid_targets_min": 1627
},
{
"epoch": 0.27848101265822783,
"grad_norm": 0.3893966405259359,
"learning_rate": 2.2186234817813767e-05,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17629346251487732,
"step": 275,
"valid_targets_mean": 3116.6,
"valid_targets_min": 1066
},
{
"epoch": 0.28354430379746837,
"grad_norm": 0.34248011251805455,
"learning_rate": 2.2591093117408906e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1394365131855011,
"step": 280,
"valid_targets_mean": 3400.1,
"valid_targets_min": 1015
},
{
"epoch": 0.28860759493670884,
"grad_norm": 0.34292015860444375,
"learning_rate": 2.299595141700405e-05,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18773144483566284,
"step": 285,
"valid_targets_mean": 4286.1,
"valid_targets_min": 1425
},
{
"epoch": 0.2936708860759494,
"grad_norm": 0.3527832328000518,
"learning_rate": 2.3400809716599193e-05,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18093225359916687,
"step": 290,
"valid_targets_mean": 4568.9,
"valid_targets_min": 1281
},
{
"epoch": 0.29873417721518986,
"grad_norm": 0.3222755455970598,
"learning_rate": 2.3805668016194332e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13850252330303192,
"step": 295,
"valid_targets_mean": 3603.9,
"valid_targets_min": 1101
},
{
"epoch": 0.3037974683544304,
"grad_norm": 0.3081645393207173,
"learning_rate": 2.4210526315789474e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1911936104297638,
"step": 300,
"valid_targets_mean": 6009.3,
"valid_targets_min": 840
},
{
"epoch": 0.30886075949367087,
"grad_norm": 0.29187368241351513,
"learning_rate": 2.461538461538462e-05,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17911839485168457,
"step": 305,
"valid_targets_mean": 7036.5,
"valid_targets_min": 1310
},
{
"epoch": 0.3139240506329114,
"grad_norm": 0.49985981352299386,
"learning_rate": 2.5020242914979758e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16296392679214478,
"step": 310,
"valid_targets_mean": 3887.8,
"valid_targets_min": 1192
},
{
"epoch": 0.3189873417721519,
"grad_norm": 0.38261294484090613,
"learning_rate": 2.54251012145749e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15782615542411804,
"step": 315,
"valid_targets_mean": 3376.2,
"valid_targets_min": 1185
},
{
"epoch": 0.3240506329113924,
"grad_norm": 0.45061664130339874,
"learning_rate": 2.5829959514170046e-05,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1975603699684143,
"step": 320,
"valid_targets_mean": 5570.6,
"valid_targets_min": 1866
},
{
"epoch": 0.3291139240506329,
"grad_norm": 0.3182602149268292,
"learning_rate": 2.6234817813765184e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14342699944972992,
"step": 325,
"valid_targets_mean": 3784.2,
"valid_targets_min": 849
},
{
"epoch": 0.3341772151898734,
"grad_norm": 0.3254644437199896,
"learning_rate": 2.6639676113360326e-05,
"loss": 0.3501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16729095578193665,
"step": 330,
"valid_targets_mean": 3966.9,
"valid_targets_min": 1392
},
{
"epoch": 0.3392405063291139,
"grad_norm": 0.32206841245268697,
"learning_rate": 2.704453441295547e-05,
"loss": 0.3476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1826034039258957,
"step": 335,
"valid_targets_mean": 4157.9,
"valid_targets_min": 1092
},
{
"epoch": 0.34430379746835443,
"grad_norm": 0.3602273548100487,
"learning_rate": 2.744939271255061e-05,
"loss": 0.3625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2222571074962616,
"step": 340,
"valid_targets_mean": 4895.1,
"valid_targets_min": 1074
},
{
"epoch": 0.3493670886075949,
"grad_norm": 0.3392767743330912,
"learning_rate": 2.7854251012145752e-05,
"loss": 0.3455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13851270079612732,
"step": 345,
"valid_targets_mean": 3250.4,
"valid_targets_min": 1001
},
{
"epoch": 0.35443037974683544,
"grad_norm": 0.32803869222957094,
"learning_rate": 2.825910931174089e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18585026264190674,
"step": 350,
"valid_targets_mean": 4607.0,
"valid_targets_min": 1164
},
{
"epoch": 0.3594936708860759,
"grad_norm": 0.2960837838285842,
"learning_rate": 2.8663967611336033e-05,
"loss": 0.3539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23394142091274261,
"step": 355,
"valid_targets_mean": 8210.9,
"valid_targets_min": 1637
},
{
"epoch": 0.36455696202531646,
"grad_norm": 0.3694811833098562,
"learning_rate": 2.906882591093118e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16552570462226868,
"step": 360,
"valid_targets_mean": 2960.9,
"valid_targets_min": 1184
},
{
"epoch": 0.369620253164557,
"grad_norm": 0.31999701209701786,
"learning_rate": 2.9473684210526317e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16295602917671204,
"step": 365,
"valid_targets_mean": 3841.0,
"valid_targets_min": 1068
},
{
"epoch": 0.37468354430379747,
"grad_norm": 0.29571436256727346,
"learning_rate": 2.987854251012146e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19385173916816711,
"step": 370,
"valid_targets_mean": 5434.1,
"valid_targets_min": 904
},
{
"epoch": 0.379746835443038,
"grad_norm": 0.2794237498150064,
"learning_rate": 3.0283400809716605e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17324280738830566,
"step": 375,
"valid_targets_mean": 6533.0,
"valid_targets_min": 914
},
{
"epoch": 0.3848101265822785,
"grad_norm": 0.46097531086569304,
"learning_rate": 3.068825910931174e-05,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612202525138855,
"step": 380,
"valid_targets_mean": 4019.0,
"valid_targets_min": 1578
},
{
"epoch": 0.389873417721519,
"grad_norm": 0.33386509179906093,
"learning_rate": 3.1093117408906885e-05,
"loss": 0.3495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14520494639873505,
"step": 385,
"valid_targets_mean": 3415.9,
"valid_targets_min": 1118
},
{
"epoch": 0.3949367088607595,
"grad_norm": 0.3319526543378725,
"learning_rate": 3.149797570850203e-05,
"loss": 0.3487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1795864999294281,
"step": 390,
"valid_targets_mean": 4239.8,
"valid_targets_min": 991
},
{
"epoch": 0.4,
"grad_norm": 0.3406949335779596,
"learning_rate": 3.190283400809717e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16871468722820282,
"step": 395,
"valid_targets_mean": 3474.5,
"valid_targets_min": 1133
},
{
"epoch": 0.4050632911392405,
"grad_norm": 0.36838681719013816,
"learning_rate": 3.230769230769231e-05,
"loss": 0.3522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1932060271501541,
"step": 400,
"valid_targets_mean": 3488.6,
"valid_targets_min": 1164
},
{
"epoch": 0.41012658227848103,
"grad_norm": 0.35042164458126773,
"learning_rate": 3.271255060728745e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17853647470474243,
"step": 405,
"valid_targets_mean": 3956.2,
"valid_targets_min": 1293
},
{
"epoch": 0.4151898734177215,
"grad_norm": 0.3489327841744588,
"learning_rate": 3.311740890688259e-05,
"loss": 0.3585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16795890033245087,
"step": 410,
"valid_targets_mean": 3783.9,
"valid_targets_min": 1206
},
{
"epoch": 0.42025316455696204,
"grad_norm": 0.3454446525690692,
"learning_rate": 3.352226720647774e-05,
"loss": 0.3516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2117060422897339,
"step": 415,
"valid_targets_mean": 4945.9,
"valid_targets_min": 1096
},
{
"epoch": 0.4253164556962025,
"grad_norm": 0.3098825126338765,
"learning_rate": 3.3927125506072876e-05,
"loss": 0.3574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20046228170394897,
"step": 420,
"valid_targets_mean": 6020.4,
"valid_targets_min": 1220
},
{
"epoch": 0.43037974683544306,
"grad_norm": 0.37532962252838115,
"learning_rate": 3.433198380566802e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1575276255607605,
"step": 425,
"valid_targets_mean": 3148.8,
"valid_targets_min": 1434
},
{
"epoch": 0.43544303797468353,
"grad_norm": 0.41731233709453813,
"learning_rate": 3.473684210526316e-05,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18151873350143433,
"step": 430,
"valid_targets_mean": 4121.1,
"valid_targets_min": 882
},
{
"epoch": 0.44050632911392407,
"grad_norm": 0.2834549547224196,
"learning_rate": 3.51417004048583e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21482950448989868,
"step": 435,
"valid_targets_mean": 7190.4,
"valid_targets_min": 980
},
{
"epoch": 0.44556962025316454,
"grad_norm": 0.30073688146062255,
"learning_rate": 3.5546558704453444e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1362500786781311,
"step": 440,
"valid_targets_mean": 4360.6,
"valid_targets_min": 1118
},
{
"epoch": 0.4506329113924051,
"grad_norm": 0.3750594432228394,
"learning_rate": 3.595141700404859e-05,
"loss": 0.3531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20675930380821228,
"step": 445,
"valid_targets_mean": 4531.2,
"valid_targets_min": 1680
},
{
"epoch": 0.45569620253164556,
"grad_norm": 0.3568782095433956,
"learning_rate": 3.635627530364373e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17187099158763885,
"step": 450,
"valid_targets_mean": 4279.3,
"valid_targets_min": 1210
},
{
"epoch": 0.4607594936708861,
"grad_norm": 0.31010973542926373,
"learning_rate": 3.676113360323887e-05,
"loss": 0.349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1888793706893921,
"step": 455,
"valid_targets_mean": 5464.9,
"valid_targets_min": 540
},
{
"epoch": 0.46582278481012657,
"grad_norm": 0.30672819186326156,
"learning_rate": 3.716599190283401e-05,
"loss": 0.3369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19805072247982025,
"step": 460,
"valid_targets_mean": 5570.1,
"valid_targets_min": 1257
},
{
"epoch": 0.4708860759493671,
"grad_norm": 0.33237701694635524,
"learning_rate": 3.757085020242915e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17327673733234406,
"step": 465,
"valid_targets_mean": 4441.7,
"valid_targets_min": 1062
},
{
"epoch": 0.4759493670886076,
"grad_norm": 0.3157269440092307,
"learning_rate": 3.7975708502024296e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036791741847992,
"step": 470,
"valid_targets_mean": 5480.2,
"valid_targets_min": 1147
},
{
"epoch": 0.4810126582278481,
"grad_norm": 0.3385448591385259,
"learning_rate": 3.8380566801619435e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18548253178596497,
"step": 475,
"valid_targets_mean": 5158.2,
"valid_targets_min": 1322
},
{
"epoch": 0.4860759493670886,
"grad_norm": 0.3229813339259753,
"learning_rate": 3.878542510121458e-05,
"loss": 0.3539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19486048817634583,
"step": 480,
"valid_targets_mean": 5207.5,
"valid_targets_min": 1234
},
{
"epoch": 0.4911392405063291,
"grad_norm": 0.39888632177896866,
"learning_rate": 3.919028340080972e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15041330456733704,
"step": 485,
"valid_targets_mean": 2910.4,
"valid_targets_min": 826
},
{
"epoch": 0.4962025316455696,
"grad_norm": 0.3216838457166851,
"learning_rate": 3.959514170040486e-05,
"loss": 0.3535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18031927943229675,
"step": 490,
"valid_targets_mean": 5146.9,
"valid_targets_min": 1318
},
{
"epoch": 0.5012658227848101,
"grad_norm": 0.3463812343689675,
"learning_rate": 4e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13655783236026764,
"step": 495,
"valid_targets_mean": 3592.6,
"valid_targets_min": 977
},
{
"epoch": 0.5063291139240507,
"grad_norm": 0.36468197040198047,
"learning_rate": 3.999987517534179e-05,
"loss": 0.3298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17994073033332825,
"step": 500,
"valid_targets_mean": 3419.4,
"valid_targets_min": 997
},
{
"epoch": 0.5113924050632911,
"grad_norm": 0.3123011360513197,
"learning_rate": 3.999950070292526e-05,
"loss": 0.3514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13850685954093933,
"step": 505,
"valid_targets_mean": 4406.6,
"valid_targets_min": 1006
},
{
"epoch": 0.5164556962025316,
"grad_norm": 0.3110207165348701,
"learning_rate": 3.9998876587424764e-05,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13691280782222748,
"step": 510,
"valid_targets_mean": 4396.4,
"valid_targets_min": 1417
},
{
"epoch": 0.5215189873417722,
"grad_norm": 0.32363025722531935,
"learning_rate": 3.99980028366308e-05,
"loss": 0.3569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24637667834758759,
"step": 515,
"valid_targets_mean": 5892.6,
"valid_targets_min": 1208
},
{
"epoch": 0.5265822784810127,
"grad_norm": 0.3650846632854969,
"learning_rate": 3.999687946144992e-05,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18719391524791718,
"step": 520,
"valid_targets_mean": 4166.3,
"valid_targets_min": 1384
},
{
"epoch": 0.5316455696202531,
"grad_norm": 0.380513757297641,
"learning_rate": 3.999550647590464e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21175450086593628,
"step": 525,
"valid_targets_mean": 3908.1,
"valid_targets_min": 1057
},
{
"epoch": 0.5367088607594936,
"grad_norm": 0.3303089638050748,
"learning_rate": 3.9993883897133174e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1324310302734375,
"step": 530,
"valid_targets_mean": 3035.0,
"valid_targets_min": 1176
},
{
"epoch": 0.5417721518987342,
"grad_norm": 0.3065345335498946,
"learning_rate": 3.9992011745389335e-05,
"loss": 0.3564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18349391222000122,
"step": 535,
"valid_targets_mean": 5569.8,
"valid_targets_min": 1419
},
{
"epoch": 0.5468354430379747,
"grad_norm": 0.3593697878507127,
"learning_rate": 3.998989004404217e-05,
"loss": 0.3477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1619454324245453,
"step": 540,
"valid_targets_mean": 3932.5,
"valid_targets_min": 1196
},
{
"epoch": 0.5518987341772152,
"grad_norm": 0.25234558053757633,
"learning_rate": 3.998751881957576e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16338235139846802,
"step": 545,
"valid_targets_mean": 5379.0,
"valid_targets_min": 977
},
{
"epoch": 0.5569620253164557,
"grad_norm": 0.3445664068863559,
"learning_rate": 3.998489810158883e-05,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1785704791545868,
"step": 550,
"valid_targets_mean": 3962.2,
"valid_targets_min": 1209
},
{
"epoch": 0.5620253164556962,
"grad_norm": 0.3556936347323425,
"learning_rate": 3.99820279227944e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18062683939933777,
"step": 555,
"valid_targets_mean": 4593.2,
"valid_targets_min": 1615
},
{
"epoch": 0.5670886075949367,
"grad_norm": 0.3792686598578621,
"learning_rate": 3.997890831901938e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19577497243881226,
"step": 560,
"valid_targets_mean": 4658.2,
"valid_targets_min": 1474
},
{
"epoch": 0.5721518987341773,
"grad_norm": 0.32913492636939423,
"learning_rate": 3.9975539329204116e-05,
"loss": 0.3387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17351575195789337,
"step": 565,
"valid_targets_mean": 4210.6,
"valid_targets_min": 743
},
{
"epoch": 0.5772151898734177,
"grad_norm": 0.296950123523885,
"learning_rate": 3.9971920995401905e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20880410075187683,
"step": 570,
"valid_targets_mean": 6590.1,
"valid_targets_min": 1899
},
{
"epoch": 0.5822784810126582,
"grad_norm": 0.34173998557875557,
"learning_rate": 3.996805336277848e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1291336864233017,
"step": 575,
"valid_targets_mean": 4007.8,
"valid_targets_min": 1380
},
{
"epoch": 0.5873417721518988,
"grad_norm": 0.30049566187413324,
"learning_rate": 3.996393647961143e-05,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13710632920265198,
"step": 580,
"valid_targets_mean": 4320.4,
"valid_targets_min": 1110
},
{
"epoch": 0.5924050632911393,
"grad_norm": 0.3451273067980245,
"learning_rate": 3.995957039728962e-05,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18673017621040344,
"step": 585,
"valid_targets_mean": 4318.7,
"valid_targets_min": 1318
},
{
"epoch": 0.5974683544303797,
"grad_norm": 0.3248655593711836,
"learning_rate": 3.9954955170312504e-05,
"loss": 0.335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15301413834095,
"step": 590,
"valid_targets_mean": 4103.9,
"valid_targets_min": 1260
},
{
"epoch": 0.6025316455696202,
"grad_norm": 0.3874469407061254,
"learning_rate": 3.995009085628951e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17825846374034882,
"step": 595,
"valid_targets_mean": 3280.8,
"valid_targets_min": 1303
},
{
"epoch": 0.6075949367088608,
"grad_norm": 0.32514023580791557,
"learning_rate": 3.994497751593927e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17784975469112396,
"step": 600,
"valid_targets_mean": 4897.2,
"valid_targets_min": 1343
},
{
"epoch": 0.6126582278481013,
"grad_norm": 0.32015309031323297,
"learning_rate": 3.9939615213088865e-05,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1702687293291092,
"step": 605,
"valid_targets_mean": 5160.1,
"valid_targets_min": 787
},
{
"epoch": 0.6177215189873417,
"grad_norm": 0.29531423820767827,
"learning_rate": 3.993400401467308e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1590127795934677,
"step": 610,
"valid_targets_mean": 5178.2,
"valid_targets_min": 1187
},
{
"epoch": 0.6227848101265823,
"grad_norm": 0.30956228742996816,
"learning_rate": 3.992814399073349e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1777225136756897,
"step": 615,
"valid_targets_mean": 5224.1,
"valid_targets_min": 1044
},
{
"epoch": 0.6278481012658228,
"grad_norm": 0.2946569197224124,
"learning_rate": 3.992203521441765e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16454584896564484,
"step": 620,
"valid_targets_mean": 5873.6,
"valid_targets_min": 1522
},
{
"epoch": 0.6329113924050633,
"grad_norm": 0.3566548256792116,
"learning_rate": 3.991567776197815e-05,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1757839322090149,
"step": 625,
"valid_targets_mean": 5280.0,
"valid_targets_min": 1179
},
{
"epoch": 0.6379746835443038,
"grad_norm": 0.34702302453822725,
"learning_rate": 3.990907171277168e-05,
"loss": 0.3406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16491375863552094,
"step": 630,
"valid_targets_mean": 3738.1,
"valid_targets_min": 1437
},
{
"epoch": 0.6430379746835443,
"grad_norm": 0.3122025130697409,
"learning_rate": 3.990221714925802e-05,
"loss": 0.3425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19272474944591522,
"step": 635,
"valid_targets_mean": 5090.6,
"valid_targets_min": 858
},
{
"epoch": 0.6481012658227848,
"grad_norm": 0.3289259973223097,
"learning_rate": 3.989511415699901e-05,
"loss": 0.3492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21416299045085907,
"step": 640,
"valid_targets_mean": 5687.4,
"valid_targets_min": 1558
},
{
"epoch": 0.6531645569620254,
"grad_norm": 0.31628182785649794,
"learning_rate": 3.988776282465752e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16229850053787231,
"step": 645,
"valid_targets_mean": 5641.7,
"valid_targets_min": 1228
},
{
"epoch": 0.6582278481012658,
"grad_norm": 0.32370069272186214,
"learning_rate": 3.9880163243996314e-05,
"loss": 0.3439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1790936440229416,
"step": 650,
"valid_targets_mean": 4757.5,
"valid_targets_min": 828
},
{
"epoch": 0.6632911392405063,
"grad_norm": 0.331462646919884,
"learning_rate": 3.9872315509876885e-05,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2034873068332672,
"step": 655,
"valid_targets_mean": 6825.2,
"valid_targets_min": 1430
},
{
"epoch": 0.6683544303797468,
"grad_norm": 0.2773031962593845,
"learning_rate": 3.986421972025831e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13872382044792175,
"step": 660,
"valid_targets_mean": 5178.6,
"valid_targets_min": 1303
},
{
"epoch": 0.6734177215189874,
"grad_norm": 0.3282605048208077,
"learning_rate": 3.9855875976196e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442852020263672,
"step": 665,
"valid_targets_mean": 3767.0,
"valid_targets_min": 1309
},
{
"epoch": 0.6784810126582278,
"grad_norm": 0.5817158484637879,
"learning_rate": 3.984728438184047e-05,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867026388645172,
"step": 670,
"valid_targets_mean": 4197.3,
"valid_targets_min": 1119
},
{
"epoch": 0.6835443037974683,
"grad_norm": 0.3539656970185502,
"learning_rate": 3.9838445044435997e-05,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16187211871147156,
"step": 675,
"valid_targets_mean": 4067.3,
"valid_targets_min": 1024
},
{
"epoch": 0.6886075949367089,
"grad_norm": 0.33229865798563013,
"learning_rate": 3.9829358074319295e-05,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17157503962516785,
"step": 680,
"valid_targets_mean": 4686.7,
"valid_targets_min": 1496
},
{
"epoch": 0.6936708860759494,
"grad_norm": 0.2791093667927135,
"learning_rate": 3.982002358491817e-05,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1936018466949463,
"step": 685,
"valid_targets_mean": 6395.1,
"valid_targets_min": 1038
},
{
"epoch": 0.6987341772151898,
"grad_norm": 0.3350209099910488,
"learning_rate": 3.981044169275006e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1778436303138733,
"step": 690,
"valid_targets_mean": 4567.5,
"valid_targets_min": 1080
},
{
"epoch": 0.7037974683544304,
"grad_norm": 0.3531099254353881,
"learning_rate": 3.9800612517420626e-05,
"loss": 0.3469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16938315331935883,
"step": 695,
"valid_targets_mean": 3896.1,
"valid_targets_min": 1641
},
{
"epoch": 0.7088607594936709,
"grad_norm": 0.318049795345604,
"learning_rate": 3.979053618162219e-05,
"loss": 0.3564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1946740746498108,
"step": 700,
"valid_targets_mean": 5408.9,
"valid_targets_min": 1410
},
{
"epoch": 0.7139240506329114,
"grad_norm": 0.3320763821369659,
"learning_rate": 3.978021281113228e-05,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17016340792179108,
"step": 705,
"valid_targets_mean": 4967.0,
"valid_targets_min": 882
},
{
"epoch": 0.7189873417721518,
"grad_norm": 0.2847828838514781,
"learning_rate": 3.9769642534812e-05,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1707335114479065,
"step": 710,
"valid_targets_mean": 6450.3,
"valid_targets_min": 1014
},
{
"epoch": 0.7240506329113924,
"grad_norm": 0.3321384385821899,
"learning_rate": 3.9758825484604494e-05,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1961357295513153,
"step": 715,
"valid_targets_mean": 4652.9,
"valid_targets_min": 1387
},
{
"epoch": 0.7291139240506329,
"grad_norm": 0.3032184720855355,
"learning_rate": 3.9747761795533194e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1426798403263092,
"step": 720,
"valid_targets_mean": 6012.8,
"valid_targets_min": 1966
},
{
"epoch": 0.7341772151898734,
"grad_norm": 0.3448777606898466,
"learning_rate": 3.973645160570023e-05,
"loss": 0.3546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1586744487285614,
"step": 725,
"valid_targets_mean": 4090.4,
"valid_targets_min": 1678
},
{
"epoch": 0.739240506329114,
"grad_norm": 0.3156506831386379,
"learning_rate": 3.9724895056284665e-05,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1619202196598053,
"step": 730,
"valid_targets_mean": 4218.2,
"valid_targets_min": 1064
},
{
"epoch": 0.7443037974683544,
"grad_norm": 0.35504669537877936,
"learning_rate": 3.971309229154072e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21181583404541016,
"step": 735,
"valid_targets_mean": 4926.1,
"valid_targets_min": 1207
},
{
"epoch": 0.7493670886075949,
"grad_norm": 0.3201734939222349,
"learning_rate": 3.9701043458796015e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22177475690841675,
"step": 740,
"valid_targets_mean": 6330.8,
"valid_targets_min": 1448
},
{
"epoch": 0.7544303797468355,
"grad_norm": 0.3323013925433624,
"learning_rate": 3.9688748708449686e-05,
"loss": 0.3383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15360356867313385,
"step": 745,
"valid_targets_mean": 4397.9,
"valid_targets_min": 1528
},
{
"epoch": 0.759493670886076,
"grad_norm": 0.2700426394697059,
"learning_rate": 3.967620819397053e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15975482761859894,
"step": 750,
"valid_targets_mean": 5138.0,
"valid_targets_min": 1494
},
{
"epoch": 0.7645569620253164,
"grad_norm": 0.32491869195537754,
"learning_rate": 3.9663422071895103e-05,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329491138458252,
"step": 755,
"valid_targets_mean": 3496.6,
"valid_targets_min": 1333
},
{
"epoch": 0.769620253164557,
"grad_norm": 0.30201583766650153,
"learning_rate": 3.965039050182573e-05,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17797686159610748,
"step": 760,
"valid_targets_mean": 5996.1,
"valid_targets_min": 1405
},
{
"epoch": 0.7746835443037975,
"grad_norm": 0.28815946203036474,
"learning_rate": 3.963711364642854e-05,
"loss": 0.3397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19754289090633392,
"step": 765,
"valid_targets_mean": 6895.8,
"valid_targets_min": 1767
},
{
"epoch": 0.779746835443038,
"grad_norm": 0.3154202174762482,
"learning_rate": 3.9623591671431416e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18379993736743927,
"step": 770,
"valid_targets_mean": 5009.2,
"valid_targets_min": 1303
},
{
"epoch": 0.7848101265822784,
"grad_norm": 0.3575700176888927,
"learning_rate": 3.960982474562196e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17523907124996185,
"step": 775,
"valid_targets_mean": 4694.8,
"valid_targets_min": 1661
},
{
"epoch": 0.789873417721519,
"grad_norm": 0.3310517991000096,
"learning_rate": 3.959581304084536e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1610376238822937,
"step": 780,
"valid_targets_mean": 4332.1,
"valid_targets_min": 863
},
{
"epoch": 0.7949367088607595,
"grad_norm": 0.31363025202931233,
"learning_rate": 3.958155673200223e-05,
"loss": 0.3547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2106252908706665,
"step": 785,
"valid_targets_mean": 5876.1,
"valid_targets_min": 1285
},
{
"epoch": 0.8,
"grad_norm": 0.2999707270623021,
"learning_rate": 3.956705599704645e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19507791101932526,
"step": 790,
"valid_targets_mean": 5528.2,
"valid_targets_min": 1012
},
{
"epoch": 0.8050632911392405,
"grad_norm": 0.34798398865892316,
"learning_rate": 3.9552311016982964e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592869609594345,
"step": 795,
"valid_targets_mean": 3994.4,
"valid_targets_min": 1020
},
{
"epoch": 0.810126582278481,
"grad_norm": 0.3486093165843197,
"learning_rate": 3.953732197586549e-05,
"loss": 0.3299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14387521147727966,
"step": 800,
"valid_targets_mean": 3136.8,
"valid_targets_min": 969
},
{
"epoch": 0.8151898734177215,
"grad_norm": 0.34294729405636676,
"learning_rate": 3.952208906079419e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14744120836257935,
"step": 805,
"valid_targets_mean": 3541.7,
"valid_targets_min": 1023
},
{
"epoch": 0.8202531645569621,
"grad_norm": 0.29811481034198406,
"learning_rate": 3.950661246191344e-05,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20451560616493225,
"step": 810,
"valid_targets_mean": 5959.1,
"valid_targets_min": 1170
},
{
"epoch": 0.8253164556962025,
"grad_norm": 0.29859308801266926,
"learning_rate": 3.949089237240933e-05,
"loss": 0.3261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17102043330669403,
"step": 815,
"valid_targets_mean": 5425.9,
"valid_targets_min": 1281
},
{
"epoch": 0.830379746835443,
"grad_norm": 0.33822208957438105,
"learning_rate": 3.947492898850736e-05,
"loss": 0.3379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12047713249921799,
"step": 820,
"valid_targets_mean": 2989.9,
"valid_targets_min": 1525
},
{
"epoch": 0.8354430379746836,
"grad_norm": 0.30589016543655284,
"learning_rate": 3.94587225094699e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16248869895935059,
"step": 825,
"valid_targets_mean": 4684.8,
"valid_targets_min": 1392
},
{
"epoch": 0.8405063291139241,
"grad_norm": 0.2936931469479608,
"learning_rate": 3.94422731375938e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12211855500936508,
"step": 830,
"valid_targets_mean": 3796.8,
"valid_targets_min": 1392
},
{
"epoch": 0.8455696202531645,
"grad_norm": 0.37559686297102585,
"learning_rate": 3.9425581078207764e-05,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12265650928020477,
"step": 835,
"valid_targets_mean": 2870.8,
"valid_targets_min": 1300
},
{
"epoch": 0.850632911392405,
"grad_norm": 0.35124796916797185,
"learning_rate": 3.940864653966985e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492408812046051,
"step": 840,
"valid_targets_mean": 3748.4,
"valid_targets_min": 1108
},
{
"epoch": 0.8556962025316456,
"grad_norm": 0.3196010195709303,
"learning_rate": 3.939146973336487e-05,
"loss": 0.3411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21070614457130432,
"step": 845,
"valid_targets_mean": 5815.2,
"valid_targets_min": 1741
},
{
"epoch": 0.8607594936708861,
"grad_norm": 0.278654689286952,
"learning_rate": 3.937405087370171e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16281408071517944,
"step": 850,
"valid_targets_mean": 6301.6,
"valid_targets_min": 1867
},
{
"epoch": 0.8658227848101265,
"grad_norm": 0.32174716361043904,
"learning_rate": 3.9356390178110694e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11544165015220642,
"step": 855,
"valid_targets_mean": 3471.2,
"valid_targets_min": 1247
},
{
"epoch": 0.8708860759493671,
"grad_norm": 0.31597886690897176,
"learning_rate": 3.9338487867040855e-05,
"loss": 0.3514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751353144645691,
"step": 860,
"valid_targets_mean": 4752.5,
"valid_targets_min": 1271
},
{
"epoch": 0.8759493670886076,
"grad_norm": 0.3376382881344058,
"learning_rate": 3.9320344163957177e-05,
"loss": 0.3505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628148853778839,
"step": 865,
"valid_targets_mean": 4121.5,
"valid_targets_min": 1412
},
{
"epoch": 0.8810126582278481,
"grad_norm": 0.3174487269237297,
"learning_rate": 3.9301959295337816e-05,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19904953241348267,
"step": 870,
"valid_targets_mean": 6095.4,
"valid_targets_min": 1694
},
{
"epoch": 0.8860759493670886,
"grad_norm": 0.29589750599326486,
"learning_rate": 3.928333349067125e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22740904986858368,
"step": 875,
"valid_targets_mean": 6433.5,
"valid_targets_min": 979
},
{
"epoch": 0.8911392405063291,
"grad_norm": 0.28879537949688816,
"learning_rate": 3.926446698245347e-05,
"loss": 0.3262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1922253668308258,
"step": 880,
"valid_targets_mean": 5540.3,
"valid_targets_min": 1526
},
{
"epoch": 0.8962025316455696,
"grad_norm": 0.3183527697451739,
"learning_rate": 3.924536000618501e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510843187570572,
"step": 885,
"valid_targets_mean": 4520.7,
"valid_targets_min": 1446
},
{
"epoch": 0.9012658227848102,
"grad_norm": 0.3190560534322978,
"learning_rate": 3.922601280036805e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19017574191093445,
"step": 890,
"valid_targets_mean": 4967.6,
"valid_targets_min": 1199
},
{
"epoch": 0.9063291139240506,
"grad_norm": 0.4456031002758009,
"learning_rate": 3.920642560650343e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22871103882789612,
"step": 895,
"valid_targets_mean": 5971.6,
"valid_targets_min": 1331
},
{
"epoch": 0.9113924050632911,
"grad_norm": 0.30090137054069316,
"learning_rate": 3.918659866908762e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15791599452495575,
"step": 900,
"valid_targets_mean": 5456.4,
"valid_targets_min": 1469
},
{
"epoch": 0.9164556962025316,
"grad_norm": 0.33133512730966574,
"learning_rate": 3.9166532235609695e-05,
"loss": 0.3397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21240505576133728,
"step": 905,
"valid_targets_mean": 5933.7,
"valid_targets_min": 1591
},
{
"epoch": 0.9215189873417722,
"grad_norm": 0.3573450052442163,
"learning_rate": 3.914622655654822e-05,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13716688752174377,
"step": 910,
"valid_targets_mean": 5188.8,
"valid_targets_min": 1591
},
{
"epoch": 0.9265822784810127,
"grad_norm": 0.3538932529953643,
"learning_rate": 3.912568188536814e-05,
"loss": 0.3537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16137436032295227,
"step": 915,
"valid_targets_mean": 3634.4,
"valid_targets_min": 1339
},
{
"epoch": 0.9316455696202531,
"grad_norm": 0.3208113773796828,
"learning_rate": 3.910489847851761e-05,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17828276753425598,
"step": 920,
"valid_targets_mean": 4550.2,
"valid_targets_min": 1178
},
{
"epoch": 0.9367088607594937,
"grad_norm": 0.3094131187909477,
"learning_rate": 3.908387659542481e-05,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14312776923179626,
"step": 925,
"valid_targets_mean": 4335.3,
"valid_targets_min": 1291
},
{
"epoch": 0.9417721518987342,
"grad_norm": 0.33010185993106733,
"learning_rate": 3.9062616498494656e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17049264907836914,
"step": 930,
"valid_targets_mean": 3559.0,
"valid_targets_min": 1428
},
{
"epoch": 0.9468354430379747,
"grad_norm": 0.3152672156222691,
"learning_rate": 3.904111845310559e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16469566524028778,
"step": 935,
"valid_targets_mean": 4357.5,
"valid_targets_min": 1218
},
{
"epoch": 0.9518987341772152,
"grad_norm": 0.3201518158080734,
"learning_rate": 3.901938272760623e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640382707118988,
"step": 940,
"valid_targets_mean": 4409.8,
"valid_targets_min": 696
},
{
"epoch": 0.9569620253164557,
"grad_norm": 0.3422558014341276,
"learning_rate": 3.899740959331204e-05,
"loss": 0.3411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14299672842025757,
"step": 945,
"valid_targets_mean": 3149.9,
"valid_targets_min": 866
},
{
"epoch": 0.9620253164556962,
"grad_norm": 0.3039490414348751,
"learning_rate": 3.897519932450189e-05,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14147335290908813,
"step": 950,
"valid_targets_mean": 4333.5,
"valid_targets_min": 1238
},
{
"epoch": 0.9670886075949368,
"grad_norm": 0.3264243877990281,
"learning_rate": 3.8952752198414716e-05,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17327773571014404,
"step": 955,
"valid_targets_mean": 4177.0,
"valid_targets_min": 1111
},
{
"epoch": 0.9721518987341772,
"grad_norm": 0.3108694369949979,
"learning_rate": 3.893006849524601e-05,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16756384074687958,
"step": 960,
"valid_targets_mean": 4619.9,
"valid_targets_min": 1156
},
{
"epoch": 0.9772151898734177,
"grad_norm": 0.3448421182167878,
"learning_rate": 3.890714849814431e-05,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15267406404018402,
"step": 965,
"valid_targets_mean": 4085.4,
"valid_targets_min": 1188
},
{
"epoch": 0.9822784810126582,
"grad_norm": 0.30352124369356204,
"learning_rate": 3.8883992493207696e-05,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2034776359796524,
"step": 970,
"valid_targets_mean": 5403.8,
"valid_targets_min": 1133
},
{
"epoch": 0.9873417721518988,
"grad_norm": 0.2876598919430634,
"learning_rate": 3.8860600769480215e-05,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17782637476921082,
"step": 975,
"valid_targets_mean": 5421.9,
"valid_targets_min": 876
},
{
"epoch": 0.9924050632911392,
"grad_norm": 0.33380559486032607,
"learning_rate": 3.883697361894825e-05,
"loss": 0.3439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2117309868335724,
"step": 980,
"valid_targets_mean": 4499.0,
"valid_targets_min": 1184
},
{
"epoch": 0.9974683544303797,
"grad_norm": 0.3618917728963476,
"learning_rate": 3.881311133653691e-05,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16749724745750427,
"step": 985,
"valid_targets_mean": 3879.4,
"valid_targets_min": 966
},
{
"epoch": 1.0020253164556963,
"grad_norm": 0.3195092960965727,
"learning_rate": 3.878901422010632e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21217718720436096,
"step": 990,
"valid_targets_mean": 6226.9,
"valid_targets_min": 1827
},
{
"epoch": 1.0070886075949368,
"grad_norm": 0.32404855006530575,
"learning_rate": 3.87646825704479e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1381339430809021,
"step": 995,
"valid_targets_mean": 3916.4,
"valid_targets_min": 1401
},
{
"epoch": 1.0121518987341773,
"grad_norm": 0.3141166003779331,
"learning_rate": 3.874011669128065e-05,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1709311306476593,
"step": 1000,
"valid_targets_mean": 4634.4,
"valid_targets_min": 1322
},
{
"epoch": 1.0172151898734176,
"grad_norm": 0.33255131568231555,
"learning_rate": 3.871531688924731e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11075881123542786,
"step": 1005,
"valid_targets_mean": 2777.5,
"valid_targets_min": 899
},
{
"epoch": 1.0222784810126582,
"grad_norm": 0.3551119238834457,
"learning_rate": 3.8690283473910555e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18998833000659943,
"step": 1010,
"valid_targets_mean": 5065.8,
"valid_targets_min": 1392
},
{
"epoch": 1.0273417721518987,
"grad_norm": 0.36295431013252033,
"learning_rate": 3.866501675774914e-05,
"loss": 0.3282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1773543804883957,
"step": 1015,
"valid_targets_mean": 3819.9,
"valid_targets_min": 1174
},
{
"epoch": 1.0324050632911392,
"grad_norm": 0.33540491774621956,
"learning_rate": 3.8639517056153997e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16152143478393555,
"step": 1020,
"valid_targets_mean": 4223.1,
"valid_targets_min": 858
},
{
"epoch": 1.0374683544303798,
"grad_norm": 0.32077100355601573,
"learning_rate": 3.8613784687424275e-05,
"loss": 0.3378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19795547425746918,
"step": 1025,
"valid_targets_mean": 5295.2,
"valid_targets_min": 1496
},
{
"epoch": 1.0425316455696203,
"grad_norm": 0.3216906551189178,
"learning_rate": 3.858781997276337e-05,
"loss": 0.3318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16188682615756989,
"step": 1030,
"valid_targets_mean": 5138.4,
"valid_targets_min": 947
},
{
"epoch": 1.0475949367088608,
"grad_norm": 0.4486889227248024,
"learning_rate": 3.856162323627497e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09634960442781448,
"step": 1035,
"valid_targets_mean": 3724.6,
"valid_targets_min": 934
},
{
"epoch": 1.0526582278481014,
"grad_norm": 0.2934117207565638,
"learning_rate": 3.8535194804958924e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1526038944721222,
"step": 1040,
"valid_targets_mean": 4829.0,
"valid_targets_min": 1401
},
{
"epoch": 1.0577215189873417,
"grad_norm": 0.2931878952686227,
"learning_rate": 3.8508535008707236e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20354345440864563,
"step": 1045,
"valid_targets_mean": 6153.3,
"valid_targets_min": 1336
},
{
"epoch": 1.0627848101265822,
"grad_norm": 0.322713813844516,
"learning_rate": 3.848164418029989e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375882625579834,
"step": 1050,
"valid_targets_mean": 4300.9,
"valid_targets_min": 1361
},
{
"epoch": 1.0678481012658227,
"grad_norm": 0.31096701689662554,
"learning_rate": 3.845452265540074e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1565578281879425,
"step": 1055,
"valid_targets_mean": 4115.1,
"valid_targets_min": 1141
},
{
"epoch": 1.0729113924050633,
"grad_norm": 0.31792661099154035,
"learning_rate": 3.842717077255329e-05,
"loss": 0.3265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18725517392158508,
"step": 1060,
"valid_targets_mean": 5399.2,
"valid_targets_min": 1440
},
{
"epoch": 1.0779746835443038,
"grad_norm": 0.2966357451403385,
"learning_rate": 3.839958887317649e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1931026577949524,
"step": 1065,
"valid_targets_mean": 6788.4,
"valid_targets_min": 1285
},
{
"epoch": 1.0830379746835443,
"grad_norm": 0.32526509145376603,
"learning_rate": 3.837177730156045e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18849416077136993,
"step": 1070,
"valid_targets_mean": 5493.9,
"valid_targets_min": 884
},
{
"epoch": 1.0881012658227849,
"grad_norm": 0.3176994766517001,
"learning_rate": 3.834373640486216e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13460056483745575,
"step": 1075,
"valid_targets_mean": 3655.2,
"valid_targets_min": 1173
},
{
"epoch": 1.0931645569620254,
"grad_norm": 0.3802547345823635,
"learning_rate": 3.8315466533101154e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1390688419342041,
"step": 1080,
"valid_targets_mean": 3724.8,
"valid_targets_min": 686
},
{
"epoch": 1.0982278481012657,
"grad_norm": 0.30409901587440336,
"learning_rate": 3.828696803915515e-05,
"loss": 0.3295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19093772768974304,
"step": 1085,
"valid_targets_mean": 5509.2,
"valid_targets_min": 1316
},
{
"epoch": 1.1032911392405063,
"grad_norm": 0.31857188574561196,
"learning_rate": 3.8258241278755613e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18015238642692566,
"step": 1090,
"valid_targets_mean": 5178.9,
"valid_targets_min": 1381
},
{
"epoch": 1.1083544303797468,
"grad_norm": 0.32050011818280044,
"learning_rate": 3.8229286610483356e-05,
"loss": 0.3233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18884283304214478,
"step": 1095,
"valid_targets_mean": 5116.2,
"valid_targets_min": 1159
},
{
"epoch": 1.1134177215189873,
"grad_norm": 0.3113272756450795,
"learning_rate": 3.820010439576403e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16775749623775482,
"step": 1100,
"valid_targets_mean": 4514.6,
"valid_targets_min": 1605
},
{
"epoch": 1.1184810126582279,
"grad_norm": 0.33153340730169845,
"learning_rate": 3.817069499886364e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12046626210212708,
"step": 1105,
"valid_targets_mean": 3291.4,
"valid_targets_min": 962
},
{
"epoch": 1.1235443037974684,
"grad_norm": 0.3013874756589958,
"learning_rate": 3.814105878688397e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16391009092330933,
"step": 1110,
"valid_targets_mean": 6036.4,
"valid_targets_min": 1055
},
{
"epoch": 1.128607594936709,
"grad_norm": 0.331804851918644,
"learning_rate": 3.8111196129758025e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1217694953083992,
"step": 1115,
"valid_targets_mean": 2960.4,
"valid_targets_min": 1255
},
{
"epoch": 1.1336708860759495,
"grad_norm": 0.35058089757688515,
"learning_rate": 3.808110740024541e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18976081907749176,
"step": 1120,
"valid_targets_mean": 4311.5,
"valid_targets_min": 1573
},
{
"epoch": 1.13873417721519,
"grad_norm": 0.2598654453403866,
"learning_rate": 3.8050792973927654e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16648131608963013,
"step": 1125,
"valid_targets_mean": 6690.9,
"valid_targets_min": 1006
},
{
"epoch": 1.1437974683544303,
"grad_norm": 0.36580297380970445,
"learning_rate": 3.8020253229203555e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.173434779047966,
"step": 1130,
"valid_targets_mean": 3429.3,
"valid_targets_min": 1217
},
{
"epoch": 1.1488607594936708,
"grad_norm": 0.3170699501916741,
"learning_rate": 3.798948854728441e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12679925560951233,
"step": 1135,
"valid_targets_mean": 3721.6,
"valid_targets_min": 726
},
{
"epoch": 1.1539240506329114,
"grad_norm": 0.3315048726728199,
"learning_rate": 3.7958499312189344e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11187270283699036,
"step": 1140,
"valid_targets_mean": 3303.8,
"valid_targets_min": 954
},
{
"epoch": 1.158987341772152,
"grad_norm": 0.2969536976332786,
"learning_rate": 3.792728591074041e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11002499610185623,
"step": 1145,
"valid_targets_mean": 4168.6,
"valid_targets_min": 1316
},
{
"epoch": 1.1640506329113924,
"grad_norm": 0.29906816062312314,
"learning_rate": 3.7895848732557815e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309490203857422,
"step": 1150,
"valid_targets_mean": 4264.5,
"valid_targets_min": 945
},
{
"epoch": 1.169113924050633,
"grad_norm": 0.3373393294160328,
"learning_rate": 3.786418817005507e-05,
"loss": 0.3299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16449810564517975,
"step": 1155,
"valid_targets_mean": 4430.1,
"valid_targets_min": 1548
},
{
"epoch": 1.1741772151898735,
"grad_norm": 0.31814918332777564,
"learning_rate": 3.783230461843406e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603396236896515,
"step": 1160,
"valid_targets_mean": 4611.4,
"valid_targets_min": 1192
},
{
"epoch": 1.1792405063291138,
"grad_norm": 0.37957067548492934,
"learning_rate": 3.7800198475680136e-05,
"loss": 0.3264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09246158599853516,
"step": 1165,
"valid_targets_mean": 2677.1,
"valid_targets_min": 1357
},
{
"epoch": 1.1843037974683543,
"grad_norm": 0.3094282166752189,
"learning_rate": 3.776787014255712e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1497591733932495,
"step": 1170,
"valid_targets_mean": 4014.9,
"valid_targets_min": 1510
},
{
"epoch": 1.1893670886075949,
"grad_norm": 0.35082198305199175,
"learning_rate": 3.773532002260233e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1902400553226471,
"step": 1175,
"valid_targets_mean": 4051.2,
"valid_targets_min": 926
},
{
"epoch": 1.1944303797468354,
"grad_norm": 0.3363300235759021,
"learning_rate": 3.770254852212152e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484481394290924,
"step": 1180,
"valid_targets_mean": 4022.1,
"valid_targets_min": 949
},
{
"epoch": 1.199493670886076,
"grad_norm": 0.2959219712023686,
"learning_rate": 3.766955605018384e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17988604307174683,
"step": 1185,
"valid_targets_mean": 5788.9,
"valid_targets_min": 927
},
{
"epoch": 1.2045569620253165,
"grad_norm": 0.30513862700761135,
"learning_rate": 3.7636343018616675e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.162398099899292,
"step": 1190,
"valid_targets_mean": 4152.4,
"valid_targets_min": 1183
},
{
"epoch": 1.209620253164557,
"grad_norm": 0.3256099867852839,
"learning_rate": 3.7602909842000565e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1604665219783783,
"step": 1195,
"valid_targets_mean": 4510.4,
"valid_targets_min": 1107
},
{
"epoch": 1.2146835443037975,
"grad_norm": 0.31652452857276137,
"learning_rate": 3.7569256937663995e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11722761392593384,
"step": 1200,
"valid_targets_mean": 3867.2,
"valid_targets_min": 1428
},
{
"epoch": 1.219746835443038,
"grad_norm": 0.3570058144248121,
"learning_rate": 3.753538472567819e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.132009819149971,
"step": 1205,
"valid_targets_mean": 3776.8,
"valid_targets_min": 1444
},
{
"epoch": 1.2248101265822784,
"grad_norm": 0.3253492095946553,
"learning_rate": 3.750129362885188e-05,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20971378684043884,
"step": 1210,
"valid_targets_mean": 5854.2,
"valid_targets_min": 895
},
{
"epoch": 1.229873417721519,
"grad_norm": 0.31813799271358817,
"learning_rate": 3.7466984072726014e-05,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14392566680908203,
"step": 1215,
"valid_targets_mean": 4255.3,
"valid_targets_min": 1377
},
{
"epoch": 1.2349367088607595,
"grad_norm": 0.3161090773410782,
"learning_rate": 3.743245648556845e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15600383281707764,
"step": 1220,
"valid_targets_mean": 4627.6,
"valid_targets_min": 1186
},
{
"epoch": 1.24,
"grad_norm": 0.3383098606932185,
"learning_rate": 3.739771129836863e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15630879998207092,
"step": 1225,
"valid_targets_mean": 3907.4,
"valid_targets_min": 1318
},
{
"epoch": 1.2450632911392405,
"grad_norm": 0.380311170159032,
"learning_rate": 3.736274894483215e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17396849393844604,
"step": 1230,
"valid_targets_mean": 3654.8,
"valid_targets_min": 1228
},
{
"epoch": 1.250126582278481,
"grad_norm": 0.29633634831203143,
"learning_rate": 3.7327569861375404e-05,
"loss": 0.3368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20720690488815308,
"step": 1235,
"valid_targets_mean": 6698.7,
"valid_targets_min": 1554
},
{
"epoch": 1.2551898734177216,
"grad_norm": 0.32181581382324975,
"learning_rate": 3.729217448712009e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15546496212482452,
"step": 1240,
"valid_targets_mean": 4598.5,
"valid_targets_min": 1081
},
{
"epoch": 1.260253164556962,
"grad_norm": 0.2876370801591027,
"learning_rate": 3.725656326388776e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12497955560684204,
"step": 1245,
"valid_targets_mean": 4425.2,
"valid_targets_min": 1167
},
{
"epoch": 1.2653164556962024,
"grad_norm": 0.3193054610028216,
"learning_rate": 3.722073663619429e-05,
"loss": 0.3268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15073925256729126,
"step": 1250,
"valid_targets_mean": 4511.2,
"valid_targets_min": 1143
},
{
"epoch": 1.270379746835443,
"grad_norm": 0.39145813292181675,
"learning_rate": 3.718469505124434e-05,
"loss": 0.3246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15670371055603027,
"step": 1255,
"valid_targets_mean": 4593.4,
"valid_targets_min": 885
},
{
"epoch": 1.2754430379746835,
"grad_norm": 0.3007158793143366,
"learning_rate": 3.714843895892576e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14526674151420593,
"step": 1260,
"valid_targets_mean": 4201.2,
"valid_targets_min": 1015
},
{
"epoch": 1.280506329113924,
"grad_norm": 0.3431473760602178,
"learning_rate": 3.7111968811803985e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11407409608364105,
"step": 1265,
"valid_targets_mean": 2609.9,
"valid_targets_min": 1008
},
{
"epoch": 1.2855696202531646,
"grad_norm": 0.31430226120597105,
"learning_rate": 3.7075285065116376e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21788525581359863,
"step": 1270,
"valid_targets_mean": 5227.1,
"valid_targets_min": 1159
},
{
"epoch": 1.290632911392405,
"grad_norm": 0.2942207875130029,
"learning_rate": 3.703838817676654e-05,
"loss": 0.3248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16078102588653564,
"step": 1275,
"valid_targets_mean": 5179.4,
"valid_targets_min": 966
},
{
"epoch": 1.2956962025316456,
"grad_norm": 0.33801133523700155,
"learning_rate": 3.7001278607318646e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13204364478588104,
"step": 1280,
"valid_targets_mean": 3593.9,
"valid_targets_min": 1351
},
{
"epoch": 1.3007594936708862,
"grad_norm": 0.36194997437445076,
"learning_rate": 3.696395681999161e-05,
"loss": 0.3315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15205729007720947,
"step": 1285,
"valid_targets_mean": 3709.8,
"valid_targets_min": 1456
},
{
"epoch": 1.3058227848101267,
"grad_norm": 0.37635182260044775,
"learning_rate": 3.692642328065337e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12143959850072861,
"step": 1290,
"valid_targets_mean": 3222.8,
"valid_targets_min": 1077
},
{
"epoch": 1.310886075949367,
"grad_norm": 0.3080355652465348,
"learning_rate": 3.688867845781506e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14508505165576935,
"step": 1295,
"valid_targets_mean": 3859.7,
"valid_targets_min": 1113
},
{
"epoch": 1.3159493670886075,
"grad_norm": 0.3439159780043492,
"learning_rate": 3.685072282262511e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14666421711444855,
"step": 1300,
"valid_targets_mean": 3587.8,
"valid_targets_min": 1142
},
{
"epoch": 1.321012658227848,
"grad_norm": 0.30506292484752023,
"learning_rate": 3.6812556848863474e-05,
"loss": 0.3253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15456736087799072,
"step": 1305,
"valid_targets_mean": 3908.8,
"valid_targets_min": 1305
},
{
"epoch": 1.3260759493670886,
"grad_norm": 0.32896698136778196,
"learning_rate": 3.6774181012935595e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14750021696090698,
"step": 1310,
"valid_targets_mean": 3579.4,
"valid_targets_min": 696
},
{
"epoch": 1.3311392405063291,
"grad_norm": 0.3494681443588045,
"learning_rate": 3.673559579386653e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16966864466667175,
"step": 1315,
"valid_targets_mean": 3639.5,
"valid_targets_min": 1136
},
{
"epoch": 1.3362025316455697,
"grad_norm": 0.3191056529939702,
"learning_rate": 3.6696801673294984e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2022847682237625,
"step": 1320,
"valid_targets_mean": 6126.2,
"valid_targets_min": 1760
},
{
"epoch": 1.34126582278481,
"grad_norm": 0.40439808049151743,
"learning_rate": 3.665779913546721e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1815149486064911,
"step": 1325,
"valid_targets_mean": 3929.4,
"valid_targets_min": 1092
},
{
"epoch": 1.3463291139240505,
"grad_norm": 0.29566683990417303,
"learning_rate": 3.6618588667231064e-05,
"loss": 0.3244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440686285495758,
"step": 1330,
"valid_targets_mean": 4236.4,
"valid_targets_min": 1086
},
{
"epoch": 1.351392405063291,
"grad_norm": 0.3344359616665295,
"learning_rate": 3.6579170758029885e-05,
"loss": 0.324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15648147463798523,
"step": 1335,
"valid_targets_mean": 3588.6,
"valid_targets_min": 1635
},
{
"epoch": 1.3564556962025316,
"grad_norm": 0.2879031761545053,
"learning_rate": 3.653954589989637e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16395555436611176,
"step": 1340,
"valid_targets_mean": 4903.5,
"valid_targets_min": 1401
},
{
"epoch": 1.3615189873417721,
"grad_norm": 0.3076034430138629,
"learning_rate": 3.649971458744645e-05,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14920540153980255,
"step": 1345,
"valid_targets_mean": 4404.3,
"valid_targets_min": 1479
},
{
"epoch": 1.3665822784810127,
"grad_norm": 0.37728920822736073,
"learning_rate": 3.645967731787313e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16919684410095215,
"step": 1350,
"valid_targets_mean": 3916.3,
"valid_targets_min": 1491
},
{
"epoch": 1.3716455696202532,
"grad_norm": 0.2944205665752948,
"learning_rate": 3.641943459094026e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20011773705482483,
"step": 1355,
"valid_targets_mean": 6104.8,
"valid_targets_min": 1110
},
{
"epoch": 1.3767088607594937,
"grad_norm": 0.31998862065193057,
"learning_rate": 3.63789869089763e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17156195640563965,
"step": 1360,
"valid_targets_mean": 4435.9,
"valid_targets_min": 1056
},
{
"epoch": 1.3817721518987343,
"grad_norm": 0.3359058600132148,
"learning_rate": 3.633833477686805e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1116013303399086,
"step": 1365,
"valid_targets_mean": 2720.7,
"valid_targets_min": 1100
},
{
"epoch": 1.3868354430379748,
"grad_norm": 0.3167283899854193,
"learning_rate": 3.629747870205438e-05,
"loss": 0.3375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15123698115348816,
"step": 1370,
"valid_targets_mean": 4809.0,
"valid_targets_min": 1288
},
{
"epoch": 1.3918987341772153,
"grad_norm": 0.3176638421764831,
"learning_rate": 3.625641919451982e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.116270050406456,
"step": 1375,
"valid_targets_mean": 3099.4,
"valid_targets_min": 1302
},
{
"epoch": 1.3969620253164556,
"grad_norm": 0.3567607135105218,
"learning_rate": 3.621515676678829e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18901550769805908,
"step": 1380,
"valid_targets_mean": 4234.6,
"valid_targets_min": 1078
},
{
"epoch": 1.4020253164556962,
"grad_norm": 0.33150001426521647,
"learning_rate": 3.617369193391663e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14285731315612793,
"step": 1385,
"valid_targets_mean": 3883.8,
"valid_targets_min": 1292
},
{
"epoch": 1.4070886075949367,
"grad_norm": 0.32040861152447253,
"learning_rate": 3.61320252134882e-05,
"loss": 0.3202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15014925599098206,
"step": 1390,
"valid_targets_mean": 4633.4,
"valid_targets_min": 1150
},
{
"epoch": 1.4121518987341772,
"grad_norm": 0.3364407178912512,
"learning_rate": 3.6090157125606405e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19701796770095825,
"step": 1395,
"valid_targets_mean": 4298.4,
"valid_targets_min": 1055
},
{
"epoch": 1.4172151898734178,
"grad_norm": 0.2998592984370577,
"learning_rate": 3.604808819288823e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21334891021251678,
"step": 1400,
"valid_targets_mean": 6774.6,
"valid_targets_min": 1471
},
{
"epoch": 1.4222784810126583,
"grad_norm": 0.32266679078127786,
"learning_rate": 3.600581894045768e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10229863971471786,
"step": 1405,
"valid_targets_mean": 2818.3,
"valid_targets_min": 1002
},
{
"epoch": 1.4273417721518986,
"grad_norm": 0.2989355644726402,
"learning_rate": 3.596334989593927e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16216593980789185,
"step": 1410,
"valid_targets_mean": 4271.4,
"valid_targets_min": 773
},
{
"epoch": 1.4324050632911391,
"grad_norm": 0.33686789223908364,
"learning_rate": 3.5920681589451385e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16129520535469055,
"step": 1415,
"valid_targets_mean": 3987.1,
"valid_targets_min": 776
},
{
"epoch": 1.4374683544303797,
"grad_norm": 0.2948991655130385,
"learning_rate": 3.58778145535997e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14479148387908936,
"step": 1420,
"valid_targets_mean": 4191.2,
"valid_targets_min": 1049
},
{
"epoch": 1.4425316455696202,
"grad_norm": 0.278153706236472,
"learning_rate": 3.583474932347054e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15073184669017792,
"step": 1425,
"valid_targets_mean": 5600.0,
"valid_targets_min": 978
},
{
"epoch": 1.4475949367088607,
"grad_norm": 0.2989703152632012,
"learning_rate": 3.5791486436624145e-05,
"loss": 0.322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1581433117389679,
"step": 1430,
"valid_targets_mean": 4557.4,
"valid_targets_min": 1311
},
{
"epoch": 1.4526582278481013,
"grad_norm": 0.3156763543957603,
"learning_rate": 3.5748026433088036e-05,
"loss": 0.3234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1554793417453766,
"step": 1435,
"valid_targets_mean": 5105.0,
"valid_targets_min": 1086
},
{
"epoch": 1.4577215189873418,
"grad_norm": 0.30549649598454104,
"learning_rate": 3.5704369855350226e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10838840901851654,
"step": 1440,
"valid_targets_mean": 2855.1,
"valid_targets_min": 1382
},
{
"epoch": 1.4627848101265823,
"grad_norm": 0.37394597619150627,
"learning_rate": 3.566051724835245e-05,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13602185249328613,
"step": 1445,
"valid_targets_mean": 3419.4,
"valid_targets_min": 1146
},
{
"epoch": 1.4678481012658229,
"grad_norm": 0.3156375413907948,
"learning_rate": 3.5616469159483363e-05,
"loss": 0.3224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14657479524612427,
"step": 1450,
"valid_targets_mean": 4287.6,
"valid_targets_min": 1162
},
{
"epoch": 1.4729113924050634,
"grad_norm": 0.32282455141307365,
"learning_rate": 3.5572226138571753e-05,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21434099972248077,
"step": 1455,
"valid_targets_mean": 6099.5,
"valid_targets_min": 1650
},
{
"epoch": 1.4779746835443037,
"grad_norm": 0.3934165636040704,
"learning_rate": 3.5527788737879595e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13554619252681732,
"step": 1460,
"valid_targets_mean": 3898.6,
"valid_targets_min": 749
},
{
"epoch": 1.4830379746835443,
"grad_norm": 0.3532333332147838,
"learning_rate": 3.548315751209524e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1423749029636383,
"step": 1465,
"valid_targets_mean": 3396.2,
"valid_targets_min": 1245
},
{
"epoch": 1.4881012658227848,
"grad_norm": 0.3046035862379382,
"learning_rate": 3.543833301832642e-05,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11005077511072159,
"step": 1470,
"valid_targets_mean": 3165.8,
"valid_targets_min": 1018
},
{
"epoch": 1.4931645569620253,
"grad_norm": 0.2934515113132098,
"learning_rate": 3.539331581609337e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16373209655284882,
"step": 1475,
"valid_targets_mean": 5422.3,
"valid_targets_min": 938
},
{
"epoch": 1.4982278481012659,
"grad_norm": 0.29330851366159866,
"learning_rate": 3.5348106467321756e-05,
"loss": 0.3204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1334601640701294,
"step": 1480,
"valid_targets_mean": 4623.2,
"valid_targets_min": 1060
},
{
"epoch": 1.5032911392405062,
"grad_norm": 0.3494149115756711,
"learning_rate": 3.530270553633574e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14463084936141968,
"step": 1485,
"valid_targets_mean": 3681.4,
"valid_targets_min": 1175
},
{
"epoch": 1.5083544303797467,
"grad_norm": 0.34094476372572885,
"learning_rate": 3.5257113589850895e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13542452454566956,
"step": 1490,
"valid_targets_mean": 3142.8,
"valid_targets_min": 1338
},
{
"epoch": 1.5134177215189872,
"grad_norm": 0.33689606267312805,
"learning_rate": 3.521133119696712e-05,
"loss": 0.3264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16328886151313782,
"step": 1495,
"valid_targets_mean": 4708.0,
"valid_targets_min": 1214
},
{
"epoch": 1.5184810126582278,
"grad_norm": 0.8587040130178458,
"learning_rate": 3.516535892916159e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.166406512260437,
"step": 1500,
"valid_targets_mean": 4267.1,
"valid_targets_min": 1066
},
{
"epoch": 1.5235443037974683,
"grad_norm": 0.31747165527732263,
"learning_rate": 3.5119197360281553e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1378452181816101,
"step": 1505,
"valid_targets_mean": 3656.2,
"valid_targets_min": 1064
},
{
"epoch": 1.5286075949367088,
"grad_norm": 0.3521429432867297,
"learning_rate": 3.507284706653722e-05,
"loss": 0.3369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22082693874835968,
"step": 1510,
"valid_targets_mean": 4618.8,
"valid_targets_min": 1392
},
{
"epoch": 1.5336708860759494,
"grad_norm": 0.3319407091362445,
"learning_rate": 3.5026308626494545e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18031668663024902,
"step": 1515,
"valid_targets_mean": 3750.2,
"valid_targets_min": 977
},
{
"epoch": 1.53873417721519,
"grad_norm": 0.33498834727615584,
"learning_rate": 3.497958262106801e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1643165647983551,
"step": 1520,
"valid_targets_mean": 3328.2,
"valid_targets_min": 1474
},
{
"epoch": 1.5437974683544304,
"grad_norm": 0.3537186281988192,
"learning_rate": 3.493266963351339e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1584773063659668,
"step": 1525,
"valid_targets_mean": 3274.9,
"valid_targets_min": 1245
},
{
"epoch": 1.548860759493671,
"grad_norm": 0.30657928098680826,
"learning_rate": 3.4885570249420454e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1703530102968216,
"step": 1530,
"valid_targets_mean": 5461.6,
"valid_targets_min": 1154
},
{
"epoch": 1.5539240506329115,
"grad_norm": 0.338680368171272,
"learning_rate": 3.483828505670563e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15479744970798492,
"step": 1535,
"valid_targets_mean": 4522.8,
"valid_targets_min": 1326
},
{
"epoch": 1.558987341772152,
"grad_norm": 0.369309200288726,
"learning_rate": 3.479081464560475e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12721368670463562,
"step": 1540,
"valid_targets_mean": 2568.1,
"valid_targets_min": 1187
},
{
"epoch": 1.5640506329113926,
"grad_norm": 0.3519884099657949,
"learning_rate": 3.474315960866558e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21022453904151917,
"step": 1545,
"valid_targets_mean": 5003.4,
"valid_targets_min": 1333
},
{
"epoch": 1.5691139240506329,
"grad_norm": 0.33365501094495986,
"learning_rate": 3.469532054074049e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11454639583826065,
"step": 1550,
"valid_targets_mean": 3473.1,
"valid_targets_min": 1181
},
{
"epoch": 1.5741772151898734,
"grad_norm": 0.3487036569312814,
"learning_rate": 3.464729803897902e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0789409726858139,
"step": 1555,
"valid_targets_mean": 2519.6,
"valid_targets_min": 1102
},
{
"epoch": 1.579240506329114,
"grad_norm": 0.33603816281790033,
"learning_rate": 3.4599092702820394e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11025889217853546,
"step": 1560,
"valid_targets_mean": 2999.4,
"valid_targets_min": 1318
},
{
"epoch": 1.5843037974683545,
"grad_norm": 0.33746214929234886,
"learning_rate": 3.4550705133986085e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540479212999344,
"step": 1565,
"valid_targets_mean": 3550.0,
"valid_targets_min": 1130
},
{
"epoch": 1.5893670886075948,
"grad_norm": 0.3700007824527567,
"learning_rate": 3.450213593647226e-05,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.179176926612854,
"step": 1570,
"valid_targets_mean": 3797.9,
"valid_targets_min": 1468
},
{
"epoch": 1.5944303797468353,
"grad_norm": 0.43557784622964635,
"learning_rate": 3.445338571654227e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12111867964267731,
"step": 1575,
"valid_targets_mean": 3459.7,
"valid_targets_min": 1321
},
{
"epoch": 1.5994936708860759,
"grad_norm": 0.3234005911683535,
"learning_rate": 3.440445508271907e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11545059829950333,
"step": 1580,
"valid_targets_mean": 3151.1,
"valid_targets_min": 966
},
{
"epoch": 1.6045569620253164,
"grad_norm": 0.31481487050082757,
"learning_rate": 3.435534464577762e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14349615573883057,
"step": 1585,
"valid_targets_mean": 4098.8,
"valid_targets_min": 1553
},
{
"epoch": 1.609620253164557,
"grad_norm": 0.3263020753319533,
"learning_rate": 3.4306055018737274e-05,
"loss": 0.3262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886909306049347,
"step": 1590,
"valid_targets_mean": 5531.9,
"valid_targets_min": 1290
},
{
"epoch": 1.6146835443037975,
"grad_norm": 0.3440773642804762,
"learning_rate": 3.425658681685412e-05,
"loss": 0.3247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17707081139087677,
"step": 1595,
"valid_targets_mean": 3534.2,
"valid_targets_min": 1301
},
{
"epoch": 1.619746835443038,
"grad_norm": 0.32440177535383535,
"learning_rate": 3.420694065761328e-05,
"loss": 0.3282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16896334290504456,
"step": 1600,
"valid_targets_mean": 4122.1,
"valid_targets_min": 965
},
{
"epoch": 1.6248101265822785,
"grad_norm": 0.2928837040048521,
"learning_rate": 3.415711716072126e-05,
"loss": 0.3318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17395883798599243,
"step": 1605,
"valid_targets_mean": 5510.7,
"valid_targets_min": 1836
},
{
"epoch": 1.629873417721519,
"grad_norm": 0.29996111358110616,
"learning_rate": 3.4107116948098155e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16087687015533447,
"step": 1610,
"valid_targets_mean": 5291.1,
"valid_targets_min": 812
},
{
"epoch": 1.6349367088607596,
"grad_norm": 0.3391636106718898,
"learning_rate": 3.4056940643869905e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12102165073156357,
"step": 1615,
"valid_targets_mean": 2991.2,
"valid_targets_min": 987
},
{
"epoch": 1.6400000000000001,
"grad_norm": 0.30250385799846535,
"learning_rate": 3.400658887436051e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15453828871250153,
"step": 1620,
"valid_targets_mean": 4200.3,
"valid_targets_min": 1171
},
{
"epoch": 1.6450632911392407,
"grad_norm": 0.31602413877978186,
"learning_rate": 3.3956062268084215e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1669228971004486,
"step": 1625,
"valid_targets_mean": 4059.0,
"valid_targets_min": 1494
},
{
"epoch": 1.650126582278481,
"grad_norm": 0.3430073741627476,
"learning_rate": 3.390536145573766e-05,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15472730994224548,
"step": 1630,
"valid_targets_mean": 4020.9,
"valid_targets_min": 1121
},
{
"epoch": 1.6551898734177215,
"grad_norm": 0.30844530157775457,
"learning_rate": 3.385448707019199e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13865000009536743,
"step": 1635,
"valid_targets_mean": 3493.1,
"valid_targets_min": 1516
},
{
"epoch": 1.660253164556962,
"grad_norm": 0.29309820401088355,
"learning_rate": 3.3803439746484996e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18344934284687042,
"step": 1640,
"valid_targets_mean": 5938.8,
"valid_targets_min": 1370
},
{
"epoch": 1.6653164556962026,
"grad_norm": 0.2917099753276015,
"learning_rate": 3.375222012181315e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15374572575092316,
"step": 1645,
"valid_targets_mean": 4424.8,
"valid_targets_min": 1247
},
{
"epoch": 1.6703797468354429,
"grad_norm": 0.31174326634371047,
"learning_rate": 3.370082883552366e-05,
"loss": 0.3248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18676675856113434,
"step": 1650,
"valid_targets_mean": 4577.7,
"valid_targets_min": 1153
},
{
"epoch": 1.6754430379746834,
"grad_norm": 0.2937468748877549,
"learning_rate": 3.364926652910651e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14714813232421875,
"step": 1655,
"valid_targets_mean": 4791.8,
"valid_targets_min": 1213
},
{
"epoch": 1.680506329113924,
"grad_norm": 0.2879601888076102,
"learning_rate": 3.359753384618641e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19825273752212524,
"step": 1660,
"valid_targets_mean": 6597.8,
"valid_targets_min": 1694
},
{
"epoch": 1.6855696202531645,
"grad_norm": 0.28734174588103684,
"learning_rate": 3.354563143251483e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13350191712379456,
"step": 1665,
"valid_targets_mean": 4193.6,
"valid_targets_min": 1311
},
{
"epoch": 1.690632911392405,
"grad_norm": 0.3163624678749021,
"learning_rate": 3.3493559935961854e-05,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19836895167827606,
"step": 1670,
"valid_targets_mean": 4911.9,
"valid_targets_min": 1235
},
{
"epoch": 1.6956962025316455,
"grad_norm": 0.26723388677186943,
"learning_rate": 3.344132000650817e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14954085648059845,
"step": 1675,
"valid_targets_mean": 5300.8,
"valid_targets_min": 1208
},
{
"epoch": 1.700759493670886,
"grad_norm": 0.3367011427653921,
"learning_rate": 3.3388912296236906e-05,
"loss": 0.3369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15727460384368896,
"step": 1680,
"valid_targets_mean": 3988.7,
"valid_targets_min": 1264
},
{
"epoch": 1.7058227848101266,
"grad_norm": 0.46226016366837236,
"learning_rate": 3.3336337459325526e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18564224243164062,
"step": 1685,
"valid_targets_mean": 6143.1,
"valid_targets_min": 1246
},
{
"epoch": 1.7108860759493671,
"grad_norm": 0.3175894026472926,
"learning_rate": 3.328359615203762e-05,
"loss": 0.3183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19139517843723297,
"step": 1690,
"valid_targets_mean": 5133.2,
"valid_targets_min": 1080
},
{
"epoch": 1.7159493670886077,
"grad_norm": 0.27972490266827565,
"learning_rate": 3.323068903271476e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11912492662668228,
"step": 1695,
"valid_targets_mean": 4236.9,
"valid_targets_min": 1213
},
{
"epoch": 1.7210126582278482,
"grad_norm": 0.28905133463909916,
"learning_rate": 3.317761676176825e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1582462191581726,
"step": 1700,
"valid_targets_mean": 5365.8,
"valid_targets_min": 1347
},
{
"epoch": 1.7260759493670887,
"grad_norm": 0.2928951231194897,
"learning_rate": 3.31243800016709e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16399666666984558,
"step": 1705,
"valid_targets_mean": 4478.1,
"valid_targets_min": 913
},
{
"epoch": 1.7311392405063293,
"grad_norm": 0.3067909993527847,
"learning_rate": 3.307097941694876e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1793975532054901,
"step": 1710,
"valid_targets_mean": 4923.8,
"valid_targets_min": 1793
},
{
"epoch": 1.7362025316455696,
"grad_norm": 0.29679310025747774,
"learning_rate": 3.3017415674172795e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1398848444223404,
"step": 1715,
"valid_targets_mean": 3729.8,
"valid_targets_min": 1281
},
{
"epoch": 1.7412658227848101,
"grad_norm": 0.33157110353633035,
"learning_rate": 3.296368944195059e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16532516479492188,
"step": 1720,
"valid_targets_mean": 4614.5,
"valid_targets_min": 1146
},
{
"epoch": 1.7463291139240507,
"grad_norm": 0.3237383031466305,
"learning_rate": 3.2909801390918e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16484834253787994,
"step": 1725,
"valid_targets_mean": 4277.1,
"valid_targets_min": 1022
},
{
"epoch": 1.7513924050632912,
"grad_norm": 0.30303998742275196,
"learning_rate": 3.285575219373079e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1231764703989029,
"step": 1730,
"valid_targets_mean": 3492.9,
"valid_targets_min": 908
},
{
"epoch": 1.7564556962025315,
"grad_norm": 0.3131204074959935,
"learning_rate": 3.2801542525056204e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16018734872341156,
"step": 1735,
"valid_targets_mean": 4216.1,
"valid_targets_min": 909
},
{
"epoch": 1.761518987341772,
"grad_norm": 0.5226006047690179,
"learning_rate": 3.27471730615646e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13336879014968872,
"step": 1740,
"valid_targets_mean": 3926.2,
"valid_targets_min": 1825
},
{
"epoch": 1.7665822784810126,
"grad_norm": 0.288468699839479,
"learning_rate": 3.2692644481920926e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637478768825531,
"step": 1745,
"valid_targets_mean": 5375.8,
"valid_targets_min": 1193
},
{
"epoch": 1.771645569620253,
"grad_norm": 0.3345448593431147,
"learning_rate": 3.263795746677633e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1924804151058197,
"step": 1750,
"valid_targets_mean": 4262.6,
"valid_targets_min": 1246
},
{
"epoch": 1.7767088607594936,
"grad_norm": 0.31362215927542564,
"learning_rate": 3.258311269875959e-05,
"loss": 0.3295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17079243063926697,
"step": 1755,
"valid_targets_mean": 4860.1,
"valid_targets_min": 1270
},
{
"epoch": 1.7817721518987342,
"grad_norm": 0.2881402537381144,
"learning_rate": 3.2528110862468664e-05,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1843501329421997,
"step": 1760,
"valid_targets_mean": 5736.6,
"valid_targets_min": 1442
},
{
"epoch": 1.7868354430379747,
"grad_norm": 0.33940507923082636,
"learning_rate": 3.247295264446209e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14896419644355774,
"step": 1765,
"valid_targets_mean": 4003.1,
"valid_targets_min": 960
},
{
"epoch": 1.7918987341772152,
"grad_norm": 0.305481958944062,
"learning_rate": 3.241763873325044e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1464659869670868,
"step": 1770,
"valid_targets_mean": 4571.4,
"valid_targets_min": 1342
},
{
"epoch": 1.7969620253164558,
"grad_norm": 0.3372959294620817,
"learning_rate": 3.2362169819287714e-05,
"loss": 0.3198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17976534366607666,
"step": 1775,
"valid_targets_mean": 4028.4,
"valid_targets_min": 1261
},
{
"epoch": 1.8020253164556963,
"grad_norm": 0.3104430678347615,
"learning_rate": 3.2306546594962744e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16419640183448792,
"step": 1780,
"valid_targets_mean": 4230.2,
"valid_targets_min": 1132
},
{
"epoch": 1.8070886075949368,
"grad_norm": 0.3241781257834898,
"learning_rate": 3.225076975459051e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21455496549606323,
"step": 1785,
"valid_targets_mean": 7327.5,
"valid_targets_min": 1343
},
{
"epoch": 1.8121518987341774,
"grad_norm": 0.3169044936479542,
"learning_rate": 3.219483999440354e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12079709023237228,
"step": 1790,
"valid_targets_mean": 3173.1,
"valid_targets_min": 1329
},
{
"epoch": 1.8172151898734177,
"grad_norm": 0.331980276874436,
"learning_rate": 3.213875801254314e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14299997687339783,
"step": 1795,
"valid_targets_mean": 3476.8,
"valid_targets_min": 942
},
{
"epoch": 1.8222784810126582,
"grad_norm": 0.25978521097127444,
"learning_rate": 3.2082524509050723e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14637430012226105,
"step": 1800,
"valid_targets_mean": 5356.4,
"valid_targets_min": 1492
},
{
"epoch": 1.8273417721518987,
"grad_norm": 0.4563427674089283,
"learning_rate": 3.20261401858591e-05,
"loss": 0.3246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16923454403877258,
"step": 1805,
"valid_targets_mean": 4621.6,
"valid_targets_min": 954
},
{
"epoch": 1.8324050632911393,
"grad_norm": 0.28306126650762187,
"learning_rate": 3.196960574678363e-05,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11796549707651138,
"step": 1810,
"valid_targets_mean": 4214.6,
"valid_targets_min": 1296
},
{
"epoch": 1.8374683544303796,
"grad_norm": 0.32499866336342004,
"learning_rate": 3.191292189751353e-05,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1776324212551117,
"step": 1815,
"valid_targets_mean": 5706.0,
"valid_targets_min": 1377
},
{
"epoch": 1.8425316455696201,
"grad_norm": 0.29118017187843964,
"learning_rate": 3.185608934560301e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12048833072185516,
"step": 1820,
"valid_targets_mean": 3490.6,
"valid_targets_min": 1465
},
{
"epoch": 1.8475949367088607,
"grad_norm": 0.3114271880772345,
"learning_rate": 3.1799108800462466e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14511121809482574,
"step": 1825,
"valid_targets_mean": 3770.2,
"valid_targets_min": 1165
},
{
"epoch": 1.8526582278481012,
"grad_norm": 0.28385385385120393,
"learning_rate": 3.174198097334959e-05,
"loss": 0.3248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16951501369476318,
"step": 1830,
"valid_targets_mean": 4812.1,
"valid_targets_min": 995
},
{
"epoch": 1.8577215189873417,
"grad_norm": 0.33205815359378843,
"learning_rate": 3.168470657736053e-05,
"loss": 0.3306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585332751274109,
"step": 1835,
"valid_targets_mean": 5364.6,
"valid_targets_min": 1166
},
{
"epoch": 1.8627848101265823,
"grad_norm": 0.31689534847164214,
"learning_rate": 3.162728632742098e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16908031702041626,
"step": 1840,
"valid_targets_mean": 4225.1,
"valid_targets_min": 1101
},
{
"epoch": 1.8678481012658228,
"grad_norm": 0.3087921045352938,
"learning_rate": 3.1569720940277267e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17665991187095642,
"step": 1845,
"valid_targets_mean": 4580.1,
"valid_targets_min": 1284
},
{
"epoch": 1.8729113924050633,
"grad_norm": 0.28162350739466746,
"learning_rate": 3.151201113448735e-05,
"loss": 0.3198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16834816336631775,
"step": 1850,
"valid_targets_mean": 5581.1,
"valid_targets_min": 1362
},
{
"epoch": 1.8779746835443039,
"grad_norm": 0.33622728572725646,
"learning_rate": 3.1454157630411905e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13378959894180298,
"step": 1855,
"valid_targets_mean": 3264.8,
"valid_targets_min": 1178
},
{
"epoch": 1.8830379746835444,
"grad_norm": 0.2888883767197038,
"learning_rate": 3.1396161150205324e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15173028409481049,
"step": 1860,
"valid_targets_mean": 5245.6,
"valid_targets_min": 1061
},
{
"epoch": 1.888101265822785,
"grad_norm": 0.3008873149690533,
"learning_rate": 3.133802241780669e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168132483959198,
"step": 1865,
"valid_targets_mean": 5342.9,
"valid_targets_min": 1360
},
{
"epoch": 1.8931645569620255,
"grad_norm": 0.30961408751335806,
"learning_rate": 3.127974215893075e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15519672632217407,
"step": 1870,
"valid_targets_mean": 4829.4,
"valid_targets_min": 1051
},
{
"epoch": 1.8982278481012658,
"grad_norm": 0.3375894079078535,
"learning_rate": 3.1221321101058826e-05,
"loss": 0.3233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2031598687171936,
"step": 1875,
"valid_targets_mean": 4846.2,
"valid_targets_min": 1616
},
{
"epoch": 1.9032911392405063,
"grad_norm": 0.30102939403192525,
"learning_rate": 3.116275997342979e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1768466830253601,
"step": 1880,
"valid_targets_mean": 5417.4,
"valid_targets_min": 1149
},
{
"epoch": 1.9083544303797468,
"grad_norm": 0.31204461528240096,
"learning_rate": 3.110405950703091e-05,
"loss": 0.3286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15786431729793549,
"step": 1885,
"valid_targets_mean": 4424.1,
"valid_targets_min": 1590
},
{
"epoch": 1.9134177215189874,
"grad_norm": 0.3212411559315451,
"learning_rate": 3.104522043458875e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15173178911209106,
"step": 1890,
"valid_targets_mean": 3546.5,
"valid_targets_min": 1048
},
{
"epoch": 1.918481012658228,
"grad_norm": 0.3477054279687247,
"learning_rate": 3.098624349056003e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09834770858287811,
"step": 1895,
"valid_targets_mean": 3314.4,
"valid_targets_min": 1081
},
{
"epoch": 1.9235443037974682,
"grad_norm": 0.3224350947488976,
"learning_rate": 3.0927129411122433e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1967785656452179,
"step": 1900,
"valid_targets_mean": 5401.0,
"valid_targets_min": 1631
},
{
"epoch": 1.9286075949367087,
"grad_norm": 0.3407210065894635,
"learning_rate": 3.086787893416543e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15977072715759277,
"step": 1905,
"valid_targets_mean": 3843.9,
"valid_targets_min": 1465
},
{
"epoch": 1.9336708860759493,
"grad_norm": 0.3048824087454436,
"learning_rate": 3.080849279928108e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21388033032417297,
"step": 1910,
"valid_targets_mean": 5811.2,
"valid_targets_min": 735
},
{
"epoch": 1.9387341772151898,
"grad_norm": 0.3220507717171466,
"learning_rate": 3.074897174775478e-05,
"loss": 0.3231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17468535900115967,
"step": 1915,
"valid_targets_mean": 4189.4,
"valid_targets_min": 1442
},
{
"epoch": 1.9437974683544303,
"grad_norm": 0.33220201972445723,
"learning_rate": 3.0689316522556026e-05,
"loss": 0.3242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948956400156021,
"step": 1920,
"valid_targets_mean": 4742.3,
"valid_targets_min": 1598
},
{
"epoch": 1.9488607594936709,
"grad_norm": 0.32448507249493624,
"learning_rate": 3.062952786832912e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440562605857849,
"step": 1925,
"valid_targets_mean": 4186.6,
"valid_targets_min": 1640
},
{
"epoch": 1.9539240506329114,
"grad_norm": 0.29766519811078285,
"learning_rate": 3.05696065313839e-05,
"loss": 0.3306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18304754793643951,
"step": 1930,
"valid_targets_mean": 6132.7,
"valid_targets_min": 1516
},
{
"epoch": 1.958987341772152,
"grad_norm": 0.2949900786324887,
"learning_rate": 3.050955325968641e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15778782963752747,
"step": 1935,
"valid_targets_mean": 5078.4,
"valid_targets_min": 1196
},
{
"epoch": 1.9640506329113925,
"grad_norm": 0.3263199970381054,
"learning_rate": 3.0449368802849553e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14029563963413239,
"step": 1940,
"valid_targets_mean": 4289.6,
"valid_targets_min": 1207
},
{
"epoch": 1.969113924050633,
"grad_norm": 0.3116697424009326,
"learning_rate": 3.0389053912123755e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1622355878353119,
"step": 1945,
"valid_targets_mean": 4043.3,
"valid_targets_min": 1217
},
{
"epoch": 1.9741772151898735,
"grad_norm": 0.33957146598689614,
"learning_rate": 3.0328609340387584e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1829889565706253,
"step": 1950,
"valid_targets_mean": 3790.2,
"valid_targets_min": 768
},
{
"epoch": 1.979240506329114,
"grad_norm": 0.31004887940586384,
"learning_rate": 3.026803584213834e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1571284979581833,
"step": 1955,
"valid_targets_mean": 4538.4,
"valid_targets_min": 956
},
{
"epoch": 1.9843037974683544,
"grad_norm": 0.2945095160712328,
"learning_rate": 3.0207334173482635e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14519169926643372,
"step": 1960,
"valid_targets_mean": 3616.2,
"valid_targets_min": 1058
},
{
"epoch": 1.989367088607595,
"grad_norm": 0.29690655635239654,
"learning_rate": 3.0146505092126987e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14115923643112183,
"step": 1965,
"valid_targets_mean": 4046.1,
"valid_targets_min": 1832
},
{
"epoch": 1.9944303797468355,
"grad_norm": 0.3836659337432429,
"learning_rate": 3.0085549357368316e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16044825315475464,
"step": 1970,
"valid_targets_mean": 4667.9,
"valid_targets_min": 1443
},
{
"epoch": 1.999493670886076,
"grad_norm": 0.3322124150108135,
"learning_rate": 3.0024467730084508e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12640810012817383,
"step": 1975,
"valid_targets_mean": 3170.9,
"valid_targets_min": 832
},
{
"epoch": 2.0040506329113925,
"grad_norm": 0.3291075554103832,
"learning_rate": 2.996326097272487e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16433456540107727,
"step": 1980,
"valid_targets_mean": 4258.9,
"valid_targets_min": 1370
},
{
"epoch": 2.009113924050633,
"grad_norm": 0.28624539538450133,
"learning_rate": 2.9901929849300676e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.156062513589859,
"step": 1985,
"valid_targets_mean": 5479.2,
"valid_targets_min": 1383
},
{
"epoch": 2.0141772151898736,
"grad_norm": 0.31864237413570884,
"learning_rate": 2.984047512537557e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17700161039829254,
"step": 1990,
"valid_targets_mean": 4326.2,
"valid_targets_min": 1491
},
{
"epoch": 2.019240506329114,
"grad_norm": 0.29138155253699194,
"learning_rate": 2.977889756805604e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19598735868930817,
"step": 1995,
"valid_targets_mean": 5823.9,
"valid_targets_min": 1470
},
{
"epoch": 2.0243037974683546,
"grad_norm": 0.32618376749689376,
"learning_rate": 2.9717197945981844e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14639677107334137,
"step": 2000,
"valid_targets_mean": 3956.3,
"valid_targets_min": 1251
},
{
"epoch": 2.0293670886075947,
"grad_norm": 0.3231822134904899,
"learning_rate": 2.9655377029316415e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1973341703414917,
"step": 2005,
"valid_targets_mean": 6070.5,
"valid_targets_min": 1268
},
{
"epoch": 2.0344303797468353,
"grad_norm": 0.4445885950556669,
"learning_rate": 2.9593435589737212e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1424170434474945,
"step": 2010,
"valid_targets_mean": 3355.1,
"valid_targets_min": 1257
},
{
"epoch": 2.039493670886076,
"grad_norm": 0.31012702805843667,
"learning_rate": 2.9531374400426158e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17267721891403198,
"step": 2015,
"valid_targets_mean": 5018.6,
"valid_targets_min": 803
},
{
"epoch": 2.0445569620253163,
"grad_norm": 0.27456099255552485,
"learning_rate": 2.9469194236059916e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18913531303405762,
"step": 2020,
"valid_targets_mean": 6316.9,
"valid_targets_min": 1565
},
{
"epoch": 2.049620253164557,
"grad_norm": 0.30759866121772944,
"learning_rate": 2.940689587280027e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17620842158794403,
"step": 2025,
"valid_targets_mean": 5025.1,
"valid_targets_min": 1103
},
{
"epoch": 2.0546835443037974,
"grad_norm": 0.3107498769401775,
"learning_rate": 2.9344480088284403e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14356273412704468,
"step": 2030,
"valid_targets_mean": 3878.3,
"valid_targets_min": 1435
},
{
"epoch": 2.059746835443038,
"grad_norm": 0.3272342894958522,
"learning_rate": 2.9281947661615206e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11045265197753906,
"step": 2035,
"valid_targets_mean": 2769.6,
"valid_targets_min": 775
},
{
"epoch": 2.0648101265822785,
"grad_norm": 0.28376297804532025,
"learning_rate": 2.921929937335157e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18254786729812622,
"step": 2040,
"valid_targets_mean": 6384.8,
"valid_targets_min": 726
},
{
"epoch": 2.069873417721519,
"grad_norm": 0.3494712370742931,
"learning_rate": 2.9156536005498616e-05,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15539231896400452,
"step": 2045,
"valid_targets_mean": 3678.8,
"valid_targets_min": 558
},
{
"epoch": 2.0749367088607595,
"grad_norm": 0.36306320132408093,
"learning_rate": 2.909365834149792e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16074064373970032,
"step": 2050,
"valid_targets_mean": 3803.6,
"valid_targets_min": 992
},
{
"epoch": 2.08,
"grad_norm": 0.28771743850152404,
"learning_rate": 2.903066716621779e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17194947600364685,
"step": 2055,
"valid_targets_mean": 6007.1,
"valid_targets_min": 788
},
{
"epoch": 2.0850632911392406,
"grad_norm": 0.3176958806269076,
"learning_rate": 2.896756326594341e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15832051634788513,
"step": 2060,
"valid_targets_mean": 4807.6,
"valid_targets_min": 1533
},
{
"epoch": 2.090126582278481,
"grad_norm": 0.30643347389492315,
"learning_rate": 2.890434742836706e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17868554592132568,
"step": 2065,
"valid_targets_mean": 5870.9,
"valid_targets_min": 1477
},
{
"epoch": 2.0951898734177217,
"grad_norm": 0.328300503212321,
"learning_rate": 2.8841020442578274e-05,
"loss": 0.3219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15090826153755188,
"step": 2070,
"valid_targets_mean": 4159.4,
"valid_targets_min": 767
},
{
"epoch": 2.100253164556962,
"grad_norm": 0.3116451598810816,
"learning_rate": 2.8777583099053985e-05,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15223953127861023,
"step": 2075,
"valid_targets_mean": 4922.9,
"valid_targets_min": 1236
},
{
"epoch": 2.1053164556962027,
"grad_norm": 0.32927381366700853,
"learning_rate": 2.871403618964867e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18153706192970276,
"step": 2080,
"valid_targets_mean": 4833.8,
"valid_targets_min": 1513
},
{
"epoch": 2.110379746835443,
"grad_norm": 0.30099077420276216,
"learning_rate": 2.8650380507584444e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11155495047569275,
"step": 2085,
"valid_targets_mean": 3890.5,
"valid_targets_min": 1469
},
{
"epoch": 2.1154430379746834,
"grad_norm": 0.304896658143913,
"learning_rate": 2.8586616847441192e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.143421471118927,
"step": 2090,
"valid_targets_mean": 4747.4,
"valid_targets_min": 849
},
{
"epoch": 2.120506329113924,
"grad_norm": 0.33627609235395134,
"learning_rate": 2.852274600514662e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17665691673755646,
"step": 2095,
"valid_targets_mean": 4558.9,
"valid_targets_min": 1540
},
{
"epoch": 2.1255696202531644,
"grad_norm": 0.3025889533254811,
"learning_rate": 2.8458768777966333e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16682836413383484,
"step": 2100,
"valid_targets_mean": 5740.6,
"valid_targets_min": 1809
},
{
"epoch": 2.130632911392405,
"grad_norm": 0.3039388867958498,
"learning_rate": 2.8394685964493886e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0811905711889267,
"step": 2105,
"valid_targets_mean": 3185.6,
"valid_targets_min": 1428
},
{
"epoch": 2.1356962025316455,
"grad_norm": 0.34645798201468236,
"learning_rate": 2.8330498364640803e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20455661416053772,
"step": 2110,
"valid_targets_mean": 5101.9,
"valid_targets_min": 1051
},
{
"epoch": 2.140759493670886,
"grad_norm": 0.2965620255799478,
"learning_rate": 2.8266206779626604e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15685412287712097,
"step": 2115,
"valid_targets_mean": 5286.0,
"valid_targets_min": 1289
},
{
"epoch": 2.1458227848101266,
"grad_norm": 0.3555931137634147,
"learning_rate": 2.8201812011968807e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16602477431297302,
"step": 2120,
"valid_targets_mean": 4031.6,
"valid_targets_min": 1147
},
{
"epoch": 2.150886075949367,
"grad_norm": 0.31549642905504277,
"learning_rate": 2.8137314865472896e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2147747278213501,
"step": 2125,
"valid_targets_mean": 5917.6,
"valid_targets_min": 1516
},
{
"epoch": 2.1559493670886076,
"grad_norm": 0.3817360788487001,
"learning_rate": 2.8072716145222295e-05,
"loss": 0.3204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1429363489151001,
"step": 2130,
"valid_targets_mean": 4846.5,
"valid_targets_min": 1233
},
{
"epoch": 2.161012658227848,
"grad_norm": 0.29099253723913165,
"learning_rate": 2.800801665756833e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1667858213186264,
"step": 2135,
"valid_targets_mean": 5250.2,
"valid_targets_min": 1352
},
{
"epoch": 2.1660759493670887,
"grad_norm": 0.31033307443976493,
"learning_rate": 2.794321721012013e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15342216193675995,
"step": 2140,
"valid_targets_mean": 4172.6,
"valid_targets_min": 959
},
{
"epoch": 2.1711392405063292,
"grad_norm": 0.32002549909894445,
"learning_rate": 2.78783186117346e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1935744285583496,
"step": 2145,
"valid_targets_mean": 5775.0,
"valid_targets_min": 1696
},
{
"epoch": 2.1762025316455698,
"grad_norm": 0.3337487659466844,
"learning_rate": 2.7813321672506268e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19408701360225677,
"step": 2150,
"valid_targets_mean": 5285.5,
"valid_targets_min": 1837
},
{
"epoch": 2.1812658227848103,
"grad_norm": 0.30999599957531293,
"learning_rate": 2.77482272037572e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16555137932300568,
"step": 2155,
"valid_targets_mean": 4545.2,
"valid_targets_min": 1035
},
{
"epoch": 2.186329113924051,
"grad_norm": 0.32893298945558314,
"learning_rate": 2.768303601802689e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15684665739536285,
"step": 2160,
"valid_targets_mean": 3914.8,
"valid_targets_min": 1135
},
{
"epoch": 2.191392405063291,
"grad_norm": 0.32177861173163685,
"learning_rate": 2.7617748929062084e-05,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13835042715072632,
"step": 2165,
"valid_targets_mean": 4624.2,
"valid_targets_min": 911
},
{
"epoch": 2.1964556962025314,
"grad_norm": 0.2604316010544582,
"learning_rate": 2.7552366751806624e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14997389912605286,
"step": 2170,
"valid_targets_mean": 6796.2,
"valid_targets_min": 1292
},
{
"epoch": 2.201518987341772,
"grad_norm": 0.30476092949327993,
"learning_rate": 2.7486890302391316e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621738076210022,
"step": 2175,
"valid_targets_mean": 5079.0,
"valid_targets_min": 1369
},
{
"epoch": 2.2065822784810125,
"grad_norm": 0.3322580301103298,
"learning_rate": 2.7421320398123702e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1476869136095047,
"step": 2180,
"valid_targets_mean": 3784.2,
"valid_targets_min": 1640
},
{
"epoch": 2.211645569620253,
"grad_norm": 0.2990722276821268,
"learning_rate": 2.735565785747787e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13568082451820374,
"step": 2185,
"valid_targets_mean": 4330.4,
"valid_targets_min": 815
},
{
"epoch": 2.2167088607594936,
"grad_norm": 0.30616718547526817,
"learning_rate": 2.728990350008423e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17533037066459656,
"step": 2190,
"valid_targets_mean": 5132.6,
"valid_targets_min": 949
},
{
"epoch": 2.221772151898734,
"grad_norm": 0.28127500881615763,
"learning_rate": 2.722405814671931e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134933739900589,
"step": 2195,
"valid_targets_mean": 5636.6,
"valid_targets_min": 732
},
{
"epoch": 2.2268354430379746,
"grad_norm": 0.27748602615715384,
"learning_rate": 2.715812261929548e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1636897474527359,
"step": 2200,
"valid_targets_mean": 5998.6,
"valid_targets_min": 1351
},
{
"epoch": 2.231898734177215,
"grad_norm": 0.3255757575300295,
"learning_rate": 2.7092097740850712e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1682029664516449,
"step": 2205,
"valid_targets_mean": 4255.6,
"valid_targets_min": 1238
},
{
"epoch": 2.2369620253164557,
"grad_norm": 0.30015032841488015,
"learning_rate": 2.7025984335538297e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1712615191936493,
"step": 2210,
"valid_targets_mean": 5242.7,
"valid_targets_min": 968
},
{
"epoch": 2.2420253164556962,
"grad_norm": 0.35257346632541897,
"learning_rate": 2.6959783228616543e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14988690614700317,
"step": 2215,
"valid_targets_mean": 3744.8,
"valid_targets_min": 1368
},
{
"epoch": 2.247088607594937,
"grad_norm": 0.34270763531215714,
"learning_rate": 2.6893495246438512e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13658785820007324,
"step": 2220,
"valid_targets_mean": 3438.7,
"valid_targets_min": 1173
},
{
"epoch": 2.2521518987341773,
"grad_norm": 0.3370660380071177,
"learning_rate": 2.682712121644168e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1949615478515625,
"step": 2225,
"valid_targets_mean": 4599.9,
"valid_targets_min": 1016
},
{
"epoch": 2.257215189873418,
"grad_norm": 0.348355336462014,
"learning_rate": 2.6760661967137597e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16294927895069122,
"step": 2230,
"valid_targets_mean": 4107.5,
"valid_targets_min": 1022
},
{
"epoch": 2.2622784810126584,
"grad_norm": 0.3249186301351007,
"learning_rate": 2.6694118328101592e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09672749042510986,
"step": 2235,
"valid_targets_mean": 2920.3,
"valid_targets_min": 950
},
{
"epoch": 2.267341772151899,
"grad_norm": 0.30303571071751967,
"learning_rate": 2.6627491129962343e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442355215549469,
"step": 2240,
"valid_targets_mean": 4454.2,
"valid_targets_min": 1369
},
{
"epoch": 2.2724050632911394,
"grad_norm": 0.31715305103924707,
"learning_rate": 2.6560781204391584e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10361987352371216,
"step": 2245,
"valid_targets_mean": 3143.1,
"valid_targets_min": 1447
},
{
"epoch": 2.27746835443038,
"grad_norm": 0.28484792889639327,
"learning_rate": 2.6493989384093674e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14160794019699097,
"step": 2250,
"valid_targets_mean": 4650.6,
"valid_targets_min": 954
},
{
"epoch": 2.28253164556962,
"grad_norm": 0.2878082890562957,
"learning_rate": 2.642711650279523e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1957184076309204,
"step": 2255,
"valid_targets_mean": 5700.1,
"valid_targets_min": 1450
},
{
"epoch": 2.2875949367088606,
"grad_norm": 0.28921634890872305,
"learning_rate": 2.636016339523472e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1497688591480255,
"step": 2260,
"valid_targets_mean": 5892.9,
"valid_targets_min": 1182
},
{
"epoch": 2.292658227848101,
"grad_norm": 0.374304372121314,
"learning_rate": 2.6293130897152005e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10483106970787048,
"step": 2265,
"valid_targets_mean": 2732.1,
"valid_targets_min": 909
},
{
"epoch": 2.2977215189873417,
"grad_norm": 0.360265224368032,
"learning_rate": 2.6226019845277954e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15251410007476807,
"step": 2270,
"valid_targets_mean": 3089.3,
"valid_targets_min": 1121
},
{
"epoch": 2.302784810126582,
"grad_norm": 0.3076018448534471,
"learning_rate": 2.615883107732398e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10678346455097198,
"step": 2275,
"valid_targets_mean": 3471.9,
"valid_targets_min": 1050
},
{
"epoch": 2.3078481012658227,
"grad_norm": 0.30671877576562406,
"learning_rate": 2.609156543197158e-05,
"loss": 0.3101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18611571192741394,
"step": 2280,
"valid_targets_mean": 5213.1,
"valid_targets_min": 1379
},
{
"epoch": 2.3129113924050633,
"grad_norm": 0.42457395280342314,
"learning_rate": 2.6024223748861883e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17773228883743286,
"step": 2285,
"valid_targets_mean": 5313.4,
"valid_targets_min": 929
},
{
"epoch": 2.317974683544304,
"grad_norm": 0.343397113662205,
"learning_rate": 2.5956806868585136e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606595367193222,
"step": 2290,
"valid_targets_mean": 3827.6,
"valid_targets_min": 1248
},
{
"epoch": 2.3230379746835443,
"grad_norm": 0.2808278753890521,
"learning_rate": 2.5889315632670247e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11440195143222809,
"step": 2295,
"valid_targets_mean": 3889.9,
"valid_targets_min": 1216
},
{
"epoch": 2.328101265822785,
"grad_norm": 0.3112053561319972,
"learning_rate": 2.582175088357426e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14229443669319153,
"step": 2300,
"valid_targets_mean": 3906.9,
"valid_targets_min": 1129
},
{
"epoch": 2.3331645569620254,
"grad_norm": 0.29738973838136984,
"learning_rate": 2.575411346467185e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12370048463344574,
"step": 2305,
"valid_targets_mean": 4034.3,
"valid_targets_min": 1620
},
{
"epoch": 2.338227848101266,
"grad_norm": 0.3012147807699108,
"learning_rate": 2.568640422024478e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2278967797756195,
"step": 2310,
"valid_targets_mean": 5961.9,
"valid_targets_min": 1399
},
{
"epoch": 2.3432911392405065,
"grad_norm": 0.2922942701946769,
"learning_rate": 2.5618623995471394e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16622743010520935,
"step": 2315,
"valid_targets_mean": 5404.4,
"valid_targets_min": 1235
},
{
"epoch": 2.348354430379747,
"grad_norm": 0.36432427585365534,
"learning_rate": 2.5550773636416008e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1854952722787857,
"step": 2320,
"valid_targets_mean": 3965.4,
"valid_targets_min": 1201
},
{
"epoch": 2.353417721518987,
"grad_norm": 0.33468505049542446,
"learning_rate": 2.548285399001843e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15984870493412018,
"step": 2325,
"valid_targets_mean": 3767.3,
"valid_targets_min": 900
},
{
"epoch": 2.3584810126582276,
"grad_norm": 0.30206170793614096,
"learning_rate": 2.5414865904083314e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18496757745742798,
"step": 2330,
"valid_targets_mean": 5605.0,
"valid_targets_min": 1244
},
{
"epoch": 2.363544303797468,
"grad_norm": 0.3069574368019458,
"learning_rate": 2.534681022726962e-05,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20892611145973206,
"step": 2335,
"valid_targets_mean": 5443.6,
"valid_targets_min": 1904
},
{
"epoch": 2.3686075949367087,
"grad_norm": 0.324406187683953,
"learning_rate": 2.5278687809080017e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13418112695217133,
"step": 2340,
"valid_targets_mean": 3362.5,
"valid_targets_min": 1043
},
{
"epoch": 2.3736708860759492,
"grad_norm": 0.32283224636579144,
"learning_rate": 2.5210499499850252e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14372019469738007,
"step": 2345,
"valid_targets_mean": 3757.2,
"valid_targets_min": 1046
},
{
"epoch": 2.3787341772151898,
"grad_norm": 0.2954201993306155,
"learning_rate": 2.5142246150738566e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16226419806480408,
"step": 2350,
"valid_targets_mean": 5083.2,
"valid_targets_min": 1909
},
{
"epoch": 2.3837974683544303,
"grad_norm": 0.278033728430402,
"learning_rate": 2.5073928613715053e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13732075691223145,
"step": 2355,
"valid_targets_mean": 5177.6,
"valid_targets_min": 1378
},
{
"epoch": 2.388860759493671,
"grad_norm": 0.3406821151852307,
"learning_rate": 2.5005547741551045e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1702435463666916,
"step": 2360,
"valid_targets_mean": 3885.0,
"valid_targets_min": 1146
},
{
"epoch": 2.3939240506329114,
"grad_norm": 0.2924901782943758,
"learning_rate": 2.4937104387808434e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17096886038780212,
"step": 2365,
"valid_targets_mean": 5283.7,
"valid_targets_min": 1374
},
{
"epoch": 2.398987341772152,
"grad_norm": 0.30986779863862535,
"learning_rate": 2.4868599406829045e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17868509888648987,
"step": 2370,
"valid_targets_mean": 4610.5,
"valid_targets_min": 824
},
{
"epoch": 2.4040506329113924,
"grad_norm": 0.2951664773380052,
"learning_rate": 2.4800033653723962e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14138385653495789,
"step": 2375,
"valid_targets_mean": 4383.0,
"valid_targets_min": 1267
},
{
"epoch": 2.409113924050633,
"grad_norm": 0.3206066119244924,
"learning_rate": 2.473140798436285e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.150266632437706,
"step": 2380,
"valid_targets_mean": 3835.7,
"valid_targets_min": 1476
},
{
"epoch": 2.4141772151898735,
"grad_norm": 0.30473370037176944,
"learning_rate": 2.466272325536329e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19058401882648468,
"step": 2385,
"valid_targets_mean": 6384.8,
"valid_targets_min": 935
},
{
"epoch": 2.419240506329114,
"grad_norm": 0.31479938811797176,
"learning_rate": 2.4593980324080054e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11872898042201996,
"step": 2390,
"valid_targets_mean": 3557.1,
"valid_targets_min": 1099
},
{
"epoch": 2.4243037974683546,
"grad_norm": 0.3392666541666469,
"learning_rate": 2.4525180048594452e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15524475276470184,
"step": 2395,
"valid_targets_mean": 4042.5,
"valid_targets_min": 1334
},
{
"epoch": 2.429367088607595,
"grad_norm": 0.3116160865837986,
"learning_rate": 2.445632328770354e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14736303687095642,
"step": 2400,
"valid_targets_mean": 4778.8,
"valid_targets_min": 1194
},
{
"epoch": 2.4344303797468356,
"grad_norm": 0.3248761370284341,
"learning_rate": 2.438741090090951e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1985064595937729,
"step": 2405,
"valid_targets_mean": 6140.9,
"valid_targets_min": 1429
},
{
"epoch": 2.439493670886076,
"grad_norm": 0.2819598660386808,
"learning_rate": 2.431844374840886e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13578057289123535,
"step": 2410,
"valid_targets_mean": 4853.0,
"valid_targets_min": 1602
},
{
"epoch": 2.4445569620253167,
"grad_norm": 0.31885986982040326,
"learning_rate": 2.4249422691081722e-05,
"loss": 0.3057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15936186909675598,
"step": 2415,
"valid_targets_mean": 4181.2,
"valid_targets_min": 1349
},
{
"epoch": 2.449620253164557,
"grad_norm": 0.30296726343845826,
"learning_rate": 2.4180348590481075e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12165558338165283,
"step": 2420,
"valid_targets_mean": 3419.1,
"valid_targets_min": 883
},
{
"epoch": 2.4546835443037973,
"grad_norm": 0.309483869681844,
"learning_rate": 2.411122230882203e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562597155570984,
"step": 2425,
"valid_targets_mean": 4920.2,
"valid_targets_min": 983
},
{
"epoch": 2.459746835443038,
"grad_norm": 1.2885193054997446,
"learning_rate": 2.4042044708971027e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1394486129283905,
"step": 2430,
"valid_targets_mean": 4328.4,
"valid_targets_min": 1162
},
{
"epoch": 2.4648101265822784,
"grad_norm": 0.27206002510649857,
"learning_rate": 2.3972816654435103e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16065040230751038,
"step": 2435,
"valid_targets_mean": 6525.3,
"valid_targets_min": 1098
},
{
"epoch": 2.469873417721519,
"grad_norm": 0.3427940884240252,
"learning_rate": 2.390353900935107e-05,
"loss": 0.3198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19091764092445374,
"step": 2440,
"valid_targets_mean": 4360.0,
"valid_targets_min": 1133
},
{
"epoch": 2.4749367088607594,
"grad_norm": 0.42327373841330385,
"learning_rate": 2.3834212638474773e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12319037318229675,
"step": 2445,
"valid_targets_mean": 3837.3,
"valid_targets_min": 873
},
{
"epoch": 2.48,
"grad_norm": 0.49287136211086113,
"learning_rate": 2.376483840717026e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15457025170326233,
"step": 2450,
"valid_targets_mean": 3929.6,
"valid_targets_min": 1205
},
{
"epoch": 2.4850632911392405,
"grad_norm": 0.32265608836896076,
"learning_rate": 2.3695417181399004e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13117042183876038,
"step": 2455,
"valid_targets_mean": 3683.8,
"valid_targets_min": 1015
},
{
"epoch": 2.490126582278481,
"grad_norm": 0.28497626230687617,
"learning_rate": 2.362594982770909e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13846123218536377,
"step": 2460,
"valid_targets_mean": 4725.8,
"valid_targets_min": 1651
},
{
"epoch": 2.4951898734177216,
"grad_norm": 0.30556606202877784,
"learning_rate": 2.3556437213224378e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1903924196958542,
"step": 2465,
"valid_targets_mean": 5195.9,
"valid_targets_min": 1317
},
{
"epoch": 2.500253164556962,
"grad_norm": 0.2957801020557521,
"learning_rate": 2.348688020563371e-05,
"loss": 0.3202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15225407481193542,
"step": 2470,
"valid_targets_mean": 4614.5,
"valid_targets_min": 892
},
{
"epoch": 2.5053164556962026,
"grad_norm": 0.29068264222113155,
"learning_rate": 2.3417279673180048e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15005727112293243,
"step": 2475,
"valid_targets_mean": 5253.2,
"valid_targets_min": 1364
},
{
"epoch": 2.510379746835443,
"grad_norm": 0.34824655792906656,
"learning_rate": 2.3347636484649662e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11774547398090363,
"step": 2480,
"valid_targets_mean": 3077.8,
"valid_targets_min": 1062
},
{
"epoch": 2.5154430379746833,
"grad_norm": 0.3255931573908884,
"learning_rate": 2.3277951509361273e-05,
"loss": 0.3317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20479710400104523,
"step": 2485,
"valid_targets_mean": 5133.7,
"valid_targets_min": 1091
},
{
"epoch": 2.520506329113924,
"grad_norm": 0.30263280385351665,
"learning_rate": 2.3208225617155206e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14676184952259064,
"step": 2490,
"valid_targets_mean": 4788.9,
"valid_targets_min": 1004
},
{
"epoch": 2.5255696202531643,
"grad_norm": 0.34344447055299104,
"learning_rate": 2.3138459678382524e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18363483250141144,
"step": 2495,
"valid_targets_mean": 4170.4,
"valid_targets_min": 1007
},
{
"epoch": 2.530632911392405,
"grad_norm": 0.2844384480121892,
"learning_rate": 2.3068654563894183e-05,
"loss": 0.3172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12592104077339172,
"step": 2500,
"valid_targets_mean": 4493.2,
"valid_targets_min": 1334
},
{
"epoch": 2.5356962025316454,
"grad_norm": 0.32631729959150463,
"learning_rate": 2.2998811145030117e-05,
"loss": 0.3101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15357106924057007,
"step": 2505,
"valid_targets_mean": 4361.8,
"valid_targets_min": 1071
},
{
"epoch": 2.540759493670886,
"grad_norm": 0.2650853449197667,
"learning_rate": 2.2928930293608435e-05,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13759788870811462,
"step": 2510,
"valid_targets_mean": 5130.8,
"valid_targets_min": 1080
},
{
"epoch": 2.5458227848101265,
"grad_norm": 0.3267807848788021,
"learning_rate": 2.2859012881914464e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16794613003730774,
"step": 2515,
"valid_targets_mean": 4673.6,
"valid_targets_min": 1083
},
{
"epoch": 2.550886075949367,
"grad_norm": 0.278879282582265,
"learning_rate": 2.278905978268992e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11442182958126068,
"step": 2520,
"valid_targets_mean": 4874.6,
"valid_targets_min": 1101
},
{
"epoch": 2.5559493670886075,
"grad_norm": 0.32085560175743244,
"learning_rate": 2.271907186912196e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12187394499778748,
"step": 2525,
"valid_targets_mean": 3503.1,
"valid_targets_min": 882
},
{
"epoch": 2.561012658227848,
"grad_norm": 0.3284259732307929,
"learning_rate": 2.2649050014832326e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16201844811439514,
"step": 2530,
"valid_targets_mean": 4727.4,
"valid_targets_min": 1505
},
{
"epoch": 2.5660759493670886,
"grad_norm": 0.2991569094124765,
"learning_rate": 2.2578995093866424e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1367436945438385,
"step": 2535,
"valid_targets_mean": 5286.4,
"valid_targets_min": 1301
},
{
"epoch": 2.571139240506329,
"grad_norm": 0.2923839601296598,
"learning_rate": 2.2508907980682406e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15937817096710205,
"step": 2540,
"valid_targets_mean": 5033.3,
"valid_targets_min": 1409
},
{
"epoch": 2.5762025316455697,
"grad_norm": 0.29834149017437644,
"learning_rate": 2.2438789550140272e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662355363368988,
"step": 2545,
"valid_targets_mean": 4474.9,
"valid_targets_min": 1458
},
{
"epoch": 2.58126582278481,
"grad_norm": 0.31248285204558157,
"learning_rate": 2.2368640677490935e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12987586855888367,
"step": 2550,
"valid_targets_mean": 4253.7,
"valid_targets_min": 1334
},
{
"epoch": 2.5863291139240507,
"grad_norm": 0.2913592791130016,
"learning_rate": 2.2298462238365293e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20642492175102234,
"step": 2555,
"valid_targets_mean": 6304.3,
"valid_targets_min": 1349
},
{
"epoch": 2.5913924050632913,
"grad_norm": 0.35349413261981677,
"learning_rate": 2.222825510876332e-05,
"loss": 0.3202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17145583033561707,
"step": 2560,
"valid_targets_mean": 4713.6,
"valid_targets_min": 1409
},
{
"epoch": 2.596455696202532,
"grad_norm": 0.3451688511848506,
"learning_rate": 2.2158020165043114e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16764461994171143,
"step": 2565,
"valid_targets_mean": 3924.4,
"valid_targets_min": 1285
},
{
"epoch": 2.6015189873417723,
"grad_norm": 0.2797909726976478,
"learning_rate": 2.2087758283909954e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1547449380159378,
"step": 2570,
"valid_targets_mean": 5481.8,
"valid_targets_min": 1376
},
{
"epoch": 2.606582278481013,
"grad_norm": 0.3101010476898593,
"learning_rate": 2.201747034240537e-05,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1627534031867981,
"step": 2575,
"valid_targets_mean": 4466.9,
"valid_targets_min": 987
},
{
"epoch": 2.6116455696202534,
"grad_norm": 1.1618173704395123,
"learning_rate": 2.1947157217896188e-05,
"loss": 0.3095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.165956050157547,
"step": 2580,
"valid_targets_mean": 4300.5,
"valid_targets_min": 778
},
{
"epoch": 2.616708860759494,
"grad_norm": 0.31858634458407287,
"learning_rate": 2.1876819788063586e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15230509638786316,
"step": 2585,
"valid_targets_mean": 3920.5,
"valid_targets_min": 1479
},
{
"epoch": 2.621772151898734,
"grad_norm": 0.30557996470586596,
"learning_rate": 2.1806458930892127e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18883772194385529,
"step": 2590,
"valid_targets_mean": 6008.9,
"valid_targets_min": 1408
},
{
"epoch": 2.6268354430379746,
"grad_norm": 0.2883450262202285,
"learning_rate": 2.173607552465881e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17338699102401733,
"step": 2595,
"valid_targets_mean": 5570.2,
"valid_targets_min": 1526
},
{
"epoch": 2.631898734177215,
"grad_norm": 0.33234113394369846,
"learning_rate": 2.1665670447922084e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12816452980041504,
"step": 2600,
"valid_targets_mean": 4282.2,
"valid_targets_min": 812
},
{
"epoch": 2.6369620253164556,
"grad_norm": 0.31643919888427663,
"learning_rate": 2.1595244579510933e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17621192336082458,
"step": 2605,
"valid_targets_mean": 5060.8,
"valid_targets_min": 1369
},
{
"epoch": 2.642025316455696,
"grad_norm": 0.30039427757871706,
"learning_rate": 2.1524798798513835e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16294711828231812,
"step": 2610,
"valid_targets_mean": 4472.4,
"valid_targets_min": 1304
},
{
"epoch": 2.6470886075949367,
"grad_norm": 0.3231328181820057,
"learning_rate": 2.1454333984267852e-05,
"loss": 0.322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16857695579528809,
"step": 2615,
"valid_targets_mean": 5128.5,
"valid_targets_min": 1215
},
{
"epoch": 2.6521518987341772,
"grad_norm": 0.331376941255876,
"learning_rate": 2.1383851016347614e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1293996274471283,
"step": 2620,
"valid_targets_mean": 3696.2,
"valid_targets_min": 781
},
{
"epoch": 2.6572151898734178,
"grad_norm": 0.2898986778677013,
"learning_rate": 2.1313350774554366e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14066889882087708,
"step": 2625,
"valid_targets_mean": 4409.5,
"valid_targets_min": 1181
},
{
"epoch": 2.6622784810126583,
"grad_norm": 0.3792545064079998,
"learning_rate": 2.1242834138904962e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14408881962299347,
"step": 2630,
"valid_targets_mean": 3892.1,
"valid_targets_min": 1313
},
{
"epoch": 2.667341772151899,
"grad_norm": 0.34582044479522395,
"learning_rate": 2.1172301989620898e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15445685386657715,
"step": 2635,
"valid_targets_mean": 4015.2,
"valid_targets_min": 743
},
{
"epoch": 2.6724050632911394,
"grad_norm": 0.31734348855671907,
"learning_rate": 2.110175520711731e-05,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14247769117355347,
"step": 2640,
"valid_targets_mean": 4152.1,
"valid_targets_min": 1532
},
{
"epoch": 2.67746835443038,
"grad_norm": 0.3108375470698165,
"learning_rate": 2.1031194671992013e-05,
"loss": 0.3145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13973818719387054,
"step": 2645,
"valid_targets_mean": 4321.8,
"valid_targets_min": 1096
},
{
"epoch": 2.68253164556962,
"grad_norm": 0.3378134291776038,
"learning_rate": 2.0960621265014462e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17127710580825806,
"step": 2650,
"valid_targets_mean": 4009.1,
"valid_targets_min": 1241
},
{
"epoch": 2.6875949367088605,
"grad_norm": 0.29939660412855834,
"learning_rate": 2.0890035867114808e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15695559978485107,
"step": 2655,
"valid_targets_mean": 5238.8,
"valid_targets_min": 1128
},
{
"epoch": 2.692658227848101,
"grad_norm": 0.3230482978021318,
"learning_rate": 2.081943935937286e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1587713658809662,
"step": 2660,
"valid_targets_mean": 4748.3,
"valid_targets_min": 1323
},
{
"epoch": 2.6977215189873416,
"grad_norm": 0.29402248645547446,
"learning_rate": 2.0748832623007117e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10896088182926178,
"step": 2665,
"valid_targets_mean": 3750.2,
"valid_targets_min": 1426
},
{
"epoch": 2.702784810126582,
"grad_norm": 0.27936531158953143,
"learning_rate": 2.067821653936375e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1711559295654297,
"step": 2670,
"valid_targets_mean": 6852.6,
"valid_targets_min": 1209
},
{
"epoch": 2.7078481012658226,
"grad_norm": 0.28924656402783777,
"learning_rate": 2.060759198990561e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14176371693611145,
"step": 2675,
"valid_targets_mean": 5084.8,
"valid_targets_min": 1430
},
{
"epoch": 2.712911392405063,
"grad_norm": 0.3123266627731589,
"learning_rate": 2.053695985620123e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15624725818634033,
"step": 2680,
"valid_targets_mean": 4276.9,
"valid_targets_min": 1150
},
{
"epoch": 2.7179746835443037,
"grad_norm": 0.30428837341523135,
"learning_rate": 2.0466321019913787e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12444409728050232,
"step": 2685,
"valid_targets_mean": 5104.2,
"valid_targets_min": 1036
},
{
"epoch": 2.7230379746835442,
"grad_norm": 0.2899541063761625,
"learning_rate": 2.0395676362790157e-05,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18925632536411285,
"step": 2690,
"valid_targets_mean": 6929.8,
"valid_targets_min": 1156
},
{
"epoch": 2.728101265822785,
"grad_norm": 0.3000387772557557,
"learning_rate": 2.032502676664985e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15346036851406097,
"step": 2695,
"valid_targets_mean": 4285.7,
"valid_targets_min": 1379
},
{
"epoch": 2.7331645569620253,
"grad_norm": 0.3021057118413619,
"learning_rate": 2.025437311337404e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14610332250595093,
"step": 2700,
"valid_targets_mean": 4591.1,
"valid_targets_min": 1675
},
{
"epoch": 2.738227848101266,
"grad_norm": 0.32691877516784146,
"learning_rate": 2.0183716284894533e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14551448822021484,
"step": 2705,
"valid_targets_mean": 3989.2,
"valid_targets_min": 919
},
{
"epoch": 2.7432911392405064,
"grad_norm": 0.3657473594680315,
"learning_rate": 2.011305716318278e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22241473197937012,
"step": 2710,
"valid_targets_mean": 6030.1,
"valid_targets_min": 1316
},
{
"epoch": 2.748354430379747,
"grad_norm": 0.3038961961226564,
"learning_rate": 2.004239663023885e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16947516798973083,
"step": 2715,
"valid_targets_mean": 5248.6,
"valid_targets_min": 1555
},
{
"epoch": 2.7534177215189874,
"grad_norm": 0.3050248442776484,
"learning_rate": 1.997173556808043e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1630948781967163,
"step": 2720,
"valid_targets_mean": 5884.7,
"valid_targets_min": 895
},
{
"epoch": 2.758481012658228,
"grad_norm": 0.35402206211471576,
"learning_rate": 1.9901074858731825e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823733150959015,
"step": 2725,
"valid_targets_mean": 4029.6,
"valid_targets_min": 1404
},
{
"epoch": 2.7635443037974685,
"grad_norm": 0.2902629337004639,
"learning_rate": 1.98304153842129e-05,
"loss": 0.313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1647607535123825,
"step": 2730,
"valid_targets_mean": 5231.3,
"valid_targets_min": 1100
},
{
"epoch": 2.768607594936709,
"grad_norm": 0.2844550099011252,
"learning_rate": 1.9759758026528162e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20809857547283173,
"step": 2735,
"valid_targets_mean": 6735.6,
"valid_targets_min": 1644
},
{
"epoch": 2.7736708860759496,
"grad_norm": 0.3348579330081765,
"learning_rate": 1.9689103667655634e-05,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1527232825756073,
"step": 2740,
"valid_targets_mean": 3877.4,
"valid_targets_min": 1491
},
{
"epoch": 2.77873417721519,
"grad_norm": 0.33857120124730805,
"learning_rate": 1.9618453189535958e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20601877570152283,
"step": 2745,
"valid_targets_mean": 4548.2,
"valid_targets_min": 1232
},
{
"epoch": 2.7837974683544306,
"grad_norm": 0.3346701582946249,
"learning_rate": 1.9547807474061303e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13511428236961365,
"step": 2750,
"valid_targets_mean": 3345.6,
"valid_targets_min": 1298
},
{
"epoch": 2.7888607594936707,
"grad_norm": 0.3375591584241796,
"learning_rate": 1.947716740306439e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16758695244789124,
"step": 2755,
"valid_targets_mean": 3964.9,
"valid_targets_min": 1047
},
{
"epoch": 2.7939240506329113,
"grad_norm": 0.340384343325027,
"learning_rate": 1.9406533858307503e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1304406374692917,
"step": 2760,
"valid_targets_mean": 3351.9,
"valid_targets_min": 1109
},
{
"epoch": 2.798987341772152,
"grad_norm": 0.29188887212643894,
"learning_rate": 1.9335907721471438e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15948455035686493,
"step": 2765,
"valid_targets_mean": 4508.9,
"valid_targets_min": 970
},
{
"epoch": 2.8040506329113923,
"grad_norm": 0.2914363526376243,
"learning_rate": 1.9265289874144554e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18582302331924438,
"step": 2770,
"valid_targets_mean": 6648.4,
"valid_targets_min": 2048
},
{
"epoch": 2.809113924050633,
"grad_norm": 0.3447263204953251,
"learning_rate": 1.9194681197811703e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11537902057170868,
"step": 2775,
"valid_targets_mean": 3061.1,
"valid_targets_min": 1261
},
{
"epoch": 2.8141772151898734,
"grad_norm": 0.28824906654455074,
"learning_rate": 1.912408257384327e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18753370642662048,
"step": 2780,
"valid_targets_mean": 6277.4,
"valid_targets_min": 1561
},
{
"epoch": 2.819240506329114,
"grad_norm": 0.31551057795248955,
"learning_rate": 1.9053494883484177e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1113462746143341,
"step": 2785,
"valid_targets_mean": 3603.0,
"valid_targets_min": 966
},
{
"epoch": 2.8243037974683545,
"grad_norm": 0.3130169957194376,
"learning_rate": 1.898291900784284e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17591753602027893,
"step": 2790,
"valid_targets_mean": 4849.0,
"valid_targets_min": 1241
},
{
"epoch": 2.829367088607595,
"grad_norm": 0.36153291519489483,
"learning_rate": 1.8912355827880237e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13046428561210632,
"step": 2795,
"valid_targets_mean": 3138.6,
"valid_targets_min": 1174
},
{
"epoch": 2.8344303797468355,
"grad_norm": 0.35818567026601295,
"learning_rate": 1.884180622439884e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15154902637004852,
"step": 2800,
"valid_targets_mean": 3774.6,
"valid_targets_min": 731
},
{
"epoch": 2.839493670886076,
"grad_norm": 0.33153674409005546,
"learning_rate": 1.8771271078031648e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17227354645729065,
"step": 2805,
"valid_targets_mean": 5559.2,
"valid_targets_min": 981
},
{
"epoch": 2.8445569620253166,
"grad_norm": 0.30646195273462673,
"learning_rate": 1.8700751269231243e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17971369624137878,
"step": 2810,
"valid_targets_mean": 5315.5,
"valid_targets_min": 1235
},
{
"epoch": 2.8496202531645567,
"grad_norm": 0.3147470597121468,
"learning_rate": 1.86302476782587e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408463716506958,
"step": 2815,
"valid_targets_mean": 3962.4,
"valid_targets_min": 820
},
{
"epoch": 2.8546835443037972,
"grad_norm": 0.35549269402291417,
"learning_rate": 1.855976118517271e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19130544364452362,
"step": 2820,
"valid_targets_mean": 4855.5,
"valid_targets_min": 959
},
{
"epoch": 2.8597468354430378,
"grad_norm": 0.2823602428424915,
"learning_rate": 1.8489292669818494e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1796441674232483,
"step": 2825,
"valid_targets_mean": 5933.9,
"valid_targets_min": 1652
},
{
"epoch": 2.8648101265822783,
"grad_norm": 0.3086469012489834,
"learning_rate": 1.8418843011816894e-05,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14876966178417206,
"step": 2830,
"valid_targets_mean": 4459.1,
"valid_targets_min": 1431
},
{
"epoch": 2.869873417721519,
"grad_norm": 0.33219619271405165,
"learning_rate": 1.8348413090553356e-05,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1837439239025116,
"step": 2835,
"valid_targets_mean": 5042.5,
"valid_targets_min": 1015
},
{
"epoch": 2.8749367088607594,
"grad_norm": 0.28160060670414677,
"learning_rate": 1.8278003785166967e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13023114204406738,
"step": 2840,
"valid_targets_mean": 4408.2,
"valid_targets_min": 1093
},
{
"epoch": 2.88,
"grad_norm": 0.2701611603230975,
"learning_rate": 1.8207615974539476e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12874723970890045,
"step": 2845,
"valid_targets_mean": 4858.8,
"valid_targets_min": 863
},
{
"epoch": 2.8850632911392404,
"grad_norm": 0.33079935847646824,
"learning_rate": 1.8137250537284325e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17800703644752502,
"step": 2850,
"valid_targets_mean": 4857.1,
"valid_targets_min": 1713
},
{
"epoch": 2.890126582278481,
"grad_norm": 0.23595757958591787,
"learning_rate": 1.8066908351735666e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1269092708826065,
"step": 2855,
"valid_targets_mean": 5766.2,
"valid_targets_min": 1183
},
{
"epoch": 2.8951898734177215,
"grad_norm": 0.33538165041242207,
"learning_rate": 1.7996590295937448e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1899298131465912,
"step": 2860,
"valid_targets_mean": 5260.9,
"valid_targets_min": 1500
},
{
"epoch": 2.900253164556962,
"grad_norm": 0.3124645131733068,
"learning_rate": 1.7926297247632383e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1435328722000122,
"step": 2865,
"valid_targets_mean": 3785.1,
"valid_targets_min": 1048
},
{
"epoch": 2.9053164556962026,
"grad_norm": 0.3305614452127962,
"learning_rate": 1.7856030084251045e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1552894562482834,
"step": 2870,
"valid_targets_mean": 4255.3,
"valid_targets_min": 844
},
{
"epoch": 2.910379746835443,
"grad_norm": 0.34874837954634086,
"learning_rate": 1.7785789682900908e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14497388899326324,
"step": 2875,
"valid_targets_mean": 3286.0,
"valid_targets_min": 1279
},
{
"epoch": 2.9154430379746836,
"grad_norm": 0.3321474887097409,
"learning_rate": 1.771557692035537e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14671984314918518,
"step": 2880,
"valid_targets_mean": 4362.1,
"valid_targets_min": 897
},
{
"epoch": 2.920506329113924,
"grad_norm": 0.36664765144869893,
"learning_rate": 1.7645392673042853e-05,
"loss": 0.3298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20450638234615326,
"step": 2885,
"valid_targets_mean": 3744.9,
"valid_targets_min": 536
},
{
"epoch": 2.9255696202531647,
"grad_norm": 0.30800064070091415,
"learning_rate": 1.757523781703581e-05,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13620543479919434,
"step": 2890,
"valid_targets_mean": 4010.2,
"valid_targets_min": 739
},
{
"epoch": 2.9306329113924052,
"grad_norm": 0.39874064817665694,
"learning_rate": 1.7505113228039848e-05,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17097340524196625,
"step": 2895,
"valid_targets_mean": 4104.1,
"valid_targets_min": 1037
},
{
"epoch": 2.9356962025316458,
"grad_norm": 0.30804629166037306,
"learning_rate": 1.7435019781382737e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14079098403453827,
"step": 2900,
"valid_targets_mean": 4534.0,
"valid_targets_min": 887
},
{
"epoch": 2.9407594936708863,
"grad_norm": 0.306220364172818,
"learning_rate": 1.7364958352003548e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17645467817783356,
"step": 2905,
"valid_targets_mean": 4994.2,
"valid_targets_min": 1148
},
{
"epoch": 2.945822784810127,
"grad_norm": 0.3179633647838338,
"learning_rate": 1.7294929814441666e-05,
"loss": 0.3231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16111071407794952,
"step": 2910,
"valid_targets_mean": 4938.6,
"valid_targets_min": 1387
},
{
"epoch": 2.9508860759493674,
"grad_norm": 0.31641771807614866,
"learning_rate": 1.7224935042825912e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16131725907325745,
"step": 2915,
"valid_targets_mean": 4423.9,
"valid_targets_min": 810
},
{
"epoch": 2.9559493670886074,
"grad_norm": 0.2900729323232742,
"learning_rate": 1.7154974910863646e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10794432461261749,
"step": 2920,
"valid_targets_mean": 3454.4,
"valid_targets_min": 1456
},
{
"epoch": 2.961012658227848,
"grad_norm": 0.3432477720018123,
"learning_rate": 1.7085050291829813e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15215110778808594,
"step": 2925,
"valid_targets_mean": 4236.8,
"valid_targets_min": 1238
},
{
"epoch": 2.9660759493670885,
"grad_norm": 0.31507659068073507,
"learning_rate": 1.7015162058556088e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16133321821689606,
"step": 2930,
"valid_targets_mean": 4263.9,
"valid_targets_min": 795
},
{
"epoch": 2.971139240506329,
"grad_norm": 0.29285158348676216,
"learning_rate": 1.6945311083419947e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1742202341556549,
"step": 2935,
"valid_targets_mean": 5417.0,
"valid_targets_min": 1360
},
{
"epoch": 2.9762025316455696,
"grad_norm": 0.2918602342182722,
"learning_rate": 1.68754982383338e-05,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684986650943756,
"step": 2940,
"valid_targets_mean": 5456.4,
"valid_targets_min": 1200
},
{
"epoch": 2.98126582278481,
"grad_norm": 0.30561630865463585,
"learning_rate": 1.6805724394734107e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10106837749481201,
"step": 2945,
"valid_targets_mean": 3017.5,
"valid_targets_min": 1279
},
{
"epoch": 2.9863291139240506,
"grad_norm": 0.29442534234659645,
"learning_rate": 1.6735990423570477e-05,
"loss": 0.3234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13497650623321533,
"step": 2950,
"valid_targets_mean": 3993.2,
"valid_targets_min": 1015
},
{
"epoch": 2.991392405063291,
"grad_norm": 0.2700507094407274,
"learning_rate": 1.666629719529483e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15681613981723785,
"step": 2955,
"valid_targets_mean": 4630.2,
"valid_targets_min": 1176
},
{
"epoch": 2.9964556962025317,
"grad_norm": 0.3447693878105072,
"learning_rate": 1.6596645579850505e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1600763201713562,
"step": 2960,
"valid_targets_mean": 3677.3,
"valid_targets_min": 1107
},
{
"epoch": 3.001012658227848,
"grad_norm": 0.29622484390463744,
"learning_rate": 1.6527036446661396e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14927029609680176,
"step": 2965,
"valid_targets_mean": 4862.4,
"valid_targets_min": 1322
},
{
"epoch": 3.0060759493670886,
"grad_norm": 0.29785828676100873,
"learning_rate": 1.645747066462115e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19526249170303345,
"step": 2970,
"valid_targets_mean": 5885.6,
"valid_targets_min": 1447
},
{
"epoch": 3.011139240506329,
"grad_norm": 0.35112230405979555,
"learning_rate": 1.638794910208225e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10469535738229752,
"step": 2975,
"valid_targets_mean": 2940.2,
"valid_targets_min": 1159
},
{
"epoch": 3.0162025316455696,
"grad_norm": 0.3772315133305102,
"learning_rate": 1.631847262684523e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16602087020874023,
"step": 2980,
"valid_targets_mean": 4357.8,
"valid_targets_min": 1389
},
{
"epoch": 3.02126582278481,
"grad_norm": 0.30911220110322923,
"learning_rate": 1.624904210614782e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612570881843567,
"step": 2985,
"valid_targets_mean": 4494.7,
"valid_targets_min": 1244
},
{
"epoch": 3.0263291139240507,
"grad_norm": 0.3517033326754291,
"learning_rate": 1.6179658406654113e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17958399653434753,
"step": 2990,
"valid_targets_mean": 4044.6,
"valid_targets_min": 1324
},
{
"epoch": 3.031392405063291,
"grad_norm": 0.28226563989162823,
"learning_rate": 1.6110322394443773e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11023816466331482,
"step": 2995,
"valid_targets_mean": 4105.8,
"valid_targets_min": 1267
},
{
"epoch": 3.0364556962025318,
"grad_norm": 0.3395674314450887,
"learning_rate": 1.60410349350012e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17015889286994934,
"step": 3000,
"valid_targets_mean": 5613.8,
"valid_targets_min": 1423
},
{
"epoch": 3.0415189873417723,
"grad_norm": 0.3328019254619737,
"learning_rate": 1.597179689320474e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16885250806808472,
"step": 3005,
"valid_targets_mean": 4626.2,
"valid_targets_min": 1034
},
{
"epoch": 3.046582278481013,
"grad_norm": 0.30137258092800007,
"learning_rate": 1.5902609133315888e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14555740356445312,
"step": 3010,
"valid_targets_mean": 5118.1,
"valid_targets_min": 1378
},
{
"epoch": 3.0516455696202534,
"grad_norm": 0.32251822208809916,
"learning_rate": 1.5833472518968478e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13226641714572906,
"step": 3015,
"valid_targets_mean": 4081.9,
"valid_targets_min": 1428
},
{
"epoch": 3.056708860759494,
"grad_norm": 0.3211101552341726,
"learning_rate": 1.5764387913157952e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0971713736653328,
"step": 3020,
"valid_targets_mean": 3146.8,
"valid_targets_min": 1380
},
{
"epoch": 3.061772151898734,
"grad_norm": 0.3360390373855527,
"learning_rate": 1.5695356178230527e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12469463050365448,
"step": 3025,
"valid_targets_mean": 3152.8,
"valid_targets_min": 1004
},
{
"epoch": 3.0668354430379745,
"grad_norm": 0.29385960506365055,
"learning_rate": 1.5626378175872486e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16584698855876923,
"step": 3030,
"valid_targets_mean": 5578.9,
"valid_targets_min": 1238
},
{
"epoch": 3.071898734177215,
"grad_norm": 0.32789137808560437,
"learning_rate": 1.5557454767099382e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17390216886997223,
"step": 3035,
"valid_targets_mean": 4741.9,
"valid_targets_min": 1219
},
{
"epoch": 3.0769620253164556,
"grad_norm": 0.3234941533877886,
"learning_rate": 1.5488586812245302e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17046749591827393,
"step": 3040,
"valid_targets_mean": 4481.4,
"valid_targets_min": 1174
},
{
"epoch": 3.082025316455696,
"grad_norm": 0.28075430375987626,
"learning_rate": 1.541977517095215e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14547553658485413,
"step": 3045,
"valid_targets_mean": 5410.0,
"valid_targets_min": 1228
},
{
"epoch": 3.0870886075949366,
"grad_norm": 0.28635813947594835,
"learning_rate": 1.5351020702158875e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13441359996795654,
"step": 3050,
"valid_targets_mean": 5051.8,
"valid_targets_min": 960
},
{
"epoch": 3.092151898734177,
"grad_norm": 0.34800039286889395,
"learning_rate": 1.52823242640908e-05,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15158754587173462,
"step": 3055,
"valid_targets_mean": 3697.4,
"valid_targets_min": 1086
},
{
"epoch": 3.0972151898734177,
"grad_norm": 0.32310977392742785,
"learning_rate": 1.5213686714248852e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16765525937080383,
"step": 3060,
"valid_targets_mean": 4845.2,
"valid_targets_min": 1334
},
{
"epoch": 3.1022784810126582,
"grad_norm": 0.296724917732042,
"learning_rate": 1.5145108909398896e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14354108273983002,
"step": 3065,
"valid_targets_mean": 4783.9,
"valid_targets_min": 1333
},
{
"epoch": 3.1073417721518988,
"grad_norm": 0.42288485229336514,
"learning_rate": 1.5076591705561056e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16323769092559814,
"step": 3070,
"valid_targets_mean": 3961.5,
"valid_targets_min": 1451
},
{
"epoch": 3.1124050632911393,
"grad_norm": 0.29888536735808585,
"learning_rate": 1.5008135957998968e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16281160712242126,
"step": 3075,
"valid_targets_mean": 5095.7,
"valid_targets_min": 989
},
{
"epoch": 3.11746835443038,
"grad_norm": 0.32246738234879885,
"learning_rate": 1.4939742521209178e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.142366424202919,
"step": 3080,
"valid_targets_mean": 3786.1,
"valid_targets_min": 776
},
{
"epoch": 3.1225316455696204,
"grad_norm": 0.2885458143447489,
"learning_rate": 1.4871412248910416e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1399984061717987,
"step": 3085,
"valid_targets_mean": 5652.7,
"valid_targets_min": 1058
},
{
"epoch": 3.127594936708861,
"grad_norm": 0.3436698843544968,
"learning_rate": 1.480314599403296e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12947720289230347,
"step": 3090,
"valid_targets_mean": 3113.7,
"valid_targets_min": 1129
},
{
"epoch": 3.1326582278481014,
"grad_norm": 0.3034361762747695,
"learning_rate": 1.4734944608708022e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1270906925201416,
"step": 3095,
"valid_targets_mean": 4283.6,
"valid_targets_min": 1371
},
{
"epoch": 3.137721518987342,
"grad_norm": 0.2910061490791564,
"learning_rate": 1.4666808944257044e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1065504252910614,
"step": 3100,
"valid_targets_mean": 4013.8,
"valid_targets_min": 1748
},
{
"epoch": 3.1427848101265825,
"grad_norm": 0.29375562777524983,
"learning_rate": 1.459873985118115e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20948265492916107,
"step": 3105,
"valid_targets_mean": 6254.6,
"valid_targets_min": 855
},
{
"epoch": 3.1478481012658226,
"grad_norm": 0.32610939195307226,
"learning_rate": 1.4530738179150445e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16477391123771667,
"step": 3110,
"valid_targets_mean": 4672.6,
"valid_targets_min": 1423
},
{
"epoch": 3.152911392405063,
"grad_norm": 0.34376610077811187,
"learning_rate": 1.44628047769935e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12125621736049652,
"step": 3115,
"valid_targets_mean": 3024.9,
"valid_targets_min": 1154
},
{
"epoch": 3.1579746835443037,
"grad_norm": 0.24961470242170858,
"learning_rate": 1.4394940492686666e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18956081569194794,
"step": 3120,
"valid_targets_mean": 8850.2,
"valid_targets_min": 1106
},
{
"epoch": 3.163037974683544,
"grad_norm": 0.3213177133533683,
"learning_rate": 1.4327146173343561e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16393819451332092,
"step": 3125,
"valid_targets_mean": 4351.1,
"valid_targets_min": 1322
},
{
"epoch": 3.1681012658227847,
"grad_norm": 0.3207864682050949,
"learning_rate": 1.4259422665204458e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19772255420684814,
"step": 3130,
"valid_targets_mean": 5234.6,
"valid_targets_min": 1247
},
{
"epoch": 3.1731645569620253,
"grad_norm": 0.3306680712851493,
"learning_rate": 1.4191770813625732e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1288958340883255,
"step": 3135,
"valid_targets_mean": 3816.3,
"valid_targets_min": 1339
},
{
"epoch": 3.178227848101266,
"grad_norm": 0.33226796696180216,
"learning_rate": 1.4124191463069305e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1820456087589264,
"step": 3140,
"valid_targets_mean": 4462.9,
"valid_targets_min": 1300
},
{
"epoch": 3.1832911392405063,
"grad_norm": 0.25066525871506057,
"learning_rate": 1.4056685457092122e-05,
"loss": 0.2981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.108408123254776,
"step": 3145,
"valid_targets_mean": 4348.1,
"valid_targets_min": 954
},
{
"epoch": 3.188354430379747,
"grad_norm": 0.2799683914898738,
"learning_rate": 1.3989253638335577e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140926331281662,
"step": 3150,
"valid_targets_mean": 5334.3,
"valid_targets_min": 686
},
{
"epoch": 3.1934177215189874,
"grad_norm": 0.364904271269176,
"learning_rate": 1.3921896848515064e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1611071527004242,
"step": 3155,
"valid_targets_mean": 3846.9,
"valid_targets_min": 1050
},
{
"epoch": 3.198481012658228,
"grad_norm": 0.31469570152651777,
"learning_rate": 1.385461592840939e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16711470484733582,
"step": 3160,
"valid_targets_mean": 4945.6,
"valid_targets_min": 1265
},
{
"epoch": 3.2035443037974685,
"grad_norm": 0.40871004437684494,
"learning_rate": 1.3787411717850358e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14797160029411316,
"step": 3165,
"valid_targets_mean": 3367.9,
"valid_targets_min": 1380
},
{
"epoch": 3.208607594936709,
"grad_norm": 0.3063676754341602,
"learning_rate": 1.3720285055712222e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12202514708042145,
"step": 3170,
"valid_targets_mean": 3846.6,
"valid_targets_min": 1062
},
{
"epoch": 3.2136708860759495,
"grad_norm": 0.33920699542879207,
"learning_rate": 1.3653236779901236e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08881708979606628,
"step": 3175,
"valid_targets_mean": 2589.6,
"valid_targets_min": 1310
},
{
"epoch": 3.21873417721519,
"grad_norm": 0.3118478710909973,
"learning_rate": 1.3586267727345232e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13673335313796997,
"step": 3180,
"valid_targets_mean": 4171.1,
"valid_targets_min": 1119
},
{
"epoch": 3.22379746835443,
"grad_norm": 0.3657648017370462,
"learning_rate": 1.35193787339831e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13656803965568542,
"step": 3185,
"valid_targets_mean": 4186.0,
"valid_targets_min": 1616
},
{
"epoch": 3.2288607594936707,
"grad_norm": 0.29575714520451474,
"learning_rate": 1.3452570634754434e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14770013093948364,
"step": 3190,
"valid_targets_mean": 5272.9,
"valid_targets_min": 1046
},
{
"epoch": 3.233924050632911,
"grad_norm": 0.29496009702650783,
"learning_rate": 1.3385844263589033e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17479810118675232,
"step": 3195,
"valid_targets_mean": 5597.1,
"valid_targets_min": 1196
},
{
"epoch": 3.2389873417721518,
"grad_norm": 0.35581177858551544,
"learning_rate": 1.3319200453396548e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15500982105731964,
"step": 3200,
"valid_targets_mean": 4076.4,
"valid_targets_min": 1070
},
{
"epoch": 3.2440506329113923,
"grad_norm": 0.292951167708079,
"learning_rate": 1.3252640036056068e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1567637026309967,
"step": 3205,
"valid_targets_mean": 5367.4,
"valid_targets_min": 1424
},
{
"epoch": 3.249113924050633,
"grad_norm": 0.3182836504556952,
"learning_rate": 1.318616384240572e-05,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862029880285263,
"step": 3210,
"valid_targets_mean": 5235.2,
"valid_targets_min": 1150
},
{
"epoch": 3.2541772151898734,
"grad_norm": 0.5962356962936214,
"learning_rate": 1.3119772702232325e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15173543989658356,
"step": 3215,
"valid_targets_mean": 3896.9,
"valid_targets_min": 1293
},
{
"epoch": 3.259240506329114,
"grad_norm": 0.30446119131111943,
"learning_rate": 1.3053467444261021e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16218072175979614,
"step": 3220,
"valid_targets_mean": 5058.7,
"valid_targets_min": 1443
},
{
"epoch": 3.2643037974683544,
"grad_norm": 0.30100968288795926,
"learning_rate": 1.2987248896144915e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1766858994960785,
"step": 3225,
"valid_targets_mean": 5638.7,
"valid_targets_min": 1494
},
{
"epoch": 3.269367088607595,
"grad_norm": 0.3043172862585619,
"learning_rate": 1.2921117884454784e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13346105813980103,
"step": 3230,
"valid_targets_mean": 4191.2,
"valid_targets_min": 886
},
{
"epoch": 3.2744303797468355,
"grad_norm": 0.30601688850305675,
"learning_rate": 1.2855075234668708e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17442500591278076,
"step": 3235,
"valid_targets_mean": 5185.5,
"valid_targets_min": 1463
},
{
"epoch": 3.279493670886076,
"grad_norm": 0.32710194023512384,
"learning_rate": 1.278912177116182e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18517401814460754,
"step": 3240,
"valid_targets_mean": 4748.3,
"valid_targets_min": 1001
},
{
"epoch": 3.2845569620253166,
"grad_norm": 0.2832311914633299,
"learning_rate": 1.2723258317195965e-05,
"loss": 0.3118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1336306631565094,
"step": 3245,
"valid_targets_mean": 4846.2,
"valid_targets_min": 1184
},
{
"epoch": 3.289620253164557,
"grad_norm": 0.2859981419544709,
"learning_rate": 1.2657485694909451e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12190467119216919,
"step": 3250,
"valid_targets_mean": 4372.2,
"valid_targets_min": 1012
},
{
"epoch": 3.2946835443037976,
"grad_norm": 0.3133461443068576,
"learning_rate": 1.2591804725306802e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09984530508518219,
"step": 3255,
"valid_targets_mean": 3387.1,
"valid_targets_min": 1020
},
{
"epoch": 3.299746835443038,
"grad_norm": 0.3066068642940143,
"learning_rate": 1.252621622824846e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10505147278308868,
"step": 3260,
"valid_targets_mean": 3119.9,
"valid_targets_min": 1415
},
{
"epoch": 3.3048101265822787,
"grad_norm": 0.30638690017522713,
"learning_rate": 1.2460721022440617e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329905241727829,
"step": 3265,
"valid_targets_mean": 3749.8,
"valid_targets_min": 1247
},
{
"epoch": 3.309873417721519,
"grad_norm": 0.3893581538313894,
"learning_rate": 1.2395319925424922e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12106384336948395,
"step": 3270,
"valid_targets_mean": 3750.2,
"valid_targets_min": 1170
},
{
"epoch": 3.3149367088607593,
"grad_norm": 0.2915580190067732,
"learning_rate": 1.2330013753568345e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15587478876113892,
"step": 3275,
"valid_targets_mean": 5153.9,
"valid_targets_min": 884
},
{
"epoch": 3.32,
"grad_norm": 0.32454051814127005,
"learning_rate": 1.2264803322052938e-05,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14347532391548157,
"step": 3280,
"valid_targets_mean": 3715.8,
"valid_targets_min": 1109
},
{
"epoch": 3.3250632911392404,
"grad_norm": 0.3014718100183408,
"learning_rate": 1.2199689444865688e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11024832725524902,
"step": 3285,
"valid_targets_mean": 3356.6,
"valid_targets_min": 1346
},
{
"epoch": 3.330126582278481,
"grad_norm": 0.3180605843827969,
"learning_rate": 1.2134672934788338e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1348501592874527,
"step": 3290,
"valid_targets_mean": 4180.2,
"valid_targets_min": 1405
},
{
"epoch": 3.3351898734177214,
"grad_norm": 0.31070898369108957,
"learning_rate": 1.206975460338726e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14836883544921875,
"step": 3295,
"valid_targets_mean": 4112.2,
"valid_targets_min": 1401
},
{
"epoch": 3.340253164556962,
"grad_norm": 0.28528395978629406,
"learning_rate": 1.2004935261003292e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11711958050727844,
"step": 3300,
"valid_targets_mean": 5100.1,
"valid_targets_min": 1029
},
{
"epoch": 3.3453164556962025,
"grad_norm": 0.3708665183674031,
"learning_rate": 1.194021571674168e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13884302973747253,
"step": 3305,
"valid_targets_mean": 4049.6,
"valid_targets_min": 974
},
{
"epoch": 3.350379746835443,
"grad_norm": 0.3298858637588618,
"learning_rate": 1.1875596778461903e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1451665610074997,
"step": 3310,
"valid_targets_mean": 4987.6,
"valid_targets_min": 1624
},
{
"epoch": 3.3554430379746836,
"grad_norm": 0.30292570807469854,
"learning_rate": 1.1811079252767663e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12376505136489868,
"step": 3315,
"valid_targets_mean": 3583.1,
"valid_targets_min": 1257
},
{
"epoch": 3.360506329113924,
"grad_norm": 0.32294869729997133,
"learning_rate": 1.174666394499677e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11844268441200256,
"step": 3320,
"valid_targets_mean": 3262.4,
"valid_targets_min": 1554
},
{
"epoch": 3.3655696202531646,
"grad_norm": 0.3438389100269291,
"learning_rate": 1.1682351659211088e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1457480937242508,
"step": 3325,
"valid_targets_mean": 3745.7,
"valid_targets_min": 1190
},
{
"epoch": 3.370632911392405,
"grad_norm": 0.33249792748827744,
"learning_rate": 1.1618143198186544e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15856462717056274,
"step": 3330,
"valid_targets_mean": 4305.5,
"valid_targets_min": 910
},
{
"epoch": 3.3756962025316457,
"grad_norm": 0.3173034049275177,
"learning_rate": 1.155403936340304e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18826264142990112,
"step": 3335,
"valid_targets_mean": 5404.1,
"valid_targets_min": 1023
},
{
"epoch": 3.3807594936708862,
"grad_norm": 0.3178276101310362,
"learning_rate": 1.149004095503452e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15395784378051758,
"step": 3340,
"valid_targets_mean": 5008.1,
"valid_targets_min": 1032
},
{
"epoch": 3.3858227848101268,
"grad_norm": 0.3025604254884791,
"learning_rate": 1.1426148771938915e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1488351970911026,
"step": 3345,
"valid_targets_mean": 4703.1,
"valid_targets_min": 1506
},
{
"epoch": 3.390886075949367,
"grad_norm": 0.3037731465395097,
"learning_rate": 1.1362363611648228e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11465154588222504,
"step": 3350,
"valid_targets_mean": 3727.4,
"valid_targets_min": 921
},
{
"epoch": 3.3959493670886074,
"grad_norm": 0.3441348411116797,
"learning_rate": 1.1298686270358542e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17264041304588318,
"step": 3355,
"valid_targets_mean": 3737.4,
"valid_targets_min": 1599
},
{
"epoch": 3.401012658227848,
"grad_norm": 0.2922925569041438,
"learning_rate": 1.1235117542920077e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11297699809074402,
"step": 3360,
"valid_targets_mean": 4023.7,
"valid_targets_min": 1052
},
{
"epoch": 3.4060759493670885,
"grad_norm": 0.3304527382358981,
"learning_rate": 1.1171658222827321e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21652498841285706,
"step": 3365,
"valid_targets_mean": 5499.5,
"valid_targets_min": 949
},
{
"epoch": 3.411139240506329,
"grad_norm": 0.34098724945316766,
"learning_rate": 1.110830910220905e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17756357789039612,
"step": 3370,
"valid_targets_mean": 3859.3,
"valid_targets_min": 961
},
{
"epoch": 3.4162025316455695,
"grad_norm": 0.29556792434414897,
"learning_rate": 1.1045070971818515e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.130351722240448,
"step": 3375,
"valid_targets_mean": 3860.4,
"valid_targets_min": 1126
},
{
"epoch": 3.42126582278481,
"grad_norm": 0.2817393837564735,
"learning_rate": 1.0981944621023508e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.172260582447052,
"step": 3380,
"valid_targets_mean": 6195.1,
"valid_targets_min": 1065
},
{
"epoch": 3.4263291139240506,
"grad_norm": 0.3019678707113778,
"learning_rate": 1.0918930837796538e-05,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14187800884246826,
"step": 3385,
"valid_targets_mean": 4729.5,
"valid_targets_min": 1024
},
{
"epoch": 3.431392405063291,
"grad_norm": 0.32014190449807,
"learning_rate": 1.0856030408705016e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15517304837703705,
"step": 3390,
"valid_targets_mean": 4351.6,
"valid_targets_min": 1381
},
{
"epoch": 3.4364556962025317,
"grad_norm": 0.28577315150998106,
"learning_rate": 1.0793244118901383e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16560965776443481,
"step": 3395,
"valid_targets_mean": 5708.4,
"valid_targets_min": 1323
},
{
"epoch": 3.441518987341772,
"grad_norm": 0.2895330117490245,
"learning_rate": 1.0730572752113368e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16116517782211304,
"step": 3400,
"valid_targets_mean": 6122.2,
"valid_targets_min": 1191
},
{
"epoch": 3.4465822784810127,
"grad_norm": 0.3276147158732667,
"learning_rate": 1.0668017090634164e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1463163197040558,
"step": 3405,
"valid_targets_mean": 3868.4,
"valid_targets_min": 1560
},
{
"epoch": 3.4516455696202533,
"grad_norm": 0.27522935687650096,
"learning_rate": 1.0605577915312662e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14057275652885437,
"step": 3410,
"valid_targets_mean": 5501.4,
"valid_targets_min": 1198
},
{
"epoch": 3.456708860759494,
"grad_norm": 0.2546793488548092,
"learning_rate": 1.0543256005543752e-05,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17178791761398315,
"step": 3415,
"valid_targets_mean": 6257.9,
"valid_targets_min": 1159
},
{
"epoch": 3.4617721518987343,
"grad_norm": 0.2887049078859965,
"learning_rate": 1.048105213925853e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15336082875728607,
"step": 3420,
"valid_targets_mean": 5676.3,
"valid_targets_min": 1581
},
{
"epoch": 3.466835443037975,
"grad_norm": 0.3248981947583244,
"learning_rate": 1.0418967092914643e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12593376636505127,
"step": 3425,
"valid_targets_mean": 3572.3,
"valid_targets_min": 1200
},
{
"epoch": 3.4718987341772154,
"grad_norm": 0.33097897236242024,
"learning_rate": 1.0357001641486556e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16061154007911682,
"step": 3430,
"valid_targets_mean": 6276.2,
"valid_targets_min": 1499
},
{
"epoch": 3.476962025316456,
"grad_norm": 0.29614677485829893,
"learning_rate": 1.0295156558455885e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1872052550315857,
"step": 3435,
"valid_targets_mean": 6640.8,
"valid_targets_min": 1160
},
{
"epoch": 3.482025316455696,
"grad_norm": 0.27705637796463173,
"learning_rate": 1.0233432615801786e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14229699969291687,
"step": 3440,
"valid_targets_mean": 5945.9,
"valid_targets_min": 1284
},
{
"epoch": 3.4870886075949366,
"grad_norm": 0.26237225876364956,
"learning_rate": 1.0171830583991245e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17002148926258087,
"step": 3445,
"valid_targets_mean": 6348.2,
"valid_targets_min": 1431
},
{
"epoch": 3.492151898734177,
"grad_norm": 0.33818695188520737,
"learning_rate": 1.0110351231969532e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19817857444286346,
"step": 3450,
"valid_targets_mean": 4845.8,
"valid_targets_min": 1227
},
{
"epoch": 3.4972151898734176,
"grad_norm": 0.27766136414994197,
"learning_rate": 1.0048995327150556e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17715927958488464,
"step": 3455,
"valid_targets_mean": 6080.2,
"valid_targets_min": 1024
},
{
"epoch": 3.502278481012658,
"grad_norm": 0.3385690737736752,
"learning_rate": 9.987763635407293e-06,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18266132473945618,
"step": 3460,
"valid_targets_mean": 4562.4,
"valid_targets_min": 1570
},
{
"epoch": 3.5073417721518987,
"grad_norm": 0.35240157099060987,
"learning_rate": 9.926656921062254e-06,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18275323510169983,
"step": 3465,
"valid_targets_mean": 4161.0,
"valid_targets_min": 1086
},
{
"epoch": 3.512405063291139,
"grad_norm": 0.37082127798975295,
"learning_rate": 9.865675946877897e-06,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.137416809797287,
"step": 3470,
"valid_targets_mean": 3108.2,
"valid_targets_min": 1222
},
{
"epoch": 3.5174683544303798,
"grad_norm": 0.32990352870182205,
"learning_rate": 9.804821474047166e-06,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13373905420303345,
"step": 3475,
"valid_targets_mean": 3385.4,
"valid_targets_min": 1094
},
{
"epoch": 3.5225316455696203,
"grad_norm": 0.3159470821550788,
"learning_rate": 9.744094262183922e-06,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1414027214050293,
"step": 3480,
"valid_targets_mean": 3928.0,
"valid_targets_min": 1133
},
{
"epoch": 3.527594936708861,
"grad_norm": 0.2903957000330617,
"learning_rate": 9.683495069313527e-06,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1404920518398285,
"step": 3485,
"valid_targets_mean": 4963.7,
"valid_targets_min": 1699
},
{
"epoch": 3.5326582278481014,
"grad_norm": 0.28971614608089746,
"learning_rate": 9.623024651863317e-06,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12896308302879333,
"step": 3490,
"valid_targets_mean": 4057.2,
"valid_targets_min": 1028
},
{
"epoch": 3.537721518987342,
"grad_norm": 0.32570265544900434,
"learning_rate": 9.56268376465323e-06,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14747750759124756,
"step": 3495,
"valid_targets_mean": 3836.9,
"valid_targets_min": 858
},
{
"epoch": 3.5427848101265824,
"grad_norm": 0.3186509490983858,
"learning_rate": 9.502473160886309e-06,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13043725490570068,
"step": 3500,
"valid_targets_mean": 3738.1,
"valid_targets_min": 908
},
{
"epoch": 3.547848101265823,
"grad_norm": 0.2738590358023834,
"learning_rate": 9.442393592139378e-06,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14587613940238953,
"step": 3505,
"valid_targets_mean": 4865.2,
"valid_targets_min": 1410
},
{
"epoch": 3.552911392405063,
"grad_norm": 0.3247037129452682,
"learning_rate": 9.382445808353582e-06,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686377227306366,
"step": 3510,
"valid_targets_mean": 4436.3,
"valid_targets_min": 1010
},
{
"epoch": 3.5579746835443036,
"grad_norm": 0.3180620836755935,
"learning_rate": 9.322630557825099e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.181858628988266,
"step": 3515,
"valid_targets_mean": 5233.6,
"valid_targets_min": 1452
},
{
"epoch": 3.563037974683544,
"grad_norm": 0.389889167724953,
"learning_rate": 9.262948587195733e-06,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15717878937721252,
"step": 3520,
"valid_targets_mean": 3013.9,
"valid_targets_min": 1243
},
{
"epoch": 3.5681012658227846,
"grad_norm": 0.29747778586225904,
"learning_rate": 9.203400641443659e-06,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1657101958990097,
"step": 3525,
"valid_targets_mean": 5011.9,
"valid_targets_min": 1171
},
{
"epoch": 3.573164556962025,
"grad_norm": 0.32589494828857773,
"learning_rate": 9.143987463874067e-06,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313675493001938,
"step": 3530,
"valid_targets_mean": 3697.8,
"valid_targets_min": 1024
},
{
"epoch": 3.5782278481012657,
"grad_norm": 0.3014059728019354,
"learning_rate": 9.084709796109907e-06,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1120418906211853,
"step": 3535,
"valid_targets_mean": 3755.7,
"valid_targets_min": 1198
},
{
"epoch": 3.5832911392405062,
"grad_norm": 0.2948674668221632,
"learning_rate": 9.025568378082656e-06,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535429894924164,
"step": 3540,
"valid_targets_mean": 5356.3,
"valid_targets_min": 1015
},
{
"epoch": 3.5883544303797468,
"grad_norm": 0.33956864916271323,
"learning_rate": 8.96656394802303e-06,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18608632683753967,
"step": 3545,
"valid_targets_mean": 4867.1,
"valid_targets_min": 1215
},
{
"epoch": 3.5934177215189873,
"grad_norm": 0.2894977962731721,
"learning_rate": 8.907697242451825e-06,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1488334834575653,
"step": 3550,
"valid_targets_mean": 4891.0,
"valid_targets_min": 1716
},
{
"epoch": 3.598481012658228,
"grad_norm": 0.3343791939565901,
"learning_rate": 8.84896899617067e-06,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.141134113073349,
"step": 3555,
"valid_targets_mean": 3341.7,
"valid_targets_min": 890
},
{
"epoch": 3.6035443037974684,
"grad_norm": 0.33452158631970796,
"learning_rate": 8.790379942252888e-06,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10691896080970764,
"step": 3560,
"valid_targets_mean": 2877.1,
"valid_targets_min": 1216
},
{
"epoch": 3.608607594936709,
"grad_norm": 0.36142037308609365,
"learning_rate": 8.73193081203436e-06,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11998053640127182,
"step": 3565,
"valid_targets_mean": 2745.8,
"valid_targets_min": 1146
},
{
"epoch": 3.6136708860759494,
"grad_norm": 0.29136587900708333,
"learning_rate": 8.673622335104335e-06,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1345549076795578,
"step": 3570,
"valid_targets_mean": 4353.7,
"valid_targets_min": 1408
},
{
"epoch": 3.61873417721519,
"grad_norm": 0.3065976409246481,
"learning_rate": 8.6154552392964e-06,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10774962604045868,
"step": 3575,
"valid_targets_mean": 3904.3,
"valid_targets_min": 1176
},
{
"epoch": 3.6237974683544305,
"grad_norm": 0.31612983755964325,
"learning_rate": 8.557430250679329e-06,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13469217717647552,
"step": 3580,
"valid_targets_mean": 3963.2,
"valid_targets_min": 1302
},
{
"epoch": 3.628860759493671,
"grad_norm": 0.355565500659515,
"learning_rate": 8.499548093548069e-06,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492483913898468,
"step": 3585,
"valid_targets_mean": 3815.0,
"valid_targets_min": 998
},
{
"epoch": 3.6339240506329116,
"grad_norm": 0.3209640823808966,
"learning_rate": 8.441809490414664e-06,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10731847584247589,
"step": 3590,
"valid_targets_mean": 3390.2,
"valid_targets_min": 1205
},
{
"epoch": 3.638987341772152,
"grad_norm": 0.3111850353285487,
"learning_rate": 8.384215161999245e-06,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12559540569782257,
"step": 3595,
"valid_targets_mean": 3864.8,
"valid_targets_min": 1279
},
{
"epoch": 3.6440506329113926,
"grad_norm": 0.3021980554963678,
"learning_rate": 8.326765827221066e-06,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16643747687339783,
"step": 3600,
"valid_targets_mean": 4737.3,
"valid_targets_min": 980
},
{
"epoch": 3.649113924050633,
"grad_norm": 0.3299126612802994,
"learning_rate": 8.269462203189467e-06,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495143473148346,
"step": 3605,
"valid_targets_mean": 4373.2,
"valid_targets_min": 1652
},
{
"epoch": 3.6541772151898733,
"grad_norm": 0.3046029741964782,
"learning_rate": 8.212305005194992e-06,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12610015273094177,
"step": 3610,
"valid_targets_mean": 4068.0,
"valid_targets_min": 990
},
{
"epoch": 3.659240506329114,
"grad_norm": 0.2889811661916004,
"learning_rate": 8.155294946700402e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14253506064414978,
"step": 3615,
"valid_targets_mean": 4970.4,
"valid_targets_min": 1268
},
{
"epoch": 3.6643037974683543,
"grad_norm": 0.3058585932521842,
"learning_rate": 8.098432739331803e-06,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14140847325325012,
"step": 3620,
"valid_targets_mean": 4990.8,
"valid_targets_min": 1162
},
{
"epoch": 3.669367088607595,
"grad_norm": 0.3078512961350209,
"learning_rate": 8.041719092869761e-06,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13041014969348907,
"step": 3625,
"valid_targets_mean": 4127.6,
"valid_targets_min": 1226
},
{
"epoch": 3.6744303797468354,
"grad_norm": 0.2557971332829355,
"learning_rate": 7.98515471524042e-06,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13294486701488495,
"step": 3630,
"valid_targets_mean": 5826.9,
"valid_targets_min": 1621
},
{
"epoch": 3.679493670886076,
"grad_norm": 0.3421960754823531,
"learning_rate": 7.928740312506704e-06,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11804340779781342,
"step": 3635,
"valid_targets_mean": 3220.9,
"valid_targets_min": 1529
},
{
"epoch": 3.6845569620253165,
"grad_norm": 0.30370702242210657,
"learning_rate": 7.87247658885946e-06,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1813192367553711,
"step": 3640,
"valid_targets_mean": 5260.7,
"valid_targets_min": 1428
},
{
"epoch": 3.689620253164557,
"grad_norm": 0.3275936364034654,
"learning_rate": 7.816364246608688e-06,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16349400579929352,
"step": 3645,
"valid_targets_mean": 4485.0,
"valid_targets_min": 891
},
{
"epoch": 3.6946835443037975,
"grad_norm": 0.36264702848645247,
"learning_rate": 7.760403986174796e-06,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13801871240139008,
"step": 3650,
"valid_targets_mean": 3051.1,
"valid_targets_min": 1057
},
{
"epoch": 3.699746835443038,
"grad_norm": 0.2776099144093922,
"learning_rate": 7.70459650607981e-06,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1680225133895874,
"step": 3655,
"valid_targets_mean": 6631.8,
"valid_targets_min": 1456
},
{
"epoch": 3.7048101265822786,
"grad_norm": 0.34172337758905963,
"learning_rate": 7.648942502938705e-06,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16763363778591156,
"step": 3660,
"valid_targets_mean": 4061.8,
"valid_targets_min": 1209
},
{
"epoch": 3.709873417721519,
"grad_norm": 0.31939393718066644,
"learning_rate": 7.593442671450666e-06,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17321282625198364,
"step": 3665,
"valid_targets_mean": 4894.1,
"valid_targets_min": 1043
},
{
"epoch": 3.714936708860759,
"grad_norm": 0.32132553979600637,
"learning_rate": 7.5380977043904365e-06,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16710880398750305,
"step": 3670,
"valid_targets_mean": 4925.1,
"valid_targets_min": 1393
},
{
"epoch": 3.7199999999999998,
"grad_norm": 0.32445408393836617,
"learning_rate": 7.482908292599689e-06,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12341426312923431,
"step": 3675,
"valid_targets_mean": 3606.6,
"valid_targets_min": 1214
},
{
"epoch": 3.7250632911392403,
"grad_norm": 0.3064797642539383,
"learning_rate": 7.427875124978359e-06,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298845112323761,
"step": 3680,
"valid_targets_mean": 4494.2,
"valid_targets_min": 1211
},
{
"epoch": 3.730126582278481,
"grad_norm": 0.2891043975748266,
"learning_rate": 7.372998888476091e-06,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14520198106765747,
"step": 3685,
"valid_targets_mean": 4642.1,
"valid_targets_min": 1350
},
{
"epoch": 3.7351898734177214,
"grad_norm": 0.2986519000501888,
"learning_rate": 7.318280268083624e-06,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19568581879138947,
"step": 3690,
"valid_targets_mean": 5491.8,
"valid_targets_min": 1141
},
{
"epoch": 3.740253164556962,
"grad_norm": 0.32054148131031535,
"learning_rate": 7.263719946824264e-06,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12194908410310745,
"step": 3695,
"valid_targets_mean": 3993.2,
"valid_targets_min": 1248
},
{
"epoch": 3.7453164556962024,
"grad_norm": 0.29536657640379355,
"learning_rate": 7.209318605745368e-06,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14819620549678802,
"step": 3700,
"valid_targets_mean": 4433.9,
"valid_targets_min": 1426
},
{
"epoch": 3.750379746835443,
"grad_norm": 0.28146869288224746,
"learning_rate": 7.1550769239098e-06,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18099471926689148,
"step": 3705,
"valid_targets_mean": 7152.2,
"valid_targets_min": 1449
},
{
"epoch": 3.7554430379746835,
"grad_norm": 0.31596675118829165,
"learning_rate": 7.100995578387519e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13141889870166779,
"step": 3710,
"valid_targets_mean": 3884.0,
"valid_targets_min": 1459
},
{
"epoch": 3.760506329113924,
"grad_norm": 0.31422332389376245,
"learning_rate": 7.047075244247061e-06,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1718595027923584,
"step": 3715,
"valid_targets_mean": 4909.5,
"valid_targets_min": 1774
},
{
"epoch": 3.7655696202531646,
"grad_norm": 0.3058451914869696,
"learning_rate": 6.993316594547148e-06,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12041142582893372,
"step": 3720,
"valid_targets_mean": 3857.4,
"valid_targets_min": 1341
},
{
"epoch": 3.770632911392405,
"grad_norm": 0.3285101705687896,
"learning_rate": 6.939720300328303e-06,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15424466133117676,
"step": 3725,
"valid_targets_mean": 4029.8,
"valid_targets_min": 1388
},
{
"epoch": 3.7756962025316456,
"grad_norm": 0.2852711508998474,
"learning_rate": 6.886287030604422e-06,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15062718093395233,
"step": 3730,
"valid_targets_mean": 5311.7,
"valid_targets_min": 1383
},
{
"epoch": 3.780759493670886,
"grad_norm": 0.32830150851392953,
"learning_rate": 6.83301745235448e-06,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1865895390510559,
"step": 3735,
"valid_targets_mean": 4781.8,
"valid_targets_min": 1034
},
{
"epoch": 3.7858227848101267,
"grad_norm": 0.33756549066729197,
"learning_rate": 6.779912230514161e-06,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12055318802595139,
"step": 3740,
"valid_targets_mean": 3463.3,
"valid_targets_min": 1599
},
{
"epoch": 3.790886075949367,
"grad_norm": 0.3152172059583756,
"learning_rate": 6.7269720279675755e-06,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17137764394283295,
"step": 3745,
"valid_targets_mean": 4888.2,
"valid_targets_min": 1432
},
{
"epoch": 3.7959493670886078,
"grad_norm": 0.3239318373383687,
"learning_rate": 6.674197505539006e-06,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14893168210983276,
"step": 3750,
"valid_targets_mean": 4158.4,
"valid_targets_min": 1285
},
{
"epoch": 3.8010126582278483,
"grad_norm": 0.2919220688770005,
"learning_rate": 6.621589321984611e-06,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14690950512886047,
"step": 3755,
"valid_targets_mean": 4748.6,
"valid_targets_min": 1607
},
{
"epoch": 3.806075949367089,
"grad_norm": 0.3025582373018823,
"learning_rate": 6.569148133984258e-06,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17515698075294495,
"step": 3760,
"valid_targets_mean": 5047.3,
"valid_targets_min": 1082
},
{
"epoch": 3.8111392405063294,
"grad_norm": 0.2952019372668243,
"learning_rate": 6.516874596133269e-06,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15086880326271057,
"step": 3765,
"valid_targets_mean": 5131.5,
"valid_targets_min": 1253
},
{
"epoch": 3.81620253164557,
"grad_norm": 0.29724809214492576,
"learning_rate": 6.464769360934306e-06,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19773977994918823,
"step": 3770,
"valid_targets_mean": 6146.5,
"valid_targets_min": 1366
},
{
"epoch": 3.82126582278481,
"grad_norm": 0.33270725662814826,
"learning_rate": 6.412833078789178e-06,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15699324011802673,
"step": 3775,
"valid_targets_mean": 4472.4,
"valid_targets_min": 1350
},
{
"epoch": 3.8263291139240505,
"grad_norm": 0.2963372278675901,
"learning_rate": 6.361066397990758e-06,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1388930231332779,
"step": 3780,
"valid_targets_mean": 4676.4,
"valid_targets_min": 971
},
{
"epoch": 3.831392405063291,
"grad_norm": 0.2786191474125972,
"learning_rate": 6.309469964714863e-06,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14243824779987335,
"step": 3785,
"valid_targets_mean": 4964.9,
"valid_targets_min": 1391
},
{
"epoch": 3.8364556962025316,
"grad_norm": 0.3057769621782611,
"learning_rate": 6.2580444230122175e-06,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1198386549949646,
"step": 3790,
"valid_targets_mean": 3840.2,
"valid_targets_min": 745
},
{
"epoch": 3.841518987341772,
"grad_norm": 0.31205008704708975,
"learning_rate": 6.2067904148003764e-06,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17915937304496765,
"step": 3795,
"valid_targets_mean": 5550.8,
"valid_targets_min": 1392
},
{
"epoch": 3.8465822784810126,
"grad_norm": 0.3072712018089592,
"learning_rate": 6.155708579855759e-06,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15422801673412323,
"step": 3800,
"valid_targets_mean": 4714.1,
"valid_targets_min": 970
},
{
"epoch": 3.851645569620253,
"grad_norm": 0.3056625890719376,
"learning_rate": 6.104799555805607e-06,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10852354019880295,
"step": 3805,
"valid_targets_mean": 3481.8,
"valid_targets_min": 1001
},
{
"epoch": 3.8567088607594937,
"grad_norm": 0.33415927615785906,
"learning_rate": 6.054063978120093e-06,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16793662309646606,
"step": 3810,
"valid_targets_mean": 3962.6,
"valid_targets_min": 1458
},
{
"epoch": 3.8617721518987342,
"grad_norm": 0.2859437483451691,
"learning_rate": 6.00350248010431e-06,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11396883428096771,
"step": 3815,
"valid_targets_mean": 4421.5,
"valid_targets_min": 1527
},
{
"epoch": 3.8668354430379748,
"grad_norm": 0.32446773366076725,
"learning_rate": 5.95311569289045e-06,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14191418886184692,
"step": 3820,
"valid_targets_mean": 3904.6,
"valid_targets_min": 1346
},
{
"epoch": 3.8718987341772153,
"grad_norm": 0.33241644171629736,
"learning_rate": 5.902904245429852e-06,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15994411706924438,
"step": 3825,
"valid_targets_mean": 4205.2,
"valid_targets_min": 1211
},
{
"epoch": 3.876962025316456,
"grad_norm": 0.33295558620330956,
"learning_rate": 5.852868764485185e-06,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11764267832040787,
"step": 3830,
"valid_targets_mean": 3148.9,
"valid_targets_min": 992
},
{
"epoch": 3.882025316455696,
"grad_norm": 0.3094377142586556,
"learning_rate": 5.803009874622645e-06,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13288931548595428,
"step": 3835,
"valid_targets_mean": 3723.9,
"valid_targets_min": 1009
},
{
"epoch": 3.8870886075949365,
"grad_norm": 0.28966742570043214,
"learning_rate": 5.753328198204107e-06,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14470314979553223,
"step": 3840,
"valid_targets_mean": 5011.6,
"valid_targets_min": 1536
},
{
"epoch": 3.892151898734177,
"grad_norm": 0.3556764011843303,
"learning_rate": 5.7038243553794105e-06,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15663528442382812,
"step": 3845,
"valid_targets_mean": 3704.3,
"valid_targets_min": 938
},
{
"epoch": 3.8972151898734175,
"grad_norm": 0.4434641609697601,
"learning_rate": 5.654498964078578e-06,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15775218605995178,
"step": 3850,
"valid_targets_mean": 5224.2,
"valid_targets_min": 1008
},
{
"epoch": 3.902278481012658,
"grad_norm": 0.28354591909624743,
"learning_rate": 5.605352640004111e-06,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20830413699150085,
"step": 3855,
"valid_targets_mean": 6659.2,
"valid_targets_min": 1634
},
{
"epoch": 3.9073417721518986,
"grad_norm": 0.31278015955485905,
"learning_rate": 5.556385996623334e-06,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1927700638771057,
"step": 3860,
"valid_targets_mean": 6460.9,
"valid_targets_min": 1493
},
{
"epoch": 3.912405063291139,
"grad_norm": 0.3183546633710576,
"learning_rate": 5.507599645160688e-06,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14958074688911438,
"step": 3865,
"valid_targets_mean": 4336.2,
"valid_targets_min": 1153
},
{
"epoch": 3.9174683544303797,
"grad_norm": 0.2926146837393363,
"learning_rate": 5.45899419459015e-06,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11325857788324356,
"step": 3870,
"valid_targets_mean": 3313.8,
"valid_targets_min": 775
},
{
"epoch": 3.92253164556962,
"grad_norm": 0.2947057963950262,
"learning_rate": 5.410570251627587e-06,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1467699259519577,
"step": 3875,
"valid_targets_mean": 5764.1,
"valid_targets_min": 1283
},
{
"epoch": 3.9275949367088607,
"grad_norm": 0.29570913844534924,
"learning_rate": 5.362328420723208e-06,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14309361577033997,
"step": 3880,
"valid_targets_mean": 4847.8,
"valid_targets_min": 927
},
{
"epoch": 3.9326582278481013,
"grad_norm": 0.3026281684204848,
"learning_rate": 5.314269304054029e-06,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19492954015731812,
"step": 3885,
"valid_targets_mean": 5634.2,
"valid_targets_min": 1361
},
{
"epoch": 3.937721518987342,
"grad_norm": 0.30964406158183067,
"learning_rate": 5.26639350151632e-06,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13411834836006165,
"step": 3890,
"valid_targets_mean": 4035.8,
"valid_targets_min": 1199
},
{
"epoch": 3.9427848101265823,
"grad_norm": 0.3111439221332038,
"learning_rate": 5.218701610718162e-06,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1787598729133606,
"step": 3895,
"valid_targets_mean": 5102.0,
"valid_targets_min": 1779
},
{
"epoch": 3.947848101265823,
"grad_norm": 0.256548917813654,
"learning_rate": 5.171194226971947e-06,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15520493686199188,
"step": 3900,
"valid_targets_mean": 5819.2,
"valid_targets_min": 913
},
{
"epoch": 3.9529113924050634,
"grad_norm": 0.35240271321787325,
"learning_rate": 5.12387194328696e-06,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.100287064909935,
"step": 3905,
"valid_targets_mean": 2803.6,
"valid_targets_min": 1229
},
{
"epoch": 3.957974683544304,
"grad_norm": 0.28051305016909855,
"learning_rate": 5.0767353503620055e-06,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11824625730514526,
"step": 3910,
"valid_targets_mean": 4403.1,
"valid_targets_min": 1454
},
{
"epoch": 3.9630379746835445,
"grad_norm": 0.33648253442313436,
"learning_rate": 5.029785036577976e-06,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12415116280317307,
"step": 3915,
"valid_targets_mean": 3484.4,
"valid_targets_min": 1290
},
{
"epoch": 3.968101265822785,
"grad_norm": 0.3051655834868841,
"learning_rate": 4.983021587990577e-06,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16038689017295837,
"step": 3920,
"valid_targets_mean": 4039.8,
"valid_targets_min": 1423
},
{
"epoch": 3.9731645569620255,
"grad_norm": 0.3149366075705648,
"learning_rate": 4.936445588322947e-06,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17041844129562378,
"step": 3925,
"valid_targets_mean": 4645.1,
"valid_targets_min": 1388
},
{
"epoch": 3.978227848101266,
"grad_norm": 0.3104948744129676,
"learning_rate": 4.890057618958406e-06,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13706716895103455,
"step": 3930,
"valid_targets_mean": 4148.2,
"valid_targets_min": 918
},
{
"epoch": 3.9832911392405066,
"grad_norm": 0.4596385567964535,
"learning_rate": 4.843858258933207e-06,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12977036833763123,
"step": 3935,
"valid_targets_mean": 4589.1,
"valid_targets_min": 1135
},
{
"epoch": 3.9883544303797467,
"grad_norm": 0.35205194291692793,
"learning_rate": 4.797848084929271e-06,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16180771589279175,
"step": 3940,
"valid_targets_mean": 4005.4,
"valid_targets_min": 1682
},
{
"epoch": 3.993417721518987,
"grad_norm": 0.3115344869207087,
"learning_rate": 4.7520276712670344e-06,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1245289221405983,
"step": 3945,
"valid_targets_mean": 3869.5,
"valid_targets_min": 1814
},
{
"epoch": 3.9984810126582278,
"grad_norm": 0.3447482808883552,
"learning_rate": 4.706397589898237e-06,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21260038018226624,
"step": 3950,
"valid_targets_mean": 4663.9,
"valid_targets_min": 1153
},
{
"epoch": 4.0030379746835445,
"grad_norm": 0.31704002367241657,
"learning_rate": 4.660958410398808e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11520913243293762,
"step": 3955,
"valid_targets_mean": 3230.5,
"valid_targets_min": 1024
},
{
"epoch": 4.008101265822785,
"grad_norm": 0.3107759512067684,
"learning_rate": 4.61571069996176e-06,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15815721452236176,
"step": 3960,
"valid_targets_mean": 4538.7,
"valid_targets_min": 763
},
{
"epoch": 4.013164556962026,
"grad_norm": 0.3240449542122713,
"learning_rate": 4.5706550233900825e-06,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1527724266052246,
"step": 3965,
"valid_targets_mean": 4152.1,
"valid_targets_min": 1278
},
{
"epoch": 4.018227848101266,
"grad_norm": 0.3371371879535488,
"learning_rate": 4.5257919430897305e-06,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14754730463027954,
"step": 3970,
"valid_targets_mean": 3785.3,
"valid_targets_min": 1269
},
{
"epoch": 4.023291139240507,
"grad_norm": 0.28767581366652223,
"learning_rate": 4.481122019062562e-06,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14282898604869843,
"step": 3975,
"valid_targets_mean": 4653.0,
"valid_targets_min": 1265
},
{
"epoch": 4.028354430379747,
"grad_norm": 0.29732809453534903,
"learning_rate": 4.436645808899374e-06,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18286307156085968,
"step": 3980,
"valid_targets_mean": 5864.7,
"valid_targets_min": 1531
},
{
"epoch": 4.033417721518988,
"grad_norm": 0.29104777332578374,
"learning_rate": 4.3923638677729506e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15134663879871368,
"step": 3985,
"valid_targets_mean": 5712.8,
"valid_targets_min": 923
},
{
"epoch": 4.038481012658228,
"grad_norm": 0.34370328700294156,
"learning_rate": 4.348276748431095e-06,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16227614879608154,
"step": 3990,
"valid_targets_mean": 4682.2,
"valid_targets_min": 1365
},
{
"epoch": 4.043544303797469,
"grad_norm": 0.2853726249793705,
"learning_rate": 4.304385001189781e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15851733088493347,
"step": 3995,
"valid_targets_mean": 5396.8,
"valid_targets_min": 1278
},
{
"epoch": 4.048607594936709,
"grad_norm": 0.2664334385740433,
"learning_rate": 4.260689173926238e-06,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690644472837448,
"step": 4000,
"valid_targets_mean": 6774.5,
"valid_targets_min": 1292
},
{
"epoch": 4.053670886075949,
"grad_norm": 0.27904233780454435,
"learning_rate": 4.217189812072131e-06,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13511596620082855,
"step": 4005,
"valid_targets_mean": 4486.5,
"valid_targets_min": 1562
},
{
"epoch": 4.0587341772151895,
"grad_norm": 0.3231775999779525,
"learning_rate": 4.173887458606767e-06,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11682070791721344,
"step": 4010,
"valid_targets_mean": 3668.7,
"valid_targets_min": 1126
},
{
"epoch": 4.06379746835443,
"grad_norm": 0.2770166025598625,
"learning_rate": 4.130782654050283e-06,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15404465794563293,
"step": 4015,
"valid_targets_mean": 5586.6,
"valid_targets_min": 1272
},
{
"epoch": 4.0688607594936705,
"grad_norm": 0.27479033637998745,
"learning_rate": 4.087875936456937e-06,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12938356399536133,
"step": 4020,
"valid_targets_mean": 5243.8,
"valid_targets_min": 1267
},
{
"epoch": 4.073924050632911,
"grad_norm": 0.31378983164450186,
"learning_rate": 4.045167841408359e-06,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15723198652267456,
"step": 4025,
"valid_targets_mean": 4392.6,
"valid_targets_min": 1232
},
{
"epoch": 4.078987341772152,
"grad_norm": 0.29002739575691505,
"learning_rate": 4.002658902006893e-06,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15544429421424866,
"step": 4030,
"valid_targets_mean": 5350.4,
"valid_targets_min": 909
},
{
"epoch": 4.084050632911392,
"grad_norm": 0.3087847959185058,
"learning_rate": 3.9603496488689174e-06,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16527938842773438,
"step": 4035,
"valid_targets_mean": 5526.1,
"valid_targets_min": 1129
},
{
"epoch": 4.089113924050633,
"grad_norm": 0.3085791674780826,
"learning_rate": 3.918240610118234e-06,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1917693018913269,
"step": 4040,
"valid_targets_mean": 6275.9,
"valid_targets_min": 1748
},
{
"epoch": 4.094177215189873,
"grad_norm": 0.286080067957159,
"learning_rate": 3.876332311379489e-06,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1519317775964737,
"step": 4045,
"valid_targets_mean": 5526.4,
"valid_targets_min": 1127
},
{
"epoch": 4.099240506329114,
"grad_norm": 0.2837484355272842,
"learning_rate": 3.834625275771582e-06,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.123206228017807,
"step": 4050,
"valid_targets_mean": 4113.7,
"valid_targets_min": 1252
},
{
"epoch": 4.104303797468354,
"grad_norm": 0.2999251731420047,
"learning_rate": 3.7931200239011643e-06,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13318127393722534,
"step": 4055,
"valid_targets_mean": 4568.8,
"valid_targets_min": 1236
},
{
"epoch": 4.109367088607595,
"grad_norm": 0.2816382941308749,
"learning_rate": 3.7518170738561168e-06,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14610666036605835,
"step": 4060,
"valid_targets_mean": 4928.9,
"valid_targets_min": 826
},
{
"epoch": 4.114430379746835,
"grad_norm": 0.32554297974189644,
"learning_rate": 3.7107169411991127e-06,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12090884894132614,
"step": 4065,
"valid_targets_mean": 3398.6,
"valid_targets_min": 1385
},
{
"epoch": 4.119493670886076,
"grad_norm": 0.3170024428197897,
"learning_rate": 3.6698201389611423e-06,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13328410685062408,
"step": 4070,
"valid_targets_mean": 4025.0,
"valid_targets_min": 901
},
{
"epoch": 4.124556962025316,
"grad_norm": 0.3205485924763668,
"learning_rate": 3.62912717763515e-06,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21576707065105438,
"step": 4075,
"valid_targets_mean": 6120.9,
"valid_targets_min": 1421
},
{
"epoch": 4.129620253164557,
"grad_norm": 0.38654381765739637,
"learning_rate": 3.5886385651696267e-06,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14297889173030853,
"step": 4080,
"valid_targets_mean": 4917.6,
"valid_targets_min": 1098
},
{
"epoch": 4.1346835443037975,
"grad_norm": 0.3524477589713149,
"learning_rate": 3.5483548069623043e-06,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14278902113437653,
"step": 4085,
"valid_targets_mean": 3844.8,
"valid_targets_min": 1260
},
{
"epoch": 4.139746835443038,
"grad_norm": 0.3197809913122213,
"learning_rate": 3.5082764058538056e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12523522973060608,
"step": 4090,
"valid_targets_mean": 3690.5,
"valid_targets_min": 885
},
{
"epoch": 4.1448101265822785,
"grad_norm": 0.30886469526940097,
"learning_rate": 3.4684038621214124e-06,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16583015024662018,
"step": 4095,
"valid_targets_mean": 5001.4,
"valid_targets_min": 1243
},
{
"epoch": 4.149873417721519,
"grad_norm": 0.28226754473975985,
"learning_rate": 3.4287376734727817e-06,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16582466661930084,
"step": 4100,
"valid_targets_mean": 5544.1,
"valid_targets_min": 1022
},
{
"epoch": 4.15493670886076,
"grad_norm": 0.3051843817153008,
"learning_rate": 3.3892783350397675e-06,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11235642433166504,
"step": 4105,
"valid_targets_mean": 3728.7,
"valid_targets_min": 1019
},
{
"epoch": 4.16,
"grad_norm": 0.28561421446674784,
"learning_rate": 3.3500263393722033e-06,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14730824530124664,
"step": 4110,
"valid_targets_mean": 5325.3,
"valid_targets_min": 1247
},
{
"epoch": 4.165063291139241,
"grad_norm": 0.3396963845435047,
"learning_rate": 3.310982176431785e-06,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1362554281949997,
"step": 4115,
"valid_targets_mean": 4046.4,
"valid_targets_min": 974
},
{
"epoch": 4.170126582278481,
"grad_norm": 0.3604026125994517,
"learning_rate": 3.2721463335859484e-06,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12034134566783905,
"step": 4120,
"valid_targets_mean": 2845.9,
"valid_targets_min": 1453
},
{
"epoch": 4.175189873417722,
"grad_norm": 0.3047812123169994,
"learning_rate": 3.2335192956017634e-06,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1503809243440628,
"step": 4125,
"valid_targets_mean": 4877.8,
"valid_targets_min": 1783
},
{
"epoch": 4.180253164556962,
"grad_norm": 0.36835014889244666,
"learning_rate": 3.1951015446399247e-06,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11517144739627838,
"step": 4130,
"valid_targets_mean": 2904.6,
"valid_targets_min": 909
},
{
"epoch": 4.185316455696203,
"grad_norm": 0.32918669737266704,
"learning_rate": 3.156893560248688e-06,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140342578291893,
"step": 4135,
"valid_targets_mean": 4083.8,
"valid_targets_min": 1081
},
{
"epoch": 4.190379746835443,
"grad_norm": 0.33957836205604514,
"learning_rate": 3.118895819357908e-06,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1507326364517212,
"step": 4140,
"valid_targets_mean": 4652.1,
"valid_targets_min": 1298
},
{
"epoch": 4.195443037974684,
"grad_norm": 0.285494983139607,
"learning_rate": 3.081108796273098e-06,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12487950921058655,
"step": 4145,
"valid_targets_mean": 4737.4,
"valid_targets_min": 1243
},
{
"epoch": 4.200506329113924,
"grad_norm": 0.32355832904009185,
"learning_rate": 3.0435329626694733e-06,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18284101784229279,
"step": 4150,
"valid_targets_mean": 4946.2,
"valid_targets_min": 1066
},
{
"epoch": 4.205569620253165,
"grad_norm": 0.2901811873935047,
"learning_rate": 3.006168787586097e-06,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13859279453754425,
"step": 4155,
"valid_targets_mean": 5316.1,
"valid_targets_min": 1099
},
{
"epoch": 4.2106329113924055,
"grad_norm": 0.5190123284320625,
"learning_rate": 2.9690167374200075e-06,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1444871723651886,
"step": 4160,
"valid_targets_mean": 4388.6,
"valid_targets_min": 1162
},
{
"epoch": 4.215696202531646,
"grad_norm": 0.31722642981901594,
"learning_rate": 2.9320772759203975e-06,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13206876814365387,
"step": 4165,
"valid_targets_mean": 4130.3,
"valid_targets_min": 1281
},
{
"epoch": 4.220759493670886,
"grad_norm": 0.30916942149206356,
"learning_rate": 2.8953508641828375e-06,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1427369862794876,
"step": 4170,
"valid_targets_mean": 4538.5,
"valid_targets_min": 1313
},
{
"epoch": 4.225822784810126,
"grad_norm": 0.3075492109138346,
"learning_rate": 2.858837960643499e-06,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17169958353042603,
"step": 4175,
"valid_targets_mean": 4840.8,
"valid_targets_min": 1296
},
{
"epoch": 4.230886075949367,
"grad_norm": 0.29933826061321767,
"learning_rate": 2.822539021073463e-06,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16137537360191345,
"step": 4180,
"valid_targets_mean": 5634.3,
"valid_targets_min": 1130
},
{
"epoch": 4.235949367088607,
"grad_norm": 0.29690888264127147,
"learning_rate": 2.786454498572997e-06,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.135961651802063,
"step": 4185,
"valid_targets_mean": 4399.6,
"valid_targets_min": 732
},
{
"epoch": 4.241012658227848,
"grad_norm": 0.3246955608047686,
"learning_rate": 2.7505848435659156e-06,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1551479548215866,
"step": 4190,
"valid_targets_mean": 4534.1,
"valid_targets_min": 1082
},
{
"epoch": 4.246075949367088,
"grad_norm": 0.29829478040788515,
"learning_rate": 2.7149305037939687e-06,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18227550387382507,
"step": 4195,
"valid_targets_mean": 5650.3,
"valid_targets_min": 1359
},
{
"epoch": 4.251139240506329,
"grad_norm": 0.3491396172417171,
"learning_rate": 2.679491924311226e-06,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13989317417144775,
"step": 4200,
"valid_targets_mean": 3527.8,
"valid_targets_min": 1094
},
{
"epoch": 4.256202531645569,
"grad_norm": 0.3062465471975927,
"learning_rate": 2.644269547478555e-06,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16212749481201172,
"step": 4205,
"valid_targets_mean": 4856.2,
"valid_targets_min": 850
},
{
"epoch": 4.26126582278481,
"grad_norm": 0.31154484975672075,
"learning_rate": 2.609263812958065e-06,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10032152384519577,
"step": 4210,
"valid_targets_mean": 3391.6,
"valid_targets_min": 1245
},
{
"epoch": 4.2663291139240505,
"grad_norm": 0.3276187265653155,
"learning_rate": 2.5744751577076343e-06,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16798563301563263,
"step": 4215,
"valid_targets_mean": 4301.5,
"valid_targets_min": 828
},
{
"epoch": 4.271392405063291,
"grad_norm": 0.31771678562930245,
"learning_rate": 2.539904015975476e-06,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14239826798439026,
"step": 4220,
"valid_targets_mean": 4702.1,
"valid_targets_min": 1064
},
{
"epoch": 4.2764556962025315,
"grad_norm": 0.2979983224769533,
"learning_rate": 2.5055508192946732e-06,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15499252080917358,
"step": 4225,
"valid_targets_mean": 4931.4,
"valid_targets_min": 1420
},
{
"epoch": 4.281518987341772,
"grad_norm": 0.3378145372579719,
"learning_rate": 2.4714159964778394e-06,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15219071507453918,
"step": 4230,
"valid_targets_mean": 4131.9,
"valid_targets_min": 1088
},
{
"epoch": 4.286582278481013,
"grad_norm": 0.3132928788106069,
"learning_rate": 2.437499973611728e-06,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17868193984031677,
"step": 4235,
"valid_targets_mean": 5772.8,
"valid_targets_min": 1773
},
{
"epoch": 4.291645569620253,
"grad_norm": 0.3049108704834252,
"learning_rate": 2.403803174051933e-06,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17676058411598206,
"step": 4240,
"valid_targets_mean": 5360.8,
"valid_targets_min": 1400
},
{
"epoch": 4.296708860759494,
"grad_norm": 0.2674881690807918,
"learning_rate": 2.3703260184176103e-06,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11438636481761932,
"step": 4245,
"valid_targets_mean": 4663.1,
"valid_targets_min": 991
},
{
"epoch": 4.301772151898734,
"grad_norm": 0.3381875004506121,
"learning_rate": 2.337068924586203e-06,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14016669988632202,
"step": 4250,
"valid_targets_mean": 3257.6,
"valid_targets_min": 973
},
{
"epoch": 4.306835443037975,
"grad_norm": 0.33566799216440724,
"learning_rate": 2.3040323076882578e-06,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1721951961517334,
"step": 4255,
"valid_targets_mean": 4602.8,
"valid_targets_min": 1312
},
{
"epoch": 4.311898734177215,
"grad_norm": 0.39194447138918637,
"learning_rate": 2.2712165801022046e-06,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1366182416677475,
"step": 4260,
"valid_targets_mean": 2721.6,
"valid_targets_min": 913
},
{
"epoch": 4.316962025316456,
"grad_norm": 0.3637100172839474,
"learning_rate": 2.2386221514492502e-06,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11843443661928177,
"step": 4265,
"valid_targets_mean": 3167.0,
"valid_targets_min": 1022
},
{
"epoch": 4.322025316455696,
"grad_norm": 0.32727869850436964,
"learning_rate": 2.2062494285882363e-06,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1746322512626648,
"step": 4270,
"valid_targets_mean": 4557.8,
"valid_targets_min": 939
},
{
"epoch": 4.327088607594937,
"grad_norm": 0.35219909889872136,
"learning_rate": 2.1740988156105593e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08915197849273682,
"step": 4275,
"valid_targets_mean": 2497.8,
"valid_targets_min": 1172
},
{
"epoch": 4.332151898734177,
"grad_norm": 0.3312024847124787,
"learning_rate": 2.142170713835161e-06,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16628465056419373,
"step": 4280,
"valid_targets_mean": 4481.7,
"valid_targets_min": 1417
},
{
"epoch": 4.337215189873418,
"grad_norm": 0.26123810507474954,
"learning_rate": 2.1104655218034685e-06,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.136556938290596,
"step": 4285,
"valid_targets_mean": 5086.1,
"valid_targets_min": 1214
},
{
"epoch": 4.3422784810126585,
"grad_norm": 0.28913080019288895,
"learning_rate": 2.0789836352744653e-06,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929275244474411,
"step": 4290,
"valid_targets_mean": 6718.0,
"valid_targets_min": 666
},
{
"epoch": 4.347341772151899,
"grad_norm": 0.2856092567973034,
"learning_rate": 2.0477254472197237e-06,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12290873378515244,
"step": 4295,
"valid_targets_mean": 4296.3,
"valid_targets_min": 828
},
{
"epoch": 4.3524050632911395,
"grad_norm": 0.376756316497093,
"learning_rate": 2.0166913478185004e-06,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1333305984735489,
"step": 4300,
"valid_targets_mean": 4643.4,
"valid_targets_min": 1007
},
{
"epoch": 4.35746835443038,
"grad_norm": 0.37269967571373286,
"learning_rate": 1.9858817244528896e-06,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16167780756950378,
"step": 4305,
"valid_targets_mean": 3327.0,
"valid_targets_min": 1248
},
{
"epoch": 4.362531645569621,
"grad_norm": 0.36507367284654024,
"learning_rate": 1.955296961702955e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1149420514702797,
"step": 4310,
"valid_targets_mean": 3484.9,
"valid_targets_min": 1218
},
{
"epoch": 4.367594936708861,
"grad_norm": 0.3549138995526032,
"learning_rate": 1.9249374413419584e-06,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16552500426769257,
"step": 4315,
"valid_targets_mean": 4319.2,
"valid_targets_min": 1166
},
{
"epoch": 4.372658227848102,
"grad_norm": 0.30961509363434114,
"learning_rate": 1.894803542331567e-06,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12911680340766907,
"step": 4320,
"valid_targets_mean": 3623.0,
"valid_targets_min": 1170
},
{
"epoch": 4.377721518987342,
"grad_norm": 0.30219606387390835,
"learning_rate": 1.8648956408171547e-06,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1574065387248993,
"step": 4325,
"valid_targets_mean": 4955.6,
"valid_targets_min": 1679
},
{
"epoch": 4.382784810126582,
"grad_norm": 0.3279169523694041,
"learning_rate": 1.8352141101230758e-06,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1483180820941925,
"step": 4330,
"valid_targets_mean": 3969.1,
"valid_targets_min": 1428
},
{
"epoch": 4.387848101265822,
"grad_norm": 0.3105228186529775,
"learning_rate": 1.8057593207480194e-06,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11923258006572723,
"step": 4335,
"valid_targets_mean": 3387.1,
"valid_targets_min": 1009
},
{
"epoch": 4.392911392405063,
"grad_norm": 0.33881080054396395,
"learning_rate": 1.7765316403603927e-06,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13051745295524597,
"step": 4340,
"valid_targets_mean": 3938.3,
"valid_targets_min": 1204
},
{
"epoch": 4.397974683544303,
"grad_norm": 0.2859920210081916,
"learning_rate": 1.7475314337937099e-06,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14054298400878906,
"step": 4345,
"valid_targets_mean": 4863.8,
"valid_targets_min": 1288
},
{
"epoch": 4.403037974683544,
"grad_norm": 0.3222088763676915,
"learning_rate": 1.7187590630420681e-06,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15554268658161163,
"step": 4350,
"valid_targets_mean": 3944.6,
"valid_targets_min": 1256
},
{
"epoch": 4.4081012658227845,
"grad_norm": 0.32147293328088156,
"learning_rate": 1.6902148872555924e-06,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13429546356201172,
"step": 4355,
"valid_targets_mean": 3537.0,
"valid_targets_min": 1501
},
{
"epoch": 4.413164556962025,
"grad_norm": 0.2873112295172894,
"learning_rate": 1.661899262735991e-06,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11225029826164246,
"step": 4360,
"valid_targets_mean": 3726.2,
"valid_targets_min": 1432
},
{
"epoch": 4.418227848101266,
"grad_norm": 0.3137420905534193,
"learning_rate": 1.6338125429320694e-06,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628667116165161,
"step": 4365,
"valid_targets_mean": 4489.4,
"valid_targets_min": 1251
},
{
"epoch": 4.423291139240506,
"grad_norm": 0.2980697010922971,
"learning_rate": 1.605955078435355e-06,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740245670080185,
"step": 4370,
"valid_targets_mean": 5941.4,
"valid_targets_min": 949
},
{
"epoch": 4.428354430379747,
"grad_norm": 0.29655956780164205,
"learning_rate": 1.5783272169756903e-06,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12947620451450348,
"step": 4375,
"valid_targets_mean": 4607.8,
"valid_targets_min": 1670
},
{
"epoch": 4.433417721518987,
"grad_norm": 0.28159919536576594,
"learning_rate": 1.550929303416917e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11871195584535599,
"step": 4380,
"valid_targets_mean": 4622.2,
"valid_targets_min": 1319
},
{
"epoch": 4.438481012658228,
"grad_norm": 0.3159849176088272,
"learning_rate": 1.5237616797525512e-06,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13893471658229828,
"step": 4385,
"valid_targets_mean": 4139.4,
"valid_targets_min": 1377
},
{
"epoch": 4.443544303797468,
"grad_norm": 0.3103371076544768,
"learning_rate": 1.49682468510153e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17314529418945312,
"step": 4390,
"valid_targets_mean": 5825.6,
"valid_targets_min": 1000
},
{
"epoch": 4.448607594936709,
"grad_norm": 0.28729653443614084,
"learning_rate": 1.4701186557039648e-06,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13900840282440186,
"step": 4395,
"valid_targets_mean": 4918.3,
"valid_targets_min": 1337
},
{
"epoch": 4.453670886075949,
"grad_norm": 0.3411738428471954,
"learning_rate": 1.4436439249169554e-06,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13948732614517212,
"step": 4400,
"valid_targets_mean": 5576.6,
"valid_targets_min": 1142
},
{
"epoch": 4.45873417721519,
"grad_norm": 0.3118105881962252,
"learning_rate": 1.4174008232104285e-06,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13870777189731598,
"step": 4405,
"valid_targets_mean": 4355.1,
"valid_targets_min": 1522
},
{
"epoch": 4.46379746835443,
"grad_norm": 0.32978343142383926,
"learning_rate": 1.3913896781629954e-06,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13087686896324158,
"step": 4410,
"valid_targets_mean": 3731.3,
"valid_targets_min": 540
},
{
"epoch": 4.468860759493671,
"grad_norm": 0.2618923931315447,
"learning_rate": 1.3656108144578962e-06,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13182973861694336,
"step": 4415,
"valid_targets_mean": 4776.1,
"valid_targets_min": 889
},
{
"epoch": 4.473924050632911,
"grad_norm": 0.27864898068700833,
"learning_rate": 1.340064553878908e-06,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14037862420082092,
"step": 4420,
"valid_targets_mean": 5322.2,
"valid_targets_min": 1116
},
{
"epoch": 4.478987341772152,
"grad_norm": 0.2935646123466447,
"learning_rate": 1.3147512153063558e-06,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18074341118335724,
"step": 4425,
"valid_targets_mean": 6079.2,
"valid_targets_min": 1329
},
{
"epoch": 4.4840506329113925,
"grad_norm": 0.34486016144946086,
"learning_rate": 1.289671114713129e-06,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1330321580171585,
"step": 4430,
"valid_targets_mean": 3942.1,
"valid_targets_min": 906
},
{
"epoch": 4.489113924050633,
"grad_norm": 0.3344555372523651,
"learning_rate": 1.264824565160716e-06,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601177453994751,
"step": 4435,
"valid_targets_mean": 5832.6,
"valid_targets_min": 1133
},
{
"epoch": 4.494177215189874,
"grad_norm": 0.31338693723543865,
"learning_rate": 1.2402118767953342e-06,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11089809238910675,
"step": 4440,
"valid_targets_mean": 3433.5,
"valid_targets_min": 1255
},
{
"epoch": 4.499240506329114,
"grad_norm": 0.32257737557743127,
"learning_rate": 1.2158333568440183e-06,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19272515177726746,
"step": 4445,
"valid_targets_mean": 5173.0,
"valid_targets_min": 1505
},
{
"epoch": 4.504303797468355,
"grad_norm": 0.31362483355013254,
"learning_rate": 1.1916893096108063e-06,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1500798463821411,
"step": 4450,
"valid_targets_mean": 4663.4,
"valid_targets_min": 1370
},
{
"epoch": 4.509367088607595,
"grad_norm": 0.3261715632472016,
"learning_rate": 1.167780036472952e-06,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13341718912124634,
"step": 4455,
"valid_targets_mean": 3426.2,
"valid_targets_min": 1364
},
{
"epoch": 4.514430379746836,
"grad_norm": 0.30597584635072983,
"learning_rate": 1.1441058358771317e-06,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16293524205684662,
"step": 4460,
"valid_targets_mean": 4787.8,
"valid_targets_min": 1378
},
{
"epoch": 4.519493670886076,
"grad_norm": 0.2817037355554941,
"learning_rate": 1.1206670033357537e-06,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15130957961082458,
"step": 4465,
"valid_targets_mean": 5285.4,
"valid_targets_min": 1543
},
{
"epoch": 4.524556962025317,
"grad_norm": 0.31694092622996994,
"learning_rate": 1.0974638314232355e-06,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15193693339824677,
"step": 4470,
"valid_targets_mean": 4457.0,
"valid_targets_min": 1065
},
{
"epoch": 4.529620253164557,
"grad_norm": 0.3521199068866329,
"learning_rate": 1.074496609772384e-06,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12703898549079895,
"step": 4475,
"valid_targets_mean": 3699.0,
"valid_targets_min": 1328
},
{
"epoch": 4.534683544303798,
"grad_norm": 0.33021283919153493,
"learning_rate": 1.0517656250707575e-06,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17758193612098694,
"step": 4480,
"valid_targets_mean": 5269.1,
"valid_targets_min": 1336
},
{
"epoch": 4.539746835443038,
"grad_norm": 0.29305233423571464,
"learning_rate": 1.0292711610570904e-06,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17428819835186005,
"step": 4485,
"valid_targets_mean": 6173.5,
"valid_targets_min": 1377
},
{
"epoch": 4.544810126582279,
"grad_norm": 0.28819969743794543,
"learning_rate": 1.007013498517766e-06,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11772993206977844,
"step": 4490,
"valid_targets_mean": 4622.6,
"valid_targets_min": 1404
},
{
"epoch": 4.549873417721519,
"grad_norm": 0.28436809731542273,
"learning_rate": 9.849929152832937e-07,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1377575397491455,
"step": 4495,
"valid_targets_mean": 4425.2,
"valid_targets_min": 1292
},
{
"epoch": 4.55493670886076,
"grad_norm": 0.3150381879092353,
"learning_rate": 9.63209686224853e-07,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13312697410583496,
"step": 4500,
"valid_targets_mean": 3467.1,
"valid_targets_min": 826
},
{
"epoch": 4.5600000000000005,
"grad_norm": 0.2911980506543601,
"learning_rate": 9.416640832508572e-07,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16458618640899658,
"step": 4505,
"valid_targets_mean": 5330.3,
"valid_targets_min": 980
},
{
"epoch": 4.56506329113924,
"grad_norm": 0.32761330476726724,
"learning_rate": 9.203563753035527e-07,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15134479105472565,
"step": 4510,
"valid_targets_mean": 4789.5,
"valid_targets_min": 1240
},
{
"epoch": 4.570126582278481,
"grad_norm": 0.27610230646497064,
"learning_rate": 8.992868283556833e-07,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14713215827941895,
"step": 4515,
"valid_targets_mean": 5446.5,
"valid_targets_min": 810
},
{
"epoch": 4.575189873417721,
"grad_norm": 0.33737396503280603,
"learning_rate": 8.78455705407144e-07,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15195101499557495,
"step": 4520,
"valid_targets_mean": 4126.9,
"valid_targets_min": 866
},
{
"epoch": 4.580253164556962,
"grad_norm": 0.421939799277528,
"learning_rate": 8.578632664817177e-07,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15855969488620758,
"step": 4525,
"valid_targets_mean": 4059.2,
"valid_targets_min": 1162
},
{
"epoch": 4.585316455696202,
"grad_norm": 0.30679616072425525,
"learning_rate": 8.375097686238187e-07,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15983693301677704,
"step": 4530,
"valid_targets_mean": 4688.2,
"valid_targets_min": 844
},
{
"epoch": 4.590379746835443,
"grad_norm": 0.33783626379593873,
"learning_rate": 8.173954658952854e-07,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13029304146766663,
"step": 4535,
"valid_targets_mean": 3584.9,
"valid_targets_min": 1132
},
{
"epoch": 4.595443037974683,
"grad_norm": 0.409725960177412,
"learning_rate": 7.975206093722176e-07,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1639317274093628,
"step": 4540,
"valid_targets_mean": 4393.8,
"valid_targets_min": 981
},
{
"epoch": 4.600506329113924,
"grad_norm": 0.34883872064169896,
"learning_rate": 7.778854471418306e-07,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1438419073820114,
"step": 4545,
"valid_targets_mean": 3598.3,
"valid_targets_min": 1015
},
{
"epoch": 4.605569620253164,
"grad_norm": 0.3163445155831429,
"learning_rate": 7.584902242993708e-07,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19004172086715698,
"step": 4550,
"valid_targets_mean": 5218.9,
"valid_targets_min": 1337
},
{
"epoch": 4.610632911392405,
"grad_norm": 0.28908020066387696,
"learning_rate": 7.393351829450379e-07,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12715786695480347,
"step": 4555,
"valid_targets_mean": 4291.9,
"valid_targets_min": 1068
},
{
"epoch": 4.6156962025316455,
"grad_norm": 0.3390758182489428,
"learning_rate": 7.204205621809813e-07,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16513592004776,
"step": 4560,
"valid_targets_mean": 4141.6,
"valid_targets_min": 1241
},
{
"epoch": 4.620759493670886,
"grad_norm": 0.3707332505274512,
"learning_rate": 7.017465981083127e-07,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18795087933540344,
"step": 4565,
"valid_targets_mean": 6154.2,
"valid_targets_min": 1174
},
{
"epoch": 4.6258227848101265,
"grad_norm": 0.3431279755640469,
"learning_rate": 6.833135238241473e-07,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1402522623538971,
"step": 4570,
"valid_targets_mean": 3705.2,
"valid_targets_min": 1346
},
{
"epoch": 4.630886075949367,
"grad_norm": 0.3201150073208208,
"learning_rate": 6.651215694187074e-07,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13963478803634644,
"step": 4575,
"valid_targets_mean": 4570.6,
"valid_targets_min": 1027
},
{
"epoch": 4.635949367088608,
"grad_norm": 0.32083737479519586,
"learning_rate": 6.471709619724386e-07,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1721346378326416,
"step": 4580,
"valid_targets_mean": 4410.9,
"valid_targets_min": 1268
},
{
"epoch": 4.641012658227848,
"grad_norm": 0.3413968428656355,
"learning_rate": 6.294619255531853e-07,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1746809184551239,
"step": 4585,
"valid_targets_mean": 4543.4,
"valid_targets_min": 1503
},
{
"epoch": 4.646075949367089,
"grad_norm": 0.2984905883347286,
"learning_rate": 6.119946812133926e-07,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2020062506198883,
"step": 4590,
"valid_targets_mean": 7061.8,
"valid_targets_min": 1615
},
{
"epoch": 4.651139240506329,
"grad_norm": 0.2957015403668056,
"learning_rate": 5.947694469873377e-07,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1912672221660614,
"step": 4595,
"valid_targets_mean": 6352.6,
"valid_targets_min": 1115
},
{
"epoch": 4.65620253164557,
"grad_norm": 0.3177142897029759,
"learning_rate": 5.777864378884212e-07,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1385997235774994,
"step": 4600,
"valid_targets_mean": 4380.5,
"valid_targets_min": 1184
},
{
"epoch": 4.66126582278481,
"grad_norm": 0.30671392692985,
"learning_rate": 5.610458659064688e-07,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17495407164096832,
"step": 4605,
"valid_targets_mean": 5155.4,
"valid_targets_min": 1128
},
{
"epoch": 4.666329113924051,
"grad_norm": 0.32460623503028924,
"learning_rate": 5.445479400051046e-07,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1435496062040329,
"step": 4610,
"valid_targets_mean": 4002.2,
"valid_targets_min": 1103
},
{
"epoch": 4.671392405063291,
"grad_norm": 0.3077758754022733,
"learning_rate": 5.282928661191178e-07,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11725576967000961,
"step": 4615,
"valid_targets_mean": 3599.3,
"valid_targets_min": 1270
},
{
"epoch": 4.676455696202532,
"grad_norm": 0.2920943225927082,
"learning_rate": 5.12280847151918e-07,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15268352627754211,
"step": 4620,
"valid_targets_mean": 4974.8,
"valid_targets_min": 1238
},
{
"epoch": 4.681518987341772,
"grad_norm": 0.3310902814879114,
"learning_rate": 4.965120829729819e-07,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1577180027961731,
"step": 4625,
"valid_targets_mean": 4892.1,
"valid_targets_min": 1480
},
{
"epoch": 4.686582278481013,
"grad_norm": 0.3364738036743787,
"learning_rate": 4.809867704153726e-07,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11956533789634705,
"step": 4630,
"valid_targets_mean": 3546.2,
"valid_targets_min": 914
},
{
"epoch": 4.6916455696202535,
"grad_norm": 0.34774374236202665,
"learning_rate": 4.657051032732707e-07,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14325565099716187,
"step": 4635,
"valid_targets_mean": 3353.1,
"valid_targets_min": 908
},
{
"epoch": 4.696708860759494,
"grad_norm": 0.32445866672285933,
"learning_rate": 4.506672722995609e-07,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1779376119375229,
"step": 4640,
"valid_targets_mean": 5084.9,
"valid_targets_min": 1254
},
{
"epoch": 4.7017721518987345,
"grad_norm": 0.3370837185705519,
"learning_rate": 4.358734652034624e-07,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12637917697429657,
"step": 4645,
"valid_targets_mean": 3544.5,
"valid_targets_min": 1283
},
{
"epoch": 4.706835443037974,
"grad_norm": 0.3141292209016846,
"learning_rate": 4.2132386664815783e-07,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13325795531272888,
"step": 4650,
"valid_targets_mean": 4623.6,
"valid_targets_min": 1232
},
{
"epoch": 4.711898734177215,
"grad_norm": 0.3052040124075767,
"learning_rate": 4.070186582485214e-07,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14848539233207703,
"step": 4655,
"valid_targets_mean": 3974.2,
"valid_targets_min": 1752
},
{
"epoch": 4.716962025316455,
"grad_norm": 0.3485398015143201,
"learning_rate": 3.9295801856882307e-07,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15560302138328552,
"step": 4660,
"valid_targets_mean": 3853.7,
"valid_targets_min": 1331
},
{
"epoch": 4.722025316455696,
"grad_norm": 0.30603263342163534,
"learning_rate": 3.791421231205217e-07,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1302764117717743,
"step": 4665,
"valid_targets_mean": 4759.7,
"valid_targets_min": 980
},
{
"epoch": 4.727088607594936,
"grad_norm": 0.36206047089808735,
"learning_rate": 3.6557114436005516e-07,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11317434906959534,
"step": 4670,
"valid_targets_mean": 2750.8,
"valid_targets_min": 1281
},
{
"epoch": 4.732151898734177,
"grad_norm": 0.31924377751088473,
"learning_rate": 3.522452516867048e-07,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19149929285049438,
"step": 4675,
"valid_targets_mean": 5680.5,
"valid_targets_min": 1070
},
{
"epoch": 4.737215189873417,
"grad_norm": 0.40142669703450146,
"learning_rate": 3.391646114404701e-07,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1676904857158661,
"step": 4680,
"valid_targets_mean": 5601.9,
"valid_targets_min": 1777
},
{
"epoch": 4.742278481012658,
"grad_norm": 0.33298593772917773,
"learning_rate": 3.263293868999928e-07,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1185358390212059,
"step": 4685,
"valid_targets_mean": 2993.5,
"valid_targets_min": 1244
},
{
"epoch": 4.7473417721518985,
"grad_norm": 0.28590139808721005,
"learning_rate": 3.1373973828052964e-07,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1383609175682068,
"step": 4690,
"valid_targets_mean": 4685.9,
"valid_targets_min": 1897
},
{
"epoch": 4.752405063291139,
"grad_norm": 0.33045699934667616,
"learning_rate": 3.013958227319358e-07,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.128380686044693,
"step": 4695,
"valid_targets_mean": 3661.8,
"valid_targets_min": 1102
},
{
"epoch": 4.7574683544303795,
"grad_norm": 0.3175505591380564,
"learning_rate": 2.892977943367159e-07,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19775532186031342,
"step": 4700,
"valid_targets_mean": 5166.0,
"valid_targets_min": 954
},
{
"epoch": 4.76253164556962,
"grad_norm": 0.2773796894575858,
"learning_rate": 2.774458041080963e-07,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12263042479753494,
"step": 4705,
"valid_targets_mean": 4538.4,
"valid_targets_min": 1559
},
{
"epoch": 4.767594936708861,
"grad_norm": 0.3292357564608315,
"learning_rate": 2.6583999998814e-07,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14571279287338257,
"step": 4710,
"valid_targets_mean": 3984.7,
"valid_targets_min": 1195
},
{
"epoch": 4.772658227848101,
"grad_norm": 0.3368831623026044,
"learning_rate": 2.544805268459016e-07,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21459759771823883,
"step": 4715,
"valid_targets_mean": 4702.3,
"valid_targets_min": 1266
},
{
"epoch": 4.777721518987342,
"grad_norm": 0.335601220973268,
"learning_rate": 2.4336752647561304e-07,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14298905432224274,
"step": 4720,
"valid_targets_mean": 3874.7,
"valid_targets_min": 965
},
{
"epoch": 4.782784810126582,
"grad_norm": 0.28413880966924987,
"learning_rate": 2.3250113759492266e-07,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1618804931640625,
"step": 4725,
"valid_targets_mean": 5582.7,
"valid_targets_min": 868
},
{
"epoch": 4.787848101265823,
"grad_norm": 0.3021482607745952,
"learning_rate": 2.2188149584315922e-07,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15998998284339905,
"step": 4730,
"valid_targets_mean": 4565.1,
"valid_targets_min": 1149
},
{
"epoch": 4.792911392405063,
"grad_norm": 0.3011882542828061,
"learning_rate": 2.1150873377963954e-07,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1401754915714264,
"step": 4735,
"valid_targets_mean": 5010.8,
"valid_targets_min": 998
},
{
"epoch": 4.797974683544304,
"grad_norm": 0.3507567997328214,
"learning_rate": 2.0138298088201004e-07,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0675700232386589,
"step": 4740,
"valid_targets_mean": 2630.8,
"valid_targets_min": 1155
},
{
"epoch": 4.803037974683544,
"grad_norm": 0.3187910514753291,
"learning_rate": 1.915043635446323e-07,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12245633453130722,
"step": 4745,
"valid_targets_mean": 3394.0,
"valid_targets_min": 1403
},
{
"epoch": 4.808101265822785,
"grad_norm": 0.2967133708531598,
"learning_rate": 1.8187300507701345e-07,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1302807629108429,
"step": 4750,
"valid_targets_mean": 3881.6,
"valid_targets_min": 1033
},
{
"epoch": 4.813164556962025,
"grad_norm": 0.30044714660435673,
"learning_rate": 1.7248902570225378e-07,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13116371631622314,
"step": 4755,
"valid_targets_mean": 4054.7,
"valid_targets_min": 886
},
{
"epoch": 4.818227848101266,
"grad_norm": 0.3161774057323668,
"learning_rate": 1.6335254255555933e-07,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14581556618213654,
"step": 4760,
"valid_targets_mean": 4080.4,
"valid_targets_min": 1368
},
{
"epoch": 4.8232911392405065,
"grad_norm": 0.30034489171760914,
"learning_rate": 1.5446366968276283e-07,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1464047133922577,
"step": 4765,
"valid_targets_mean": 4359.5,
"valid_targets_min": 1093
},
{
"epoch": 4.828354430379747,
"grad_norm": 0.30396263421785596,
"learning_rate": 1.4582251803892055e-07,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14488472044467926,
"step": 4770,
"valid_targets_mean": 4854.4,
"valid_targets_min": 956
},
{
"epoch": 4.8334177215189875,
"grad_norm": 0.25886849889886787,
"learning_rate": 1.3742919548691114e-07,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13551469147205353,
"step": 4775,
"valid_targets_mean": 5292.5,
"valid_targets_min": 1085
},
{
"epoch": 4.838481012658228,
"grad_norm": 0.3369536866060149,
"learning_rate": 1.2928380679609442e-07,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20701755583286285,
"step": 4780,
"valid_targets_mean": 5313.5,
"valid_targets_min": 1444
},
{
"epoch": 4.843544303797469,
"grad_norm": 0.2981209270612857,
"learning_rate": 1.2138645364101032e-07,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11797007918357849,
"step": 4785,
"valid_targets_mean": 4077.7,
"valid_targets_min": 1058
},
{
"epoch": 4.848607594936709,
"grad_norm": 0.2923056085103413,
"learning_rate": 1.1373723460009756e-07,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18645049631595612,
"step": 4790,
"valid_targets_mean": 6275.9,
"valid_targets_min": 1356
},
{
"epoch": 4.85367088607595,
"grad_norm": 0.31520564975094073,
"learning_rate": 1.0633624515447027e-07,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1347823590040207,
"step": 4795,
"valid_targets_mean": 3709.9,
"valid_targets_min": 1143
},
{
"epoch": 4.85873417721519,
"grad_norm": 0.330282900217264,
"learning_rate": 9.918357768673004e-08,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10554465651512146,
"step": 4800,
"valid_targets_mean": 3067.8,
"valid_targets_min": 1042
},
{
"epoch": 4.863797468354431,
"grad_norm": 0.34394007944621313,
"learning_rate": 9.22793214797979e-08,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1265249103307724,
"step": 4805,
"valid_targets_mean": 3206.9,
"valid_targets_min": 972
},
{
"epoch": 4.868860759493671,
"grad_norm": 0.3066301892656282,
"learning_rate": 8.562356271582194e-08,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11144056916236877,
"step": 4810,
"valid_targets_mean": 3448.4,
"valid_targets_min": 1079
},
{
"epoch": 4.873924050632912,
"grad_norm": 0.31898550298505707,
"learning_rate": 7.92163844750804e-08,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17169725894927979,
"step": 4815,
"valid_targets_mean": 4453.8,
"valid_targets_min": 1086
},
{
"epoch": 4.878987341772152,
"grad_norm": 0.35072783756221276,
"learning_rate": 7.305786673495796e-08,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1834912747144699,
"step": 4820,
"valid_targets_mean": 4796.1,
"valid_targets_min": 1290
},
{
"epoch": 4.884050632911393,
"grad_norm": 0.30086828019346806,
"learning_rate": 6.714808636893999e-08,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19445079565048218,
"step": 4825,
"valid_targets_mean": 5488.9,
"valid_targets_min": 1013
},
{
"epoch": 4.889113924050633,
"grad_norm": 0.29066248451169346,
"learning_rate": 6.148711714565992e-08,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14921297132968903,
"step": 4830,
"valid_targets_mean": 5289.1,
"valid_targets_min": 1279
},
{
"epoch": 4.894177215189873,
"grad_norm": 0.3206808977051651,
"learning_rate": 5.6075029727971075e-08,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15516558289527893,
"step": 4835,
"valid_targets_mean": 4284.6,
"valid_targets_min": 1465
},
{
"epoch": 4.899240506329114,
"grad_norm": 0.34136663563954944,
"learning_rate": 5.091189167207189e-08,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16188789904117584,
"step": 4840,
"valid_targets_mean": 4162.2,
"valid_targets_min": 1536
},
{
"epoch": 4.904303797468354,
"grad_norm": 0.2892291641651244,
"learning_rate": 4.5997767426653183e-08,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11494030058383942,
"step": 4845,
"valid_targets_mean": 3805.9,
"valid_targets_min": 950
},
{
"epoch": 4.909367088607595,
"grad_norm": 0.3310728562870818,
"learning_rate": 4.133271833210772e-08,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15285596251487732,
"step": 4850,
"valid_targets_mean": 4150.3,
"valid_targets_min": 1408
},
{
"epoch": 4.914430379746835,
"grad_norm": 0.29329622685622975,
"learning_rate": 3.6916802619746395e-08,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16643556952476501,
"step": 4855,
"valid_targets_mean": 5756.4,
"valid_targets_min": 1791
},
{
"epoch": 4.919493670886076,
"grad_norm": 0.3795378130128926,
"learning_rate": 3.2750075411087654e-08,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20965784788131714,
"step": 4860,
"valid_targets_mean": 5036.8,
"valid_targets_min": 1359
},
{
"epoch": 4.924556962025316,
"grad_norm": 0.3227285897594828,
"learning_rate": 2.8832588717164766e-08,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13055765628814697,
"step": 4865,
"valid_targets_mean": 3481.6,
"valid_targets_min": 1608
},
{
"epoch": 4.929620253164557,
"grad_norm": 0.30074655411206147,
"learning_rate": 2.516439143786631e-08,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17739662528038025,
"step": 4870,
"valid_targets_mean": 5336.9,
"valid_targets_min": 786
},
{
"epoch": 4.934683544303797,
"grad_norm": 0.37988249749008485,
"learning_rate": 2.1745529361343333e-08,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18349409103393555,
"step": 4875,
"valid_targets_mean": 5208.7,
"valid_targets_min": 1284
},
{
"epoch": 4.939746835443038,
"grad_norm": 0.3022387792298933,
"learning_rate": 1.857604516342315e-08,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1349787563085556,
"step": 4880,
"valid_targets_mean": 4001.4,
"valid_targets_min": 1055
},
{
"epoch": 4.944810126582278,
"grad_norm": 0.3239022765036362,
"learning_rate": 1.5655978407085326e-08,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15572325885295868,
"step": 4885,
"valid_targets_mean": 4256.0,
"valid_targets_min": 1282
},
{
"epoch": 4.949873417721519,
"grad_norm": 0.3484022919664308,
"learning_rate": 1.2985365541959838e-08,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1123068630695343,
"step": 4890,
"valid_targets_mean": 3383.1,
"valid_targets_min": 1353
},
{
"epoch": 4.954936708860759,
"grad_norm": 0.2766076122909068,
"learning_rate": 1.0564239903885221e-08,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13588979840278625,
"step": 4895,
"valid_targets_mean": 5022.2,
"valid_targets_min": 1687
},
{
"epoch": 4.96,
"grad_norm": 0.3637031857594984,
"learning_rate": 8.392631714477794e-09,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22151219844818115,
"step": 4900,
"valid_targets_mean": 4548.4,
"valid_targets_min": 1055
},
{
"epoch": 4.9650632911392405,
"grad_norm": 0.3070617643850501,
"learning_rate": 6.470568080760853e-09,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599656343460083,
"step": 4905,
"valid_targets_mean": 5380.0,
"valid_targets_min": 696
},
{
"epoch": 4.970126582278481,
"grad_norm": 0.2982099706698035,
"learning_rate": 4.798072994827152e-09,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13907426595687866,
"step": 4910,
"valid_targets_mean": 4511.9,
"valid_targets_min": 1282
},
{
"epoch": 4.975189873417722,
"grad_norm": 0.34819560371210506,
"learning_rate": 3.3751673335458147e-09,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14076785743236542,
"step": 4915,
"valid_targets_mean": 3422.9,
"valid_targets_min": 1383
},
{
"epoch": 4.980253164556962,
"grad_norm": 0.3120620502259134,
"learning_rate": 2.2018688582803315e-09,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17987266182899475,
"step": 4920,
"valid_targets_mean": 5285.9,
"valid_targets_min": 1137
},
{
"epoch": 4.985316455696203,
"grad_norm": 0.28626460706538365,
"learning_rate": 1.2781922146931635e-09,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15345998108386993,
"step": 4925,
"valid_targets_mean": 5331.3,
"valid_targets_min": 781
},
{
"epoch": 4.990379746835443,
"grad_norm": 0.30214318111472815,
"learning_rate": 6.041489325459004e-10,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14609292149543762,
"step": 4930,
"valid_targets_mean": 4398.6,
"valid_targets_min": 1460
},
{
"epoch": 4.995443037974684,
"grad_norm": 0.36710406768986703,
"learning_rate": 1.7974742556159386e-10,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17454470694065094,
"step": 4935,
"valid_targets_mean": 4667.4,
"valid_targets_min": 949
},
{
"epoch": 5.0,
"grad_norm": 0.42711913533675244,
"learning_rate": 4.992991313734763e-12,
"loss": 0.2954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29739144444465637,
"step": 4940,
"valid_targets_mean": 4348.2,
"valid_targets_min": 876
},
{
"epoch": 5.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29739144444465637,
"step": 4940,
"total_flos": 1.3775029894633226e+18,
"train_loss": 0.31707094306887884,
"train_runtime": 34760.1149,
"train_samples_per_second": 4.545,
"train_steps_per_second": 0.142,
"valid_targets_mean": 4348.2,
"valid_targets_min": 876
}
],
"logging_steps": 5,
"max_steps": 4940,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": false,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1.3775029894633226e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}