exp_tas_parser_xml_traces / trainer_state.json
hf-reset
Reset repository without checkpoints directories
71c3757
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4060,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008620689655172414,
"grad_norm": 9.24550457643599,
"learning_rate": 3.9408866995073894e-07,
"loss": 0.9873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43203049898147583,
"step": 5,
"valid_targets_mean": 3287.9,
"valid_targets_min": 901
},
{
"epoch": 0.017241379310344827,
"grad_norm": 7.335533460597348,
"learning_rate": 8.866995073891626e-07,
"loss": 1.0212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5148377418518066,
"step": 10,
"valid_targets_mean": 3855.8,
"valid_targets_min": 1359
},
{
"epoch": 0.02586206896551724,
"grad_norm": 7.854592614384845,
"learning_rate": 1.3793103448275862e-06,
"loss": 1.0819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5726603865623474,
"step": 15,
"valid_targets_mean": 2505.0,
"valid_targets_min": 764
},
{
"epoch": 0.034482758620689655,
"grad_norm": 4.719130380535508,
"learning_rate": 1.8719211822660098e-06,
"loss": 1.0174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6978442668914795,
"step": 20,
"valid_targets_mean": 5433.6,
"valid_targets_min": 502
},
{
"epoch": 0.04310344827586207,
"grad_norm": 4.179075473275818,
"learning_rate": 2.3645320197044334e-06,
"loss": 0.9749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37579989433288574,
"step": 25,
"valid_targets_mean": 2919.2,
"valid_targets_min": 695
},
{
"epoch": 0.05172413793103448,
"grad_norm": 3.2866656076565355,
"learning_rate": 2.8571428571428573e-06,
"loss": 0.8866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3706856369972229,
"step": 30,
"valid_targets_mean": 3500.5,
"valid_targets_min": 643
},
{
"epoch": 0.0603448275862069,
"grad_norm": 2.5424063865240134,
"learning_rate": 3.349753694581281e-06,
"loss": 0.9536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4894193708896637,
"step": 35,
"valid_targets_mean": 3924.0,
"valid_targets_min": 1668
},
{
"epoch": 0.06896551724137931,
"grad_norm": 2.0545621588279888,
"learning_rate": 3.842364532019705e-06,
"loss": 0.8279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41704902052879333,
"step": 40,
"valid_targets_mean": 2984.0,
"valid_targets_min": 840
},
{
"epoch": 0.07758620689655173,
"grad_norm": 1.287657343571009,
"learning_rate": 4.334975369458129e-06,
"loss": 0.8506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40100449323654175,
"step": 45,
"valid_targets_mean": 4369.2,
"valid_targets_min": 619
},
{
"epoch": 0.08620689655172414,
"grad_norm": 1.1918469853583982,
"learning_rate": 4.8275862068965525e-06,
"loss": 0.8647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4594336450099945,
"step": 50,
"valid_targets_mean": 4147.5,
"valid_targets_min": 1578
},
{
"epoch": 0.09482758620689655,
"grad_norm": 0.9441218490186954,
"learning_rate": 5.320197044334976e-06,
"loss": 0.7806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4251787066459656,
"step": 55,
"valid_targets_mean": 5269.2,
"valid_targets_min": 2325
},
{
"epoch": 0.10344827586206896,
"grad_norm": 1.0388853131448057,
"learning_rate": 5.812807881773399e-06,
"loss": 0.7767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3979467749595642,
"step": 60,
"valid_targets_mean": 2872.6,
"valid_targets_min": 1303
},
{
"epoch": 0.11206896551724138,
"grad_norm": 0.9660370233248622,
"learning_rate": 6.305418719211823e-06,
"loss": 0.8294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32068926095962524,
"step": 65,
"valid_targets_mean": 2370.2,
"valid_targets_min": 737
},
{
"epoch": 0.1206896551724138,
"grad_norm": 0.8930917300505489,
"learning_rate": 6.798029556650246e-06,
"loss": 0.8083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3917607069015503,
"step": 70,
"valid_targets_mean": 3463.4,
"valid_targets_min": 1465
},
{
"epoch": 0.12931034482758622,
"grad_norm": 0.7389990882620856,
"learning_rate": 7.290640394088671e-06,
"loss": 0.7757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3763599991798401,
"step": 75,
"valid_targets_mean": 4467.6,
"valid_targets_min": 772
},
{
"epoch": 0.13793103448275862,
"grad_norm": 0.7472214279722299,
"learning_rate": 7.783251231527095e-06,
"loss": 0.7342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3860183656215668,
"step": 80,
"valid_targets_mean": 3997.8,
"valid_targets_min": 1795
},
{
"epoch": 0.14655172413793102,
"grad_norm": 0.7218339941398133,
"learning_rate": 8.275862068965518e-06,
"loss": 0.7617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4559746980667114,
"step": 85,
"valid_targets_mean": 5640.1,
"valid_targets_min": 274
},
{
"epoch": 0.15517241379310345,
"grad_norm": 0.7425167868253314,
"learning_rate": 8.768472906403942e-06,
"loss": 0.7697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43732425570487976,
"step": 90,
"valid_targets_mean": 4439.5,
"valid_targets_min": 1082
},
{
"epoch": 0.16379310344827586,
"grad_norm": 0.8784728083131768,
"learning_rate": 9.261083743842364e-06,
"loss": 0.6829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3236698806285858,
"step": 95,
"valid_targets_mean": 2221.5,
"valid_targets_min": 583
},
{
"epoch": 0.1724137931034483,
"grad_norm": 0.668610432068481,
"learning_rate": 9.75369458128079e-06,
"loss": 0.7028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3175450563430786,
"step": 100,
"valid_targets_mean": 4900.4,
"valid_targets_min": 412
},
{
"epoch": 0.1810344827586207,
"grad_norm": 0.762868705154042,
"learning_rate": 1.0246305418719214e-05,
"loss": 0.7046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33831289410591125,
"step": 105,
"valid_targets_mean": 3072.5,
"valid_targets_min": 1802
},
{
"epoch": 0.1896551724137931,
"grad_norm": 0.771147983381667,
"learning_rate": 1.0738916256157637e-05,
"loss": 0.6963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3214723765850067,
"step": 110,
"valid_targets_mean": 3625.2,
"valid_targets_min": 756
},
{
"epoch": 0.19827586206896552,
"grad_norm": 1.640623528697079,
"learning_rate": 1.123152709359606e-05,
"loss": 0.7089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23830479383468628,
"step": 115,
"valid_targets_mean": 3252.0,
"valid_targets_min": 679
},
{
"epoch": 0.20689655172413793,
"grad_norm": 0.7019602281567701,
"learning_rate": 1.1724137931034483e-05,
"loss": 0.7265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32230842113494873,
"step": 120,
"valid_targets_mean": 4071.5,
"valid_targets_min": 1946
},
{
"epoch": 0.21551724137931033,
"grad_norm": 0.7339495236828748,
"learning_rate": 1.2216748768472909e-05,
"loss": 0.7463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007355332374573,
"step": 125,
"valid_targets_mean": 2948.8,
"valid_targets_min": 1718
},
{
"epoch": 0.22413793103448276,
"grad_norm": 0.5110196587530477,
"learning_rate": 1.2709359605911331e-05,
"loss": 0.6675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22014601528644562,
"step": 130,
"valid_targets_mean": 4781.5,
"valid_targets_min": 1996
},
{
"epoch": 0.23275862068965517,
"grad_norm": 0.6846953537064482,
"learning_rate": 1.3201970443349755e-05,
"loss": 0.6993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17798146605491638,
"step": 135,
"valid_targets_mean": 2210.0,
"valid_targets_min": 728
},
{
"epoch": 0.2413793103448276,
"grad_norm": 0.8179902129138006,
"learning_rate": 1.369458128078818e-05,
"loss": 0.7097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47994717955589294,
"step": 140,
"valid_targets_mean": 5659.4,
"valid_targets_min": 890
},
{
"epoch": 0.25,
"grad_norm": 0.5915590286522948,
"learning_rate": 1.4187192118226602e-05,
"loss": 0.6907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24744611978530884,
"step": 145,
"valid_targets_mean": 3455.5,
"valid_targets_min": 553
},
{
"epoch": 0.25862068965517243,
"grad_norm": 0.7578130027178461,
"learning_rate": 1.4679802955665026e-05,
"loss": 0.7072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4918016195297241,
"step": 150,
"valid_targets_mean": 3785.9,
"valid_targets_min": 708
},
{
"epoch": 0.2672413793103448,
"grad_norm": 0.8118636484819712,
"learning_rate": 1.5172413793103448e-05,
"loss": 0.7223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3037732243537903,
"step": 155,
"valid_targets_mean": 2365.0,
"valid_targets_min": 338
},
{
"epoch": 0.27586206896551724,
"grad_norm": 0.8417411826914287,
"learning_rate": 1.5665024630541875e-05,
"loss": 0.7179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25301000475883484,
"step": 160,
"valid_targets_mean": 2006.4,
"valid_targets_min": 754
},
{
"epoch": 0.28448275862068967,
"grad_norm": 1.0078060923241636,
"learning_rate": 1.6157635467980298e-05,
"loss": 0.6841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5394257307052612,
"step": 165,
"valid_targets_mean": 3262.0,
"valid_targets_min": 946
},
{
"epoch": 0.29310344827586204,
"grad_norm": 0.8509294072085292,
"learning_rate": 1.665024630541872e-05,
"loss": 0.6869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.293990820646286,
"step": 170,
"valid_targets_mean": 2501.8,
"valid_targets_min": 606
},
{
"epoch": 0.3017241379310345,
"grad_norm": 1.5110699028438686,
"learning_rate": 1.7142857142857142e-05,
"loss": 0.6406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42483076453208923,
"step": 175,
"valid_targets_mean": 5015.8,
"valid_targets_min": 571
},
{
"epoch": 0.3103448275862069,
"grad_norm": 0.829361033344782,
"learning_rate": 1.7635467980295567e-05,
"loss": 0.6593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3968130350112915,
"step": 180,
"valid_targets_mean": 4155.6,
"valid_targets_min": 1366
},
{
"epoch": 0.31896551724137934,
"grad_norm": 2.2132799203163036,
"learning_rate": 1.8128078817733993e-05,
"loss": 0.6668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41700565814971924,
"step": 185,
"valid_targets_mean": 3660.1,
"valid_targets_min": 1274
},
{
"epoch": 0.3275862068965517,
"grad_norm": 0.7201258507954451,
"learning_rate": 1.8620689655172415e-05,
"loss": 0.6377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3403915762901306,
"step": 190,
"valid_targets_mean": 3456.1,
"valid_targets_min": 811
},
{
"epoch": 0.33620689655172414,
"grad_norm": 0.7496831909974342,
"learning_rate": 1.911330049261084e-05,
"loss": 0.6633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3048527240753174,
"step": 195,
"valid_targets_mean": 3633.9,
"valid_targets_min": 1775
},
{
"epoch": 0.3448275862068966,
"grad_norm": 1.0466424956418392,
"learning_rate": 1.9605911330049263e-05,
"loss": 0.6995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32808586955070496,
"step": 200,
"valid_targets_mean": 3535.2,
"valid_targets_min": 586
},
{
"epoch": 0.35344827586206895,
"grad_norm": 0.8218255448633348,
"learning_rate": 2.0098522167487688e-05,
"loss": 0.6917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2928812801837921,
"step": 205,
"valid_targets_mean": 3240.9,
"valid_targets_min": 834
},
{
"epoch": 0.3620689655172414,
"grad_norm": 0.8029280949690537,
"learning_rate": 2.059113300492611e-05,
"loss": 0.7323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30598652362823486,
"step": 210,
"valid_targets_mean": 2593.9,
"valid_targets_min": 623
},
{
"epoch": 0.3706896551724138,
"grad_norm": 1.2032672924578944,
"learning_rate": 2.1083743842364536e-05,
"loss": 0.6665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2592845559120178,
"step": 215,
"valid_targets_mean": 4767.8,
"valid_targets_min": 1062
},
{
"epoch": 0.3793103448275862,
"grad_norm": 0.7836032078966709,
"learning_rate": 2.1576354679802954e-05,
"loss": 0.6655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27402517199516296,
"step": 220,
"valid_targets_mean": 2645.8,
"valid_targets_min": 955
},
{
"epoch": 0.3879310344827586,
"grad_norm": 0.7223820678613246,
"learning_rate": 2.206896551724138e-05,
"loss": 0.6182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808302640914917,
"step": 225,
"valid_targets_mean": 2963.4,
"valid_targets_min": 1475
},
{
"epoch": 0.39655172413793105,
"grad_norm": 0.6050302790875435,
"learning_rate": 2.2561576354679805e-05,
"loss": 0.6178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4045502543449402,
"step": 230,
"valid_targets_mean": 5649.1,
"valid_targets_min": 1876
},
{
"epoch": 0.4051724137931034,
"grad_norm": 0.6999663949451717,
"learning_rate": 2.3054187192118228e-05,
"loss": 0.633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23481211066246033,
"step": 235,
"valid_targets_mean": 3052.0,
"valid_targets_min": 1318
},
{
"epoch": 0.41379310344827586,
"grad_norm": 0.7423530530074394,
"learning_rate": 2.3546798029556653e-05,
"loss": 0.6828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3373368978500366,
"step": 240,
"valid_targets_mean": 3396.6,
"valid_targets_min": 464
},
{
"epoch": 0.4224137931034483,
"grad_norm": 0.7379312877310925,
"learning_rate": 2.403940886699508e-05,
"loss": 0.7037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21787698566913605,
"step": 245,
"valid_targets_mean": 2163.5,
"valid_targets_min": 534
},
{
"epoch": 0.43103448275862066,
"grad_norm": 0.8063509127084881,
"learning_rate": 2.4532019704433497e-05,
"loss": 0.6382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792884111404419,
"step": 250,
"valid_targets_mean": 3017.1,
"valid_targets_min": 1032
},
{
"epoch": 0.4396551724137931,
"grad_norm": 0.6706813958825989,
"learning_rate": 2.5024630541871923e-05,
"loss": 0.657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086356520652771,
"step": 255,
"valid_targets_mean": 4803.4,
"valid_targets_min": 357
},
{
"epoch": 0.4482758620689655,
"grad_norm": 0.9310469728000066,
"learning_rate": 2.551724137931035e-05,
"loss": 0.7131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2496461719274521,
"step": 260,
"valid_targets_mean": 1765.0,
"valid_targets_min": 470
},
{
"epoch": 0.45689655172413796,
"grad_norm": 0.7289154684935432,
"learning_rate": 2.600985221674877e-05,
"loss": 0.6566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2873595654964447,
"step": 265,
"valid_targets_mean": 3518.4,
"valid_targets_min": 785
},
{
"epoch": 0.46551724137931033,
"grad_norm": 0.7491930663891365,
"learning_rate": 2.6502463054187196e-05,
"loss": 0.6191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3568354845046997,
"step": 270,
"valid_targets_mean": 3725.4,
"valid_targets_min": 937
},
{
"epoch": 0.47413793103448276,
"grad_norm": 0.6869919899460102,
"learning_rate": 2.6995073891625615e-05,
"loss": 0.6547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.300902396440506,
"step": 275,
"valid_targets_mean": 3223.5,
"valid_targets_min": 1041
},
{
"epoch": 0.4827586206896552,
"grad_norm": 0.7219971094287305,
"learning_rate": 2.748768472906404e-05,
"loss": 0.6283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22700543701648712,
"step": 280,
"valid_targets_mean": 2332.5,
"valid_targets_min": 1321
},
{
"epoch": 0.49137931034482757,
"grad_norm": 0.7840522944810209,
"learning_rate": 2.7980295566502466e-05,
"loss": 0.6794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.429918497800827,
"step": 285,
"valid_targets_mean": 4372.2,
"valid_targets_min": 2070
},
{
"epoch": 0.5,
"grad_norm": 0.7168472411052416,
"learning_rate": 2.8472906403940888e-05,
"loss": 0.6222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090544641017914,
"step": 290,
"valid_targets_mean": 3569.8,
"valid_targets_min": 1793
},
{
"epoch": 0.5086206896551724,
"grad_norm": 0.6401065575292432,
"learning_rate": 2.8965517241379313e-05,
"loss": 0.6535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3025968670845032,
"step": 295,
"valid_targets_mean": 4973.6,
"valid_targets_min": 917
},
{
"epoch": 0.5172413793103449,
"grad_norm": 0.5902560458840668,
"learning_rate": 2.945812807881774e-05,
"loss": 0.6428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35170048475265503,
"step": 300,
"valid_targets_mean": 6022.5,
"valid_targets_min": 1054
},
{
"epoch": 0.5258620689655172,
"grad_norm": 0.7483408537338351,
"learning_rate": 2.9950738916256158e-05,
"loss": 0.6253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22863270342350006,
"step": 305,
"valid_targets_mean": 3410.6,
"valid_targets_min": 1894
},
{
"epoch": 0.5344827586206896,
"grad_norm": 0.8333505264909917,
"learning_rate": 3.0443349753694583e-05,
"loss": 0.6544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38335931301116943,
"step": 310,
"valid_targets_mean": 3636.6,
"valid_targets_min": 1483
},
{
"epoch": 0.5431034482758621,
"grad_norm": 0.7569810094427996,
"learning_rate": 3.093596059113301e-05,
"loss": 0.5966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2640477418899536,
"step": 315,
"valid_targets_mean": 3758.2,
"valid_targets_min": 1159
},
{
"epoch": 0.5517241379310345,
"grad_norm": 0.8703377303462938,
"learning_rate": 3.142857142857143e-05,
"loss": 0.6108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3582964241504669,
"step": 320,
"valid_targets_mean": 2754.5,
"valid_targets_min": 1437
},
{
"epoch": 0.5603448275862069,
"grad_norm": 0.6746278227062145,
"learning_rate": 3.1921182266009856e-05,
"loss": 0.6329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2840624749660492,
"step": 325,
"valid_targets_mean": 3434.4,
"valid_targets_min": 534
},
{
"epoch": 0.5689655172413793,
"grad_norm": 0.6661913423851306,
"learning_rate": 3.2413793103448275e-05,
"loss": 0.6354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3681085407733917,
"step": 330,
"valid_targets_mean": 4702.4,
"valid_targets_min": 1024
},
{
"epoch": 0.5775862068965517,
"grad_norm": 0.6413649397859758,
"learning_rate": 3.29064039408867e-05,
"loss": 0.6488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29207906126976013,
"step": 335,
"valid_targets_mean": 3462.1,
"valid_targets_min": 1725
},
{
"epoch": 0.5862068965517241,
"grad_norm": 0.8651344005129311,
"learning_rate": 3.3399014778325126e-05,
"loss": 0.6268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3141361176967621,
"step": 340,
"valid_targets_mean": 2540.4,
"valid_targets_min": 1181
},
{
"epoch": 0.5948275862068966,
"grad_norm": 0.7769867467422841,
"learning_rate": 3.389162561576355e-05,
"loss": 0.5976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33586743474006653,
"step": 345,
"valid_targets_mean": 3471.5,
"valid_targets_min": 2102
},
{
"epoch": 0.603448275862069,
"grad_norm": 0.7670895081874297,
"learning_rate": 3.438423645320197e-05,
"loss": 0.6091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30461496114730835,
"step": 350,
"valid_targets_mean": 3081.5,
"valid_targets_min": 1388
},
{
"epoch": 0.6120689655172413,
"grad_norm": 0.7050722350888959,
"learning_rate": 3.4876847290640396e-05,
"loss": 0.6474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4162551164627075,
"step": 355,
"valid_targets_mean": 4125.9,
"valid_targets_min": 1195
},
{
"epoch": 0.6206896551724138,
"grad_norm": 0.6332661299318986,
"learning_rate": 3.536945812807882e-05,
"loss": 0.6514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37823486328125,
"step": 360,
"valid_targets_mean": 6009.8,
"valid_targets_min": 1362
},
{
"epoch": 0.6293103448275862,
"grad_norm": 0.6793271986969113,
"learning_rate": 3.586206896551725e-05,
"loss": 0.6152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2917017936706543,
"step": 365,
"valid_targets_mean": 4666.1,
"valid_targets_min": 379
},
{
"epoch": 0.6379310344827587,
"grad_norm": 0.6450087890703107,
"learning_rate": 3.6354679802955665e-05,
"loss": 0.6331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29983556270599365,
"step": 370,
"valid_targets_mean": 4020.2,
"valid_targets_min": 940
},
{
"epoch": 0.646551724137931,
"grad_norm": 0.7471314078072796,
"learning_rate": 3.684729064039409e-05,
"loss": 0.6443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3147204518318176,
"step": 375,
"valid_targets_mean": 3499.0,
"valid_targets_min": 636
},
{
"epoch": 0.6551724137931034,
"grad_norm": 0.709612006208998,
"learning_rate": 3.7339901477832516e-05,
"loss": 0.6724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23856517672538757,
"step": 380,
"valid_targets_mean": 3519.8,
"valid_targets_min": 1031
},
{
"epoch": 0.6637931034482759,
"grad_norm": 0.697296078256357,
"learning_rate": 3.7832512315270935e-05,
"loss": 0.6477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26525959372520447,
"step": 385,
"valid_targets_mean": 3800.0,
"valid_targets_min": 636
},
{
"epoch": 0.6724137931034483,
"grad_norm": 0.7964944660649016,
"learning_rate": 3.832512315270936e-05,
"loss": 0.6174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2790738344192505,
"step": 390,
"valid_targets_mean": 3369.2,
"valid_targets_min": 2124
},
{
"epoch": 0.6810344827586207,
"grad_norm": 0.7391646482654692,
"learning_rate": 3.8817733990147786e-05,
"loss": 0.6382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2945958375930786,
"step": 395,
"valid_targets_mean": 3164.6,
"valid_targets_min": 1496
},
{
"epoch": 0.6896551724137931,
"grad_norm": 0.7017054297069276,
"learning_rate": 3.931034482758621e-05,
"loss": 0.5758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24679553508758545,
"step": 400,
"valid_targets_mean": 3879.5,
"valid_targets_min": 1781
},
{
"epoch": 0.6982758620689655,
"grad_norm": 0.784443324981124,
"learning_rate": 3.980295566502464e-05,
"loss": 0.6421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3295668959617615,
"step": 405,
"valid_targets_mean": 3656.9,
"valid_targets_min": 2311
},
{
"epoch": 0.7068965517241379,
"grad_norm": 0.6669603608079032,
"learning_rate": 3.999993347192948e-05,
"loss": 0.6026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2392359972000122,
"step": 410,
"valid_targets_mean": 2878.8,
"valid_targets_min": 786
},
{
"epoch": 0.7155172413793104,
"grad_norm": 0.5869402914374651,
"learning_rate": 3.9999526913101334e-05,
"loss": 0.6044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2842877507209778,
"step": 415,
"valid_targets_mean": 4819.2,
"valid_targets_min": 1604
},
{
"epoch": 0.7241379310344828,
"grad_norm": 0.712850243180447,
"learning_rate": 3.999875076298832e-05,
"loss": 0.6093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45204976201057434,
"step": 420,
"valid_targets_mean": 5218.8,
"valid_targets_min": 980
},
{
"epoch": 0.7327586206896551,
"grad_norm": 0.6287529479538014,
"learning_rate": 3.9997605035933704e-05,
"loss": 0.6427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23647578060626984,
"step": 425,
"valid_targets_mean": 3042.9,
"valid_targets_min": 1884
},
{
"epoch": 0.7413793103448276,
"grad_norm": 0.613243349326708,
"learning_rate": 3.99960897531105e-05,
"loss": 0.6482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23709192872047424,
"step": 430,
"valid_targets_mean": 3435.1,
"valid_targets_min": 1558
},
{
"epoch": 0.75,
"grad_norm": 0.6562955349817724,
"learning_rate": 3.999420494252116e-05,
"loss": 0.5951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3045341968536377,
"step": 435,
"valid_targets_mean": 4663.6,
"valid_targets_min": 1470
},
{
"epoch": 0.7586206896551724,
"grad_norm": 0.7627463901707322,
"learning_rate": 3.9991950638996976e-05,
"loss": 0.6301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4783356785774231,
"step": 440,
"valid_targets_mean": 4428.6,
"valid_targets_min": 2142
},
{
"epoch": 0.7672413793103449,
"grad_norm": 0.646915086795381,
"learning_rate": 3.998932688419748e-05,
"loss": 0.6333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2336660921573639,
"step": 445,
"valid_targets_mean": 3231.2,
"valid_targets_min": 1201
},
{
"epoch": 0.7758620689655172,
"grad_norm": 0.6989419952214646,
"learning_rate": 3.9986333726609674e-05,
"loss": 0.5952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34037575125694275,
"step": 450,
"valid_targets_mean": 4055.6,
"valid_targets_min": 2316
},
{
"epoch": 0.7844827586206896,
"grad_norm": 0.6629583343519574,
"learning_rate": 3.99829712215471e-05,
"loss": 0.6399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17064107954502106,
"step": 455,
"valid_targets_mean": 2590.6,
"valid_targets_min": 1968
},
{
"epoch": 0.7931034482758621,
"grad_norm": 0.78890938920922,
"learning_rate": 3.997923943114886e-05,
"loss": 0.6104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29810309410095215,
"step": 460,
"valid_targets_mean": 2791.9,
"valid_targets_min": 379
},
{
"epoch": 0.8017241379310345,
"grad_norm": 0.7272042315596238,
"learning_rate": 3.997513842437845e-05,
"loss": 0.6096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.364572137594223,
"step": 465,
"valid_targets_mean": 3626.4,
"valid_targets_min": 426
},
{
"epoch": 0.8103448275862069,
"grad_norm": 0.6577433648661997,
"learning_rate": 3.997066827702248e-05,
"loss": 0.6063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37066060304641724,
"step": 470,
"valid_targets_mean": 4684.1,
"valid_targets_min": 656
},
{
"epoch": 0.8189655172413793,
"grad_norm": 0.9374920706442889,
"learning_rate": 3.996582907168928e-05,
"loss": 0.6019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33479398488998413,
"step": 475,
"valid_targets_mean": 2754.0,
"valid_targets_min": 819
},
{
"epoch": 0.8275862068965517,
"grad_norm": 0.6973024921577812,
"learning_rate": 3.996062089780737e-05,
"loss": 0.611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128424286842346,
"step": 480,
"valid_targets_mean": 5124.0,
"valid_targets_min": 1016
},
{
"epoch": 0.8362068965517241,
"grad_norm": 0.8674122403376363,
"learning_rate": 3.99550438516238e-05,
"loss": 0.6519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37676799297332764,
"step": 485,
"valid_targets_mean": 2540.9,
"valid_targets_min": 1171
},
{
"epoch": 0.8448275862068966,
"grad_norm": 0.8139547580639379,
"learning_rate": 3.994909803620241e-05,
"loss": 0.6309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30208778381347656,
"step": 490,
"valid_targets_mean": 3834.2,
"valid_targets_min": 1779
},
{
"epoch": 0.853448275862069,
"grad_norm": 0.6703455605697158,
"learning_rate": 3.994278356142187e-05,
"loss": 0.5802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3729390501976013,
"step": 495,
"valid_targets_mean": 4426.1,
"valid_targets_min": 1333
},
{
"epoch": 0.8620689655172413,
"grad_norm": 0.7773046757336888,
"learning_rate": 3.993610054397368e-05,
"loss": 0.6127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28395596146583557,
"step": 500,
"valid_targets_mean": 2704.4,
"valid_targets_min": 492
},
{
"epoch": 0.8706896551724138,
"grad_norm": 0.6933830157899125,
"learning_rate": 3.992904910736001e-05,
"loss": 0.6275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3321034908294678,
"step": 505,
"valid_targets_mean": 2750.9,
"valid_targets_min": 781
},
{
"epoch": 0.8793103448275862,
"grad_norm": 0.6899491978796316,
"learning_rate": 3.9921629381891425e-05,
"loss": 0.6128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2895788550376892,
"step": 510,
"valid_targets_mean": 3737.8,
"valid_targets_min": 1953
},
{
"epoch": 0.8879310344827587,
"grad_norm": 0.6461401658273619,
"learning_rate": 3.991384150468445e-05,
"loss": 0.632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2809222936630249,
"step": 515,
"valid_targets_mean": 3917.4,
"valid_targets_min": 2273
},
{
"epoch": 0.896551724137931,
"grad_norm": 1.2440232141350356,
"learning_rate": 3.9905685619659074e-05,
"loss": 0.6162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2755066752433777,
"step": 520,
"valid_targets_mean": 2479.9,
"valid_targets_min": 935
},
{
"epoch": 0.9051724137931034,
"grad_norm": 0.8153879328655858,
"learning_rate": 3.9897161877536076e-05,
"loss": 0.6054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3150935173034668,
"step": 525,
"valid_targets_mean": 2985.4,
"valid_targets_min": 1461
},
{
"epoch": 0.9137931034482759,
"grad_norm": 0.610080365395153,
"learning_rate": 3.9888270435834196e-05,
"loss": 0.5662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674276828765869,
"step": 530,
"valid_targets_mean": 4293.4,
"valid_targets_min": 854
},
{
"epoch": 0.9224137931034483,
"grad_norm": 0.7289184888115173,
"learning_rate": 3.987901145886731e-05,
"loss": 0.6252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40158599615097046,
"step": 535,
"valid_targets_mean": 3920.5,
"valid_targets_min": 1234
},
{
"epoch": 0.9310344827586207,
"grad_norm": 0.9065353440528913,
"learning_rate": 3.9869385117741314e-05,
"loss": 0.6004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.262065052986145,
"step": 540,
"valid_targets_mean": 2458.5,
"valid_targets_min": 1032
},
{
"epoch": 0.9396551724137931,
"grad_norm": 0.8075182485003022,
"learning_rate": 3.985939159035101e-05,
"loss": 0.6231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27840715646743774,
"step": 545,
"valid_targets_mean": 2088.2,
"valid_targets_min": 815
},
{
"epoch": 0.9482758620689655,
"grad_norm": 0.8932299994242785,
"learning_rate": 3.98490310613768e-05,
"loss": 0.6197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31527039408683777,
"step": 550,
"valid_targets_mean": 2544.9,
"valid_targets_min": 377
},
{
"epoch": 0.9568965517241379,
"grad_norm": 0.600637076017398,
"learning_rate": 3.983830372228127e-05,
"loss": 0.6074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.384111225605011,
"step": 555,
"valid_targets_mean": 5281.6,
"valid_targets_min": 1035
},
{
"epoch": 0.9655172413793104,
"grad_norm": 0.6461798471784225,
"learning_rate": 3.982720977130567e-05,
"loss": 0.6061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39894336462020874,
"step": 560,
"valid_targets_mean": 4568.5,
"valid_targets_min": 594
},
{
"epoch": 0.9741379310344828,
"grad_norm": 0.785625646117963,
"learning_rate": 3.9815749413466204e-05,
"loss": 0.6221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33625924587249756,
"step": 565,
"valid_targets_mean": 2459.2,
"valid_targets_min": 494
},
{
"epoch": 0.9827586206896551,
"grad_norm": 0.6826434190898227,
"learning_rate": 3.980392286055033e-05,
"loss": 0.613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2937217354774475,
"step": 570,
"valid_targets_mean": 3124.0,
"valid_targets_min": 1630
},
{
"epoch": 0.9913793103448276,
"grad_norm": 0.7113889514712743,
"learning_rate": 3.979173033111275e-05,
"loss": 0.5836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29601383209228516,
"step": 575,
"valid_targets_mean": 3815.6,
"valid_targets_min": 1390
},
{
"epoch": 1.0,
"grad_norm": 0.7978906605998085,
"learning_rate": 3.977917205047142e-05,
"loss": 0.6345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4608190059661865,
"step": 580,
"valid_targets_mean": 3223.1,
"valid_targets_min": 706
},
{
"epoch": 1.0086206896551724,
"grad_norm": 0.6005717129590061,
"learning_rate": 3.976624825070339e-05,
"loss": 0.5683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41373294591903687,
"step": 585,
"valid_targets_mean": 5931.6,
"valid_targets_min": 1471
},
{
"epoch": 1.0172413793103448,
"grad_norm": 0.6552336478289915,
"learning_rate": 3.97529591706405e-05,
"loss": 0.5455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23430368304252625,
"step": 590,
"valid_targets_mean": 2999.2,
"valid_targets_min": 941
},
{
"epoch": 1.0258620689655173,
"grad_norm": 0.7195300818386714,
"learning_rate": 3.973930505586496e-05,
"loss": 0.5861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23183020949363708,
"step": 595,
"valid_targets_mean": 2522.2,
"valid_targets_min": 734
},
{
"epoch": 1.0344827586206897,
"grad_norm": 0.6737625154821479,
"learning_rate": 3.972528615870483e-05,
"loss": 0.5762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3226555585861206,
"step": 600,
"valid_targets_mean": 3511.2,
"valid_targets_min": 1281
},
{
"epoch": 1.043103448275862,
"grad_norm": 0.6574075084965194,
"learning_rate": 3.9710902738229354e-05,
"loss": 0.576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3020402193069458,
"step": 605,
"valid_targets_mean": 4075.6,
"valid_targets_min": 592
},
{
"epoch": 1.0517241379310345,
"grad_norm": 0.6361634659488868,
"learning_rate": 3.9696155060244166e-05,
"loss": 0.6074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31071919202804565,
"step": 610,
"valid_targets_mean": 4625.1,
"valid_targets_min": 1577
},
{
"epoch": 1.0603448275862069,
"grad_norm": 0.6865688750734892,
"learning_rate": 3.968104339728636e-05,
"loss": 0.5529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22631359100341797,
"step": 615,
"valid_targets_mean": 3810.9,
"valid_targets_min": 1016
},
{
"epoch": 1.0689655172413792,
"grad_norm": 0.7847925685737638,
"learning_rate": 3.966556802861951e-05,
"loss": 0.5722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21570219099521637,
"step": 620,
"valid_targets_mean": 3329.9,
"valid_targets_min": 541
},
{
"epoch": 1.0775862068965518,
"grad_norm": 0.6508403733170468,
"learning_rate": 3.964972924022843e-05,
"loss": 0.5917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25959932804107666,
"step": 625,
"valid_targets_mean": 3226.6,
"valid_targets_min": 544
},
{
"epoch": 1.0862068965517242,
"grad_norm": 0.6393748831001188,
"learning_rate": 3.963352732481396e-05,
"loss": 0.5649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24320468306541443,
"step": 630,
"valid_targets_mean": 3234.1,
"valid_targets_min": 1606
},
{
"epoch": 1.0948275862068966,
"grad_norm": 0.6464744061619221,
"learning_rate": 3.961696258178752e-05,
"loss": 0.56,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23860612511634827,
"step": 635,
"valid_targets_mean": 3424.6,
"valid_targets_min": 281
},
{
"epoch": 1.103448275862069,
"grad_norm": 0.7130411239086852,
"learning_rate": 3.960003531726559e-05,
"loss": 0.5978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2414039522409439,
"step": 640,
"valid_targets_mean": 2692.5,
"valid_targets_min": 1147
},
{
"epoch": 1.1120689655172413,
"grad_norm": 0.6067056941197266,
"learning_rate": 3.958274584406403e-05,
"loss": 0.5889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696046233177185,
"step": 645,
"valid_targets_mean": 3656.6,
"valid_targets_min": 1580
},
{
"epoch": 1.1206896551724137,
"grad_norm": 0.6794563652987848,
"learning_rate": 3.956509448169233e-05,
"loss": 0.5579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25545477867126465,
"step": 650,
"valid_targets_mean": 3386.6,
"valid_targets_min": 1070
},
{
"epoch": 1.1293103448275863,
"grad_norm": 0.5907805691902701,
"learning_rate": 3.9547081556347693e-05,
"loss": 0.55,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3312992453575134,
"step": 655,
"valid_targets_mean": 5166.6,
"valid_targets_min": 1067
},
{
"epoch": 1.1379310344827587,
"grad_norm": 0.6929733973909208,
"learning_rate": 3.952870740090901e-05,
"loss": 0.5628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20063847303390503,
"step": 660,
"valid_targets_mean": 2974.2,
"valid_targets_min": 1165
},
{
"epoch": 1.146551724137931,
"grad_norm": 0.6362204985300633,
"learning_rate": 3.950997235493069e-05,
"loss": 0.5549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19708850979804993,
"step": 665,
"valid_targets_mean": 2985.6,
"valid_targets_min": 753
},
{
"epoch": 1.1551724137931034,
"grad_norm": 0.6358110533727936,
"learning_rate": 3.9490876764636414e-05,
"loss": 0.5738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28072255849838257,
"step": 670,
"valid_targets_mean": 3981.6,
"valid_targets_min": 904
},
{
"epoch": 1.1637931034482758,
"grad_norm": 0.7492089400612849,
"learning_rate": 3.947142098291272e-05,
"loss": 0.5969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18699270486831665,
"step": 675,
"valid_targets_mean": 2234.5,
"valid_targets_min": 520
},
{
"epoch": 1.1724137931034484,
"grad_norm": 0.6757843817064915,
"learning_rate": 3.945160536930247e-05,
"loss": 0.6009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26428648829460144,
"step": 680,
"valid_targets_mean": 3843.4,
"valid_targets_min": 1182
},
{
"epoch": 1.1810344827586208,
"grad_norm": 0.634931931587929,
"learning_rate": 3.9431430289998235e-05,
"loss": 0.5489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3300395607948303,
"step": 685,
"valid_targets_mean": 4375.2,
"valid_targets_min": 1305
},
{
"epoch": 1.1896551724137931,
"grad_norm": 0.6151851916260583,
"learning_rate": 3.941089611783551e-05,
"loss": 0.5548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18444105982780457,
"step": 690,
"valid_targets_mean": 3105.9,
"valid_targets_min": 1484
},
{
"epoch": 1.1982758620689655,
"grad_norm": 0.6068354631280605,
"learning_rate": 3.939000323228583e-05,
"loss": 0.5517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512916922569275,
"step": 695,
"valid_targets_mean": 4222.9,
"valid_targets_min": 1393
},
{
"epoch": 1.206896551724138,
"grad_norm": 0.7634427474132905,
"learning_rate": 3.9368752019449744e-05,
"loss": 0.5944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21794426441192627,
"step": 700,
"valid_targets_mean": 2043.1,
"valid_targets_min": 581
},
{
"epoch": 1.2155172413793103,
"grad_norm": 0.6191064830788139,
"learning_rate": 3.934714287204969e-05,
"loss": 0.5532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3472103476524353,
"step": 705,
"valid_targets_mean": 4762.0,
"valid_targets_min": 1397
},
{
"epoch": 1.2241379310344827,
"grad_norm": 0.7037462902349687,
"learning_rate": 3.932517618942275e-05,
"loss": 0.5717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27132099866867065,
"step": 710,
"valid_targets_mean": 3573.6,
"valid_targets_min": 1746
},
{
"epoch": 1.2327586206896552,
"grad_norm": 0.7072106217368744,
"learning_rate": 3.930285237751324e-05,
"loss": 0.6102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910650670528412,
"step": 715,
"valid_targets_mean": 3287.1,
"valid_targets_min": 663
},
{
"epoch": 1.2413793103448276,
"grad_norm": 0.6650108596305829,
"learning_rate": 3.928017184886525e-05,
"loss": 0.5893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2076074481010437,
"step": 720,
"valid_targets_mean": 2658.0,
"valid_targets_min": 1354
},
{
"epoch": 1.25,
"grad_norm": 0.7113696936170891,
"learning_rate": 3.925713502261496e-05,
"loss": 0.5793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28718888759613037,
"step": 725,
"valid_targets_mean": 2900.5,
"valid_targets_min": 274
},
{
"epoch": 1.2586206896551724,
"grad_norm": 0.6066075532383515,
"learning_rate": 3.9233742324482965e-05,
"loss": 0.5675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.182432159781456,
"step": 730,
"valid_targets_mean": 4086.9,
"valid_targets_min": 599
},
{
"epoch": 1.2672413793103448,
"grad_norm": 0.6322789893306922,
"learning_rate": 3.920999418676636e-05,
"loss": 0.5827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.340463250875473,
"step": 735,
"valid_targets_mean": 4901.2,
"valid_targets_min": 1812
},
{
"epoch": 1.2758620689655173,
"grad_norm": 0.645804554200195,
"learning_rate": 3.918589104833075e-05,
"loss": 0.5825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30338525772094727,
"step": 740,
"valid_targets_mean": 4204.6,
"valid_targets_min": 1376
},
{
"epoch": 1.2844827586206897,
"grad_norm": 0.7050655189214021,
"learning_rate": 3.916143335460218e-05,
"loss": 0.5499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33188706636428833,
"step": 745,
"valid_targets_mean": 3245.9,
"valid_targets_min": 1098
},
{
"epoch": 1.293103448275862,
"grad_norm": 0.6445820272212374,
"learning_rate": 3.913662155755885e-05,
"loss": 0.5595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24519510567188263,
"step": 750,
"valid_targets_mean": 3186.8,
"valid_targets_min": 509
},
{
"epoch": 1.3017241379310345,
"grad_norm": 0.7975036037110392,
"learning_rate": 3.911145611572282e-05,
"loss": 0.5481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2782052755355835,
"step": 755,
"valid_targets_mean": 2524.6,
"valid_targets_min": 426
},
{
"epoch": 1.3103448275862069,
"grad_norm": 0.7281950316071065,
"learning_rate": 3.908593749415148e-05,
"loss": 0.6545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1945173144340515,
"step": 760,
"valid_targets_mean": 2425.2,
"valid_targets_min": 478
},
{
"epoch": 1.3189655172413794,
"grad_norm": 0.6366615373153709,
"learning_rate": 3.9060066164428986e-05,
"loss": 0.5524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992849349975586,
"step": 765,
"valid_targets_mean": 4045.9,
"valid_targets_min": 1069
},
{
"epoch": 1.3275862068965516,
"grad_norm": 0.7551529366816231,
"learning_rate": 3.903384260465756e-05,
"loss": 0.58,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27485474944114685,
"step": 770,
"valid_targets_mean": 2762.9,
"valid_targets_min": 377
},
{
"epoch": 1.3362068965517242,
"grad_norm": 0.6821396675191562,
"learning_rate": 3.900726729944861e-05,
"loss": 0.5618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30889642238616943,
"step": 775,
"valid_targets_mean": 3370.8,
"valid_targets_min": 438
},
{
"epoch": 1.3448275862068966,
"grad_norm": 0.6717238345792034,
"learning_rate": 3.898034073991382e-05,
"loss": 0.5625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41013768315315247,
"step": 780,
"valid_targets_mean": 4358.2,
"valid_targets_min": 1786
},
{
"epoch": 1.353448275862069,
"grad_norm": 0.7992752610314047,
"learning_rate": 3.8953063423656055e-05,
"loss": 0.5849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28634825348854065,
"step": 785,
"valid_targets_mean": 2582.8,
"valid_targets_min": 1188
},
{
"epoch": 1.3620689655172413,
"grad_norm": 0.6925451862529552,
"learning_rate": 3.892543585476014e-05,
"loss": 0.5691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935306429862976,
"step": 790,
"valid_targets_mean": 5148.4,
"valid_targets_min": 1771
},
{
"epoch": 1.3706896551724137,
"grad_norm": 0.7842287612668596,
"learning_rate": 3.88974585437836e-05,
"loss": 0.5681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19979897141456604,
"step": 795,
"valid_targets_mean": 2904.8,
"valid_targets_min": 547
},
{
"epoch": 1.3793103448275863,
"grad_norm": 0.6401163459314333,
"learning_rate": 3.886913200774717e-05,
"loss": 0.5899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28293904662132263,
"step": 800,
"valid_targets_mean": 3463.2,
"valid_targets_min": 1594
},
{
"epoch": 1.3879310344827587,
"grad_norm": 0.6807319952123996,
"learning_rate": 3.884045677012528e-05,
"loss": 0.5806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20955102145671844,
"step": 805,
"valid_targets_mean": 2845.8,
"valid_targets_min": 367
},
{
"epoch": 1.396551724137931,
"grad_norm": 0.6675497158755671,
"learning_rate": 3.8811433360836364e-05,
"loss": 0.5345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2397671937942505,
"step": 810,
"valid_targets_mean": 3195.6,
"valid_targets_min": 1550
},
{
"epoch": 1.4051724137931034,
"grad_norm": 0.742052701853441,
"learning_rate": 3.878206231623306e-05,
"loss": 0.5727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2547149658203125,
"step": 815,
"valid_targets_mean": 2620.4,
"valid_targets_min": 408
},
{
"epoch": 1.4137931034482758,
"grad_norm": 0.7070815970934397,
"learning_rate": 3.8752344179092315e-05,
"loss": 0.5722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28830042481422424,
"step": 820,
"valid_targets_mean": 3540.2,
"valid_targets_min": 754
},
{
"epoch": 1.4224137931034484,
"grad_norm": 0.6308183596674323,
"learning_rate": 3.8722279498605344e-05,
"loss": 0.5937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23384696245193481,
"step": 825,
"valid_targets_mean": 3138.0,
"valid_targets_min": 682
},
{
"epoch": 1.4310344827586206,
"grad_norm": 0.6233028809186425,
"learning_rate": 3.869186883036748e-05,
"loss": 0.5749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2825425863265991,
"step": 830,
"valid_targets_mean": 3813.5,
"valid_targets_min": 1404
},
{
"epoch": 1.4396551724137931,
"grad_norm": 0.6315819587869369,
"learning_rate": 3.8661112736367924e-05,
"loss": 0.5418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27093827724456787,
"step": 835,
"valid_targets_mean": 3958.6,
"valid_targets_min": 1813
},
{
"epoch": 1.4482758620689655,
"grad_norm": 0.8002481201902519,
"learning_rate": 3.863001178497933e-05,
"loss": 0.5521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3411499261856079,
"step": 840,
"valid_targets_mean": 3449.6,
"valid_targets_min": 1562
},
{
"epoch": 1.456896551724138,
"grad_norm": 0.5646014000758687,
"learning_rate": 3.8598566550947316e-05,
"loss": 0.571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.267992228269577,
"step": 845,
"valid_targets_mean": 4902.5,
"valid_targets_min": 1685
},
{
"epoch": 1.4655172413793103,
"grad_norm": 0.6276978940722122,
"learning_rate": 3.856677761537986e-05,
"loss": 0.5893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31473422050476074,
"step": 850,
"valid_targets_mean": 4601.8,
"valid_targets_min": 1341
},
{
"epoch": 1.4741379310344827,
"grad_norm": 0.7348376830947169,
"learning_rate": 3.853464556573652e-05,
"loss": 0.5466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999240458011627,
"step": 855,
"valid_targets_mean": 3640.1,
"valid_targets_min": 916
},
{
"epoch": 1.4827586206896552,
"grad_norm": 0.8978611329491114,
"learning_rate": 3.850217099581764e-05,
"loss": 0.5616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27713045477867126,
"step": 860,
"valid_targets_mean": 2290.8,
"valid_targets_min": 1201
},
{
"epoch": 1.4913793103448276,
"grad_norm": 0.77046321533511,
"learning_rate": 3.8469354505753305e-05,
"loss": 0.5693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24054045975208282,
"step": 865,
"valid_targets_mean": 2118.1,
"valid_targets_min": 938
},
{
"epoch": 1.5,
"grad_norm": 0.7222989825813173,
"learning_rate": 3.843619670199229e-05,
"loss": 0.544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27719244360923767,
"step": 870,
"valid_targets_mean": 3316.0,
"valid_targets_min": 300
},
{
"epoch": 1.5086206896551724,
"grad_norm": 0.6285334439850424,
"learning_rate": 3.8402698197290865e-05,
"loss": 0.612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40034905076026917,
"step": 875,
"valid_targets_mean": 4616.9,
"valid_targets_min": 279
},
{
"epoch": 1.5172413793103448,
"grad_norm": 0.5988467971800734,
"learning_rate": 3.8368859610701443e-05,
"loss": 0.5665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3291173577308655,
"step": 880,
"valid_targets_mean": 5205.2,
"valid_targets_min": 1111
},
{
"epoch": 1.5258620689655173,
"grad_norm": 0.6221097934601042,
"learning_rate": 3.833468156756114e-05,
"loss": 0.5594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20184822380542755,
"step": 885,
"valid_targets_mean": 3121.1,
"valid_targets_min": 1996
},
{
"epoch": 1.5344827586206895,
"grad_norm": 0.6088881299880774,
"learning_rate": 3.8300164699480246e-05,
"loss": 0.5604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29023054242134094,
"step": 890,
"valid_targets_mean": 4022.2,
"valid_targets_min": 1170
},
{
"epoch": 1.543103448275862,
"grad_norm": 0.5851660013826078,
"learning_rate": 3.8265309644330535e-05,
"loss": 0.5475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22081995010375977,
"step": 895,
"valid_targets_mean": 3288.5,
"valid_targets_min": 775
},
{
"epoch": 1.5517241379310345,
"grad_norm": 0.5601559917028126,
"learning_rate": 3.823011704623347e-05,
"loss": 0.5356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25190994143486023,
"step": 900,
"valid_targets_mean": 4485.5,
"valid_targets_min": 1709
},
{
"epoch": 1.5603448275862069,
"grad_norm": 0.7111127459782094,
"learning_rate": 3.81945875555483e-05,
"loss": 0.6294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37708738446235657,
"step": 905,
"valid_targets_mean": 2716.1,
"valid_targets_min": 754
},
{
"epoch": 1.5689655172413794,
"grad_norm": 0.6241213259356158,
"learning_rate": 3.8158721828860094e-05,
"loss": 0.5732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25017252564430237,
"step": 910,
"valid_targets_mean": 2699.0,
"valid_targets_min": 908
},
{
"epoch": 1.5775862068965516,
"grad_norm": 1.5933254202486349,
"learning_rate": 3.81225205289675e-05,
"loss": 0.5779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41490495204925537,
"step": 915,
"valid_targets_mean": 4895.0,
"valid_targets_min": 1272
},
{
"epoch": 1.5862068965517242,
"grad_norm": 0.5280871052538816,
"learning_rate": 3.808598432487061e-05,
"loss": 0.5613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.259874165058136,
"step": 920,
"valid_targets_mean": 5779.0,
"valid_targets_min": 1994
},
{
"epoch": 1.5948275862068966,
"grad_norm": 0.549604024077637,
"learning_rate": 3.8049113891758506e-05,
"loss": 0.5666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.215641051530838,
"step": 925,
"valid_targets_mean": 4589.5,
"valid_targets_min": 856
},
{
"epoch": 1.603448275862069,
"grad_norm": 0.764713960290603,
"learning_rate": 3.8011909910996856e-05,
"loss": 0.5534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3771178424358368,
"step": 930,
"valid_targets_mean": 5157.5,
"valid_targets_min": 1677
},
{
"epoch": 1.6120689655172413,
"grad_norm": 0.6691714653562654,
"learning_rate": 3.797437307011527e-05,
"loss": 0.5525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23908597230911255,
"step": 935,
"valid_targets_mean": 3168.0,
"valid_targets_min": 1366
},
{
"epoch": 1.6206896551724137,
"grad_norm": 0.7097924121846054,
"learning_rate": 3.793650406279463e-05,
"loss": 0.5983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20683707296848297,
"step": 940,
"valid_targets_mean": 2603.0,
"valid_targets_min": 1098
},
{
"epoch": 1.6293103448275863,
"grad_norm": 0.6521675166491431,
"learning_rate": 3.789830358885423e-05,
"loss": 0.5752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32541143894195557,
"step": 945,
"valid_targets_mean": 4503.4,
"valid_targets_min": 863
},
{
"epoch": 1.6379310344827587,
"grad_norm": 0.6127301186437016,
"learning_rate": 3.7859772354238885e-05,
"loss": 0.5737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24941956996917725,
"step": 950,
"valid_targets_mean": 3997.9,
"valid_targets_min": 1318
},
{
"epoch": 1.646551724137931,
"grad_norm": 0.8107486435337788,
"learning_rate": 3.782091107100587e-05,
"loss": 0.5631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38626742362976074,
"step": 955,
"valid_targets_mean": 3198.8,
"valid_targets_min": 1015
},
{
"epoch": 1.6551724137931034,
"grad_norm": 0.6709100944181071,
"learning_rate": 3.7781720457311746e-05,
"loss": 0.5458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23467305302619934,
"step": 960,
"valid_targets_mean": 2846.6,
"valid_targets_min": 1638
},
{
"epoch": 1.6637931034482758,
"grad_norm": 0.7378895599046713,
"learning_rate": 3.7742201237399105e-05,
"loss": 0.5371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540317177772522,
"step": 965,
"valid_targets_mean": 2416.0,
"valid_targets_min": 752
},
{
"epoch": 1.6724137931034484,
"grad_norm": 0.8032206453205488,
"learning_rate": 3.77023541415832e-05,
"loss": 0.5284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24500620365142822,
"step": 970,
"valid_targets_mean": 2129.1,
"valid_targets_min": 338
},
{
"epoch": 1.6810344827586206,
"grad_norm": 0.7327397961798686,
"learning_rate": 3.7662179906238405e-05,
"loss": 0.5712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32717061042785645,
"step": 975,
"valid_targets_mean": 3676.8,
"valid_targets_min": 1039
},
{
"epoch": 1.6896551724137931,
"grad_norm": 0.6867767089756939,
"learning_rate": 3.762167927378464e-05,
"loss": 0.5624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27892693877220154,
"step": 980,
"valid_targets_mean": 3443.0,
"valid_targets_min": 1785
},
{
"epoch": 1.6982758620689655,
"grad_norm": 0.6052211747597286,
"learning_rate": 3.7580852992673656e-05,
"loss": 0.5641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21629683673381805,
"step": 985,
"valid_targets_mean": 3518.9,
"valid_targets_min": 1496
},
{
"epoch": 1.706896551724138,
"grad_norm": 0.5922892058837835,
"learning_rate": 3.7539701817375185e-05,
"loss": 0.5866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31934842467308044,
"step": 990,
"valid_targets_mean": 4224.4,
"valid_targets_min": 1416
},
{
"epoch": 1.7155172413793105,
"grad_norm": 1.0493692424194028,
"learning_rate": 3.7498226508362996e-05,
"loss": 0.5721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24411314725875854,
"step": 995,
"valid_targets_mean": 3659.2,
"valid_targets_min": 1365
},
{
"epoch": 1.7241379310344827,
"grad_norm": 0.6364551146606927,
"learning_rate": 3.7456427832100864e-05,
"loss": 0.5801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3116251826286316,
"step": 1000,
"valid_targets_mean": 3976.9,
"valid_targets_min": 1273
},
{
"epoch": 1.7327586206896552,
"grad_norm": 0.6729473015193449,
"learning_rate": 3.7414306561028385e-05,
"loss": 0.5628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3718431890010834,
"step": 1005,
"valid_targets_mean": 3988.6,
"valid_targets_min": 505
},
{
"epoch": 1.7413793103448276,
"grad_norm": 0.5651344642180671,
"learning_rate": 3.73718634735467e-05,
"loss": 0.5792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30802202224731445,
"step": 1010,
"valid_targets_mean": 4792.2,
"valid_targets_min": 1894
},
{
"epoch": 1.75,
"grad_norm": 0.8160406841638043,
"learning_rate": 3.732909935400412e-05,
"loss": 0.5709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2621057629585266,
"step": 1015,
"valid_targets_mean": 3583.6,
"valid_targets_min": 1468
},
{
"epoch": 1.7586206896551724,
"grad_norm": 0.6185222015980905,
"learning_rate": 3.7286014992681645e-05,
"loss": 0.5687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619808316230774,
"step": 1020,
"valid_targets_mean": 3748.1,
"valid_targets_min": 585
},
{
"epoch": 1.7672413793103448,
"grad_norm": 0.640359359009962,
"learning_rate": 3.7242611185778325e-05,
"loss": 0.5421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3694639801979065,
"step": 1025,
"valid_targets_mean": 4001.2,
"valid_targets_min": 449
},
{
"epoch": 1.7758620689655173,
"grad_norm": 0.8925661522909636,
"learning_rate": 3.7198888735396574e-05,
"loss": 0.5703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37001776695251465,
"step": 1030,
"valid_targets_mean": 3830.2,
"valid_targets_min": 1482
},
{
"epoch": 1.7844827586206895,
"grad_norm": 0.6379804791552203,
"learning_rate": 3.7154848449527334e-05,
"loss": 0.5647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17609938979148865,
"step": 1035,
"valid_targets_mean": 1858.1,
"valid_targets_min": 777
},
{
"epoch": 1.793103448275862,
"grad_norm": 0.7359978586481348,
"learning_rate": 3.7110491142035145e-05,
"loss": 0.6291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3263494372367859,
"step": 1040,
"valid_targets_mean": 3026.8,
"valid_targets_min": 782
},
{
"epoch": 1.8017241379310345,
"grad_norm": 0.5501378819443856,
"learning_rate": 3.7065817632643115e-05,
"loss": 0.6026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22044426202774048,
"step": 1045,
"valid_targets_mean": 4140.5,
"valid_targets_min": 358
},
{
"epoch": 1.8103448275862069,
"grad_norm": 0.5146610646097317,
"learning_rate": 3.702082874691776e-05,
"loss": 0.5362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27138766646385193,
"step": 1050,
"valid_targets_mean": 5316.9,
"valid_targets_min": 1629
},
{
"epoch": 1.8189655172413794,
"grad_norm": 0.6383974478414849,
"learning_rate": 3.6975525316253744e-05,
"loss": 0.5958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22577664256095886,
"step": 1055,
"valid_targets_mean": 2754.6,
"valid_targets_min": 1739
},
{
"epoch": 1.8275862068965516,
"grad_norm": 0.6577167966442022,
"learning_rate": 3.692990817785853e-05,
"loss": 0.5482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972791999578476,
"step": 1060,
"valid_targets_mean": 2684.1,
"valid_targets_min": 714
},
{
"epoch": 1.8362068965517242,
"grad_norm": 0.762753066575453,
"learning_rate": 3.68839781747369e-05,
"loss": 0.5723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2219727784395218,
"step": 1065,
"valid_targets_mean": 2217.9,
"valid_targets_min": 672
},
{
"epoch": 1.8448275862068966,
"grad_norm": 0.5593369703101698,
"learning_rate": 3.683773615567538e-05,
"loss": 0.5535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3015214204788208,
"step": 1070,
"valid_targets_mean": 5070.4,
"valid_targets_min": 1527
},
{
"epoch": 1.853448275862069,
"grad_norm": 0.7393362257169361,
"learning_rate": 3.679118297522654e-05,
"loss": 0.5468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.355376273393631,
"step": 1075,
"valid_targets_mean": 3456.8,
"valid_targets_min": 1585
},
{
"epoch": 1.8620689655172413,
"grad_norm": 0.5691065100419264,
"learning_rate": 3.674431949369321e-05,
"loss": 0.5659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14589709043502808,
"step": 1080,
"valid_targets_mean": 2719.9,
"valid_targets_min": 1349
},
{
"epoch": 1.8706896551724137,
"grad_norm": 0.6450842387622542,
"learning_rate": 3.6697146577112614e-05,
"loss": 0.5337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23650528490543365,
"step": 1085,
"valid_targets_mean": 3103.2,
"valid_targets_min": 1011
},
{
"epoch": 1.8793103448275863,
"grad_norm": 0.5385390273419834,
"learning_rate": 3.6649665097240304e-05,
"loss": 0.5297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18768148124217987,
"step": 1090,
"valid_targets_mean": 3738.4,
"valid_targets_min": 946
},
{
"epoch": 1.8879310344827587,
"grad_norm": 0.6826042526112265,
"learning_rate": 3.660187593153408e-05,
"loss": 0.5874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2879507541656494,
"step": 1095,
"valid_targets_mean": 3481.0,
"valid_targets_min": 899
},
{
"epoch": 1.896551724137931,
"grad_norm": 0.5991426639597468,
"learning_rate": 3.655377996313782e-05,
"loss": 0.5689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3126043379306793,
"step": 1100,
"valid_targets_mean": 3764.6,
"valid_targets_min": 1376
},
{
"epoch": 1.9051724137931034,
"grad_norm": 0.7434156428546637,
"learning_rate": 3.6505378080865054e-05,
"loss": 0.5656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29617348313331604,
"step": 1105,
"valid_targets_mean": 3182.0,
"valid_targets_min": 376
},
{
"epoch": 1.9137931034482758,
"grad_norm": 0.7376220507013634,
"learning_rate": 3.645667117918265e-05,
"loss": 0.598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2663417458534241,
"step": 1110,
"valid_targets_mean": 2946.8,
"valid_targets_min": 845
},
{
"epoch": 1.9224137931034484,
"grad_norm": 0.8093067307919336,
"learning_rate": 3.640766015819423e-05,
"loss": 0.5685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27129626274108887,
"step": 1115,
"valid_targets_mean": 2276.5,
"valid_targets_min": 644
},
{
"epoch": 1.9310344827586206,
"grad_norm": 0.5931648105041701,
"learning_rate": 3.6358345923623506e-05,
"loss": 0.5883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597714364528656,
"step": 1120,
"valid_targets_mean": 3566.5,
"valid_targets_min": 360
},
{
"epoch": 1.9396551724137931,
"grad_norm": 0.738013686632746,
"learning_rate": 3.630872938679761e-05,
"loss": 0.5421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23417630791664124,
"step": 1125,
"valid_targets_mean": 2241.8,
"valid_targets_min": 578
},
{
"epoch": 1.9482758620689655,
"grad_norm": 0.6536051717630208,
"learning_rate": 3.6258811464630215e-05,
"loss": 0.5475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.274051696062088,
"step": 1130,
"valid_targets_mean": 4223.8,
"valid_targets_min": 1954
},
{
"epoch": 1.956896551724138,
"grad_norm": 0.6558108915171494,
"learning_rate": 3.620859307960458e-05,
"loss": 0.5642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24242520332336426,
"step": 1135,
"valid_targets_mean": 3583.0,
"valid_targets_min": 573
},
{
"epoch": 1.9655172413793105,
"grad_norm": 0.6073167182222721,
"learning_rate": 3.615807515975654e-05,
"loss": 0.5769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3692033290863037,
"step": 1140,
"valid_targets_mean": 4391.9,
"valid_targets_min": 1444
},
{
"epoch": 1.9741379310344827,
"grad_norm": 0.6930399535333776,
"learning_rate": 3.6107258638657324e-05,
"loss": 0.6037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3953619599342346,
"step": 1145,
"valid_targets_mean": 3482.9,
"valid_targets_min": 687
},
{
"epoch": 1.9827586206896552,
"grad_norm": 0.7208553198716309,
"learning_rate": 3.60561444553963e-05,
"loss": 0.545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.300916850566864,
"step": 1150,
"valid_targets_mean": 2875.0,
"valid_targets_min": 543
},
{
"epoch": 1.9913793103448276,
"grad_norm": 0.6244319777954573,
"learning_rate": 3.600473355456366e-05,
"loss": 0.5711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2742713689804077,
"step": 1155,
"valid_targets_mean": 3724.2,
"valid_targets_min": 669
},
{
"epoch": 2.0,
"grad_norm": 0.48027221325927555,
"learning_rate": 3.595302688623291e-05,
"loss": 0.5181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2375207096338272,
"step": 1160,
"valid_targets_mean": 5709.9,
"valid_targets_min": 988
},
{
"epoch": 2.0086206896551726,
"grad_norm": 0.5856447431662087,
"learning_rate": 3.590102540594337e-05,
"loss": 0.5453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30319711565971375,
"step": 1165,
"valid_targets_mean": 5402.0,
"valid_targets_min": 1635
},
{
"epoch": 2.0172413793103448,
"grad_norm": 0.7330528758146855,
"learning_rate": 3.584873007468244e-05,
"loss": 0.5198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27307698130607605,
"step": 1170,
"valid_targets_mean": 2848.5,
"valid_targets_min": 1847
},
{
"epoch": 2.0258620689655173,
"grad_norm": 0.7161268600907155,
"learning_rate": 3.5796141858867935e-05,
"loss": 0.5027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34653913974761963,
"step": 1175,
"valid_targets_mean": 4229.5,
"valid_targets_min": 1459
},
{
"epoch": 2.0344827586206895,
"grad_norm": 0.5659681020477086,
"learning_rate": 3.5743261730330144e-05,
"loss": 0.525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24164336919784546,
"step": 1180,
"valid_targets_mean": 4535.0,
"valid_targets_min": 1595
},
{
"epoch": 2.043103448275862,
"grad_norm": 0.4950635871322631,
"learning_rate": 3.569009066629392e-05,
"loss": 0.4908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23670178651809692,
"step": 1185,
"valid_targets_mean": 6254.8,
"valid_targets_min": 1354
},
{
"epoch": 2.0517241379310347,
"grad_norm": 0.6259920795782811,
"learning_rate": 3.56366296493606e-05,
"loss": 0.4903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27048274874687195,
"step": 1190,
"valid_targets_mean": 4885.5,
"valid_targets_min": 746
},
{
"epoch": 2.060344827586207,
"grad_norm": 0.6708662248079352,
"learning_rate": 3.558287966748985e-05,
"loss": 0.5362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30487942695617676,
"step": 1195,
"valid_targets_mean": 3506.9,
"valid_targets_min": 699
},
{
"epoch": 2.0689655172413794,
"grad_norm": 0.6187149631493275,
"learning_rate": 3.552884171398141e-05,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3041895925998688,
"step": 1200,
"valid_targets_mean": 4673.4,
"valid_targets_min": 1416
},
{
"epoch": 2.0775862068965516,
"grad_norm": 0.6913500596782618,
"learning_rate": 3.547451678745673e-05,
"loss": 0.5435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3575402498245239,
"step": 1205,
"valid_targets_mean": 3261.8,
"valid_targets_min": 585
},
{
"epoch": 2.086206896551724,
"grad_norm": 0.5514253157032389,
"learning_rate": 3.541990589184053e-05,
"loss": 0.5061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2519359290599823,
"step": 1210,
"valid_targets_mean": 4331.5,
"valid_targets_min": 1142
},
{
"epoch": 2.0948275862068964,
"grad_norm": 0.661119552726637,
"learning_rate": 3.5365010036342245e-05,
"loss": 0.5097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.236103817820549,
"step": 1215,
"valid_targets_mean": 3665.9,
"valid_targets_min": 2115
},
{
"epoch": 2.103448275862069,
"grad_norm": 0.8185562556513293,
"learning_rate": 3.530983023543734e-05,
"loss": 0.5356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31141743063926697,
"step": 1220,
"valid_targets_mean": 3175.2,
"valid_targets_min": 553
},
{
"epoch": 2.1120689655172415,
"grad_norm": 0.637393506264498,
"learning_rate": 3.525436750884863e-05,
"loss": 0.5785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3377242088317871,
"step": 1225,
"valid_targets_mean": 4718.9,
"valid_targets_min": 1464
},
{
"epoch": 2.1206896551724137,
"grad_norm": 0.7000643799771167,
"learning_rate": 3.5198622881527374e-05,
"loss": 0.5361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17588718235492706,
"step": 1230,
"valid_targets_mean": 1794.2,
"valid_targets_min": 634
},
{
"epoch": 2.1293103448275863,
"grad_norm": 0.7836403305595876,
"learning_rate": 3.514259738363436e-05,
"loss": 0.5403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22173136472702026,
"step": 1235,
"valid_targets_mean": 2264.4,
"valid_targets_min": 759
},
{
"epoch": 2.1379310344827585,
"grad_norm": 0.6896222117398101,
"learning_rate": 3.5086292050520855e-05,
"loss": 0.5224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2105882465839386,
"step": 1240,
"valid_targets_mean": 2616.1,
"valid_targets_min": 829
},
{
"epoch": 2.146551724137931,
"grad_norm": 0.5989637638408554,
"learning_rate": 3.502970792270951e-05,
"loss": 0.5352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3733382523059845,
"step": 1245,
"valid_targets_mean": 5749.2,
"valid_targets_min": 943
},
{
"epoch": 2.1551724137931036,
"grad_norm": 0.5854317531631298,
"learning_rate": 3.497284604587508e-05,
"loss": 0.5462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21069422364234924,
"step": 1250,
"valid_targets_mean": 3517.9,
"valid_targets_min": 1692
},
{
"epoch": 2.163793103448276,
"grad_norm": 0.6059368591518353,
"learning_rate": 3.491570747082512e-05,
"loss": 0.5363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3978424668312073,
"step": 1255,
"valid_targets_mean": 5706.0,
"valid_targets_min": 2893
},
{
"epoch": 2.1724137931034484,
"grad_norm": 0.6915074580961807,
"learning_rate": 3.485829325348059e-05,
"loss": 0.5327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25558722019195557,
"step": 1260,
"valid_targets_mean": 3663.6,
"valid_targets_min": 603
},
{
"epoch": 2.1810344827586206,
"grad_norm": 0.6260784283173534,
"learning_rate": 3.4800604454856284e-05,
"loss": 0.5269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34905317425727844,
"step": 1265,
"valid_targets_mean": 5479.1,
"valid_targets_min": 1430
},
{
"epoch": 2.189655172413793,
"grad_norm": 0.8041527550042902,
"learning_rate": 3.47426421410413e-05,
"loss": 0.5285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525642216205597,
"step": 1270,
"valid_targets_mean": 1884.0,
"valid_targets_min": 449
},
{
"epoch": 2.1982758620689653,
"grad_norm": 0.6165577267512379,
"learning_rate": 3.468440738317926e-05,
"loss": 0.5213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24296146631240845,
"step": 1275,
"valid_targets_mean": 3509.9,
"valid_targets_min": 808
},
{
"epoch": 2.206896551724138,
"grad_norm": 0.7388739054714368,
"learning_rate": 3.4625901257448596e-05,
"loss": 0.5153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27573007345199585,
"step": 1280,
"valid_targets_mean": 2770.6,
"valid_targets_min": 1382
},
{
"epoch": 2.2155172413793105,
"grad_norm": 0.7213845700851882,
"learning_rate": 3.4567124845042564e-05,
"loss": 0.5097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23074638843536377,
"step": 1285,
"valid_targets_mean": 2694.5,
"valid_targets_min": 590
},
{
"epoch": 2.2241379310344827,
"grad_norm": 0.7344427687166307,
"learning_rate": 3.4508079232149354e-05,
"loss": 0.531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18814852833747864,
"step": 1290,
"valid_targets_mean": 2153.9,
"valid_targets_min": 384
},
{
"epoch": 2.2327586206896552,
"grad_norm": 0.7193043812909778,
"learning_rate": 3.444876550993198e-05,
"loss": 0.5276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1843530833721161,
"step": 1295,
"valid_targets_mean": 2371.8,
"valid_targets_min": 688
},
{
"epoch": 2.2413793103448274,
"grad_norm": 0.6514805960089244,
"learning_rate": 3.4389184774508105e-05,
"loss": 0.5329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27728837728500366,
"step": 1300,
"valid_targets_mean": 3690.1,
"valid_targets_min": 2078
},
{
"epoch": 2.25,
"grad_norm": 0.7699933360610283,
"learning_rate": 3.43293381269298e-05,
"loss": 0.5288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1803208887577057,
"step": 1305,
"valid_targets_mean": 1974.6,
"valid_targets_min": 679
},
{
"epoch": 2.2586206896551726,
"grad_norm": 0.7015909626972417,
"learning_rate": 3.4269226673163204e-05,
"loss": 0.5561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21470309793949127,
"step": 1310,
"valid_targets_mean": 2602.1,
"valid_targets_min": 520
},
{
"epoch": 2.2672413793103448,
"grad_norm": 0.6252001020266619,
"learning_rate": 3.420885152406805e-05,
"loss": 0.5063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16884250938892365,
"step": 1315,
"valid_targets_mean": 2221.1,
"valid_targets_min": 525
},
{
"epoch": 2.2758620689655173,
"grad_norm": 0.6660044917747885,
"learning_rate": 3.4148213795377194e-05,
"loss": 0.499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23926129937171936,
"step": 1320,
"valid_targets_mean": 3184.8,
"valid_targets_min": 1308
},
{
"epoch": 2.2844827586206895,
"grad_norm": 0.5942881743308523,
"learning_rate": 3.408731460767593e-05,
"loss": 0.5297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2458754926919937,
"step": 1325,
"valid_targets_mean": 3705.9,
"valid_targets_min": 224
},
{
"epoch": 2.293103448275862,
"grad_norm": 0.6559455552008154,
"learning_rate": 3.402615508638134e-05,
"loss": 0.5145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22481057047843933,
"step": 1330,
"valid_targets_mean": 3710.4,
"valid_targets_min": 775
},
{
"epoch": 2.3017241379310347,
"grad_norm": 0.5791109072786359,
"learning_rate": 3.396473636172146e-05,
"loss": 0.5553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3390901982784271,
"step": 1335,
"valid_targets_mean": 5454.2,
"valid_targets_min": 699
},
{
"epoch": 2.310344827586207,
"grad_norm": 0.6528879026655229,
"learning_rate": 3.3903059568714406e-05,
"loss": 0.5262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2803526222705841,
"step": 1340,
"valid_targets_mean": 4691.2,
"valid_targets_min": 1937
},
{
"epoch": 2.3189655172413794,
"grad_norm": 0.7334531238595307,
"learning_rate": 3.384112584714739e-05,
"loss": 0.5669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25998979806900024,
"step": 1345,
"valid_targets_mean": 2414.1,
"valid_targets_min": 872
},
{
"epoch": 2.3275862068965516,
"grad_norm": 0.6706388706657296,
"learning_rate": 3.377893634155568e-05,
"loss": 0.4946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20304179191589355,
"step": 1350,
"valid_targets_mean": 2520.6,
"valid_targets_min": 548
},
{
"epoch": 2.336206896551724,
"grad_norm": 0.6070209292783567,
"learning_rate": 3.371649220120143e-05,
"loss": 0.5372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23858051002025604,
"step": 1355,
"valid_targets_mean": 3398.2,
"valid_targets_min": 1239
},
{
"epoch": 2.344827586206897,
"grad_norm": 0.7403730502951553,
"learning_rate": 3.365379458005243e-05,
"loss": 0.5054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22786666452884674,
"step": 1360,
"valid_targets_mean": 2695.2,
"valid_targets_min": 743
},
{
"epoch": 2.353448275862069,
"grad_norm": 0.6160438267365825,
"learning_rate": 3.35908446367608e-05,
"loss": 0.5121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2835865020751953,
"step": 1365,
"valid_targets_mean": 4868.5,
"valid_targets_min": 2282
},
{
"epoch": 2.3620689655172415,
"grad_norm": 0.7046709820942064,
"learning_rate": 3.35276435346416e-05,
"loss": 0.5285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3344838321208954,
"step": 1370,
"valid_targets_mean": 3689.5,
"valid_targets_min": 827
},
{
"epoch": 2.3706896551724137,
"grad_norm": 0.6216160994750745,
"learning_rate": 3.346419244165127e-05,
"loss": 0.5405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3214781880378723,
"step": 1375,
"valid_targets_mean": 4100.1,
"valid_targets_min": 1151
},
{
"epoch": 2.3793103448275863,
"grad_norm": 0.7168615045877246,
"learning_rate": 3.3400492530366086e-05,
"loss": 0.5204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20914702117443085,
"step": 1380,
"valid_targets_mean": 2650.0,
"valid_targets_min": 1076
},
{
"epoch": 2.3879310344827585,
"grad_norm": 0.5642488910557313,
"learning_rate": 3.333654497796051e-05,
"loss": 0.533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19634991884231567,
"step": 1385,
"valid_targets_mean": 4127.8,
"valid_targets_min": 2108
},
{
"epoch": 2.396551724137931,
"grad_norm": 0.6683303924854348,
"learning_rate": 3.32723509661854e-05,
"loss": 0.5526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20605990290641785,
"step": 1390,
"valid_targets_mean": 2370.1,
"valid_targets_min": 727
},
{
"epoch": 2.405172413793103,
"grad_norm": 0.6217914813865608,
"learning_rate": 3.320791168134617e-05,
"loss": 0.5063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21512621641159058,
"step": 1395,
"valid_targets_mean": 3568.4,
"valid_targets_min": 1538
},
{
"epoch": 2.413793103448276,
"grad_norm": 0.7781917849824482,
"learning_rate": 3.31432283142809e-05,
"loss": 0.5619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29964110255241394,
"step": 1400,
"valid_targets_mean": 2767.4,
"valid_targets_min": 1923
},
{
"epoch": 2.4224137931034484,
"grad_norm": 0.6605249390307784,
"learning_rate": 3.307830206033831e-05,
"loss": 0.4859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29924869537353516,
"step": 1405,
"valid_targets_mean": 3953.2,
"valid_targets_min": 1292
},
{
"epoch": 2.4310344827586206,
"grad_norm": 0.7248729187206819,
"learning_rate": 3.301313411935565e-05,
"loss": 0.5529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2112955003976822,
"step": 1410,
"valid_targets_mean": 3034.6,
"valid_targets_min": 1475
},
{
"epoch": 2.439655172413793,
"grad_norm": 0.7278902760761354,
"learning_rate": 3.294772569563656e-05,
"loss": 0.5258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18192905187606812,
"step": 1415,
"valid_targets_mean": 2044.2,
"valid_targets_min": 601
},
{
"epoch": 2.4482758620689653,
"grad_norm": 0.64996168644576,
"learning_rate": 3.28820779979288e-05,
"loss": 0.5494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32071739435195923,
"step": 1420,
"valid_targets_mean": 4041.8,
"valid_targets_min": 722
},
{
"epoch": 2.456896551724138,
"grad_norm": 0.7663835356371171,
"learning_rate": 3.281619223940192e-05,
"loss": 0.5397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934093475341797,
"step": 1425,
"valid_targets_mean": 2963.6,
"valid_targets_min": 868
},
{
"epoch": 2.4655172413793105,
"grad_norm": 0.6175608448597791,
"learning_rate": 3.2750069637624826e-05,
"loss": 0.5451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3377595543861389,
"step": 1430,
"valid_targets_mean": 4578.6,
"valid_targets_min": 826
},
{
"epoch": 2.4741379310344827,
"grad_norm": 0.7053303469776532,
"learning_rate": 3.2683711414543295e-05,
"loss": 0.5272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21549789607524872,
"step": 1435,
"valid_targets_mean": 2838.2,
"valid_targets_min": 1878
},
{
"epoch": 2.4827586206896552,
"grad_norm": 0.7720525074341179,
"learning_rate": 3.261711879645737e-05,
"loss": 0.5284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23706737160682678,
"step": 1440,
"valid_targets_mean": 2927.0,
"valid_targets_min": 1586
},
{
"epoch": 2.4913793103448274,
"grad_norm": 0.6610418282529897,
"learning_rate": 3.255029301399873e-05,
"loss": 0.5382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260223925113678,
"step": 1445,
"valid_targets_mean": 3151.2,
"valid_targets_min": 971
},
{
"epoch": 2.5,
"grad_norm": 0.6761189439890816,
"learning_rate": 3.248323530210793e-05,
"loss": 0.5382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32373419404029846,
"step": 1450,
"valid_targets_mean": 3626.5,
"valid_targets_min": 1237
},
{
"epoch": 2.5086206896551726,
"grad_norm": 0.6059901254993909,
"learning_rate": 3.241594690001157e-05,
"loss": 0.5212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2417319416999817,
"step": 1455,
"valid_targets_mean": 4077.8,
"valid_targets_min": 1227
},
{
"epoch": 2.5172413793103448,
"grad_norm": 0.6563136263005875,
"learning_rate": 3.2348429051199424e-05,
"loss": 0.5293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2823067605495453,
"step": 1460,
"valid_targets_mean": 3091.4,
"valid_targets_min": 1724
},
{
"epoch": 2.5258620689655173,
"grad_norm": 0.7011191203587458,
"learning_rate": 3.228068300340142e-05,
"loss": 0.4991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21909786760807037,
"step": 1465,
"valid_targets_mean": 2642.6,
"valid_targets_min": 333
},
{
"epoch": 2.5344827586206895,
"grad_norm": 0.5963350141222057,
"learning_rate": 3.221271000856462e-05,
"loss": 0.5457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24788910150527954,
"step": 1470,
"valid_targets_mean": 4478.2,
"valid_targets_min": 1019
},
{
"epoch": 2.543103448275862,
"grad_norm": 0.593167616912684,
"learning_rate": 3.214451132283006e-05,
"loss": 0.527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1979059875011444,
"step": 1475,
"valid_targets_mean": 3345.1,
"valid_targets_min": 447
},
{
"epoch": 2.5517241379310347,
"grad_norm": 0.8516404992092461,
"learning_rate": 3.207608820650955e-05,
"loss": 0.5231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16317282617092133,
"step": 1480,
"valid_targets_mean": 1854.1,
"valid_targets_min": 572
},
{
"epoch": 2.560344827586207,
"grad_norm": 0.7011631826201656,
"learning_rate": 3.2007441924062374e-05,
"loss": 0.5337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26514554023742676,
"step": 1485,
"valid_targets_mean": 3083.2,
"valid_targets_min": 1483
},
{
"epoch": 2.5689655172413794,
"grad_norm": 0.6304731407800173,
"learning_rate": 3.193857374407192e-05,
"loss": 0.48,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2470451146364212,
"step": 1490,
"valid_targets_mean": 4148.5,
"valid_targets_min": 1957
},
{
"epoch": 2.5775862068965516,
"grad_norm": 0.6114733267413521,
"learning_rate": 3.186948493922225e-05,
"loss": 0.547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3491957187652588,
"step": 1495,
"valid_targets_mean": 5381.4,
"valid_targets_min": 1451
},
{
"epoch": 2.586206896551724,
"grad_norm": 0.6816944170488414,
"learning_rate": 3.180017678627458e-05,
"loss": 0.5967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2270176112651825,
"step": 1500,
"valid_targets_mean": 3054.8,
"valid_targets_min": 1323
},
{
"epoch": 2.594827586206897,
"grad_norm": 0.7494842689929292,
"learning_rate": 3.173065056604366e-05,
"loss": 0.5136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2226772904396057,
"step": 1505,
"valid_targets_mean": 2615.2,
"valid_targets_min": 1722
},
{
"epoch": 2.603448275862069,
"grad_norm": 0.6433063056386409,
"learning_rate": 3.166090756337415e-05,
"loss": 0.5177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21712681651115417,
"step": 1510,
"valid_targets_mean": 2954.0,
"valid_targets_min": 1400
},
{
"epoch": 2.612068965517241,
"grad_norm": 0.6961184844546833,
"learning_rate": 3.159094906711683e-05,
"loss": 0.5239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3057723343372345,
"step": 1515,
"valid_targets_mean": 3615.5,
"valid_targets_min": 1354
},
{
"epoch": 2.6206896551724137,
"grad_norm": 0.545448810661674,
"learning_rate": 3.15207763701048e-05,
"loss": 0.5392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17520517110824585,
"step": 1520,
"valid_targets_mean": 3273.5,
"valid_targets_min": 810
},
{
"epoch": 2.6293103448275863,
"grad_norm": 0.7398151880436875,
"learning_rate": 3.14503907691296e-05,
"loss": 0.5192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3340669572353363,
"step": 1525,
"valid_targets_mean": 4266.0,
"valid_targets_min": 1420
},
{
"epoch": 2.637931034482759,
"grad_norm": 0.6137448794815791,
"learning_rate": 3.1379793564917235e-05,
"loss": 0.5231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983524799346924,
"step": 1530,
"valid_targets_mean": 3807.5,
"valid_targets_min": 1186
},
{
"epoch": 2.646551724137931,
"grad_norm": 0.6892239692209475,
"learning_rate": 3.130898606210414e-05,
"loss": 0.5334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3036305010318756,
"step": 1535,
"valid_targets_mean": 3669.1,
"valid_targets_min": 1027
},
{
"epoch": 2.655172413793103,
"grad_norm": 0.6042307659721222,
"learning_rate": 3.1237969569213056e-05,
"loss": 0.5045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24306747317314148,
"step": 1540,
"valid_targets_mean": 4035.2,
"valid_targets_min": 542
},
{
"epoch": 2.663793103448276,
"grad_norm": 0.8334671686011501,
"learning_rate": 3.1166745398628874e-05,
"loss": 0.5805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19789639115333557,
"step": 1545,
"valid_targets_mean": 2123.8,
"valid_targets_min": 1039
},
{
"epoch": 2.6724137931034484,
"grad_norm": 0.6708117196991292,
"learning_rate": 3.109531486657437e-05,
"loss": 0.5227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20612336695194244,
"step": 1550,
"valid_targets_mean": 2896.1,
"valid_targets_min": 525
},
{
"epoch": 2.6810344827586206,
"grad_norm": 0.648789931136324,
"learning_rate": 3.102367929308586e-05,
"loss": 0.4925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2443523108959198,
"step": 1555,
"valid_targets_mean": 3337.5,
"valid_targets_min": 355
},
{
"epoch": 2.689655172413793,
"grad_norm": 0.6629620042366543,
"learning_rate": 3.0951840001988854e-05,
"loss": 0.5205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35953301191329956,
"step": 1560,
"valid_targets_mean": 4085.9,
"valid_targets_min": 1662
},
{
"epoch": 2.6982758620689653,
"grad_norm": 0.6425392266887242,
"learning_rate": 3.0879798320873546e-05,
"loss": 0.5215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3335888683795929,
"step": 1565,
"valid_targets_mean": 4582.8,
"valid_targets_min": 305
},
{
"epoch": 2.706896551724138,
"grad_norm": 0.6788939491162826,
"learning_rate": 3.0807555581070304e-05,
"loss": 0.5386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21099033951759338,
"step": 1570,
"valid_targets_mean": 2514.8,
"valid_targets_min": 379
},
{
"epoch": 2.7155172413793105,
"grad_norm": 0.5663003368589072,
"learning_rate": 3.0735113117625045e-05,
"loss": 0.5191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2197110652923584,
"step": 1575,
"valid_targets_mean": 3289.1,
"valid_targets_min": 1913
},
{
"epoch": 2.7241379310344827,
"grad_norm": 0.6638782454802991,
"learning_rate": 3.0662472269274617e-05,
"loss": 0.5152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2275673747062683,
"step": 1580,
"valid_targets_mean": 2688.1,
"valid_targets_min": 808
},
{
"epoch": 2.7327586206896552,
"grad_norm": 0.6255538446405725,
"learning_rate": 3.058963437842198e-05,
"loss": 0.5289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22095435857772827,
"step": 1585,
"valid_targets_mean": 3796.5,
"valid_targets_min": 278
},
{
"epoch": 2.7413793103448274,
"grad_norm": 0.7320428985273902,
"learning_rate": 3.0516600791111465e-05,
"loss": 0.5589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32439008355140686,
"step": 1590,
"valid_targets_mean": 3684.9,
"valid_targets_min": 1568
},
{
"epoch": 2.75,
"grad_norm": 0.6438464021090996,
"learning_rate": 3.0443372857003857e-05,
"loss": 0.54,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23027420043945312,
"step": 1595,
"valid_targets_mean": 3581.9,
"valid_targets_min": 824
},
{
"epoch": 2.7586206896551726,
"grad_norm": 0.5545857332698958,
"learning_rate": 3.036995192935149e-05,
"loss": 0.5087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14524194598197937,
"step": 1600,
"valid_targets_mean": 2816.8,
"valid_targets_min": 856
},
{
"epoch": 2.7672413793103448,
"grad_norm": 0.5086626682547694,
"learning_rate": 3.029633936497321e-05,
"loss": 0.5171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1898607611656189,
"step": 1605,
"valid_targets_mean": 4273.4,
"valid_targets_min": 1829
},
{
"epoch": 2.7758620689655173,
"grad_norm": 0.6651291467249401,
"learning_rate": 3.0222536524229293e-05,
"loss": 0.4846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34460657835006714,
"step": 1610,
"valid_targets_mean": 4023.6,
"valid_targets_min": 422
},
{
"epoch": 2.7844827586206895,
"grad_norm": 0.6564925258448345,
"learning_rate": 3.0148544770996343e-05,
"loss": 0.5208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18299517035484314,
"step": 1615,
"valid_targets_mean": 2348.9,
"valid_targets_min": 815
},
{
"epoch": 2.793103448275862,
"grad_norm": 0.6070334989595733,
"learning_rate": 3.007436547264207e-05,
"loss": 0.5325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28292137384414673,
"step": 1620,
"valid_targets_mean": 4357.8,
"valid_targets_min": 1053
},
{
"epoch": 2.8017241379310347,
"grad_norm": 0.6572055384794816,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.5248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29250192642211914,
"step": 1625,
"valid_targets_mean": 5173.9,
"valid_targets_min": 2061
},
{
"epoch": 2.810344827586207,
"grad_norm": 0.6925557917291159,
"learning_rate": 2.9925449727344184e-05,
"loss": 0.5264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30762213468551636,
"step": 1630,
"valid_targets_mean": 3761.1,
"valid_targets_min": 1011
},
{
"epoch": 2.8189655172413794,
"grad_norm": 0.6649410248775828,
"learning_rate": 2.985071603236374e-05,
"loss": 0.5271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22346317768096924,
"step": 1635,
"valid_targets_mean": 2541.2,
"valid_targets_min": 464
},
{
"epoch": 2.8275862068965516,
"grad_norm": 0.6368963124979056,
"learning_rate": 2.9775800296137474e-05,
"loss": 0.5056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19894252717494965,
"step": 1640,
"valid_targets_mean": 2954.8,
"valid_targets_min": 507
},
{
"epoch": 2.836206896551724,
"grad_norm": 0.6563286820648637,
"learning_rate": 2.970070390310828e-05,
"loss": 0.5365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22569561004638672,
"step": 1645,
"valid_targets_mean": 3002.4,
"valid_targets_min": 858
},
{
"epoch": 2.844827586206897,
"grad_norm": 0.735343254781571,
"learning_rate": 2.962542824105762e-05,
"loss": 0.5358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2973644733428955,
"step": 1650,
"valid_targets_mean": 4036.9,
"valid_targets_min": 753
},
{
"epoch": 2.853448275862069,
"grad_norm": 0.5751232737303497,
"learning_rate": 2.954997470107982e-05,
"loss": 0.4989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16975465416908264,
"step": 1655,
"valid_targets_mean": 2872.4,
"valid_targets_min": 563
},
{
"epoch": 2.862068965517241,
"grad_norm": 0.7517885308967944,
"learning_rate": 2.947434467755641e-05,
"loss": 0.5731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31603339314460754,
"step": 1660,
"valid_targets_mean": 2926.6,
"valid_targets_min": 1582
},
{
"epoch": 2.8706896551724137,
"grad_norm": 0.6477449192786452,
"learning_rate": 2.9398539568130327e-05,
"loss": 0.5898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31569886207580566,
"step": 1665,
"valid_targets_mean": 2998.9,
"valid_targets_min": 350
},
{
"epoch": 2.8793103448275863,
"grad_norm": 0.6412838960401286,
"learning_rate": 2.9322560773680087e-05,
"loss": 0.4843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672387361526489,
"step": 1670,
"valid_targets_mean": 3486.6,
"valid_targets_min": 464
},
{
"epoch": 2.887931034482759,
"grad_norm": 0.6584277587208057,
"learning_rate": 2.924640969829393e-05,
"loss": 0.5575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27888116240501404,
"step": 1675,
"valid_targets_mean": 3456.2,
"valid_targets_min": 1280
},
{
"epoch": 2.896551724137931,
"grad_norm": 0.6355034785984488,
"learning_rate": 2.9170087749243832e-05,
"loss": 0.5556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856561541557312,
"step": 1680,
"valid_targets_mean": 4470.8,
"valid_targets_min": 777
},
{
"epoch": 2.905172413793103,
"grad_norm": 0.5522129444874521,
"learning_rate": 2.9093596336959513e-05,
"loss": 0.5217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21474653482437134,
"step": 1685,
"valid_targets_mean": 3683.0,
"valid_targets_min": 556
},
{
"epoch": 2.913793103448276,
"grad_norm": 0.6079117430065913,
"learning_rate": 2.9016936875002377e-05,
"loss": 0.5326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18614447116851807,
"step": 1690,
"valid_targets_mean": 2769.2,
"valid_targets_min": 1703
},
{
"epoch": 2.9224137931034484,
"grad_norm": 0.8154640803310477,
"learning_rate": 2.8940110780039385e-05,
"loss": 0.5368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3220832049846649,
"step": 1695,
"valid_targets_mean": 4347.4,
"valid_targets_min": 455
},
{
"epoch": 2.9310344827586206,
"grad_norm": 0.7008249840337234,
"learning_rate": 2.8863119471816878e-05,
"loss": 0.5359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307187557220459,
"step": 1700,
"valid_targets_mean": 3782.1,
"valid_targets_min": 1743
},
{
"epoch": 2.939655172413793,
"grad_norm": 1.8383581207079867,
"learning_rate": 2.878596437313434e-05,
"loss": 0.5455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3547545075416565,
"step": 1705,
"valid_targets_mean": 3102.1,
"valid_targets_min": 1146
},
{
"epoch": 2.9482758620689653,
"grad_norm": 0.6890582013953978,
"learning_rate": 2.87086469098181e-05,
"loss": 0.5464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3087565302848816,
"step": 1710,
"valid_targets_mean": 3642.0,
"valid_targets_min": 785
},
{
"epoch": 2.956896551724138,
"grad_norm": 0.6014663654543025,
"learning_rate": 2.863116851069499e-05,
"loss": 0.5198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3157251477241516,
"step": 1715,
"valid_targets_mean": 4566.4,
"valid_targets_min": 1703
},
{
"epoch": 2.9655172413793105,
"grad_norm": 0.6183718750559749,
"learning_rate": 2.855353060756593e-05,
"loss": 0.5583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3171611428260803,
"step": 1720,
"valid_targets_mean": 4044.4,
"valid_targets_min": 921
},
{
"epoch": 2.9741379310344827,
"grad_norm": 0.6770199017058159,
"learning_rate": 2.8475734635179472e-05,
"loss": 0.5231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20549774169921875,
"step": 1725,
"valid_targets_mean": 2707.2,
"valid_targets_min": 786
},
{
"epoch": 2.9827586206896552,
"grad_norm": 0.6267781432228309,
"learning_rate": 2.8397782031205295e-05,
"loss": 0.5278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000187277793884,
"step": 1730,
"valid_targets_mean": 4574.9,
"valid_targets_min": 382
},
{
"epoch": 2.9913793103448274,
"grad_norm": 0.6597096565482661,
"learning_rate": 2.8319674236207634e-05,
"loss": 0.492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2720503807067871,
"step": 1735,
"valid_targets_mean": 3237.6,
"valid_targets_min": 315
},
{
"epoch": 3.0,
"grad_norm": 0.6370988041102025,
"learning_rate": 2.8241412693618638e-05,
"loss": 0.5817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47008463740348816,
"step": 1740,
"valid_targets_mean": 5323.2,
"valid_targets_min": 791
},
{
"epoch": 3.0086206896551726,
"grad_norm": 0.5006687241913529,
"learning_rate": 2.816299884971173e-05,
"loss": 0.5026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24396368861198425,
"step": 1745,
"valid_targets_mean": 5369.8,
"valid_targets_min": 2674
},
{
"epoch": 3.0172413793103448,
"grad_norm": 0.5939923129308482,
"learning_rate": 2.8084434153574847e-05,
"loss": 0.5129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22303283214569092,
"step": 1750,
"valid_targets_mean": 3715.1,
"valid_targets_min": 1836
},
{
"epoch": 3.0258620689655173,
"grad_norm": 0.7216174616024418,
"learning_rate": 2.8005720057083685e-05,
"loss": 0.5277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28930047154426575,
"step": 1755,
"valid_targets_mean": 3260.1,
"valid_targets_min": 1785
},
{
"epoch": 3.0344827586206895,
"grad_norm": 0.7138077000722072,
"learning_rate": 2.792685801487486e-05,
"loss": 0.5313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21426135301589966,
"step": 1760,
"valid_targets_mean": 2808.0,
"valid_targets_min": 1549
},
{
"epoch": 3.043103448275862,
"grad_norm": 0.6304834277842427,
"learning_rate": 2.7847849484319008e-05,
"loss": 0.469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.240925133228302,
"step": 1765,
"valid_targets_mean": 4177.4,
"valid_targets_min": 1711
},
{
"epoch": 3.0517241379310347,
"grad_norm": 0.7227466624603867,
"learning_rate": 2.7768695925493897e-05,
"loss": 0.5099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26144564151763916,
"step": 1770,
"valid_targets_mean": 3339.5,
"valid_targets_min": 306
},
{
"epoch": 3.060344827586207,
"grad_norm": 0.7157335610062132,
"learning_rate": 2.7689398801157393e-05,
"loss": 0.494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26888376474380493,
"step": 1775,
"valid_targets_mean": 3690.0,
"valid_targets_min": 1804
},
{
"epoch": 3.0689655172413794,
"grad_norm": 0.5782389133302738,
"learning_rate": 2.7609959576720467e-05,
"loss": 0.4676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19823557138442993,
"step": 1780,
"valid_targets_mean": 3715.9,
"valid_targets_min": 505
},
{
"epoch": 3.0775862068965516,
"grad_norm": 0.7773493115682202,
"learning_rate": 2.7530379720220096e-05,
"loss": 0.4946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1992146074771881,
"step": 1785,
"valid_targets_mean": 2262.2,
"valid_targets_min": 663
},
{
"epoch": 3.086206896551724,
"grad_norm": 0.741058590026973,
"learning_rate": 2.7450660702292132e-05,
"loss": 0.4946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29747503995895386,
"step": 1790,
"valid_targets_mean": 3664.2,
"valid_targets_min": 754
},
{
"epoch": 3.0948275862068964,
"grad_norm": 0.6655355159285354,
"learning_rate": 2.7370803996144143e-05,
"loss": 0.5224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30806177854537964,
"step": 1795,
"valid_targets_mean": 4508.5,
"valid_targets_min": 1059
},
{
"epoch": 3.103448275862069,
"grad_norm": 0.7684487595267243,
"learning_rate": 2.7290811077528166e-05,
"loss": 0.5114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24772027134895325,
"step": 1800,
"valid_targets_mean": 2500.2,
"valid_targets_min": 1039
},
{
"epoch": 3.1120689655172415,
"grad_norm": 0.5519635037547266,
"learning_rate": 2.7210683424713447e-05,
"loss": 0.5154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18051207065582275,
"step": 1805,
"valid_targets_mean": 4038.2,
"valid_targets_min": 1334
},
{
"epoch": 3.1206896551724137,
"grad_norm": 0.7459536824641055,
"learning_rate": 2.7130422518459113e-05,
"loss": 0.4894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261766254901886,
"step": 1810,
"valid_targets_mean": 3044.9,
"valid_targets_min": 1218
},
{
"epoch": 3.1293103448275863,
"grad_norm": 0.5779130633158371,
"learning_rate": 2.705002984198684e-05,
"loss": 0.4887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20895667374134064,
"step": 1815,
"valid_targets_mean": 4266.2,
"valid_targets_min": 1510
},
{
"epoch": 3.1379310344827585,
"grad_norm": 0.6672732033247093,
"learning_rate": 2.6969506880953384e-05,
"loss": 0.4987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21796973049640656,
"step": 1820,
"valid_targets_mean": 3656.4,
"valid_targets_min": 1407
},
{
"epoch": 3.146551724137931,
"grad_norm": 0.6777179149459249,
"learning_rate": 2.688885512342318e-05,
"loss": 0.4933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26772722601890564,
"step": 1825,
"valid_targets_mean": 4573.4,
"valid_targets_min": 570
},
{
"epoch": 3.1551724137931036,
"grad_norm": 0.7747681268810057,
"learning_rate": 2.680807605984082e-05,
"loss": 0.503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.354011595249176,
"step": 1830,
"valid_targets_mean": 3500.1,
"valid_targets_min": 877
},
{
"epoch": 3.163793103448276,
"grad_norm": 0.6555975732510367,
"learning_rate": 2.6727171183003502e-05,
"loss": 0.4637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22615736722946167,
"step": 1835,
"valid_targets_mean": 3957.8,
"valid_targets_min": 1602
},
{
"epoch": 3.1724137931034484,
"grad_norm": 0.6815734089237001,
"learning_rate": 2.6646141988033475e-05,
"loss": 0.5291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22214952111244202,
"step": 1840,
"valid_targets_mean": 2964.4,
"valid_targets_min": 781
},
{
"epoch": 3.1810344827586206,
"grad_norm": 0.6380099116738308,
"learning_rate": 2.6564989972350364e-05,
"loss": 0.4798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.229619562625885,
"step": 1845,
"valid_targets_mean": 4561.1,
"valid_targets_min": 1693
},
{
"epoch": 3.189655172413793,
"grad_norm": 0.604404711071115,
"learning_rate": 2.6483716635643535e-05,
"loss": 0.5054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33196941018104553,
"step": 1850,
"valid_targets_mean": 5268.6,
"valid_targets_min": 854
},
{
"epoch": 3.1982758620689653,
"grad_norm": 0.6726535401662077,
"learning_rate": 2.6402323479844364e-05,
"loss": 0.5099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2879241406917572,
"step": 1855,
"valid_targets_mean": 3671.5,
"valid_targets_min": 674
},
{
"epoch": 3.206896551724138,
"grad_norm": 0.6445858526652752,
"learning_rate": 2.6320812009098472e-05,
"loss": 0.4887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1965891420841217,
"step": 1860,
"valid_targets_mean": 4424.1,
"valid_targets_min": 644
},
{
"epoch": 3.2155172413793105,
"grad_norm": 0.7543347211262738,
"learning_rate": 2.6239183729737957e-05,
"loss": 0.5032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20700570940971375,
"step": 1865,
"valid_targets_mean": 3542.0,
"valid_targets_min": 1627
},
{
"epoch": 3.2241379310344827,
"grad_norm": 0.635457218042516,
"learning_rate": 2.6157440150253535e-05,
"loss": 0.4891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22845527529716492,
"step": 1870,
"valid_targets_mean": 3959.0,
"valid_targets_min": 422
},
{
"epoch": 3.2327586206896552,
"grad_norm": 0.7224438201544804,
"learning_rate": 2.6075582781266665e-05,
"loss": 0.4711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23363882303237915,
"step": 1875,
"valid_targets_mean": 3106.1,
"valid_targets_min": 348
},
{
"epoch": 3.2413793103448274,
"grad_norm": 0.7469170275128653,
"learning_rate": 2.5993613135501643e-05,
"loss": 0.526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26454028487205505,
"step": 1880,
"valid_targets_mean": 3685.9,
"valid_targets_min": 1384
},
{
"epoch": 3.25,
"grad_norm": 0.8467283740580998,
"learning_rate": 2.5911532727757625e-05,
"loss": 0.5166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2143116295337677,
"step": 1885,
"valid_targets_mean": 2019.8,
"valid_targets_min": 594
},
{
"epoch": 3.2586206896551726,
"grad_norm": 0.714157813357512,
"learning_rate": 2.582934307488067e-05,
"loss": 0.489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25460219383239746,
"step": 1890,
"valid_targets_mean": 2973.9,
"valid_targets_min": 1539
},
{
"epoch": 3.2672413793103448,
"grad_norm": 0.6119264269910555,
"learning_rate": 2.5747045695735674e-05,
"loss": 0.512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3362063765525818,
"step": 1895,
"valid_targets_mean": 5818.9,
"valid_targets_min": 1128
},
{
"epoch": 3.2758620689655173,
"grad_norm": 0.6722720740574156,
"learning_rate": 2.5664642111178312e-05,
"loss": 0.4917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25751858949661255,
"step": 1900,
"valid_targets_mean": 3154.4,
"valid_targets_min": 274
},
{
"epoch": 3.2844827586206895,
"grad_norm": 0.6899167832115443,
"learning_rate": 2.5582133844026943e-05,
"loss": 0.5095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2338351607322693,
"step": 1905,
"valid_targets_mean": 3443.5,
"valid_targets_min": 815
},
{
"epoch": 3.293103448275862,
"grad_norm": 0.6885008624009163,
"learning_rate": 2.5499522419034462e-05,
"loss": 0.4983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2654280662536621,
"step": 1910,
"valid_targets_mean": 3975.5,
"valid_targets_min": 464
},
{
"epoch": 3.3017241379310347,
"grad_norm": 0.693540405884434,
"learning_rate": 2.5416809362860107e-05,
"loss": 0.4699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2041737139225006,
"step": 1915,
"valid_targets_mean": 3395.4,
"valid_targets_min": 1520
},
{
"epoch": 3.310344827586207,
"grad_norm": 0.6970513975428828,
"learning_rate": 2.5333996204041276e-05,
"loss": 0.4984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3178594708442688,
"step": 1920,
"valid_targets_mean": 3556.8,
"valid_targets_min": 1146
},
{
"epoch": 3.3189655172413794,
"grad_norm": 0.6954967899107553,
"learning_rate": 2.5251084472965257e-05,
"loss": 0.4865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17998085916042328,
"step": 1925,
"valid_targets_mean": 2760.6,
"valid_targets_min": 998
},
{
"epoch": 3.3275862068965516,
"grad_norm": 0.6046125422661831,
"learning_rate": 2.5168075701840948e-05,
"loss": 0.5053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15390408039093018,
"step": 1930,
"valid_targets_mean": 3165.2,
"valid_targets_min": 1413
},
{
"epoch": 3.336206896551724,
"grad_norm": 0.5960966625837508,
"learning_rate": 2.5084971424670568e-05,
"loss": 0.4869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35475805401802063,
"step": 1935,
"valid_targets_mean": 4783.4,
"valid_targets_min": 1444
},
{
"epoch": 3.344827586206897,
"grad_norm": 0.7763661645104593,
"learning_rate": 2.500177317722126e-05,
"loss": 0.5187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23105254769325256,
"step": 1940,
"valid_targets_mean": 2399.2,
"valid_targets_min": 916
},
{
"epoch": 3.353448275862069,
"grad_norm": 0.6779936365212638,
"learning_rate": 2.4918482496996757e-05,
"loss": 0.4934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19377613067626953,
"step": 1945,
"valid_targets_mean": 2806.4,
"valid_targets_min": 728
},
{
"epoch": 3.3620689655172415,
"grad_norm": 0.605208783856609,
"learning_rate": 2.483510092320895e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1888284683227539,
"step": 1950,
"valid_targets_mean": 3616.1,
"valid_targets_min": 1234
},
{
"epoch": 3.3706896551724137,
"grad_norm": 0.6789435419175992,
"learning_rate": 2.4751629996749427e-05,
"loss": 0.5092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2218063771724701,
"step": 1955,
"valid_targets_mean": 3372.0,
"valid_targets_min": 655
},
{
"epoch": 3.3793103448275863,
"grad_norm": 0.7475419933802377,
"learning_rate": 2.4668071260161022e-05,
"loss": 0.5067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542641758918762,
"step": 1960,
"valid_targets_mean": 2348.0,
"valid_targets_min": 1132
},
{
"epoch": 3.3879310344827585,
"grad_norm": 0.7582425874011535,
"learning_rate": 2.4584426257609315e-05,
"loss": 0.5271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34427642822265625,
"step": 1965,
"valid_targets_mean": 3218.0,
"valid_targets_min": 642
},
{
"epoch": 3.396551724137931,
"grad_norm": 0.7337643514205625,
"learning_rate": 2.4500696534854062e-05,
"loss": 0.4802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2051694095134735,
"step": 1970,
"valid_targets_mean": 2417.1,
"valid_targets_min": 367
},
{
"epoch": 3.405172413793103,
"grad_norm": 0.6417616249105758,
"learning_rate": 2.4416883639220647e-05,
"loss": 0.4867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26043596863746643,
"step": 1975,
"valid_targets_mean": 3970.5,
"valid_targets_min": 1043
},
{
"epoch": 3.413793103448276,
"grad_norm": 0.6730591273563613,
"learning_rate": 2.4332989119571506e-05,
"loss": 0.4553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515748143196106,
"step": 1980,
"valid_targets_mean": 3129.4,
"valid_targets_min": 840
},
{
"epoch": 3.4224137931034484,
"grad_norm": 0.6291444527805404,
"learning_rate": 2.4249014526277473e-05,
"loss": 0.5206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3734513521194458,
"step": 1985,
"valid_targets_mean": 4917.1,
"valid_targets_min": 1643
},
{
"epoch": 3.4310344827586206,
"grad_norm": 0.6094709452717426,
"learning_rate": 2.416496141118915e-05,
"loss": 0.4911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2604672312736511,
"step": 1990,
"valid_targets_mean": 4694.5,
"valid_targets_min": 1146
},
{
"epoch": 3.439655172413793,
"grad_norm": 0.9224302977758335,
"learning_rate": 2.4080831327608224e-05,
"loss": 0.4891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28474128246307373,
"step": 1995,
"valid_targets_mean": 2746.2,
"valid_targets_min": 645
},
{
"epoch": 3.4482758620689653,
"grad_norm": 0.6913692015061919,
"learning_rate": 2.3996625830258742e-05,
"loss": 0.4678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24615857005119324,
"step": 2000,
"valid_targets_mean": 3448.2,
"valid_targets_min": 1630
},
{
"epoch": 3.456896551724138,
"grad_norm": 0.7680712640173568,
"learning_rate": 2.3912346475258424e-05,
"loss": 0.4757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20221805572509766,
"step": 2005,
"valid_targets_mean": 2574.9,
"valid_targets_min": 565
},
{
"epoch": 3.4655172413793105,
"grad_norm": 0.635108180966016,
"learning_rate": 2.3827994820089856e-05,
"loss": 0.5233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32651764154434204,
"step": 2010,
"valid_targets_mean": 4662.1,
"valid_targets_min": 1373
},
{
"epoch": 3.4741379310344827,
"grad_norm": 0.740260789953024,
"learning_rate": 2.3743572423571752e-05,
"loss": 0.5045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.287661612033844,
"step": 2015,
"valid_targets_mean": 3843.0,
"valid_targets_min": 1769
},
{
"epoch": 3.4827586206896552,
"grad_norm": 0.7038105239975521,
"learning_rate": 2.365908084583011e-05,
"loss": 0.4831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31129515171051025,
"step": 2020,
"valid_targets_mean": 4296.4,
"valid_targets_min": 1580
},
{
"epoch": 3.4913793103448274,
"grad_norm": 0.6372501954816124,
"learning_rate": 2.3574521648269406e-05,
"loss": 0.4977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579384207725525,
"step": 2025,
"valid_targets_mean": 2607.8,
"valid_targets_min": 1195
},
{
"epoch": 3.5,
"grad_norm": 0.618822719912611,
"learning_rate": 2.3489896393543717e-05,
"loss": 0.5425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24836230278015137,
"step": 2030,
"valid_targets_mean": 3427.4,
"valid_targets_min": 1491
},
{
"epoch": 3.5086206896551726,
"grad_norm": 0.6939708126805756,
"learning_rate": 2.340520664552788e-05,
"loss": 0.4841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540481150150299,
"step": 2035,
"valid_targets_mean": 2188.2,
"valid_targets_min": 853
},
{
"epoch": 3.5172413793103448,
"grad_norm": 0.6632351331782165,
"learning_rate": 2.3320453969288553e-05,
"loss": 0.5268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2977678179740906,
"step": 2040,
"valid_targets_mean": 4092.8,
"valid_targets_min": 1544
},
{
"epoch": 3.5258620689655173,
"grad_norm": 0.7073877534358624,
"learning_rate": 2.32356399310553e-05,
"loss": 0.4762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23784738779067993,
"step": 2045,
"valid_targets_mean": 2905.9,
"valid_targets_min": 1383
},
{
"epoch": 3.5344827586206895,
"grad_norm": 0.6296400085161705,
"learning_rate": 2.3150766098191667e-05,
"loss": 0.5148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32230597734451294,
"step": 2050,
"valid_targets_mean": 5635.5,
"valid_targets_min": 1954
},
{
"epoch": 3.543103448275862,
"grad_norm": 0.6033249092992661,
"learning_rate": 2.3065834039166212e-05,
"loss": 0.4714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18579596281051636,
"step": 2055,
"valid_targets_mean": 3727.8,
"valid_targets_min": 1319
},
{
"epoch": 3.5517241379310347,
"grad_norm": 0.6645454654059848,
"learning_rate": 2.2980845323523487e-05,
"loss": 0.5103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31462427973747253,
"step": 2060,
"valid_targets_mean": 4143.9,
"valid_targets_min": 1388
},
{
"epoch": 3.560344827586207,
"grad_norm": 0.7143907035845465,
"learning_rate": 2.2895801521855096e-05,
"loss": 0.4634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23505531251430511,
"step": 2065,
"valid_targets_mean": 3194.8,
"valid_targets_min": 767
},
{
"epoch": 3.5689655172413794,
"grad_norm": 0.6500578607981675,
"learning_rate": 2.2810704205770587e-05,
"loss": 0.5166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32650500535964966,
"step": 2070,
"valid_targets_mean": 4477.2,
"valid_targets_min": 492
},
{
"epoch": 3.5775862068965516,
"grad_norm": 0.7229860852185133,
"learning_rate": 2.2725554947868495e-05,
"loss": 0.5121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2526986002922058,
"step": 2075,
"valid_targets_mean": 3047.9,
"valid_targets_min": 1887
},
{
"epoch": 3.586206896551724,
"grad_norm": 0.7627338670987832,
"learning_rate": 2.2640355321707218e-05,
"loss": 0.4954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.332661509513855,
"step": 2080,
"valid_targets_mean": 3330.1,
"valid_targets_min": 786
},
{
"epoch": 3.594827586206897,
"grad_norm": 0.6869482734837352,
"learning_rate": 2.2555106901775955e-05,
"loss": 0.5149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26278042793273926,
"step": 2085,
"valid_targets_mean": 3234.6,
"valid_targets_min": 1015
},
{
"epoch": 3.603448275862069,
"grad_norm": 0.718849337496441,
"learning_rate": 2.246981126346564e-05,
"loss": 0.488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1774282157421112,
"step": 2090,
"valid_targets_mean": 2628.5,
"valid_targets_min": 449
},
{
"epoch": 3.612068965517241,
"grad_norm": 0.6200784407794563,
"learning_rate": 2.238446998303977e-05,
"loss": 0.5258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27215301990509033,
"step": 2095,
"valid_targets_mean": 3960.6,
"valid_targets_min": 1863
},
{
"epoch": 3.6206896551724137,
"grad_norm": 0.7332072518118599,
"learning_rate": 2.2299084637605343e-05,
"loss": 0.481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2048092931509018,
"step": 2100,
"valid_targets_mean": 2481.8,
"valid_targets_min": 728
},
{
"epoch": 3.6293103448275863,
"grad_norm": 0.7172691824388733,
"learning_rate": 2.221365680508364e-05,
"loss": 0.4647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23591715097427368,
"step": 2105,
"valid_targets_mean": 2745.5,
"valid_targets_min": 837
},
{
"epoch": 3.637931034482759,
"grad_norm": 0.7339486648404044,
"learning_rate": 2.2128188064181143e-05,
"loss": 0.4893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19370971620082855,
"step": 2110,
"valid_targets_mean": 3371.1,
"valid_targets_min": 1676
},
{
"epoch": 3.646551724137931,
"grad_norm": 0.6893113432210646,
"learning_rate": 2.2042679994360296e-05,
"loss": 0.4478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32415205240249634,
"step": 2115,
"valid_targets_mean": 3909.2,
"valid_targets_min": 1739
},
{
"epoch": 3.655172413793103,
"grad_norm": 0.7281686902973696,
"learning_rate": 2.195713417581033e-05,
"loss": 0.4897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24168765544891357,
"step": 2120,
"valid_targets_mean": 4198.9,
"valid_targets_min": 1165
},
{
"epoch": 3.663793103448276,
"grad_norm": 0.6199759210387455,
"learning_rate": 2.1871552189418113e-05,
"loss": 0.4874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26401397585868835,
"step": 2125,
"valid_targets_mean": 4291.9,
"valid_targets_min": 2534
},
{
"epoch": 3.6724137931034484,
"grad_norm": 0.8452521663580951,
"learning_rate": 2.1785935616738855e-05,
"loss": 0.4733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19978295266628265,
"step": 2130,
"valid_targets_mean": 2012.5,
"valid_targets_min": 603
},
{
"epoch": 3.6810344827586206,
"grad_norm": 0.5985029280720291,
"learning_rate": 2.170028603996695e-05,
"loss": 0.4938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24260295927524567,
"step": 2135,
"valid_targets_mean": 5161.2,
"valid_targets_min": 2410
},
{
"epoch": 3.689655172413793,
"grad_norm": 0.648017450021513,
"learning_rate": 2.161460504190668e-05,
"loss": 0.4949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2743348777294159,
"step": 2140,
"valid_targets_mean": 4066.6,
"valid_targets_min": 2103
},
{
"epoch": 3.6982758620689653,
"grad_norm": 0.5452730933756482,
"learning_rate": 2.1528894205943017e-05,
"loss": 0.5007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28508615493774414,
"step": 2145,
"valid_targets_mean": 5361.5,
"valid_targets_min": 1637
},
{
"epoch": 3.706896551724138,
"grad_norm": 0.6408652868463778,
"learning_rate": 2.1443155116012328e-05,
"loss": 0.5788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25458598136901855,
"step": 2150,
"valid_targets_mean": 3966.1,
"valid_targets_min": 2205
},
{
"epoch": 3.7155172413793105,
"grad_norm": 0.6158141746313681,
"learning_rate": 2.1357389356573098e-05,
"loss": 0.4627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16511517763137817,
"step": 2155,
"valid_targets_mean": 2890.8,
"valid_targets_min": 1528
},
{
"epoch": 3.7241379310344827,
"grad_norm": 0.6024470063685289,
"learning_rate": 2.1271598512576705e-05,
"loss": 0.482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34891843795776367,
"step": 2160,
"valid_targets_mean": 5724.5,
"valid_targets_min": 2872
},
{
"epoch": 3.7327586206896552,
"grad_norm": 0.6510061779600028,
"learning_rate": 2.1185784169438047e-05,
"loss": 0.4756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25346675515174866,
"step": 2165,
"valid_targets_mean": 3543.5,
"valid_targets_min": 1662
},
{
"epoch": 3.7413793103448274,
"grad_norm": 0.6673234066879691,
"learning_rate": 2.1099947913006303e-05,
"loss": 0.4898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3024991452693939,
"step": 2170,
"valid_targets_mean": 4123.0,
"valid_targets_min": 862
},
{
"epoch": 3.75,
"grad_norm": 0.713682007673058,
"learning_rate": 2.1014091329535618e-05,
"loss": 0.5008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28074443340301514,
"step": 2175,
"valid_targets_mean": 3506.8,
"valid_targets_min": 1235
},
{
"epoch": 3.7586206896551726,
"grad_norm": 0.6602595641335219,
"learning_rate": 2.0928216005655762e-05,
"loss": 0.4734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678144574165344,
"step": 2180,
"valid_targets_mean": 3774.0,
"valid_targets_min": 858
},
{
"epoch": 3.7672413793103448,
"grad_norm": 0.6043947084246732,
"learning_rate": 2.084232352834285e-05,
"loss": 0.4949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.237286776304245,
"step": 2185,
"valid_targets_mean": 4557.8,
"valid_targets_min": 1117
},
{
"epoch": 3.7758620689655173,
"grad_norm": 0.7429037899492916,
"learning_rate": 2.0756415484889975e-05,
"loss": 0.5154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23691049218177795,
"step": 2190,
"valid_targets_mean": 2794.6,
"valid_targets_min": 831
},
{
"epoch": 3.7844827586206895,
"grad_norm": 0.6505918685977937,
"learning_rate": 2.0670493462877897e-05,
"loss": 0.4931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2736482620239258,
"step": 2195,
"valid_targets_mean": 3816.5,
"valid_targets_min": 1517
},
{
"epoch": 3.793103448275862,
"grad_norm": 0.6440464847958695,
"learning_rate": 2.0584559050145706e-05,
"loss": 0.4699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20258024334907532,
"step": 2200,
"valid_targets_mean": 2998.4,
"valid_targets_min": 355
},
{
"epoch": 3.8017241379310347,
"grad_norm": 0.6236608397078807,
"learning_rate": 2.0498613834761462e-05,
"loss": 0.5048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3027684688568115,
"step": 2205,
"valid_targets_mean": 3835.9,
"valid_targets_min": 1036
},
{
"epoch": 3.810344827586207,
"grad_norm": 0.6808291010026204,
"learning_rate": 2.0412659404992862e-05,
"loss": 0.4713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17417572438716888,
"step": 2210,
"valid_targets_mean": 2092.0,
"valid_targets_min": 960
},
{
"epoch": 3.8189655172413794,
"grad_norm": 0.7056179085462992,
"learning_rate": 2.0326697349277893e-05,
"loss": 0.5039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2949260473251343,
"step": 2215,
"valid_targets_mean": 3186.6,
"valid_targets_min": 1249
},
{
"epoch": 3.8275862068965516,
"grad_norm": 0.651368163793838,
"learning_rate": 2.024072925619546e-05,
"loss": 0.4871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24330437183380127,
"step": 2220,
"valid_targets_mean": 3891.6,
"valid_targets_min": 1039
},
{
"epoch": 3.836206896551724,
"grad_norm": 0.7410681072909164,
"learning_rate": 2.0154756714436043e-05,
"loss": 0.4915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660757899284363,
"step": 2225,
"valid_targets_mean": 3078.1,
"valid_targets_min": 1328
},
{
"epoch": 3.844827586206897,
"grad_norm": 0.7170639487897909,
"learning_rate": 2.006878131277233e-05,
"loss": 0.4991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18728289008140564,
"step": 2230,
"valid_targets_mean": 2276.6,
"valid_targets_min": 999
},
{
"epoch": 3.853448275862069,
"grad_norm": 0.6547821115723866,
"learning_rate": 1.9982804640029864e-05,
"loss": 0.4948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17102737724781036,
"step": 2235,
"valid_targets_mean": 2813.9,
"valid_targets_min": 468
},
{
"epoch": 3.862068965517241,
"grad_norm": 0.8628243763616128,
"learning_rate": 1.989682828505767e-05,
"loss": 0.5214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25767794251441956,
"step": 2240,
"valid_targets_mean": 2402.8,
"valid_targets_min": 1147
},
{
"epoch": 3.8706896551724137,
"grad_norm": 0.6296546190582638,
"learning_rate": 1.9810853836698913e-05,
"loss": 0.4841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32976585626602173,
"step": 2245,
"valid_targets_mean": 4604.4,
"valid_targets_min": 1119
},
{
"epoch": 3.8793103448275863,
"grad_norm": 0.5633331197906519,
"learning_rate": 1.972488288376151e-05,
"loss": 0.5211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2464699000120163,
"step": 2250,
"valid_targets_mean": 4274.8,
"valid_targets_min": 734
},
{
"epoch": 3.887931034482759,
"grad_norm": 0.5908706096835258,
"learning_rate": 1.963891701498879e-05,
"loss": 0.5147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24134039878845215,
"step": 2255,
"valid_targets_mean": 4620.5,
"valid_targets_min": 1978
},
{
"epoch": 3.896551724137931,
"grad_norm": 0.6552321287100807,
"learning_rate": 1.955295781903014e-05,
"loss": 0.4751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21362680196762085,
"step": 2260,
"valid_targets_mean": 3177.8,
"valid_targets_min": 248
},
{
"epoch": 3.905172413793103,
"grad_norm": 0.6877670110487286,
"learning_rate": 1.9467006884411605e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27820611000061035,
"step": 2265,
"valid_targets_mean": 3651.4,
"valid_targets_min": 844
},
{
"epoch": 3.913793103448276,
"grad_norm": 0.7938588084907477,
"learning_rate": 1.9381065799506583e-05,
"loss": 0.4931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19728420674800873,
"step": 2270,
"valid_targets_mean": 3676.1,
"valid_targets_min": 1032
},
{
"epoch": 3.9224137931034484,
"grad_norm": 0.6484184754715151,
"learning_rate": 1.929513615250643e-05,
"loss": 0.4796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930006980895996,
"step": 2275,
"valid_targets_mean": 3896.8,
"valid_targets_min": 560
},
{
"epoch": 3.9310344827586206,
"grad_norm": 0.7110467870098871,
"learning_rate": 1.9209219531391155e-05,
"loss": 0.5081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18151012063026428,
"step": 2280,
"valid_targets_mean": 2306.0,
"valid_targets_min": 1641
},
{
"epoch": 3.939655172413793,
"grad_norm": 0.6470127936020821,
"learning_rate": 1.9123317523900015e-05,
"loss": 0.5244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20861583948135376,
"step": 2285,
"valid_targets_mean": 2988.9,
"valid_targets_min": 927
},
{
"epoch": 3.9482758620689653,
"grad_norm": 0.709579187138778,
"learning_rate": 1.9037431717502253e-05,
"loss": 0.5476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3209431767463684,
"step": 2290,
"valid_targets_mean": 4697.9,
"valid_targets_min": 1726
},
{
"epoch": 3.956896551724138,
"grad_norm": 0.6240167958052882,
"learning_rate": 1.8951563699367673e-05,
"loss": 0.5076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25870320200920105,
"step": 2295,
"valid_targets_mean": 4539.9,
"valid_targets_min": 727
},
{
"epoch": 3.9655172413793105,
"grad_norm": 0.6988806889464962,
"learning_rate": 1.886571505633737e-05,
"loss": 0.4913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23148533701896667,
"step": 2300,
"valid_targets_mean": 3224.5,
"valid_targets_min": 295
},
{
"epoch": 3.9741379310344827,
"grad_norm": 0.7110833448191198,
"learning_rate": 1.8779887374894384e-05,
"loss": 0.4968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3375265896320343,
"step": 2305,
"valid_targets_mean": 3697.4,
"valid_targets_min": 333
},
{
"epoch": 3.9827586206896552,
"grad_norm": 0.7142197646340462,
"learning_rate": 1.8694082241134385e-05,
"loss": 0.4925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31442028284072876,
"step": 2310,
"valid_targets_mean": 4799.8,
"valid_targets_min": 1452
},
{
"epoch": 3.9913793103448274,
"grad_norm": 0.649630590659874,
"learning_rate": 1.8608301240736378e-05,
"loss": 0.484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37650713324546814,
"step": 2315,
"valid_targets_mean": 4964.6,
"valid_targets_min": 1840
},
{
"epoch": 4.0,
"grad_norm": 0.6968453928792222,
"learning_rate": 1.852254595893335e-05,
"loss": 0.5214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32762742042541504,
"step": 2320,
"valid_targets_mean": 3752.6,
"valid_targets_min": 930
},
{
"epoch": 4.008620689655173,
"grad_norm": 0.7291286990476985,
"learning_rate": 1.8436817980483035e-05,
"loss": 0.4788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3126080632209778,
"step": 2325,
"valid_targets_mean": 3247.2,
"valid_targets_min": 1659
},
{
"epoch": 4.017241379310345,
"grad_norm": 0.7057735186382891,
"learning_rate": 1.835111888963859e-05,
"loss": 0.4538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033781111240387,
"step": 2330,
"valid_targets_mean": 2532.8,
"valid_targets_min": 937
},
{
"epoch": 4.025862068965517,
"grad_norm": 0.6541556624040162,
"learning_rate": 1.8265450270119335e-05,
"loss": 0.4746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3108016550540924,
"step": 2335,
"valid_targets_mean": 4034.9,
"valid_targets_min": 1548
},
{
"epoch": 4.0344827586206895,
"grad_norm": 0.6445427177162534,
"learning_rate": 1.8179813705081468e-05,
"loss": 0.4941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12971869111061096,
"step": 2340,
"valid_targets_mean": 2487.0,
"valid_targets_min": 627
},
{
"epoch": 4.043103448275862,
"grad_norm": 0.7042487745553745,
"learning_rate": 1.8094210777088833e-05,
"loss": 0.505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815548777580261,
"step": 2345,
"valid_targets_mean": 4024.0,
"valid_targets_min": 2054
},
{
"epoch": 4.051724137931035,
"grad_norm": 0.6020174178834994,
"learning_rate": 1.800864306808367e-05,
"loss": 0.4802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21823859214782715,
"step": 2350,
"valid_targets_mean": 4244.8,
"valid_targets_min": 1761
},
{
"epoch": 4.060344827586207,
"grad_norm": 0.6238354016392303,
"learning_rate": 1.7923112159357344e-05,
"loss": 0.4504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2578839659690857,
"step": 2355,
"valid_targets_mean": 4613.9,
"valid_targets_min": 907
},
{
"epoch": 4.068965517241379,
"grad_norm": 0.7187931969464216,
"learning_rate": 1.783761963152117e-05,
"loss": 0.4586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20894671976566315,
"step": 2360,
"valid_targets_mean": 3244.1,
"valid_targets_min": 1825
},
{
"epoch": 4.077586206896552,
"grad_norm": 0.6994976820358275,
"learning_rate": 1.7752167064477173e-05,
"loss": 0.4528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23919735848903656,
"step": 2365,
"valid_targets_mean": 3916.8,
"valid_targets_min": 1761
},
{
"epoch": 4.086206896551724,
"grad_norm": 0.5850465646262993,
"learning_rate": 1.7666756037388923e-05,
"loss": 0.4525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1654837727546692,
"step": 2370,
"valid_targets_mean": 3629.4,
"valid_targets_min": 447
},
{
"epoch": 4.094827586206897,
"grad_norm": 0.7177392536005954,
"learning_rate": 1.7581388128652315e-05,
"loss": 0.4606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21581028401851654,
"step": 2375,
"valid_targets_mean": 3316.8,
"valid_targets_min": 1135
},
{
"epoch": 4.103448275862069,
"grad_norm": 0.5731165600563709,
"learning_rate": 1.7496064915866414e-05,
"loss": 0.509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3835183382034302,
"step": 2380,
"valid_targets_mean": 6331.9,
"valid_targets_min": 437
},
{
"epoch": 4.112068965517241,
"grad_norm": 0.7698613386016276,
"learning_rate": 1.7410787975804314e-05,
"loss": 0.5003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34291595220565796,
"step": 2385,
"valid_targets_mean": 2412.0,
"valid_targets_min": 447
},
{
"epoch": 4.120689655172414,
"grad_norm": 0.781265529624121,
"learning_rate": 1.732555888438398e-05,
"loss": 0.4557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2012426108121872,
"step": 2390,
"valid_targets_mean": 2611.0,
"valid_targets_min": 663
},
{
"epoch": 4.129310344827586,
"grad_norm": 0.7510692376144248,
"learning_rate": 1.7240379216639136e-05,
"loss": 0.4786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21286329627037048,
"step": 2395,
"valid_targets_mean": 2835.6,
"valid_targets_min": 1229
},
{
"epoch": 4.137931034482759,
"grad_norm": 0.7969516781579605,
"learning_rate": 1.7155250546690173e-05,
"loss": 0.4848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15521761775016785,
"step": 2400,
"valid_targets_mean": 2185.4,
"valid_targets_min": 781
},
{
"epoch": 4.146551724137931,
"grad_norm": 0.7440613379174275,
"learning_rate": 1.707017444771502e-05,
"loss": 0.4606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2337280809879303,
"step": 2405,
"valid_targets_mean": 2963.6,
"valid_targets_min": 500
},
{
"epoch": 4.155172413793103,
"grad_norm": 0.606456216137015,
"learning_rate": 1.6985152491920103e-05,
"loss": 0.4822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23560550808906555,
"step": 2410,
"valid_targets_mean": 4323.4,
"valid_targets_min": 1376
},
{
"epoch": 4.163793103448276,
"grad_norm": 0.7113548099234891,
"learning_rate": 1.690018625051128e-05,
"loss": 0.4629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24127575755119324,
"step": 2415,
"valid_targets_mean": 3512.8,
"valid_targets_min": 546
},
{
"epoch": 4.172413793103448,
"grad_norm": 0.7335560913283429,
"learning_rate": 1.681527729366481e-05,
"loss": 0.5255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.227250874042511,
"step": 2420,
"valid_targets_mean": 3176.8,
"valid_targets_min": 1879
},
{
"epoch": 4.181034482758621,
"grad_norm": 0.6575969011970396,
"learning_rate": 1.673042719049834e-05,
"loss": 0.4494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23015271127223969,
"step": 2425,
"valid_targets_mean": 3656.1,
"valid_targets_min": 1887
},
{
"epoch": 4.189655172413793,
"grad_norm": 0.8112593380488805,
"learning_rate": 1.664563750904188e-05,
"loss": 0.4945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2517668902873993,
"step": 2430,
"valid_targets_mean": 3671.8,
"valid_targets_min": 1683
},
{
"epoch": 4.198275862068965,
"grad_norm": 0.6753752628064544,
"learning_rate": 1.656090981620888e-05,
"loss": 0.4388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25802406668663025,
"step": 2435,
"valid_targets_mean": 3962.8,
"valid_targets_min": 1314
},
{
"epoch": 4.206896551724138,
"grad_norm": 0.7788552162943313,
"learning_rate": 1.64762456777672e-05,
"loss": 0.4838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3255932629108429,
"step": 2440,
"valid_targets_mean": 3356.9,
"valid_targets_min": 727
},
{
"epoch": 4.2155172413793105,
"grad_norm": 0.8393009126080171,
"learning_rate": 1.6391646658310242e-05,
"loss": 0.4838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931306064128876,
"step": 2445,
"valid_targets_mean": 2868.1,
"valid_targets_min": 1304
},
{
"epoch": 4.224137931034483,
"grad_norm": 0.571986417301678,
"learning_rate": 1.6307114321227996e-05,
"loss": 0.4586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17009538412094116,
"step": 2450,
"valid_targets_mean": 4011.8,
"valid_targets_min": 1762
},
{
"epoch": 4.232758620689655,
"grad_norm": 0.7702861431778673,
"learning_rate": 1.622265022867818e-05,
"loss": 0.4839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.259504109621048,
"step": 2455,
"valid_targets_mean": 3427.9,
"valid_targets_min": 1832
},
{
"epoch": 4.241379310344827,
"grad_norm": 0.5842087243862168,
"learning_rate": 1.6138255941557336e-05,
"loss": 0.4806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24924680590629578,
"step": 2460,
"valid_targets_mean": 5294.4,
"valid_targets_min": 2306
},
{
"epoch": 4.25,
"grad_norm": 0.612414463039784,
"learning_rate": 1.6053933019472003e-05,
"loss": 0.5153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31655654311180115,
"step": 2465,
"valid_targets_mean": 4829.4,
"valid_targets_min": 1225
},
{
"epoch": 4.258620689655173,
"grad_norm": 0.6508360003084009,
"learning_rate": 1.5969683020709902e-05,
"loss": 0.4653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17931914329528809,
"step": 2470,
"valid_targets_mean": 3591.4,
"valid_targets_min": 1719
},
{
"epoch": 4.267241379310345,
"grad_norm": 0.704264317057782,
"learning_rate": 1.5885507502211108e-05,
"loss": 0.4618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20509269833564758,
"step": 2475,
"valid_targets_mean": 3139.9,
"valid_targets_min": 1111
},
{
"epoch": 4.275862068965517,
"grad_norm": 0.6722079858073913,
"learning_rate": 1.5801408019539345e-05,
"loss": 0.4737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22740936279296875,
"step": 2480,
"valid_targets_mean": 3398.4,
"valid_targets_min": 1330
},
{
"epoch": 4.2844827586206895,
"grad_norm": 0.8060161994387373,
"learning_rate": 1.5717386126853156e-05,
"loss": 0.4649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24399414658546448,
"step": 2485,
"valid_targets_mean": 3238.5,
"valid_targets_min": 764
},
{
"epoch": 4.293103448275862,
"grad_norm": 0.6985011079923761,
"learning_rate": 1.5633443376877236e-05,
"loss": 0.4582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16938087344169617,
"step": 2490,
"valid_targets_mean": 2844.6,
"valid_targets_min": 758
},
{
"epoch": 4.301724137931035,
"grad_norm": 0.7439431964854526,
"learning_rate": 1.5549581320873715e-05,
"loss": 0.4437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602732479572296,
"step": 2495,
"valid_targets_mean": 3250.0,
"valid_targets_min": 703
},
{
"epoch": 4.310344827586207,
"grad_norm": 0.6282633270553464,
"learning_rate": 1.546580150861351e-05,
"loss": 0.4574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25479474663734436,
"step": 2500,
"valid_targets_mean": 4628.0,
"valid_targets_min": 1693
},
{
"epoch": 4.318965517241379,
"grad_norm": 0.8246874265708705,
"learning_rate": 1.5382105488347654e-05,
"loss": 0.4666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22745488584041595,
"step": 2505,
"valid_targets_mean": 1733.8,
"valid_targets_min": 619
},
{
"epoch": 4.327586206896552,
"grad_norm": 0.7846829027462743,
"learning_rate": 1.5298494806778733e-05,
"loss": 0.4657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22082726657390594,
"step": 2510,
"valid_targets_mean": 3654.4,
"valid_targets_min": 1465
},
{
"epoch": 4.336206896551724,
"grad_norm": 0.6296582314989281,
"learning_rate": 1.5214971009032251e-05,
"loss": 0.4521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15524858236312866,
"step": 2515,
"valid_targets_mean": 2274.6,
"valid_targets_min": 1343
},
{
"epoch": 4.344827586206897,
"grad_norm": 0.7560024210938446,
"learning_rate": 1.51315356386281e-05,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1853024959564209,
"step": 2520,
"valid_targets_mean": 2265.1,
"valid_targets_min": 770
},
{
"epoch": 4.353448275862069,
"grad_norm": 0.7486129314963273,
"learning_rate": 1.5048190237452052e-05,
"loss": 0.46,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26965516805648804,
"step": 2525,
"valid_targets_mean": 3411.0,
"valid_targets_min": 770
},
{
"epoch": 4.362068965517241,
"grad_norm": 0.6807770197203692,
"learning_rate": 1.4964936345727217e-05,
"loss": 0.4841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339846432209015,
"step": 2530,
"valid_targets_mean": 4331.9,
"valid_targets_min": 1783
},
{
"epoch": 4.370689655172414,
"grad_norm": 0.6803166630329365,
"learning_rate": 1.4881775501985645e-05,
"loss": 0.4546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28594276309013367,
"step": 2535,
"valid_targets_mean": 4092.5,
"valid_targets_min": 1539
},
{
"epoch": 4.379310344827586,
"grad_norm": 0.5757965352729172,
"learning_rate": 1.4798709243039842e-05,
"loss": 0.4644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1932697892189026,
"step": 2540,
"valid_targets_mean": 5489.0,
"valid_targets_min": 1267
},
{
"epoch": 4.387931034482759,
"grad_norm": 0.5942994221260147,
"learning_rate": 1.4715739103954375e-05,
"loss": 0.4508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21481472253799438,
"step": 2545,
"valid_targets_mean": 5184.6,
"valid_targets_min": 1271
},
{
"epoch": 4.396551724137931,
"grad_norm": 0.6178769092364461,
"learning_rate": 1.4632866618017543e-05,
"loss": 0.5295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18912258744239807,
"step": 2550,
"valid_targets_mean": 3871.4,
"valid_targets_min": 1208
},
{
"epoch": 4.405172413793103,
"grad_norm": 0.8134877119006606,
"learning_rate": 1.4550093316712987e-05,
"loss": 0.469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20429262518882751,
"step": 2555,
"valid_targets_mean": 2489.2,
"valid_targets_min": 507
},
{
"epoch": 4.413793103448276,
"grad_norm": 0.5891826115646406,
"learning_rate": 1.4467420729691433e-05,
"loss": 0.4544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17067211866378784,
"step": 2560,
"valid_targets_mean": 3092.2,
"valid_targets_min": 906
},
{
"epoch": 4.422413793103448,
"grad_norm": 0.9293318381152055,
"learning_rate": 1.4384850384742412e-05,
"loss": 0.489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2481684684753418,
"step": 2565,
"valid_targets_mean": 2614.8,
"valid_targets_min": 1022
},
{
"epoch": 4.431034482758621,
"grad_norm": 0.6806302768850274,
"learning_rate": 1.4302383807766003e-05,
"loss": 0.4664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2130582630634308,
"step": 2570,
"valid_targets_mean": 3661.5,
"valid_targets_min": 494
},
{
"epoch": 4.439655172413793,
"grad_norm": 0.697118422325438,
"learning_rate": 1.4220022522744667e-05,
"loss": 0.477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19902461767196655,
"step": 2575,
"valid_targets_mean": 1975.0,
"valid_targets_min": 930
},
{
"epoch": 4.448275862068965,
"grad_norm": 0.7070799859650805,
"learning_rate": 1.4137768051715059e-05,
"loss": 0.484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23186877369880676,
"step": 2580,
"valid_targets_mean": 2672.6,
"valid_targets_min": 853
},
{
"epoch": 4.456896551724138,
"grad_norm": 0.575984761040613,
"learning_rate": 1.4055621914739915e-05,
"loss": 0.4524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1701734960079193,
"step": 2585,
"valid_targets_mean": 4939.8,
"valid_targets_min": 839
},
{
"epoch": 4.4655172413793105,
"grad_norm": 0.7282253361677753,
"learning_rate": 1.3973585629879973e-05,
"loss": 0.5063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23230789601802826,
"step": 2590,
"valid_targets_mean": 2770.1,
"valid_targets_min": 338
},
{
"epoch": 4.474137931034483,
"grad_norm": 0.6912665051596748,
"learning_rate": 1.3891660713165873e-05,
"loss": 0.4468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2850716710090637,
"step": 2595,
"valid_targets_mean": 4440.0,
"valid_targets_min": 2110
},
{
"epoch": 4.482758620689655,
"grad_norm": 0.7127927872180074,
"learning_rate": 1.3809848678570204e-05,
"loss": 0.5011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22266356647014618,
"step": 2600,
"valid_targets_mean": 3722.6,
"valid_targets_min": 476
},
{
"epoch": 4.491379310344827,
"grad_norm": 0.6644441685191089,
"learning_rate": 1.3728151037979468e-05,
"loss": 0.4326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1618672013282776,
"step": 2605,
"valid_targets_mean": 2797.1,
"valid_targets_min": 1354
},
{
"epoch": 4.5,
"grad_norm": 0.5986312130885189,
"learning_rate": 1.3646569301166177e-05,
"loss": 0.5185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28881144523620605,
"step": 2610,
"valid_targets_mean": 5293.5,
"valid_targets_min": 1501
},
{
"epoch": 4.508620689655173,
"grad_norm": 0.6110587897031703,
"learning_rate": 1.3565104975760936e-05,
"loss": 0.4994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2550974488258362,
"step": 2615,
"valid_targets_mean": 3494.4,
"valid_targets_min": 1619
},
{
"epoch": 4.517241379310345,
"grad_norm": 2.095551452059934,
"learning_rate": 1.34837595672246e-05,
"loss": 0.45,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19936276972293854,
"step": 2620,
"valid_targets_mean": 3422.5,
"valid_targets_min": 976
},
{
"epoch": 4.525862068965517,
"grad_norm": 0.8689738516206781,
"learning_rate": 1.3402534578820428e-05,
"loss": 0.4567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20421892404556274,
"step": 2625,
"valid_targets_mean": 2142.2,
"valid_targets_min": 869
},
{
"epoch": 4.5344827586206895,
"grad_norm": 0.7587423675506256,
"learning_rate": 1.3321431511586308e-05,
"loss": 0.4748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26311057806015015,
"step": 2630,
"valid_targets_mean": 3068.2,
"valid_targets_min": 836
},
{
"epoch": 4.543103448275862,
"grad_norm": 0.5919863204622956,
"learning_rate": 1.3240451864307048e-05,
"loss": 0.4819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40301793813705444,
"step": 2635,
"valid_targets_mean": 6527.0,
"valid_targets_min": 1882
},
{
"epoch": 4.551724137931035,
"grad_norm": 0.7394470646381965,
"learning_rate": 1.3159597133486628e-05,
"loss": 0.4704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3109036386013031,
"step": 2640,
"valid_targets_mean": 4317.9,
"valid_targets_min": 332
},
{
"epoch": 4.560344827586206,
"grad_norm": 0.581128140903931,
"learning_rate": 1.3078868813320594e-05,
"loss": 0.4648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20483621954917908,
"step": 2645,
"valid_targets_mean": 4570.8,
"valid_targets_min": 1850
},
{
"epoch": 4.568965517241379,
"grad_norm": 0.6712161614418943,
"learning_rate": 1.2998268395668412e-05,
"loss": 0.4727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14631853997707367,
"step": 2650,
"valid_targets_mean": 2733.5,
"valid_targets_min": 998
},
{
"epoch": 4.577586206896552,
"grad_norm": 0.6468590508784885,
"learning_rate": 1.2917797370025908e-05,
"loss": 0.4805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17968174815177917,
"step": 2655,
"valid_targets_mean": 4648.6,
"valid_targets_min": 1836
},
{
"epoch": 4.586206896551724,
"grad_norm": 0.6418907774726199,
"learning_rate": 1.2837457223497754e-05,
"loss": 0.4638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17467010021209717,
"step": 2660,
"valid_targets_mean": 3575.1,
"valid_targets_min": 1494
},
{
"epoch": 4.594827586206897,
"grad_norm": 0.6893197458456521,
"learning_rate": 1.2757249440769957e-05,
"loss": 0.4872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20580238103866577,
"step": 2665,
"valid_targets_mean": 3706.9,
"valid_targets_min": 916
},
{
"epoch": 4.603448275862069,
"grad_norm": 0.7362191975720149,
"learning_rate": 1.2677175504082452e-05,
"loss": 0.4534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3365599513053894,
"step": 2670,
"valid_targets_mean": 4807.8,
"valid_targets_min": 365
},
{
"epoch": 4.612068965517241,
"grad_norm": 0.6649827629129201,
"learning_rate": 1.2597236893201712e-05,
"loss": 0.4974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2436644583940506,
"step": 2675,
"valid_targets_mean": 3814.6,
"valid_targets_min": 686
},
{
"epoch": 4.620689655172414,
"grad_norm": 0.5922553527915343,
"learning_rate": 1.2517435085393373e-05,
"loss": 0.437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17249786853790283,
"step": 2680,
"valid_targets_mean": 3553.8,
"valid_targets_min": 1067
},
{
"epoch": 4.629310344827586,
"grad_norm": 0.795297876094166,
"learning_rate": 1.2437771555394944e-05,
"loss": 0.4819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24163809418678284,
"step": 2685,
"valid_targets_mean": 2616.9,
"valid_targets_min": 1042
},
{
"epoch": 4.637931034482759,
"grad_norm": 0.7232979961406071,
"learning_rate": 1.2358247775388578e-05,
"loss": 0.4728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24019086360931396,
"step": 2690,
"valid_targets_mean": 3697.1,
"valid_targets_min": 2034
},
{
"epoch": 4.646551724137931,
"grad_norm": 0.7096407435915755,
"learning_rate": 1.227886521497383e-05,
"loss": 0.4479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24640309810638428,
"step": 2695,
"valid_targets_mean": 3368.4,
"valid_targets_min": 298
},
{
"epoch": 4.655172413793103,
"grad_norm": 0.7014687573513457,
"learning_rate": 1.2199625341140533e-05,
"loss": 0.485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635158896446228,
"step": 2700,
"valid_targets_mean": 3276.6,
"valid_targets_min": 1973
},
{
"epoch": 4.663793103448276,
"grad_norm": 0.6546970206016567,
"learning_rate": 1.2120529618241665e-05,
"loss": 0.4535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31338346004486084,
"step": 2705,
"valid_targets_mean": 6266.4,
"valid_targets_min": 1717
},
{
"epoch": 4.672413793103448,
"grad_norm": 0.6793637217901053,
"learning_rate": 1.2041579507966288e-05,
"loss": 0.4778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24181483685970306,
"step": 2710,
"valid_targets_mean": 3137.2,
"valid_targets_min": 1817
},
{
"epoch": 4.681034482758621,
"grad_norm": 0.6821886337532992,
"learning_rate": 1.1962776469312556e-05,
"loss": 0.4735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2773562967777252,
"step": 2715,
"valid_targets_mean": 4600.2,
"valid_targets_min": 1971
},
{
"epoch": 4.689655172413794,
"grad_norm": 0.74251794560561,
"learning_rate": 1.1884121958560721e-05,
"loss": 0.5042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2979833781719208,
"step": 2720,
"valid_targets_mean": 3467.6,
"valid_targets_min": 299
},
{
"epoch": 4.698275862068965,
"grad_norm": 0.7380207470077343,
"learning_rate": 1.1805617429246254e-05,
"loss": 0.4522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24474026262760162,
"step": 2725,
"valid_targets_mean": 3314.1,
"valid_targets_min": 1689
},
{
"epoch": 4.706896551724138,
"grad_norm": 0.6441690010094415,
"learning_rate": 1.1727264332132978e-05,
"loss": 0.4806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11414848268032074,
"step": 2730,
"valid_targets_mean": 1974.6,
"valid_targets_min": 455
},
{
"epoch": 4.7155172413793105,
"grad_norm": 0.6516620909898261,
"learning_rate": 1.1649064115186216e-05,
"loss": 0.4883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3251435160636902,
"step": 2735,
"valid_targets_mean": 4367.8,
"valid_targets_min": 1572
},
{
"epoch": 4.724137931034483,
"grad_norm": 0.8113136652791311,
"learning_rate": 1.1571018223546095e-05,
"loss": 0.4889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2595599293708801,
"step": 2740,
"valid_targets_mean": 2774.2,
"valid_targets_min": 1540
},
{
"epoch": 4.732758620689655,
"grad_norm": 0.6827835506352863,
"learning_rate": 1.1493128099500806e-05,
"loss": 0.4525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19236114621162415,
"step": 2745,
"valid_targets_mean": 3065.4,
"valid_targets_min": 872
},
{
"epoch": 4.741379310344827,
"grad_norm": 0.6266580967892691,
"learning_rate": 1.1415395182459925e-05,
"loss": 0.4738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2641719579696655,
"step": 2750,
"valid_targets_mean": 4104.9,
"valid_targets_min": 606
},
{
"epoch": 4.75,
"grad_norm": 0.6257424293723131,
"learning_rate": 1.1337820908927891e-05,
"loss": 0.5079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2416507452726364,
"step": 2755,
"valid_targets_mean": 3923.8,
"valid_targets_min": 696
},
{
"epoch": 4.758620689655173,
"grad_norm": 0.805541412851283,
"learning_rate": 1.126040671247738e-05,
"loss": 0.458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27597856521606445,
"step": 2760,
"valid_targets_mean": 2572.5,
"valid_targets_min": 616
},
{
"epoch": 4.767241379310345,
"grad_norm": 0.8497370331969035,
"learning_rate": 1.1183154023722839e-05,
"loss": 0.4596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24853654205799103,
"step": 2765,
"valid_targets_mean": 3065.8,
"valid_targets_min": 503
},
{
"epoch": 4.775862068965517,
"grad_norm": 0.7473644020752989,
"learning_rate": 1.1106064270294068e-05,
"loss": 0.4822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2988268733024597,
"step": 2770,
"valid_targets_mean": 3608.1,
"valid_targets_min": 422
},
{
"epoch": 4.7844827586206895,
"grad_norm": 0.8095234401769938,
"learning_rate": 1.1029138876809818e-05,
"loss": 0.4887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27407869696617126,
"step": 2775,
"valid_targets_mean": 2853.9,
"valid_targets_min": 1394
},
{
"epoch": 4.793103448275862,
"grad_norm": 0.6752834632880041,
"learning_rate": 1.0952379264851464e-05,
"loss": 0.5027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26760053634643555,
"step": 2780,
"valid_targets_mean": 4063.4,
"valid_targets_min": 637
},
{
"epoch": 4.801724137931035,
"grad_norm": 0.544555675768033,
"learning_rate": 1.087578685293674e-05,
"loss": 0.4918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2731075584888458,
"step": 2785,
"valid_targets_mean": 5893.2,
"valid_targets_min": 579
},
{
"epoch": 4.810344827586206,
"grad_norm": 0.7388130196480253,
"learning_rate": 1.0799363056493529e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2854580879211426,
"step": 2790,
"valid_targets_mean": 3466.8,
"valid_targets_min": 1664
},
{
"epoch": 4.818965517241379,
"grad_norm": 0.6272646450147065,
"learning_rate": 1.0723109287833697e-05,
"loss": 0.4575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2139543890953064,
"step": 2795,
"valid_targets_mean": 4144.4,
"valid_targets_min": 2050
},
{
"epoch": 4.827586206896552,
"grad_norm": 0.7794735480091342,
"learning_rate": 1.0647026956126979e-05,
"loss": 0.4628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20534175634384155,
"step": 2800,
"valid_targets_mean": 2368.4,
"valid_targets_min": 464
},
{
"epoch": 4.836206896551724,
"grad_norm": 0.6678653155160964,
"learning_rate": 1.0571117467374972e-05,
"loss": 0.4629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15956327319145203,
"step": 2805,
"valid_targets_mean": 2978.4,
"valid_targets_min": 729
},
{
"epoch": 4.844827586206897,
"grad_norm": 0.5596544836969336,
"learning_rate": 1.0495382224385154e-05,
"loss": 0.5028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28414013981819153,
"step": 2810,
"valid_targets_mean": 5631.0,
"valid_targets_min": 1747
},
{
"epoch": 4.853448275862069,
"grad_norm": 0.6433212251402481,
"learning_rate": 1.0419822626744894e-05,
"loss": 0.4865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21995951235294342,
"step": 2815,
"valid_targets_mean": 3540.8,
"valid_targets_min": 1831
},
{
"epoch": 4.862068965517241,
"grad_norm": 0.625422523116903,
"learning_rate": 1.0344440070795671e-05,
"loss": 0.47,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672995328903198,
"step": 2820,
"valid_targets_mean": 4453.2,
"valid_targets_min": 1359
},
{
"epoch": 4.870689655172414,
"grad_norm": 0.5794212310915364,
"learning_rate": 1.0269235949607223e-05,
"loss": 0.4825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19607986509799957,
"step": 2825,
"valid_targets_mean": 5040.0,
"valid_targets_min": 2426
},
{
"epoch": 4.879310344827586,
"grad_norm": 0.9159213416745643,
"learning_rate": 1.019421165295182e-05,
"loss": 0.4986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16384699940681458,
"step": 2830,
"valid_targets_mean": 2185.4,
"valid_targets_min": 498
},
{
"epoch": 4.887931034482759,
"grad_norm": 0.7706544148632299,
"learning_rate": 1.0119368567278545e-05,
"loss": 0.4774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26055097579956055,
"step": 2835,
"valid_targets_mean": 3275.6,
"valid_targets_min": 538
},
{
"epoch": 4.896551724137931,
"grad_norm": 0.5879710351602947,
"learning_rate": 1.0044708075687746e-05,
"loss": 0.4681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16971173882484436,
"step": 2840,
"valid_targets_mean": 3531.1,
"valid_targets_min": 598
},
{
"epoch": 4.905172413793103,
"grad_norm": 0.5934834566194066,
"learning_rate": 9.97023155790541e-06,
"loss": 0.5148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.217238187789917,
"step": 2845,
"valid_targets_mean": 3915.4,
"valid_targets_min": 978
},
{
"epoch": 4.913793103448276,
"grad_norm": 0.8337575764419852,
"learning_rate": 9.895940390257675e-06,
"loss": 0.4738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27576619386672974,
"step": 2850,
"valid_targets_mean": 2578.9,
"valid_targets_min": 1535
},
{
"epoch": 4.922413793103448,
"grad_norm": 0.588290288880693,
"learning_rate": 9.821835945645426e-06,
"loss": 0.4361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17642898857593536,
"step": 2855,
"valid_targets_mean": 3636.9,
"valid_targets_min": 990
},
{
"epoch": 4.931034482758621,
"grad_norm": 0.7140384238875621,
"learning_rate": 9.747919593518897e-06,
"loss": 0.4873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606832981109619,
"step": 2860,
"valid_targets_mean": 3753.2,
"valid_targets_min": 930
},
{
"epoch": 4.939655172413794,
"grad_norm": 0.6297493613480442,
"learning_rate": 9.674192699852397e-06,
"loss": 0.5279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20206616818904877,
"step": 2865,
"valid_targets_mean": 3818.6,
"valid_targets_min": 2442
},
{
"epoch": 4.948275862068965,
"grad_norm": 0.6437450236124188,
"learning_rate": 9.600656627119e-06,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28231048583984375,
"step": 2870,
"valid_targets_mean": 5143.2,
"valid_targets_min": 1743
},
{
"epoch": 4.956896551724138,
"grad_norm": 0.7231210514400496,
"learning_rate": 9.52731273426544e-06,
"loss": 0.4665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20072084665298462,
"step": 2875,
"valid_targets_mean": 2665.2,
"valid_targets_min": 1783
},
{
"epoch": 4.9655172413793105,
"grad_norm": 0.7200627267648373,
"learning_rate": 9.454162376686959e-06,
"loss": 0.4669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21553944051265717,
"step": 2880,
"valid_targets_mean": 3167.2,
"valid_targets_min": 1382
},
{
"epoch": 4.974137931034483,
"grad_norm": 0.7048399069586939,
"learning_rate": 9.381206906202268e-06,
"loss": 0.5094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3543662428855896,
"step": 2885,
"valid_targets_mean": 4687.0,
"valid_targets_min": 1536
},
{
"epoch": 4.982758620689655,
"grad_norm": 0.5646407366469018,
"learning_rate": 9.308447671028546e-06,
"loss": 0.5034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24721992015838623,
"step": 2890,
"valid_targets_mean": 5792.9,
"valid_targets_min": 2082
},
{
"epoch": 4.991379310344827,
"grad_norm": 0.8018492929350751,
"learning_rate": 9.235886015756579e-06,
"loss": 0.4382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2554394602775574,
"step": 2895,
"valid_targets_mean": 3645.0,
"valid_targets_min": 864
},
{
"epoch": 5.0,
"grad_norm": 0.7478721695038638,
"learning_rate": 9.163523281325855e-06,
"loss": 0.497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2047863006591797,
"step": 2900,
"valid_targets_mean": 2364.6,
"valid_targets_min": 1117
},
{
"epoch": 5.008620689655173,
"grad_norm": 0.6224544654750317,
"learning_rate": 9.09136080499979e-06,
"loss": 0.4708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23398515582084656,
"step": 2905,
"valid_targets_mean": 3525.2,
"valid_targets_min": 1480
},
{
"epoch": 5.017241379310345,
"grad_norm": 0.6724030509673462,
"learning_rate": 9.019399920341056e-06,
"loss": 0.4449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19100379943847656,
"step": 2910,
"valid_targets_mean": 3215.8,
"valid_targets_min": 433
},
{
"epoch": 5.025862068965517,
"grad_norm": 0.7583214816177382,
"learning_rate": 8.947641957186901e-06,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19197000563144684,
"step": 2915,
"valid_targets_mean": 2711.9,
"valid_targets_min": 804
},
{
"epoch": 5.0344827586206895,
"grad_norm": 1.654079400156267,
"learning_rate": 8.876088241624581e-06,
"loss": 0.4418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17325645685195923,
"step": 2920,
"valid_targets_mean": 3065.5,
"valid_targets_min": 359
},
{
"epoch": 5.043103448275862,
"grad_norm": 0.5891519901032664,
"learning_rate": 8.804740095966854e-06,
"loss": 0.4805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2441479116678238,
"step": 2925,
"valid_targets_mean": 5050.4,
"valid_targets_min": 1819
},
{
"epoch": 5.051724137931035,
"grad_norm": 0.8278995394082316,
"learning_rate": 8.733598838727559e-06,
"loss": 0.4434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18562006950378418,
"step": 2930,
"valid_targets_mean": 2430.1,
"valid_targets_min": 1811
},
{
"epoch": 5.060344827586207,
"grad_norm": 0.8698667716108178,
"learning_rate": 8.662665784597229e-06,
"loss": 0.4666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086687922477722,
"step": 2935,
"valid_targets_mean": 4216.1,
"valid_targets_min": 892
},
{
"epoch": 5.068965517241379,
"grad_norm": 0.7016494507760576,
"learning_rate": 8.591942244418787e-06,
"loss": 0.4642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21846792101860046,
"step": 2940,
"valid_targets_mean": 3485.5,
"valid_targets_min": 1529
},
{
"epoch": 5.077586206896552,
"grad_norm": 0.6630898429377045,
"learning_rate": 8.521429525163353e-06,
"loss": 0.4532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2878398001194,
"step": 2945,
"valid_targets_mean": 4316.1,
"valid_targets_min": 625
},
{
"epoch": 5.086206896551724,
"grad_norm": 0.761735138224444,
"learning_rate": 8.451128929906103e-06,
"loss": 0.4497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1884111762046814,
"step": 2950,
"valid_targets_mean": 2733.1,
"valid_targets_min": 1546
},
{
"epoch": 5.094827586206897,
"grad_norm": 0.8339171233338399,
"learning_rate": 8.381041757802104e-06,
"loss": 0.4466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26359814405441284,
"step": 2955,
"valid_targets_mean": 2911.4,
"valid_targets_min": 937
},
{
"epoch": 5.103448275862069,
"grad_norm": 0.6877757737180021,
"learning_rate": 8.311169304062408e-06,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2356172502040863,
"step": 2960,
"valid_targets_mean": 3584.0,
"valid_targets_min": 1213
},
{
"epoch": 5.112068965517241,
"grad_norm": 0.8051485741023968,
"learning_rate": 8.24151285993005e-06,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16779354214668274,
"step": 2965,
"valid_targets_mean": 2010.1,
"valid_targets_min": 1005
},
{
"epoch": 5.120689655172414,
"grad_norm": 0.6175388631001866,
"learning_rate": 8.172073712656217e-06,
"loss": 0.4595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15900662541389465,
"step": 2970,
"valid_targets_mean": 3262.8,
"valid_targets_min": 1201
},
{
"epoch": 5.129310344827586,
"grad_norm": 0.8481695814337025,
"learning_rate": 8.102853145476443e-06,
"loss": 0.4956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27707868814468384,
"step": 2975,
"valid_targets_mean": 6042.9,
"valid_targets_min": 1837
},
{
"epoch": 5.137931034482759,
"grad_norm": 0.7790714744312073,
"learning_rate": 8.033852437586909e-06,
"loss": 0.4999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4171217978000641,
"step": 2980,
"valid_targets_mean": 4342.9,
"valid_targets_min": 1199
},
{
"epoch": 5.146551724137931,
"grad_norm": 0.7171849773714023,
"learning_rate": 7.965072864120795e-06,
"loss": 0.4707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24280916154384613,
"step": 2985,
"valid_targets_mean": 3208.9,
"valid_targets_min": 1568
},
{
"epoch": 5.155172413793103,
"grad_norm": 0.7268079620351237,
"learning_rate": 7.896515696124703e-06,
"loss": 0.455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24983307719230652,
"step": 2990,
"valid_targets_mean": 3696.2,
"valid_targets_min": 1525
},
{
"epoch": 5.163793103448276,
"grad_norm": 0.7397712005549786,
"learning_rate": 7.828182200535192e-06,
"loss": 0.4805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1951979696750641,
"step": 2995,
"valid_targets_mean": 2562.8,
"valid_targets_min": 593
},
{
"epoch": 5.172413793103448,
"grad_norm": 0.6078078960889772,
"learning_rate": 7.760073640155363e-06,
"loss": 0.4299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15697035193443298,
"step": 3000,
"valid_targets_mean": 3641.9,
"valid_targets_min": 1695
},
{
"epoch": 5.181034482758621,
"grad_norm": 0.6906741782932729,
"learning_rate": 7.6921912736315e-06,
"loss": 0.4592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528272867202759,
"step": 3005,
"valid_targets_mean": 3960.2,
"valid_targets_min": 569
},
{
"epoch": 5.189655172413793,
"grad_norm": 0.779801729011475,
"learning_rate": 7.624536355429832e-06,
"loss": 0.4482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13327597081661224,
"step": 3010,
"valid_targets_mean": 2014.1,
"valid_targets_min": 595
},
{
"epoch": 5.198275862068965,
"grad_norm": 0.6961265560269253,
"learning_rate": 7.557110135813341e-06,
"loss": 0.4799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25486013293266296,
"step": 3015,
"valid_targets_mean": 3800.1,
"valid_targets_min": 692
},
{
"epoch": 5.206896551724138,
"grad_norm": 0.7485573343568958,
"learning_rate": 7.489913860818662e-06,
"loss": 0.4767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23183771967887878,
"step": 3020,
"valid_targets_mean": 3628.5,
"valid_targets_min": 1680
},
{
"epoch": 5.2155172413793105,
"grad_norm": 0.6081028132914261,
"learning_rate": 7.4229487722330315e-06,
"loss": 0.4706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1672867089509964,
"step": 3025,
"valid_targets_mean": 3773.8,
"valid_targets_min": 1863
},
{
"epoch": 5.224137931034483,
"grad_norm": 0.7129702935758114,
"learning_rate": 7.356216107571399e-06,
"loss": 0.4519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27049562335014343,
"step": 3030,
"valid_targets_mean": 3894.4,
"valid_targets_min": 696
},
{
"epoch": 5.232758620689655,
"grad_norm": 1.0397970965650016,
"learning_rate": 7.289717100053497e-06,
"loss": 0.5137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1450689136981964,
"step": 3035,
"valid_targets_mean": 2030.2,
"valid_targets_min": 498
},
{
"epoch": 5.241379310344827,
"grad_norm": 0.6915057778767586,
"learning_rate": 7.2234529785810645e-06,
"loss": 0.4723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542662024497986,
"step": 3040,
"valid_targets_mean": 3820.6,
"valid_targets_min": 916
},
{
"epoch": 5.25,
"grad_norm": 0.7056302244612103,
"learning_rate": 7.157424967715163e-06,
"loss": 0.4573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13803818821907043,
"step": 3045,
"valid_targets_mean": 2330.0,
"valid_targets_min": 704
},
{
"epoch": 5.258620689655173,
"grad_norm": 0.6185090500671104,
"learning_rate": 7.091634287653526e-06,
"loss": 0.4722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2878566086292267,
"step": 3050,
"valid_targets_mean": 4588.1,
"valid_targets_min": 1677
},
{
"epoch": 5.267241379310345,
"grad_norm": 0.761902630255462,
"learning_rate": 7.026082154208012e-06,
"loss": 0.4416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29359132051467896,
"step": 3055,
"valid_targets_mean": 4224.2,
"valid_targets_min": 1513
},
{
"epoch": 5.275862068965517,
"grad_norm": 0.7844949843129767,
"learning_rate": 6.960769778782133e-06,
"loss": 0.4444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986701726913452,
"step": 3060,
"valid_targets_mean": 3789.8,
"valid_targets_min": 753
},
{
"epoch": 5.2844827586206895,
"grad_norm": 0.726504265476168,
"learning_rate": 6.89569836834868e-06,
"loss": 0.47,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24666550755500793,
"step": 3065,
"valid_targets_mean": 3141.1,
"valid_targets_min": 890
},
{
"epoch": 5.293103448275862,
"grad_norm": 0.6848726403595511,
"learning_rate": 6.830869125427406e-06,
"loss": 0.4914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35621824860572815,
"step": 3070,
"valid_targets_mean": 3706.6,
"valid_targets_min": 1151
},
{
"epoch": 5.301724137931035,
"grad_norm": 0.7941226544749608,
"learning_rate": 6.766283248062817e-06,
"loss": 0.4605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20678937435150146,
"step": 3075,
"valid_targets_mean": 2429.2,
"valid_targets_min": 795
},
{
"epoch": 5.310344827586207,
"grad_norm": 0.6736650057815443,
"learning_rate": 6.701941929801996e-06,
"loss": 0.4988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25833404064178467,
"step": 3080,
"valid_targets_mean": 4493.0,
"valid_targets_min": 2396
},
{
"epoch": 5.318965517241379,
"grad_norm": 0.7533894846747827,
"learning_rate": 6.637846359672611e-06,
"loss": 0.4833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21882648766040802,
"step": 3085,
"valid_targets_mean": 3435.5,
"valid_targets_min": 1432
},
{
"epoch": 5.327586206896552,
"grad_norm": 0.9917710187118872,
"learning_rate": 6.57399772216089e-06,
"loss": 0.4459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2761511206626892,
"step": 3090,
"valid_targets_mean": 4892.8,
"valid_targets_min": 1290
},
{
"epoch": 5.336206896551724,
"grad_norm": 0.7004668156294833,
"learning_rate": 6.510397197189724e-06,
"loss": 0.5128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20646989345550537,
"step": 3095,
"valid_targets_mean": 3881.2,
"valid_targets_min": 1376
},
{
"epoch": 5.344827586206897,
"grad_norm": 0.6756196982178647,
"learning_rate": 6.447045960096909e-06,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19709131121635437,
"step": 3100,
"valid_targets_mean": 3093.2,
"valid_targets_min": 760
},
{
"epoch": 5.353448275862069,
"grad_norm": 0.8315120005504095,
"learning_rate": 6.383945181613398e-06,
"loss": 0.4206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2558245360851288,
"step": 3105,
"valid_targets_mean": 3705.8,
"valid_targets_min": 1318
},
{
"epoch": 5.362068965517241,
"grad_norm": 0.7182202828905813,
"learning_rate": 6.32109602784166e-06,
"loss": 0.452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2329225242137909,
"step": 3110,
"valid_targets_mean": 3544.4,
"valid_targets_min": 1795
},
{
"epoch": 5.370689655172414,
"grad_norm": 0.7119685951103023,
"learning_rate": 6.258499660234147e-06,
"loss": 0.4502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15800319612026215,
"step": 3115,
"valid_targets_mean": 3172.1,
"valid_targets_min": 1784
},
{
"epoch": 5.379310344827586,
"grad_norm": 0.7202358371283981,
"learning_rate": 6.196157235571813e-06,
"loss": 0.4635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982141077518463,
"step": 3120,
"valid_targets_mean": 3674.8,
"valid_targets_min": 357
},
{
"epoch": 5.387931034482759,
"grad_norm": 0.7885867904582534,
"learning_rate": 6.134069905942764e-06,
"loss": 0.4675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30231577157974243,
"step": 3125,
"valid_targets_mean": 3849.5,
"valid_targets_min": 320
},
{
"epoch": 5.396551724137931,
"grad_norm": 0.7181738901551832,
"learning_rate": 6.072238818720919e-06,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23303094506263733,
"step": 3130,
"valid_targets_mean": 3753.1,
"valid_targets_min": 999
},
{
"epoch": 5.405172413793103,
"grad_norm": 0.593921178442862,
"learning_rate": 6.010665116544858e-06,
"loss": 0.4653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23492135107517242,
"step": 3135,
"valid_targets_mean": 4800.0,
"valid_targets_min": 1120
},
{
"epoch": 5.413793103448276,
"grad_norm": 0.7764310266542166,
"learning_rate": 5.9493499372967e-06,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.225310817360878,
"step": 3140,
"valid_targets_mean": 2939.2,
"valid_targets_min": 581
},
{
"epoch": 5.422413793103448,
"grad_norm": 0.7323733956463316,
"learning_rate": 5.888294414081024e-06,
"loss": 0.4852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25720715522766113,
"step": 3145,
"valid_targets_mean": 4409.8,
"valid_targets_min": 1989
},
{
"epoch": 5.431034482758621,
"grad_norm": 0.6882597275678037,
"learning_rate": 5.827499675203987e-06,
"loss": 0.421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14771276712417603,
"step": 3150,
"valid_targets_mean": 2556.0,
"valid_targets_min": 1467
},
{
"epoch": 5.439655172413793,
"grad_norm": 0.842854165866408,
"learning_rate": 5.76696684415245e-06,
"loss": 0.4494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25888389348983765,
"step": 3155,
"valid_targets_mean": 3178.9,
"valid_targets_min": 1645
},
{
"epoch": 5.448275862068965,
"grad_norm": 0.6555092034098002,
"learning_rate": 5.706697039573217e-06,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24546992778778076,
"step": 3160,
"valid_targets_mean": 4539.2,
"valid_targets_min": 1857
},
{
"epoch": 5.456896551724138,
"grad_norm": 0.7048492004889653,
"learning_rate": 5.646691375252344e-06,
"loss": 0.4697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22363720834255219,
"step": 3165,
"valid_targets_mean": 3127.9,
"valid_targets_min": 1318
},
{
"epoch": 5.4655172413793105,
"grad_norm": 0.6378803177788848,
"learning_rate": 5.586950960094606e-06,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21243023872375488,
"step": 3170,
"valid_targets_mean": 4441.9,
"valid_targets_min": 1440
},
{
"epoch": 5.474137931034483,
"grad_norm": 0.7817408980627574,
"learning_rate": 5.527476898102959e-06,
"loss": 0.4443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24490898847579956,
"step": 3175,
"valid_targets_mean": 3144.2,
"valid_targets_min": 333
},
{
"epoch": 5.482758620689655,
"grad_norm": 0.6047332242907153,
"learning_rate": 5.4682702883581395e-06,
"loss": 0.4316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134861558675766,
"step": 3180,
"valid_targets_mean": 3966.6,
"valid_targets_min": 1314
},
{
"epoch": 5.491379310344827,
"grad_norm": 0.636476438778125,
"learning_rate": 5.40933222499838e-06,
"loss": 0.43,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19472798705101013,
"step": 3185,
"valid_targets_mean": 3977.2,
"valid_targets_min": 812
},
{
"epoch": 5.5,
"grad_norm": 0.6748452817636509,
"learning_rate": 5.350663797199174e-06,
"loss": 0.4697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19321182370185852,
"step": 3190,
"valid_targets_mean": 3625.8,
"valid_targets_min": 1099
},
{
"epoch": 5.508620689655173,
"grad_norm": 0.8353678432176448,
"learning_rate": 5.292266089153149e-06,
"loss": 0.4495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23553451895713806,
"step": 3195,
"valid_targets_mean": 2531.8,
"valid_targets_min": 760
},
{
"epoch": 5.517241379310345,
"grad_norm": 0.5708775355976995,
"learning_rate": 5.234140180050029e-06,
"loss": 0.4726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2230847179889679,
"step": 3200,
"valid_targets_mean": 4267.9,
"valid_targets_min": 455
},
{
"epoch": 5.525862068965517,
"grad_norm": 0.7399173755970399,
"learning_rate": 5.1762871440566935e-06,
"loss": 0.434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1931067705154419,
"step": 3205,
"valid_targets_mean": 3313.6,
"valid_targets_min": 917
},
{
"epoch": 5.5344827586206895,
"grad_norm": 0.7492141521348251,
"learning_rate": 5.118708050297332e-06,
"loss": 0.4385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27809464931488037,
"step": 3210,
"valid_targets_mean": 4113.2,
"valid_targets_min": 1205
},
{
"epoch": 5.543103448275862,
"grad_norm": 0.6827907606565726,
"learning_rate": 5.061403962833669e-06,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17418712377548218,
"step": 3215,
"valid_targets_mean": 3184.0,
"valid_targets_min": 976
},
{
"epoch": 5.551724137931035,
"grad_norm": 0.7028563981123193,
"learning_rate": 5.004375940645314e-06,
"loss": 0.4878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37116700410842896,
"step": 3220,
"valid_targets_mean": 5722.8,
"valid_targets_min": 1655
},
{
"epoch": 5.560344827586206,
"grad_norm": 0.6358136143357161,
"learning_rate": 4.947625037610219e-06,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26970693469047546,
"step": 3225,
"valid_targets_mean": 5035.5,
"valid_targets_min": 1129
},
{
"epoch": 5.568965517241379,
"grad_norm": 0.79905657590774,
"learning_rate": 4.8911523024851295e-06,
"loss": 0.4967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19400912523269653,
"step": 3230,
"valid_targets_mean": 2246.5,
"valid_targets_min": 385
},
{
"epoch": 5.577586206896552,
"grad_norm": 0.7661307110427259,
"learning_rate": 4.834958778886271e-06,
"loss": 0.4811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3137957453727722,
"step": 3235,
"valid_targets_mean": 3229.9,
"valid_targets_min": 1368
},
{
"epoch": 5.586206896551724,
"grad_norm": 0.6816565028977988,
"learning_rate": 4.779045505270043e-06,
"loss": 0.4576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2541190981864929,
"step": 3240,
"valid_targets_mean": 4194.4,
"valid_targets_min": 563
},
{
"epoch": 5.594827586206897,
"grad_norm": 0.6751608561194854,
"learning_rate": 4.723413514913817e-06,
"loss": 0.4557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17950564622879028,
"step": 3245,
"valid_targets_mean": 2918.8,
"valid_targets_min": 1462
},
{
"epoch": 5.603448275862069,
"grad_norm": 0.7316269694764956,
"learning_rate": 4.66806383589685e-06,
"loss": 0.4765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735571563243866,
"step": 3250,
"valid_targets_mean": 3391.2,
"valid_targets_min": 644
},
{
"epoch": 5.612068965517241,
"grad_norm": 0.6414697826461783,
"learning_rate": 4.6129974910812855e-06,
"loss": 0.4433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18585994839668274,
"step": 3255,
"valid_targets_mean": 3076.2,
"valid_targets_min": 1818
},
{
"epoch": 5.620689655172414,
"grad_norm": 0.6504910454062405,
"learning_rate": 4.558215498093252e-06,
"loss": 0.4478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2893863916397095,
"step": 3260,
"valid_targets_mean": 5735.8,
"valid_targets_min": 415
},
{
"epoch": 5.629310344827586,
"grad_norm": 0.7196796255916211,
"learning_rate": 4.503718869304063e-06,
"loss": 0.4711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2017214149236679,
"step": 3265,
"valid_targets_mean": 3032.1,
"valid_targets_min": 437
},
{
"epoch": 5.637931034482759,
"grad_norm": 0.8140224360637848,
"learning_rate": 4.449508611811482e-06,
"loss": 0.4655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18502508103847504,
"step": 3270,
"valid_targets_mean": 2054.6,
"valid_targets_min": 897
},
{
"epoch": 5.646551724137931,
"grad_norm": 0.6233804054960342,
"learning_rate": 4.395585727421139e-06,
"loss": 0.4717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23045390844345093,
"step": 3275,
"valid_targets_mean": 4667.6,
"valid_targets_min": 2813
},
{
"epoch": 5.655172413793103,
"grad_norm": 0.7026030856163301,
"learning_rate": 4.341951212628031e-06,
"loss": 0.4861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3447082042694092,
"step": 3280,
"valid_targets_mean": 4856.2,
"valid_targets_min": 1629
},
{
"epoch": 5.663793103448276,
"grad_norm": 0.6809784081813541,
"learning_rate": 4.288606058598048e-06,
"loss": 0.4395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1348533034324646,
"step": 3285,
"valid_targets_mean": 2791.8,
"valid_targets_min": 1492
},
{
"epoch": 5.672413793103448,
"grad_norm": 0.613876392573019,
"learning_rate": 4.235551251149714e-06,
"loss": 0.4666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2379133701324463,
"step": 3290,
"valid_targets_mean": 5035.5,
"valid_targets_min": 714
},
{
"epoch": 5.681034482758621,
"grad_norm": 0.7094539400481058,
"learning_rate": 4.1827877707359474e-06,
"loss": 0.4482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2683733403682709,
"step": 3295,
"valid_targets_mean": 4671.0,
"valid_targets_min": 1056
},
{
"epoch": 5.689655172413794,
"grad_norm": 0.8787456783967276,
"learning_rate": 4.130316592425934e-06,
"loss": 0.4478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19786673784255981,
"step": 3300,
"valid_targets_mean": 2232.8,
"valid_targets_min": 279
},
{
"epoch": 5.698275862068965,
"grad_norm": 0.8502083809636145,
"learning_rate": 4.078138685887125e-06,
"loss": 0.4566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2412954866886139,
"step": 3305,
"valid_targets_mean": 3456.1,
"valid_targets_min": 1128
},
{
"epoch": 5.706896551724138,
"grad_norm": 0.7472679746715507,
"learning_rate": 4.026255015367302e-06,
"loss": 0.4484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23308929800987244,
"step": 3310,
"valid_targets_mean": 3830.0,
"valid_targets_min": 480
},
{
"epoch": 5.7155172413793105,
"grad_norm": 0.75274136107482,
"learning_rate": 3.974666539676774e-06,
"loss": 0.4847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14974159002304077,
"step": 3315,
"valid_targets_mean": 2648.6,
"valid_targets_min": 652
},
{
"epoch": 5.724137931034483,
"grad_norm": 0.5774910463846608,
"learning_rate": 3.923374212170634e-06,
"loss": 0.4978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22366955876350403,
"step": 3320,
"valid_targets_mean": 4939.1,
"valid_targets_min": 1908
},
{
"epoch": 5.732758620689655,
"grad_norm": 0.9389239094558165,
"learning_rate": 3.872378980731168e-06,
"loss": 0.4579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31157776713371277,
"step": 3325,
"valid_targets_mean": 4375.2,
"valid_targets_min": 2092
},
{
"epoch": 5.741379310344827,
"grad_norm": 0.7856183251154304,
"learning_rate": 3.821681787750327e-06,
"loss": 0.4824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2415979951620102,
"step": 3330,
"valid_targets_mean": 3034.4,
"valid_targets_min": 1001
},
{
"epoch": 5.75,
"grad_norm": 0.6251658420467967,
"learning_rate": 3.7712835701122985e-06,
"loss": 0.4581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3360128402709961,
"step": 3335,
"valid_targets_mean": 5729.0,
"valid_targets_min": 1965
},
{
"epoch": 5.758620689655173,
"grad_norm": 0.7503171399314047,
"learning_rate": 3.721185259176223e-06,
"loss": 0.4509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20740580558776855,
"step": 3340,
"valid_targets_mean": 2710.9,
"valid_targets_min": 1147
},
{
"epoch": 5.767241379310345,
"grad_norm": 0.7658794496747393,
"learning_rate": 3.6713877807589503e-06,
"loss": 0.4425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19355687499046326,
"step": 3345,
"valid_targets_mean": 2887.6,
"valid_targets_min": 451
},
{
"epoch": 5.775862068965517,
"grad_norm": 0.6818747673397412,
"learning_rate": 3.621892055117955e-06,
"loss": 0.4548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2165466994047165,
"step": 3350,
"valid_targets_mean": 4357.8,
"valid_targets_min": 1508
},
{
"epoch": 5.7844827586206895,
"grad_norm": 0.576120259663283,
"learning_rate": 3.572698996934303e-06,
"loss": 0.4441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19731038808822632,
"step": 3355,
"valid_targets_mean": 5281.2,
"valid_targets_min": 1702
},
{
"epoch": 5.793103448275862,
"grad_norm": 0.7233735140697485,
"learning_rate": 3.5238095152957906e-06,
"loss": 0.4703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16802190244197845,
"step": 3360,
"valid_targets_mean": 2777.1,
"valid_targets_min": 1009
},
{
"epoch": 5.801724137931035,
"grad_norm": 0.6935810826398939,
"learning_rate": 3.4752245136801065e-06,
"loss": 0.459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20021113753318787,
"step": 3365,
"valid_targets_mean": 3346.2,
"valid_targets_min": 1778
},
{
"epoch": 5.810344827586206,
"grad_norm": 0.6305192634235494,
"learning_rate": 3.4269448899381354e-06,
"loss": 0.4703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24132040143013,
"step": 3370,
"valid_targets_mean": 5659.8,
"valid_targets_min": 468
},
{
"epoch": 5.818965517241379,
"grad_norm": 0.6686341734215869,
"learning_rate": 3.3789715362773955e-06,
"loss": 0.4396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2577729821205139,
"step": 3375,
"valid_targets_mean": 4669.1,
"valid_targets_min": 842
},
{
"epoch": 5.827586206896552,
"grad_norm": 0.5730865976165508,
"learning_rate": 3.3313053392455317e-06,
"loss": 0.4393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2799406051635742,
"step": 3380,
"valid_targets_mean": 5855.2,
"valid_targets_min": 1536
},
{
"epoch": 5.836206896551724,
"grad_norm": 0.6779968652180786,
"learning_rate": 3.2839471797139287e-06,
"loss": 0.441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2712808847427368,
"step": 3385,
"valid_targets_mean": 3816.5,
"valid_targets_min": 1117
},
{
"epoch": 5.844827586206897,
"grad_norm": 0.678758331044749,
"learning_rate": 3.236897932861438e-06,
"loss": 0.4575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1380578577518463,
"step": 3390,
"valid_targets_mean": 2670.1,
"valid_targets_min": 1094
},
{
"epoch": 5.853448275862069,
"grad_norm": 0.6930942013750735,
"learning_rate": 3.190158468158209e-06,
"loss": 0.4717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26487284898757935,
"step": 3395,
"valid_targets_mean": 4868.8,
"valid_targets_min": 1079
},
{
"epoch": 5.862068965517241,
"grad_norm": 0.8138602963483332,
"learning_rate": 3.1437296493496183e-06,
"loss": 0.4437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084672451019287,
"step": 3400,
"valid_targets_mean": 2761.5,
"valid_targets_min": 1043
},
{
"epoch": 5.870689655172414,
"grad_norm": 0.7005704796522405,
"learning_rate": 3.0976123344402897e-06,
"loss": 0.4103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30806052684783936,
"step": 3405,
"valid_targets_mean": 5424.6,
"valid_targets_min": 1519
},
{
"epoch": 5.879310344827586,
"grad_norm": 0.5581296805550643,
"learning_rate": 3.0518073756782683e-06,
"loss": 0.4627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23483984172344208,
"step": 3410,
"valid_targets_mean": 6492.5,
"valid_targets_min": 370
},
{
"epoch": 5.887931034482759,
"grad_norm": 0.7413985748284263,
"learning_rate": 3.0063156195392685e-06,
"loss": 0.4331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1887524425983429,
"step": 3415,
"valid_targets_mean": 3025.9,
"valid_targets_min": 299
},
{
"epoch": 5.896551724137931,
"grad_norm": 0.7227263047030936,
"learning_rate": 2.9611379067109914e-06,
"loss": 0.448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2441166490316391,
"step": 3420,
"valid_targets_mean": 4610.4,
"valid_targets_min": 837
},
{
"epoch": 5.905172413793103,
"grad_norm": 0.7828328616055023,
"learning_rate": 2.9162750720776366e-06,
"loss": 0.4469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19237752258777618,
"step": 3425,
"valid_targets_mean": 2687.2,
"valid_targets_min": 1850
},
{
"epoch": 5.913793103448276,
"grad_norm": 0.7107936465243866,
"learning_rate": 2.871727944704452e-06,
"loss": 0.4617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1891714334487915,
"step": 3430,
"valid_targets_mean": 3769.1,
"valid_targets_min": 1792
},
{
"epoch": 5.922413793103448,
"grad_norm": 0.7382472128070807,
"learning_rate": 2.8274973478224167e-06,
"loss": 0.4566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17400340735912323,
"step": 3435,
"valid_targets_mean": 2444.0,
"valid_targets_min": 862
},
{
"epoch": 5.931034482758621,
"grad_norm": 0.6571277220139973,
"learning_rate": 2.783584098813006e-06,
"loss": 0.4282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19393205642700195,
"step": 3440,
"valid_targets_mean": 3712.8,
"valid_targets_min": 1681
},
{
"epoch": 5.939655172413794,
"grad_norm": 0.7312043134669541,
"learning_rate": 2.739989009193138e-06,
"loss": 0.4772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664768099784851,
"step": 3445,
"valid_targets_mean": 5313.1,
"valid_targets_min": 1496
},
{
"epoch": 5.948275862068965,
"grad_norm": 0.7966953008777837,
"learning_rate": 2.6967128846001234e-06,
"loss": 0.4134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16477492451667786,
"step": 3450,
"valid_targets_mean": 2826.6,
"valid_targets_min": 398
},
{
"epoch": 5.956896551724138,
"grad_norm": 0.7505723326591668,
"learning_rate": 2.6537565247768094e-06,
"loss": 0.4649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1759946495294571,
"step": 3455,
"valid_targets_mean": 2627.0,
"valid_targets_min": 328
},
{
"epoch": 5.9655172413793105,
"grad_norm": 0.7730918698032901,
"learning_rate": 2.611120723556775e-06,
"loss": 0.4524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2330639362335205,
"step": 3460,
"valid_targets_mean": 3213.0,
"valid_targets_min": 317
},
{
"epoch": 5.974137931034483,
"grad_norm": 0.6871752561410659,
"learning_rate": 2.568806268849684e-06,
"loss": 0.4427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2211509346961975,
"step": 3465,
"valid_targets_mean": 4685.8,
"valid_targets_min": 358
},
{
"epoch": 5.982758620689655,
"grad_norm": 0.6866564277500524,
"learning_rate": 2.526813942626736e-06,
"loss": 0.4428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20986169576644897,
"step": 3470,
"valid_targets_mean": 4101.9,
"valid_targets_min": 1247
},
{
"epoch": 5.991379310344827,
"grad_norm": 0.6407646096396032,
"learning_rate": 2.4851445209061574e-06,
"loss": 0.4476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18139518797397614,
"step": 3475,
"valid_targets_mean": 3582.2,
"valid_targets_min": 1577
},
{
"epoch": 6.0,
"grad_norm": 0.5858103373326182,
"learning_rate": 2.4437987737389277e-06,
"loss": 0.4322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1381668597459793,
"step": 3480,
"valid_targets_mean": 2870.6,
"valid_targets_min": 1488
},
{
"epoch": 6.008620689655173,
"grad_norm": 0.7740135978527747,
"learning_rate": 2.40277746519451e-06,
"loss": 0.4717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22488614916801453,
"step": 3485,
"valid_targets_mean": 3303.1,
"valid_targets_min": 789
},
{
"epoch": 6.017241379310345,
"grad_norm": 0.6718129793968958,
"learning_rate": 2.362081353346746e-06,
"loss": 0.463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22049200534820557,
"step": 3490,
"valid_targets_mean": 3427.2,
"valid_targets_min": 1670
},
{
"epoch": 6.025862068965517,
"grad_norm": 0.6108999358440294,
"learning_rate": 2.3217111902598298e-06,
"loss": 0.4345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25082069635391235,
"step": 3495,
"valid_targets_mean": 5472.6,
"valid_targets_min": 2368
},
{
"epoch": 6.0344827586206895,
"grad_norm": 0.7142070390712623,
"learning_rate": 2.2816677219744388e-06,
"loss": 0.429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18685954809188843,
"step": 3500,
"valid_targets_mean": 3964.9,
"valid_targets_min": 1503
},
{
"epoch": 6.043103448275862,
"grad_norm": 0.6773698288330054,
"learning_rate": 2.241951688493924e-06,
"loss": 0.4551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644187808036804,
"step": 3505,
"valid_targets_mean": 4625.0,
"valid_targets_min": 1480
},
{
"epoch": 6.051724137931035,
"grad_norm": 0.8091413060885396,
"learning_rate": 2.2025638237706294e-06,
"loss": 0.4631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22907666862010956,
"step": 3510,
"valid_targets_mean": 2675.4,
"valid_targets_min": 1267
},
{
"epoch": 6.060344827586207,
"grad_norm": 0.6849568569146559,
"learning_rate": 2.1635048556923555e-06,
"loss": 0.496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3542017340660095,
"step": 3515,
"valid_targets_mean": 4052.4,
"valid_targets_min": 432
},
{
"epoch": 6.068965517241379,
"grad_norm": 0.676675971064016,
"learning_rate": 2.1247755060688856e-06,
"loss": 0.4691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13447147607803345,
"step": 3520,
"valid_targets_mean": 2988.2,
"valid_targets_min": 1243
},
{
"epoch": 6.077586206896552,
"grad_norm": 0.7520571476765067,
"learning_rate": 2.0863764906186514e-06,
"loss": 0.4516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25384098291397095,
"step": 3525,
"valid_targets_mean": 3574.5,
"valid_targets_min": 1700
},
{
"epoch": 6.086206896551724,
"grad_norm": 0.716713637131033,
"learning_rate": 2.048308518955515e-06,
"loss": 0.4705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3154298663139343,
"step": 3530,
"valid_targets_mean": 5037.4,
"valid_targets_min": 429
},
{
"epoch": 6.094827586206897,
"grad_norm": 0.7694399803659958,
"learning_rate": 2.010572294575641e-06,
"loss": 0.4698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17910689115524292,
"step": 3535,
"valid_targets_mean": 3081.2,
"valid_targets_min": 1551
},
{
"epoch": 6.103448275862069,
"grad_norm": 0.7868404699942033,
"learning_rate": 1.9731685148445168e-06,
"loss": 0.4561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528718113899231,
"step": 3540,
"valid_targets_mean": 4245.1,
"valid_targets_min": 2071
},
{
"epoch": 6.112068965517241,
"grad_norm": 0.7576280365207806,
"learning_rate": 1.9360978709840304e-06,
"loss": 0.4174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1939217746257782,
"step": 3545,
"valid_targets_mean": 2826.0,
"valid_targets_min": 543
},
{
"epoch": 6.120689655172414,
"grad_norm": 0.717658482106765,
"learning_rate": 1.8993610480597359e-06,
"loss": 0.4367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32581982016563416,
"step": 3550,
"valid_targets_mean": 5192.1,
"valid_targets_min": 1572
},
{
"epoch": 6.129310344827586,
"grad_norm": 0.6379593260805476,
"learning_rate": 1.8629587249681802e-06,
"loss": 0.4901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898372411727905,
"step": 3555,
"valid_targets_mean": 4503.4,
"valid_targets_min": 233
},
{
"epoch": 6.137931034482759,
"grad_norm": 0.8367663752524243,
"learning_rate": 1.8268915744243321e-06,
"loss": 0.4469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21554884314537048,
"step": 3560,
"valid_targets_mean": 2432.1,
"valid_targets_min": 895
},
{
"epoch": 6.146551724137931,
"grad_norm": 0.7054337218833375,
"learning_rate": 1.7911602629491876e-06,
"loss": 0.4659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18869292736053467,
"step": 3565,
"valid_targets_mean": 3975.1,
"valid_targets_min": 470
},
{
"epoch": 6.155172413793103,
"grad_norm": 0.7631519820066042,
"learning_rate": 1.7557654508574339e-06,
"loss": 0.4637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16359178721904755,
"step": 3570,
"valid_targets_mean": 1903.8,
"valid_targets_min": 383
},
{
"epoch": 6.163793103448276,
"grad_norm": 0.7024009414184341,
"learning_rate": 1.7207077922452465e-06,
"loss": 0.4322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18459674715995789,
"step": 3575,
"valid_targets_mean": 3362.8,
"valid_targets_min": 1424
},
{
"epoch": 6.172413793103448,
"grad_norm": 0.77426605189279,
"learning_rate": 1.6859879349782016e-06,
"loss": 0.4596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14893782138824463,
"step": 3580,
"valid_targets_mean": 1882.2,
"valid_targets_min": 710
},
{
"epoch": 6.181034482758621,
"grad_norm": 0.7511156023426865,
"learning_rate": 1.6516065206793142e-06,
"loss": 0.4586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090694546699524,
"step": 3585,
"valid_targets_mean": 3560.6,
"valid_targets_min": 655
},
{
"epoch": 6.189655172413793,
"grad_norm": 0.7063002930277574,
"learning_rate": 1.6175641847171687e-06,
"loss": 0.4822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2065710723400116,
"step": 3590,
"valid_targets_mean": 3442.1,
"valid_targets_min": 686
},
{
"epoch": 6.198275862068965,
"grad_norm": 0.7527738601886692,
"learning_rate": 1.5838615561941705e-06,
"loss": 0.4457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19831009209156036,
"step": 3595,
"valid_targets_mean": 3206.9,
"valid_targets_min": 305
},
{
"epoch": 6.206896551724138,
"grad_norm": 0.7563126410614768,
"learning_rate": 1.550499257934952e-06,
"loss": 0.4661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772877514362335,
"step": 3600,
"valid_targets_mean": 3702.5,
"valid_targets_min": 1528
},
{
"epoch": 6.2155172413793105,
"grad_norm": 0.6758864017574707,
"learning_rate": 1.5174779064748246e-06,
"loss": 0.453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3183794617652893,
"step": 3605,
"valid_targets_mean": 5107.1,
"valid_targets_min": 546
},
{
"epoch": 6.224137931034483,
"grad_norm": 0.5562754795731977,
"learning_rate": 1.4847981120484089e-06,
"loss": 0.425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17494836449623108,
"step": 3610,
"valid_targets_mean": 5317.8,
"valid_targets_min": 1689
},
{
"epoch": 6.232758620689655,
"grad_norm": 0.5664500974521548,
"learning_rate": 1.4524604785783548e-06,
"loss": 0.4335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948354482650757,
"step": 3615,
"valid_targets_mean": 6150.6,
"valid_targets_min": 1373
},
{
"epoch": 6.241379310344827,
"grad_norm": 0.8404985064381851,
"learning_rate": 1.4204656036641717e-06,
"loss": 0.428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2410782277584076,
"step": 3620,
"valid_targets_mean": 2847.4,
"valid_targets_min": 703
},
{
"epoch": 6.25,
"grad_norm": 0.6389203413177802,
"learning_rate": 1.3888140785711945e-06,
"loss": 0.4408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20249323546886444,
"step": 3625,
"valid_targets_mean": 3856.8,
"valid_targets_min": 1831
},
{
"epoch": 6.258620689655173,
"grad_norm": 0.8460556546997163,
"learning_rate": 1.3575064882196398e-06,
"loss": 0.4386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1973244547843933,
"step": 3630,
"valid_targets_mean": 2522.9,
"valid_targets_min": 917
},
{
"epoch": 6.267241379310345,
"grad_norm": 0.7198328827499566,
"learning_rate": 1.326543411173833e-06,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749674677848816,
"step": 3635,
"valid_targets_mean": 2668.4,
"valid_targets_min": 812
},
{
"epoch": 6.275862068965517,
"grad_norm": 0.7067874613966607,
"learning_rate": 1.295925419631474e-06,
"loss": 0.4557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20972105860710144,
"step": 3640,
"valid_targets_mean": 3294.1,
"valid_targets_min": 1135
},
{
"epoch": 6.2844827586206895,
"grad_norm": 0.737266550604988,
"learning_rate": 1.265653079413094e-06,
"loss": 0.4409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23832815885543823,
"step": 3645,
"valid_targets_mean": 2836.0,
"valid_targets_min": 836
},
{
"epoch": 6.293103448275862,
"grad_norm": 0.7808341732396372,
"learning_rate": 1.2357269499515745e-06,
"loss": 0.4365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26828426122665405,
"step": 3650,
"valid_targets_mean": 3709.5,
"valid_targets_min": 888
},
{
"epoch": 6.301724137931035,
"grad_norm": 0.8072417550739505,
"learning_rate": 1.2061475842818337e-06,
"loss": 0.4984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2538772225379944,
"step": 3655,
"valid_targets_mean": 3380.8,
"valid_targets_min": 647
},
{
"epoch": 6.310344827586207,
"grad_norm": 0.7006576081958799,
"learning_rate": 1.176915529030589e-06,
"loss": 0.4348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29240888357162476,
"step": 3660,
"valid_targets_mean": 4889.4,
"valid_targets_min": 2397
},
{
"epoch": 6.318965517241379,
"grad_norm": 0.7591513606843514,
"learning_rate": 1.1480313244062603e-06,
"loss": 0.45,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28072088956832886,
"step": 3665,
"valid_targets_mean": 3284.6,
"valid_targets_min": 1211
},
{
"epoch": 6.327586206896552,
"grad_norm": 0.6552167771838345,
"learning_rate": 1.1194955041889898e-06,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17346346378326416,
"step": 3670,
"valid_targets_mean": 3683.0,
"valid_targets_min": 1142
},
{
"epoch": 6.336206896551724,
"grad_norm": 0.6798357918420773,
"learning_rate": 1.0913085957207748e-06,
"loss": 0.4396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14828425645828247,
"step": 3675,
"valid_targets_mean": 2677.5,
"valid_targets_min": 571
},
{
"epoch": 6.344827586206897,
"grad_norm": 0.7887644233319003,
"learning_rate": 1.063471119895727e-06,
"loss": 0.4294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.227344810962677,
"step": 3680,
"valid_targets_mean": 3479.6,
"valid_targets_min": 1237
},
{
"epoch": 6.353448275862069,
"grad_norm": 0.8053988429305725,
"learning_rate": 1.0359835911504246e-06,
"loss": 0.4455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19495242834091187,
"step": 3685,
"valid_targets_mean": 3586.6,
"valid_targets_min": 1418
},
{
"epoch": 6.362068965517241,
"grad_norm": 0.8122518920294817,
"learning_rate": 1.0088465174544514e-06,
"loss": 0.4733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2196522206068039,
"step": 3690,
"valid_targets_mean": 2701.8,
"valid_targets_min": 1681
},
{
"epoch": 6.370689655172414,
"grad_norm": 0.753020543651917,
"learning_rate": 9.820604003009614e-07,
"loss": 0.4691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19198468327522278,
"step": 3695,
"valid_targets_mean": 3232.6,
"valid_targets_min": 582
},
{
"epoch": 6.379310344827586,
"grad_norm": 0.7618572578862354,
"learning_rate": 9.556257346974319e-07,
"loss": 0.42,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21314972639083862,
"step": 3700,
"valid_targets_mean": 3102.0,
"valid_targets_min": 839
},
{
"epoch": 6.387931034482759,
"grad_norm": 0.765904355774887,
"learning_rate": 9.295430091565261e-07,
"loss": 0.4612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19799397885799408,
"step": 3705,
"valid_targets_mean": 2865.5,
"valid_targets_min": 1475
},
{
"epoch": 6.396551724137931,
"grad_norm": 0.609585669709035,
"learning_rate": 9.038127056870416e-07,
"loss": 0.4525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21491311490535736,
"step": 3710,
"valid_targets_mean": 5568.1,
"valid_targets_min": 563
},
{
"epoch": 6.405172413793103,
"grad_norm": 0.7690352570878218,
"learning_rate": 8.784352997850277e-07,
"loss": 0.404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20269158482551575,
"step": 3715,
"valid_targets_mean": 4081.6,
"valid_targets_min": 1503
},
{
"epoch": 6.413793103448276,
"grad_norm": 0.7846482935070382,
"learning_rate": 8.534112604249789e-07,
"loss": 0.4087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2106572985649109,
"step": 3720,
"valid_targets_mean": 3615.6,
"valid_targets_min": 348
},
{
"epoch": 6.422413793103448,
"grad_norm": 0.5584770451232427,
"learning_rate": 8.287410500511739e-07,
"loss": 0.4232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2852216362953186,
"step": 3725,
"valid_targets_mean": 7787.0,
"valid_targets_min": 4802
},
{
"epoch": 6.431034482758621,
"grad_norm": 0.6558759014342717,
"learning_rate": 8.044251245691393e-07,
"loss": 0.4837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19151388108730316,
"step": 3730,
"valid_targets_mean": 3860.0,
"valid_targets_min": 1447
},
{
"epoch": 6.439655172413793,
"grad_norm": 0.6171395789005942,
"learning_rate": 7.804639333372077e-07,
"loss": 0.4506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16960985958576202,
"step": 3735,
"valid_targets_mean": 4072.1,
"valid_targets_min": 1878
},
{
"epoch": 6.448275862068965,
"grad_norm": 0.7816495350034629,
"learning_rate": 7.568579191582248e-07,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17788684368133545,
"step": 3740,
"valid_targets_mean": 3884.8,
"valid_targets_min": 1158
},
{
"epoch": 6.456896551724138,
"grad_norm": 0.6529206048125584,
"learning_rate": 7.336075182713708e-07,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18897415697574615,
"step": 3745,
"valid_targets_mean": 4003.6,
"valid_targets_min": 565
},
{
"epoch": 6.4655172413793105,
"grad_norm": 0.6449389338492015,
"learning_rate": 7.107131603440809e-07,
"loss": 0.4252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2346837818622589,
"step": 3750,
"valid_targets_mean": 5214.0,
"valid_targets_min": 1501
},
{
"epoch": 6.474137931034483,
"grad_norm": 0.7811946298032911,
"learning_rate": 6.881752684641219e-07,
"loss": 0.4527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19682791829109192,
"step": 3755,
"valid_targets_mean": 2777.1,
"valid_targets_min": 645
},
{
"epoch": 6.482758620689655,
"grad_norm": 0.749142145074001,
"learning_rate": 6.659942591317703e-07,
"loss": 0.4234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24652616679668427,
"step": 3760,
"valid_targets_mean": 3532.0,
"valid_targets_min": 497
},
{
"epoch": 6.491379310344827,
"grad_norm": 0.7214616295655278,
"learning_rate": 6.441705422521072e-07,
"loss": 0.4656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21576929092407227,
"step": 3765,
"valid_targets_mean": 3651.8,
"valid_targets_min": 447
},
{
"epoch": 6.5,
"grad_norm": 0.8278176356345619,
"learning_rate": 6.22704521127444e-07,
"loss": 0.4623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2633417844772339,
"step": 3770,
"valid_targets_mean": 4134.5,
"valid_targets_min": 1746
},
{
"epoch": 6.508620689655173,
"grad_norm": 0.7594236851050343,
"learning_rate": 6.015965924498912e-07,
"loss": 0.4218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20567096769809723,
"step": 3775,
"valid_targets_mean": 2847.8,
"valid_targets_min": 1944
},
{
"epoch": 6.517241379310345,
"grad_norm": 0.668955142683864,
"learning_rate": 5.808471462939946e-07,
"loss": 0.5166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2435295730829239,
"step": 3780,
"valid_targets_mean": 4341.1,
"valid_targets_min": 1338
},
{
"epoch": 6.525862068965517,
"grad_norm": 0.7095589321551677,
"learning_rate": 5.604565661095484e-07,
"loss": 0.4735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26538217067718506,
"step": 3785,
"valid_targets_mean": 3807.8,
"valid_targets_min": 1789
},
{
"epoch": 6.5344827586206895,
"grad_norm": 0.8061244528120283,
"learning_rate": 5.404252287145006e-07,
"loss": 0.4308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15442270040512085,
"step": 3790,
"valid_targets_mean": 1825.9,
"valid_targets_min": 649
},
{
"epoch": 6.543103448275862,
"grad_norm": 0.8048087082616983,
"learning_rate": 5.207535042879963e-07,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24893686175346375,
"step": 3795,
"valid_targets_mean": 2585.2,
"valid_targets_min": 811
},
{
"epoch": 6.551724137931035,
"grad_norm": 0.7251230246204804,
"learning_rate": 5.014417563635276e-07,
"loss": 0.4444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101002335548401,
"step": 3800,
"valid_targets_mean": 3319.1,
"valid_targets_min": 1090
},
{
"epoch": 6.560344827586206,
"grad_norm": 0.7553348462583848,
"learning_rate": 4.824903418222259e-07,
"loss": 0.4565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1768944263458252,
"step": 3805,
"valid_targets_mean": 2879.6,
"valid_targets_min": 1292
},
{
"epoch": 6.568965517241379,
"grad_norm": 0.6256257986197964,
"learning_rate": 4.638996108862559e-07,
"loss": 0.4851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13639257848262787,
"step": 3810,
"valid_targets_mean": 2789.2,
"valid_targets_min": 1803
},
{
"epoch": 6.577586206896552,
"grad_norm": 0.6782534867126325,
"learning_rate": 4.456699071123538e-07,
"loss": 0.4755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28413069248199463,
"step": 3815,
"valid_targets_mean": 3424.9,
"valid_targets_min": 791
},
{
"epoch": 6.586206896551724,
"grad_norm": 0.8068441567212525,
"learning_rate": 4.2780156738546407e-07,
"loss": 0.4407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23791375756263733,
"step": 3820,
"valid_targets_mean": 3495.1,
"valid_targets_min": 592
},
{
"epoch": 6.594827586206897,
"grad_norm": 0.7618897463733958,
"learning_rate": 4.1029492191253296e-07,
"loss": 0.4332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005632758140564,
"step": 3825,
"valid_targets_mean": 3915.5,
"valid_targets_min": 756
},
{
"epoch": 6.603448275862069,
"grad_norm": 0.6790164115588616,
"learning_rate": 3.931502942163956e-07,
"loss": 0.4281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24386459589004517,
"step": 3830,
"valid_targets_mean": 4130.9,
"valid_targets_min": 1192
},
{
"epoch": 6.612068965517241,
"grad_norm": 0.6898721639387323,
"learning_rate": 3.763680011297921e-07,
"loss": 0.4393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19996516406536102,
"step": 3835,
"valid_targets_mean": 3800.0,
"valid_targets_min": 1547
},
{
"epoch": 6.620689655172414,
"grad_norm": 0.7915362044920929,
"learning_rate": 3.599483527895231e-07,
"loss": 0.436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447966992855072,
"step": 3840,
"valid_targets_mean": 2010.4,
"valid_targets_min": 840
},
{
"epoch": 6.629310344827586,
"grad_norm": 0.7086048153772613,
"learning_rate": 3.4389165263071233e-07,
"loss": 0.4355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24716392159461975,
"step": 3845,
"valid_targets_mean": 3861.5,
"valid_targets_min": 1355
},
{
"epoch": 6.637931034482759,
"grad_norm": 0.7407607649314212,
"learning_rate": 3.2819819738119983e-07,
"loss": 0.4424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21087799966335297,
"step": 3850,
"valid_targets_mean": 3448.4,
"valid_targets_min": 1410
},
{
"epoch": 6.646551724137931,
"grad_norm": 0.7862129023418445,
"learning_rate": 3.1286827705605984e-07,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18787223100662231,
"step": 3855,
"valid_targets_mean": 2740.4,
"valid_targets_min": 1036
},
{
"epoch": 6.655172413793103,
"grad_norm": 0.9583946478618197,
"learning_rate": 2.979021749522448e-07,
"loss": 0.4737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20167484879493713,
"step": 3860,
"valid_targets_mean": 2912.0,
"valid_targets_min": 858
},
{
"epoch": 6.663793103448276,
"grad_norm": 0.7463481814937221,
"learning_rate": 2.833001676433367e-07,
"loss": 0.4301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26120278239250183,
"step": 3865,
"valid_targets_mean": 4619.1,
"valid_targets_min": 1401
},
{
"epoch": 6.672413793103448,
"grad_norm": 0.6642070716787235,
"learning_rate": 2.690625249744572e-07,
"loss": 0.4469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23449347913265228,
"step": 3870,
"valid_targets_mean": 4213.8,
"valid_targets_min": 1849
},
{
"epoch": 6.681034482758621,
"grad_norm": 0.915332604744956,
"learning_rate": 2.551895100572566e-07,
"loss": 0.4496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29583102464675903,
"step": 3875,
"valid_targets_mean": 2902.1,
"valid_targets_min": 1314
},
{
"epoch": 6.689655172413794,
"grad_norm": 0.8360269400695622,
"learning_rate": 2.4168137926506854e-07,
"loss": 0.455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830885648727417,
"step": 3880,
"valid_targets_mean": 2553.8,
"valid_targets_min": 724
},
{
"epoch": 6.698275862068965,
"grad_norm": 0.6291602674642697,
"learning_rate": 2.2853838222817616e-07,
"loss": 0.4299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1453477144241333,
"step": 3885,
"valid_targets_mean": 3349.6,
"valid_targets_min": 1724
},
{
"epoch": 6.706896551724138,
"grad_norm": 0.6820000274820427,
"learning_rate": 2.1576076182917794e-07,
"loss": 0.4197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21681362390518188,
"step": 3890,
"valid_targets_mean": 3162.0,
"valid_targets_min": 545
},
{
"epoch": 6.7155172413793105,
"grad_norm": 0.7987024941251497,
"learning_rate": 2.0334875419851573e-07,
"loss": 0.4558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1824357658624649,
"step": 3895,
"valid_targets_mean": 2830.0,
"valid_targets_min": 616
},
{
"epoch": 6.724137931034483,
"grad_norm": 0.8215637161827768,
"learning_rate": 1.9130258871011165e-07,
"loss": 0.4713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18571743369102478,
"step": 3900,
"valid_targets_mean": 2641.1,
"valid_targets_min": 1586
},
{
"epoch": 6.732758620689655,
"grad_norm": 0.6581754518761841,
"learning_rate": 1.7962248797711356e-07,
"loss": 0.4888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15917380154132843,
"step": 3905,
"valid_targets_mean": 2697.8,
"valid_targets_min": 1491
},
{
"epoch": 6.741379310344827,
"grad_norm": 0.8997760891262785,
"learning_rate": 1.683086678478074e-07,
"loss": 0.4441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23729611933231354,
"step": 3910,
"valid_targets_mean": 2189.0,
"valid_targets_min": 489
},
{
"epoch": 6.75,
"grad_norm": 0.690128316353554,
"learning_rate": 1.573613374015981e-07,
"loss": 0.4293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21301250159740448,
"step": 3915,
"valid_targets_mean": 3811.6,
"valid_targets_min": 787
},
{
"epoch": 6.758620689655173,
"grad_norm": 0.783312423194326,
"learning_rate": 1.4678069894517033e-07,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18273267149925232,
"step": 3920,
"valid_targets_mean": 2392.5,
"valid_targets_min": 544
},
{
"epoch": 6.767241379310345,
"grad_norm": 0.5708162729229475,
"learning_rate": 1.3656694800873614e-07,
"loss": 0.4403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26748549938201904,
"step": 3925,
"valid_targets_mean": 6344.1,
"valid_targets_min": 2684
},
{
"epoch": 6.775862068965517,
"grad_norm": 0.7851430882153787,
"learning_rate": 1.2672027334242887e-07,
"loss": 0.4679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24374479055404663,
"step": 3930,
"valid_targets_mean": 3370.4,
"valid_targets_min": 1127
},
{
"epoch": 6.7844827586206895,
"grad_norm": 0.8589422933193868,
"learning_rate": 1.1724085691280806e-07,
"loss": 0.4484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15478235483169556,
"step": 3935,
"valid_targets_mean": 1799.1,
"valid_targets_min": 701
},
{
"epoch": 6.793103448275862,
"grad_norm": 0.7017426303676837,
"learning_rate": 1.0812887389950233e-07,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1417360007762909,
"step": 3940,
"valid_targets_mean": 2816.0,
"valid_targets_min": 394
},
{
"epoch": 6.801724137931035,
"grad_norm": 0.7320585288066113,
"learning_rate": 9.938449269197181e-08,
"loss": 0.4539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23600172996520996,
"step": 3945,
"valid_targets_mean": 3293.9,
"valid_targets_min": 1581
},
{
"epoch": 6.810344827586206,
"grad_norm": 0.7865361114606387,
"learning_rate": 9.100787488639295e-08,
"loss": 0.4737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16835284233093262,
"step": 3950,
"valid_targets_mean": 2500.4,
"valid_targets_min": 1075
},
{
"epoch": 6.818965517241379,
"grad_norm": 0.7598474628110911,
"learning_rate": 8.299917528267198e-08,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23328222334384918,
"step": 3955,
"valid_targets_mean": 3315.4,
"valid_targets_min": 1230
},
{
"epoch": 6.827586206896552,
"grad_norm": 0.6922186966361085,
"learning_rate": 7.535854188159164e-08,
"loss": 0.4561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22030378878116608,
"step": 3960,
"valid_targets_mean": 4447.1,
"valid_targets_min": 1842
},
{
"epoch": 6.836206896551724,
"grad_norm": 0.7934710758265647,
"learning_rate": 6.808611588206448e-08,
"loss": 0.4398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18129822611808777,
"step": 3965,
"valid_targets_mean": 2330.4,
"valid_targets_min": 696
},
{
"epoch": 6.844827586206897,
"grad_norm": 0.776583820755344,
"learning_rate": 6.11820316785372e-08,
"loss": 0.4452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13943791389465332,
"step": 3970,
"valid_targets_mean": 1962.6,
"valid_targets_min": 479
},
{
"epoch": 6.853448275862069,
"grad_norm": 0.7680731809453211,
"learning_rate": 5.464641685849259e-08,
"loss": 0.4619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3107728958129883,
"step": 3975,
"valid_targets_mean": 3925.5,
"valid_targets_min": 1400
},
{
"epoch": 6.862068965517241,
"grad_norm": 0.769315800681628,
"learning_rate": 4.8479392200100336e-08,
"loss": 0.4535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2647784352302551,
"step": 3980,
"valid_targets_mean": 3176.2,
"valid_targets_min": 450
},
{
"epoch": 6.870689655172414,
"grad_norm": 0.754287459757374,
"learning_rate": 4.268107166998769e-08,
"loss": 0.4386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20756995677947998,
"step": 3985,
"valid_targets_mean": 4493.1,
"valid_targets_min": 1858
},
{
"epoch": 6.879310344827586,
"grad_norm": 0.9099113076711162,
"learning_rate": 3.7251562421123375e-08,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22244426608085632,
"step": 3990,
"valid_targets_mean": 2582.2,
"valid_targets_min": 379
},
{
"epoch": 6.887931034482759,
"grad_norm": 0.6508460492899365,
"learning_rate": 3.219096479084804e-08,
"loss": 0.4508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32543838024139404,
"step": 3995,
"valid_targets_mean": 5302.9,
"valid_targets_min": 1996
},
{
"epoch": 6.896551724137931,
"grad_norm": 0.6718668504076304,
"learning_rate": 2.749937229901134e-08,
"loss": 0.4699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28725236654281616,
"step": 4000,
"valid_targets_mean": 4658.1,
"valid_targets_min": 1064
},
{
"epoch": 6.905172413793103,
"grad_norm": 0.6116223856311377,
"learning_rate": 2.317687164624882e-08,
"loss": 0.4503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.211561381816864,
"step": 4005,
"valid_targets_mean": 5063.1,
"valid_targets_min": 1967
},
{
"epoch": 6.913793103448276,
"grad_norm": 0.8881826270754143,
"learning_rate": 1.9223542712381026e-08,
"loss": 0.459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2072024941444397,
"step": 4010,
"valid_targets_mean": 2485.4,
"valid_targets_min": 615
},
{
"epoch": 6.922413793103448,
"grad_norm": 0.8659801226831524,
"learning_rate": 1.563945855492799e-08,
"loss": 0.4907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39161914587020874,
"step": 4015,
"valid_targets_mean": 3150.6,
"valid_targets_min": 955
},
{
"epoch": 6.931034482758621,
"grad_norm": 0.80563907343615,
"learning_rate": 1.242468540777253e-08,
"loss": 0.4357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18695054948329926,
"step": 4020,
"valid_targets_mean": 2511.8,
"valid_targets_min": 328
},
{
"epoch": 6.939655172413794,
"grad_norm": 0.6738769628962994,
"learning_rate": 9.579282679927915e-09,
"loss": 0.4729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2548571825027466,
"step": 4025,
"valid_targets_mean": 4149.2,
"valid_targets_min": 1536
},
{
"epoch": 6.948275862068965,
"grad_norm": 0.6701279131603821,
"learning_rate": 7.1033029544365085e-09,
"loss": 0.4602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15617677569389343,
"step": 4030,
"valid_targets_mean": 3156.2,
"valid_targets_min": 534
},
{
"epoch": 6.956896551724138,
"grad_norm": 0.7093717573267669,
"learning_rate": 4.996791987410543e-09,
"loss": 0.4497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2574841380119324,
"step": 4035,
"valid_targets_mean": 3534.9,
"valid_targets_min": 524
},
{
"epoch": 6.9655172413793105,
"grad_norm": 0.7332674589011584,
"learning_rate": 3.2597887071750266e-09,
"loss": 0.4585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26754799485206604,
"step": 4040,
"valid_targets_mean": 4100.1,
"valid_targets_min": 656
},
{
"epoch": 6.974137931034483,
"grad_norm": 0.6754420334215917,
"learning_rate": 1.892325213552759e-09,
"loss": 0.4722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21604621410369873,
"step": 4045,
"valid_targets_mean": 3842.0,
"valid_targets_min": 805
},
{
"epoch": 6.982758620689655,
"grad_norm": 0.6285696246936402,
"learning_rate": 8.944267772692527e-10,
"loss": 0.4513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1556059867143631,
"step": 4050,
"valid_targets_mean": 2972.5,
"valid_targets_min": 1132
},
{
"epoch": 6.991379310344827,
"grad_norm": 0.8528056566558939,
"learning_rate": 2.66111839490879e-10,
"loss": 0.4412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22985875606536865,
"step": 4055,
"valid_targets_mean": 2739.5,
"valid_targets_min": 1285
},
{
"epoch": 7.0,
"grad_norm": 0.7150700292512204,
"learning_rate": 7.392011478479787e-12,
"loss": 0.4477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25698769092559814,
"step": 4060,
"valid_targets_mean": 3496.4,
"valid_targets_min": 809
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25698769092559814,
"step": 4060,
"total_flos": 1.0409209055737283e+18,
"train_loss": 0.5224247261221185,
"train_runtime": 35382.8947,
"train_samples_per_second": 1.835,
"train_steps_per_second": 0.115,
"valid_targets_mean": 3496.4,
"valid_targets_min": 809
}
],
"logging_steps": 5,
"max_steps": 4060,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 600,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.0409209055737283e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}