| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 6712, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.005216484089723527, |
| "grad_norm": 11.24254837639787, |
| "learning_rate": 2.3809523809523811e-07, |
| "loss": 0.6831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.352985143661499, |
| "step": 5, |
| "valid_targets_mean": 5016.1, |
| "valid_targets_min": 3449 |
| }, |
| { |
| "epoch": 0.010432968179447054, |
| "grad_norm": 11.232055207273655, |
| "learning_rate": 5.357142857142857e-07, |
| "loss": 0.7003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3600406050682068, |
| "step": 10, |
| "valid_targets_mean": 4135.8, |
| "valid_targets_min": 2157 |
| }, |
| { |
| "epoch": 0.01564945226917058, |
| "grad_norm": 11.366410871408558, |
| "learning_rate": 8.333333333333333e-07, |
| "loss": 0.6785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33216580748558044, |
| "step": 15, |
| "valid_targets_mean": 4791.5, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 0.020865936358894107, |
| "grad_norm": 10.34808092771311, |
| "learning_rate": 1.130952380952381e-06, |
| "loss": 0.6848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3293125033378601, |
| "step": 20, |
| "valid_targets_mean": 5037.9, |
| "valid_targets_min": 2294 |
| }, |
| { |
| "epoch": 0.02608242044861763, |
| "grad_norm": 7.6077329183534355, |
| "learning_rate": 1.4285714285714286e-06, |
| "loss": 0.6608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3203168511390686, |
| "step": 25, |
| "valid_targets_mean": 4165.8, |
| "valid_targets_min": 1328 |
| }, |
| { |
| "epoch": 0.03129890453834116, |
| "grad_norm": 5.405083399889847, |
| "learning_rate": 1.7261904761904764e-06, |
| "loss": 0.6115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2907986044883728, |
| "step": 30, |
| "valid_targets_mean": 5063.2, |
| "valid_targets_min": 2066 |
| }, |
| { |
| "epoch": 0.036515388628064686, |
| "grad_norm": 3.9727593664560845, |
| "learning_rate": 2.023809523809524e-06, |
| "loss": 0.5967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2616725265979767, |
| "step": 35, |
| "valid_targets_mean": 5020.9, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 0.041731872717788214, |
| "grad_norm": 4.2532153338984795, |
| "learning_rate": 2.321428571428572e-06, |
| "loss": 0.5382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24420849978923798, |
| "step": 40, |
| "valid_targets_mean": 3708.5, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 0.046948356807511735, |
| "grad_norm": 2.934457351095903, |
| "learning_rate": 2.6190476190476192e-06, |
| "loss": 0.5187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24222546815872192, |
| "step": 45, |
| "valid_targets_mean": 5127.6, |
| "valid_targets_min": 2067 |
| }, |
| { |
| "epoch": 0.05216484089723526, |
| "grad_norm": 1.8853061847111383, |
| "learning_rate": 2.916666666666667e-06, |
| "loss": 0.5205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252302885055542, |
| "step": 50, |
| "valid_targets_mean": 4483.6, |
| "valid_targets_min": 2124 |
| }, |
| { |
| "epoch": 0.05738132498695879, |
| "grad_norm": 1.4677384311186294, |
| "learning_rate": 3.2142857142857147e-06, |
| "loss": 0.4809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18407613039016724, |
| "step": 55, |
| "valid_targets_mean": 3567.4, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 0.06259780907668232, |
| "grad_norm": 1.120364963485017, |
| "learning_rate": 3.511904761904762e-06, |
| "loss": 0.4447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22264821827411652, |
| "step": 60, |
| "valid_targets_mean": 3878.1, |
| "valid_targets_min": 1741 |
| }, |
| { |
| "epoch": 0.06781429316640585, |
| "grad_norm": 0.840971856813474, |
| "learning_rate": 3.80952380952381e-06, |
| "loss": 0.4575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23368576169013977, |
| "step": 65, |
| "valid_targets_mean": 5164.6, |
| "valid_targets_min": 2130 |
| }, |
| { |
| "epoch": 0.07303077725612937, |
| "grad_norm": 0.8384789308765538, |
| "learning_rate": 4.107142857142857e-06, |
| "loss": 0.4306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20054024457931519, |
| "step": 70, |
| "valid_targets_mean": 5614.9, |
| "valid_targets_min": 2491 |
| }, |
| { |
| "epoch": 0.0782472613458529, |
| "grad_norm": 0.6385587472558049, |
| "learning_rate": 4.404761904761905e-06, |
| "loss": 0.4176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22027632594108582, |
| "step": 75, |
| "valid_targets_mean": 6077.4, |
| "valid_targets_min": 2913 |
| }, |
| { |
| "epoch": 0.08346374543557643, |
| "grad_norm": 0.6630664582444133, |
| "learning_rate": 4.702380952380953e-06, |
| "loss": 0.4129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19254867732524872, |
| "step": 80, |
| "valid_targets_mean": 3906.9, |
| "valid_targets_min": 2090 |
| }, |
| { |
| "epoch": 0.08868022952529994, |
| "grad_norm": 0.6786403833983912, |
| "learning_rate": 5e-06, |
| "loss": 0.4207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23695020377635956, |
| "step": 85, |
| "valid_targets_mean": 5569.6, |
| "valid_targets_min": 3740 |
| }, |
| { |
| "epoch": 0.09389671361502347, |
| "grad_norm": 0.6184877623015653, |
| "learning_rate": 5.297619047619048e-06, |
| "loss": 0.4219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19551850855350494, |
| "step": 90, |
| "valid_targets_mean": 4397.8, |
| "valid_targets_min": 2423 |
| }, |
| { |
| "epoch": 0.099113197704747, |
| "grad_norm": 0.7103317313757143, |
| "learning_rate": 5.595238095238096e-06, |
| "loss": 0.4175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23150977492332458, |
| "step": 95, |
| "valid_targets_mean": 4499.1, |
| "valid_targets_min": 2100 |
| }, |
| { |
| "epoch": 0.10432968179447052, |
| "grad_norm": 0.6478165702052965, |
| "learning_rate": 5.892857142857144e-06, |
| "loss": 0.3957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18475624918937683, |
| "step": 100, |
| "valid_targets_mean": 3931.0, |
| "valid_targets_min": 1857 |
| }, |
| { |
| "epoch": 0.10954616588419405, |
| "grad_norm": 1.592022317536399, |
| "learning_rate": 6.1904761904761914e-06, |
| "loss": 0.3929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21138747036457062, |
| "step": 105, |
| "valid_targets_mean": 4803.2, |
| "valid_targets_min": 3210 |
| }, |
| { |
| "epoch": 0.11476264997391758, |
| "grad_norm": 0.5508085022135111, |
| "learning_rate": 6.488095238095239e-06, |
| "loss": 0.3684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21324364840984344, |
| "step": 110, |
| "valid_targets_mean": 5535.6, |
| "valid_targets_min": 2106 |
| }, |
| { |
| "epoch": 0.11997913406364111, |
| "grad_norm": 0.6710255867894759, |
| "learning_rate": 6.785714285714287e-06, |
| "loss": 0.3882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21487626433372498, |
| "step": 115, |
| "valid_targets_mean": 5593.4, |
| "valid_targets_min": 3020 |
| }, |
| { |
| "epoch": 0.12519561815336464, |
| "grad_norm": 0.6555896961622583, |
| "learning_rate": 7.083333333333335e-06, |
| "loss": 0.3719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.200883150100708, |
| "step": 120, |
| "valid_targets_mean": 4099.2, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 0.13041210224308816, |
| "grad_norm": 0.6368436071225058, |
| "learning_rate": 7.380952380952382e-06, |
| "loss": 0.3772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2024303674697876, |
| "step": 125, |
| "valid_targets_mean": 4552.5, |
| "valid_targets_min": 2219 |
| }, |
| { |
| "epoch": 0.1356285863328117, |
| "grad_norm": 0.6426147411338267, |
| "learning_rate": 7.67857142857143e-06, |
| "loss": 0.3617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19902446866035461, |
| "step": 130, |
| "valid_targets_mean": 4261.1, |
| "valid_targets_min": 1714 |
| }, |
| { |
| "epoch": 0.14084507042253522, |
| "grad_norm": 0.5425425596699449, |
| "learning_rate": 7.976190476190477e-06, |
| "loss": 0.3637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1794453263282776, |
| "step": 135, |
| "valid_targets_mean": 4941.1, |
| "valid_targets_min": 2717 |
| }, |
| { |
| "epoch": 0.14606155451225875, |
| "grad_norm": 0.6099519495344266, |
| "learning_rate": 8.273809523809523e-06, |
| "loss": 0.3636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20556297898292542, |
| "step": 140, |
| "valid_targets_mean": 5149.0, |
| "valid_targets_min": 2683 |
| }, |
| { |
| "epoch": 0.15127803860198227, |
| "grad_norm": 0.5616784883743269, |
| "learning_rate": 8.571428571428571e-06, |
| "loss": 0.3737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20041660964488983, |
| "step": 145, |
| "valid_targets_mean": 4993.5, |
| "valid_targets_min": 2369 |
| }, |
| { |
| "epoch": 0.1564945226917058, |
| "grad_norm": 0.573865959626073, |
| "learning_rate": 8.869047619047619e-06, |
| "loss": 0.3732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1961544007062912, |
| "step": 150, |
| "valid_targets_mean": 6082.9, |
| "valid_targets_min": 3402 |
| }, |
| { |
| "epoch": 0.16171100678142933, |
| "grad_norm": 0.6318893370099948, |
| "learning_rate": 9.166666666666666e-06, |
| "loss": 0.3748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1895100474357605, |
| "step": 155, |
| "valid_targets_mean": 5077.5, |
| "valid_targets_min": 2645 |
| }, |
| { |
| "epoch": 0.16692749087115286, |
| "grad_norm": 0.62541969323896, |
| "learning_rate": 9.464285714285714e-06, |
| "loss": 0.3582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16339033842086792, |
| "step": 160, |
| "valid_targets_mean": 4114.4, |
| "valid_targets_min": 1777 |
| }, |
| { |
| "epoch": 0.17214397496087636, |
| "grad_norm": 0.5606657840484052, |
| "learning_rate": 9.761904761904762e-06, |
| "loss": 0.3576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15099817514419556, |
| "step": 165, |
| "valid_targets_mean": 5019.4, |
| "valid_targets_min": 2033 |
| }, |
| { |
| "epoch": 0.17736045905059988, |
| "grad_norm": 0.5365733878219655, |
| "learning_rate": 1.005952380952381e-05, |
| "loss": 0.3433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16473634541034698, |
| "step": 170, |
| "valid_targets_mean": 5306.1, |
| "valid_targets_min": 1850 |
| }, |
| { |
| "epoch": 0.1825769431403234, |
| "grad_norm": 0.7029064378668989, |
| "learning_rate": 1.0357142857142859e-05, |
| "loss": 0.3407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17407193779945374, |
| "step": 175, |
| "valid_targets_mean": 4721.5, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 0.18779342723004694, |
| "grad_norm": 0.48456037806978225, |
| "learning_rate": 1.0654761904761905e-05, |
| "loss": 0.3143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16871285438537598, |
| "step": 180, |
| "valid_targets_mean": 5911.6, |
| "valid_targets_min": 3213 |
| }, |
| { |
| "epoch": 0.19300991131977047, |
| "grad_norm": 0.585313639557234, |
| "learning_rate": 1.0952380952380955e-05, |
| "loss": 0.3511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16843539476394653, |
| "step": 185, |
| "valid_targets_mean": 4861.0, |
| "valid_targets_min": 1564 |
| }, |
| { |
| "epoch": 0.198226395409494, |
| "grad_norm": 0.6211861060913116, |
| "learning_rate": 1.125e-05, |
| "loss": 0.3413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20040014386177063, |
| "step": 190, |
| "valid_targets_mean": 5177.6, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 0.20344287949921752, |
| "grad_norm": 0.5808811625651205, |
| "learning_rate": 1.1547619047619047e-05, |
| "loss": 0.3356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14674122631549835, |
| "step": 195, |
| "valid_targets_mean": 4242.0, |
| "valid_targets_min": 1649 |
| }, |
| { |
| "epoch": 0.20865936358894105, |
| "grad_norm": 0.6379936783242135, |
| "learning_rate": 1.1845238095238096e-05, |
| "loss": 0.3501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1750584840774536, |
| "step": 200, |
| "valid_targets_mean": 5140.6, |
| "valid_targets_min": 2976 |
| }, |
| { |
| "epoch": 0.21387584767866458, |
| "grad_norm": 0.6471244895039363, |
| "learning_rate": 1.2142857142857142e-05, |
| "loss": 0.3436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21840491890907288, |
| "step": 205, |
| "valid_targets_mean": 4205.1, |
| "valid_targets_min": 1637 |
| }, |
| { |
| "epoch": 0.2190923317683881, |
| "grad_norm": 0.6649540245139282, |
| "learning_rate": 1.2440476190476192e-05, |
| "loss": 0.3544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17277714610099792, |
| "step": 210, |
| "valid_targets_mean": 3557.8, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 0.22430881585811163, |
| "grad_norm": 0.5805068966151554, |
| "learning_rate": 1.2738095238095238e-05, |
| "loss": 0.3353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1522510051727295, |
| "step": 215, |
| "valid_targets_mean": 5786.1, |
| "valid_targets_min": 4208 |
| }, |
| { |
| "epoch": 0.22952529994783516, |
| "grad_norm": 0.5651854016863527, |
| "learning_rate": 1.3035714285714287e-05, |
| "loss": 0.3381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1737382411956787, |
| "step": 220, |
| "valid_targets_mean": 5721.5, |
| "valid_targets_min": 4956 |
| }, |
| { |
| "epoch": 0.2347417840375587, |
| "grad_norm": 0.5575886336701769, |
| "learning_rate": 1.3333333333333333e-05, |
| "loss": 0.3339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1307171881198883, |
| "step": 225, |
| "valid_targets_mean": 4515.4, |
| "valid_targets_min": 2175 |
| }, |
| { |
| "epoch": 0.23995826812728221, |
| "grad_norm": 0.5292908481239273, |
| "learning_rate": 1.3630952380952383e-05, |
| "loss": 0.3447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17313320934772491, |
| "step": 230, |
| "valid_targets_mean": 6369.9, |
| "valid_targets_min": 2012 |
| }, |
| { |
| "epoch": 0.24517475221700574, |
| "grad_norm": 0.6057809728782292, |
| "learning_rate": 1.3928571428571429e-05, |
| "loss": 0.3379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14974744617938995, |
| "step": 235, |
| "valid_targets_mean": 3524.4, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 0.25039123630672927, |
| "grad_norm": 0.5217173574795259, |
| "learning_rate": 1.4226190476190478e-05, |
| "loss": 0.3374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1415945291519165, |
| "step": 240, |
| "valid_targets_mean": 4837.8, |
| "valid_targets_min": 1942 |
| }, |
| { |
| "epoch": 0.2556077203964528, |
| "grad_norm": 0.5804691857168636, |
| "learning_rate": 1.4523809523809524e-05, |
| "loss": 0.3362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14725586771965027, |
| "step": 245, |
| "valid_targets_mean": 4438.8, |
| "valid_targets_min": 2127 |
| }, |
| { |
| "epoch": 0.2608242044861763, |
| "grad_norm": 0.47455922996119354, |
| "learning_rate": 1.4821428571428574e-05, |
| "loss": 0.3158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1384584605693817, |
| "step": 250, |
| "valid_targets_mean": 6362.5, |
| "valid_targets_min": 4182 |
| }, |
| { |
| "epoch": 0.26604068857589985, |
| "grad_norm": 0.5283181886582033, |
| "learning_rate": 1.511904761904762e-05, |
| "loss": 0.3381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14814651012420654, |
| "step": 255, |
| "valid_targets_mean": 5219.5, |
| "valid_targets_min": 1846 |
| }, |
| { |
| "epoch": 0.2712571726656234, |
| "grad_norm": 0.5121560567291197, |
| "learning_rate": 1.5416666666666668e-05, |
| "loss": 0.3339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15080620348453522, |
| "step": 260, |
| "valid_targets_mean": 5809.4, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 0.2764736567553469, |
| "grad_norm": 0.5935465658304162, |
| "learning_rate": 1.5714285714285715e-05, |
| "loss": 0.3154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1419353485107422, |
| "step": 265, |
| "valid_targets_mean": 5533.5, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 0.28169014084507044, |
| "grad_norm": 0.5083365742176544, |
| "learning_rate": 1.6011904761904763e-05, |
| "loss": 0.3314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14203351736068726, |
| "step": 270, |
| "valid_targets_mean": 4847.2, |
| "valid_targets_min": 1625 |
| }, |
| { |
| "epoch": 0.28690662493479396, |
| "grad_norm": 0.710129632830787, |
| "learning_rate": 1.630952380952381e-05, |
| "loss": 0.297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13648484647274017, |
| "step": 275, |
| "valid_targets_mean": 5074.6, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 0.2921231090245175, |
| "grad_norm": 0.6543408417526709, |
| "learning_rate": 1.660714285714286e-05, |
| "loss": 0.3253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14508678019046783, |
| "step": 280, |
| "valid_targets_mean": 5268.5, |
| "valid_targets_min": 2041 |
| }, |
| { |
| "epoch": 0.297339593114241, |
| "grad_norm": 0.6418915878980699, |
| "learning_rate": 1.6904761904761906e-05, |
| "loss": 0.3175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18109339475631714, |
| "step": 285, |
| "valid_targets_mean": 4462.6, |
| "valid_targets_min": 2442 |
| }, |
| { |
| "epoch": 0.30255607720396455, |
| "grad_norm": 0.6194921336607193, |
| "learning_rate": 1.7202380952380954e-05, |
| "loss": 0.326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1862541139125824, |
| "step": 290, |
| "valid_targets_mean": 4875.8, |
| "valid_targets_min": 1394 |
| }, |
| { |
| "epoch": 0.3077725612936881, |
| "grad_norm": 0.5319603288677237, |
| "learning_rate": 1.7500000000000002e-05, |
| "loss": 0.317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17491722106933594, |
| "step": 295, |
| "valid_targets_mean": 6071.2, |
| "valid_targets_min": 3280 |
| }, |
| { |
| "epoch": 0.3129890453834116, |
| "grad_norm": 0.6186814249083511, |
| "learning_rate": 1.779761904761905e-05, |
| "loss": 0.3331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18440985679626465, |
| "step": 300, |
| "valid_targets_mean": 5409.8, |
| "valid_targets_min": 2536 |
| }, |
| { |
| "epoch": 0.31820552947313513, |
| "grad_norm": 0.5355216263580986, |
| "learning_rate": 1.8095238095238097e-05, |
| "loss": 0.3151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1482452005147934, |
| "step": 305, |
| "valid_targets_mean": 5292.5, |
| "valid_targets_min": 1908 |
| }, |
| { |
| "epoch": 0.32342201356285866, |
| "grad_norm": 0.6241421491249363, |
| "learning_rate": 1.8392857142857142e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17003270983695984, |
| "step": 310, |
| "valid_targets_mean": 3620.0, |
| "valid_targets_min": 2145 |
| }, |
| { |
| "epoch": 0.3286384976525822, |
| "grad_norm": 0.5381406797781704, |
| "learning_rate": 1.8690476190476193e-05, |
| "loss": 0.321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20382024347782135, |
| "step": 315, |
| "valid_targets_mean": 6635.0, |
| "valid_targets_min": 1875 |
| }, |
| { |
| "epoch": 0.3338549817423057, |
| "grad_norm": 0.5140255577789234, |
| "learning_rate": 1.8988095238095237e-05, |
| "loss": 0.3141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13623102009296417, |
| "step": 320, |
| "valid_targets_mean": 5313.2, |
| "valid_targets_min": 3440 |
| }, |
| { |
| "epoch": 0.33907146583202924, |
| "grad_norm": 0.5490101147993109, |
| "learning_rate": 1.928571428571429e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1648813635110855, |
| "step": 325, |
| "valid_targets_mean": 5498.0, |
| "valid_targets_min": 2695 |
| }, |
| { |
| "epoch": 0.3442879499217527, |
| "grad_norm": 0.5244338139150616, |
| "learning_rate": 1.9583333333333333e-05, |
| "loss": 0.314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14053672552108765, |
| "step": 330, |
| "valid_targets_mean": 4315.6, |
| "valid_targets_min": 1711 |
| }, |
| { |
| "epoch": 0.34950443401147624, |
| "grad_norm": 0.5313860431206892, |
| "learning_rate": 1.9880952380952384e-05, |
| "loss": 0.3021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14705346524715424, |
| "step": 335, |
| "valid_targets_mean": 5682.1, |
| "valid_targets_min": 2366 |
| }, |
| { |
| "epoch": 0.35472091810119977, |
| "grad_norm": 0.5517836053206827, |
| "learning_rate": 2.0178571428571428e-05, |
| "loss": 0.3178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14730581641197205, |
| "step": 340, |
| "valid_targets_mean": 4762.9, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 0.3599374021909233, |
| "grad_norm": 0.5873148919465628, |
| "learning_rate": 2.0476190476190476e-05, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14816001057624817, |
| "step": 345, |
| "valid_targets_mean": 4330.0, |
| "valid_targets_min": 1916 |
| }, |
| { |
| "epoch": 0.3651538862806468, |
| "grad_norm": 0.5868340714087114, |
| "learning_rate": 2.0773809523809527e-05, |
| "loss": 0.3276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15234585106372833, |
| "step": 350, |
| "valid_targets_mean": 4120.2, |
| "valid_targets_min": 2846 |
| }, |
| { |
| "epoch": 0.37037037037037035, |
| "grad_norm": 0.5889924742292431, |
| "learning_rate": 2.1071428571428575e-05, |
| "loss": 0.3054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1578396111726761, |
| "step": 355, |
| "valid_targets_mean": 3943.8, |
| "valid_targets_min": 1624 |
| }, |
| { |
| "epoch": 0.3755868544600939, |
| "grad_norm": 0.5327053695279573, |
| "learning_rate": 2.136904761904762e-05, |
| "loss": 0.318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13582128286361694, |
| "step": 360, |
| "valid_targets_mean": 4614.1, |
| "valid_targets_min": 1073 |
| }, |
| { |
| "epoch": 0.3808033385498174, |
| "grad_norm": 0.5987827349693853, |
| "learning_rate": 2.1666666666666667e-05, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16083483397960663, |
| "step": 365, |
| "valid_targets_mean": 5879.5, |
| "valid_targets_min": 3184 |
| }, |
| { |
| "epoch": 0.38601982263954093, |
| "grad_norm": 0.5399690497041971, |
| "learning_rate": 2.1964285714285718e-05, |
| "loss": 0.3175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14316409826278687, |
| "step": 370, |
| "valid_targets_mean": 5359.6, |
| "valid_targets_min": 2062 |
| }, |
| { |
| "epoch": 0.39123630672926446, |
| "grad_norm": 0.45995926795020464, |
| "learning_rate": 2.2261904761904766e-05, |
| "loss": 0.3078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12717297673225403, |
| "step": 375, |
| "valid_targets_mean": 5594.1, |
| "valid_targets_min": 2426 |
| }, |
| { |
| "epoch": 0.396452790818988, |
| "grad_norm": 0.579643544005563, |
| "learning_rate": 2.255952380952381e-05, |
| "loss": 0.3179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15679344534873962, |
| "step": 380, |
| "valid_targets_mean": 4358.9, |
| "valid_targets_min": 1152 |
| }, |
| { |
| "epoch": 0.4016692749087115, |
| "grad_norm": 0.5444834444148753, |
| "learning_rate": 2.2857142857142858e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1315690577030182, |
| "step": 385, |
| "valid_targets_mean": 4194.0, |
| "valid_targets_min": 2077 |
| }, |
| { |
| "epoch": 0.40688575899843504, |
| "grad_norm": 0.5608144517538177, |
| "learning_rate": 2.315476190476191e-05, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16721805930137634, |
| "step": 390, |
| "valid_targets_mean": 5650.0, |
| "valid_targets_min": 3618 |
| }, |
| { |
| "epoch": 0.41210224308815857, |
| "grad_norm": 0.6559864927637044, |
| "learning_rate": 2.3452380952380957e-05, |
| "loss": 0.3061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18273624777793884, |
| "step": 395, |
| "valid_targets_mean": 4517.8, |
| "valid_targets_min": 1583 |
| }, |
| { |
| "epoch": 0.4173187271778821, |
| "grad_norm": 0.6378535909126191, |
| "learning_rate": 2.375e-05, |
| "loss": 0.3025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16496604681015015, |
| "step": 400, |
| "valid_targets_mean": 5223.9, |
| "valid_targets_min": 1318 |
| }, |
| { |
| "epoch": 0.4225352112676056, |
| "grad_norm": 0.6781104998447693, |
| "learning_rate": 2.404761904761905e-05, |
| "loss": 0.3175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17576375603675842, |
| "step": 405, |
| "valid_targets_mean": 3318.2, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 0.42775169535732915, |
| "grad_norm": 0.5784644184137221, |
| "learning_rate": 2.4345238095238093e-05, |
| "loss": 0.3018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16208800673484802, |
| "step": 410, |
| "valid_targets_mean": 5647.1, |
| "valid_targets_min": 3608 |
| }, |
| { |
| "epoch": 0.4329681794470527, |
| "grad_norm": 0.6573520288389244, |
| "learning_rate": 2.4642857142857145e-05, |
| "loss": 0.3108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17460080981254578, |
| "step": 415, |
| "valid_targets_mean": 4403.0, |
| "valid_targets_min": 2081 |
| }, |
| { |
| "epoch": 0.4381846635367762, |
| "grad_norm": 0.5476098640503447, |
| "learning_rate": 2.4940476190476192e-05, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1501733809709549, |
| "step": 420, |
| "valid_targets_mean": 4802.5, |
| "valid_targets_min": 2261 |
| }, |
| { |
| "epoch": 0.44340114762649974, |
| "grad_norm": 0.5511914866318157, |
| "learning_rate": 2.523809523809524e-05, |
| "loss": 0.284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14066597819328308, |
| "step": 425, |
| "valid_targets_mean": 6033.6, |
| "valid_targets_min": 3444 |
| }, |
| { |
| "epoch": 0.44861763171622326, |
| "grad_norm": 0.5825093311949527, |
| "learning_rate": 2.5535714285714284e-05, |
| "loss": 0.2871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14601226150989532, |
| "step": 430, |
| "valid_targets_mean": 5004.1, |
| "valid_targets_min": 1981 |
| }, |
| { |
| "epoch": 0.4538341158059468, |
| "grad_norm": 0.6225010243591146, |
| "learning_rate": 2.5833333333333336e-05, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14383742213249207, |
| "step": 435, |
| "valid_targets_mean": 5421.5, |
| "valid_targets_min": 2777 |
| }, |
| { |
| "epoch": 0.4590505998956703, |
| "grad_norm": 0.7252997694301736, |
| "learning_rate": 2.6130952380952383e-05, |
| "loss": 0.3038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17696425318717957, |
| "step": 440, |
| "valid_targets_mean": 5086.2, |
| "valid_targets_min": 2096 |
| }, |
| { |
| "epoch": 0.46426708398539385, |
| "grad_norm": 0.6002954989597811, |
| "learning_rate": 2.642857142857143e-05, |
| "loss": 0.3134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1518591344356537, |
| "step": 445, |
| "valid_targets_mean": 4727.5, |
| "valid_targets_min": 2695 |
| }, |
| { |
| "epoch": 0.4694835680751174, |
| "grad_norm": 0.6363078433064229, |
| "learning_rate": 2.6726190476190475e-05, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14227741956710815, |
| "step": 450, |
| "valid_targets_mean": 3842.5, |
| "valid_targets_min": 1852 |
| }, |
| { |
| "epoch": 0.4747000521648409, |
| "grad_norm": 0.6475283887341605, |
| "learning_rate": 2.7023809523809527e-05, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1538422852754593, |
| "step": 455, |
| "valid_targets_mean": 4200.5, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 0.47991653625456443, |
| "grad_norm": 0.6316203448975509, |
| "learning_rate": 2.7321428571428574e-05, |
| "loss": 0.2871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12457837909460068, |
| "step": 460, |
| "valid_targets_mean": 4195.6, |
| "valid_targets_min": 1664 |
| }, |
| { |
| "epoch": 0.48513302034428796, |
| "grad_norm": 0.5453336168892163, |
| "learning_rate": 2.7619047619047622e-05, |
| "loss": 0.2966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14784672856330872, |
| "step": 465, |
| "valid_targets_mean": 5087.2, |
| "valid_targets_min": 1948 |
| }, |
| { |
| "epoch": 0.4903495044340115, |
| "grad_norm": 0.5319864811856899, |
| "learning_rate": 2.7916666666666666e-05, |
| "loss": 0.3105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14754140377044678, |
| "step": 470, |
| "valid_targets_mean": 6058.4, |
| "valid_targets_min": 4615 |
| }, |
| { |
| "epoch": 0.495565988523735, |
| "grad_norm": 0.5747818680084603, |
| "learning_rate": 2.8214285714285718e-05, |
| "loss": 0.297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15875563025474548, |
| "step": 475, |
| "valid_targets_mean": 5760.1, |
| "valid_targets_min": 2787 |
| }, |
| { |
| "epoch": 0.5007824726134585, |
| "grad_norm": 0.537330584769206, |
| "learning_rate": 2.8511904761904765e-05, |
| "loss": 0.2992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13198646903038025, |
| "step": 480, |
| "valid_targets_mean": 5275.2, |
| "valid_targets_min": 3038 |
| }, |
| { |
| "epoch": 0.5059989567031821, |
| "grad_norm": 0.570047820911184, |
| "learning_rate": 2.8809523809523813e-05, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14526161551475525, |
| "step": 485, |
| "valid_targets_mean": 4437.0, |
| "valid_targets_min": 2076 |
| }, |
| { |
| "epoch": 0.5112154407929056, |
| "grad_norm": 0.5424253004654361, |
| "learning_rate": 2.9107142857142857e-05, |
| "loss": 0.2991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13815993070602417, |
| "step": 490, |
| "valid_targets_mean": 4431.6, |
| "valid_targets_min": 1877 |
| }, |
| { |
| "epoch": 0.5164319248826291, |
| "grad_norm": 0.6056196332833156, |
| "learning_rate": 2.940476190476191e-05, |
| "loss": 0.2939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13893744349479675, |
| "step": 495, |
| "valid_targets_mean": 5731.2, |
| "valid_targets_min": 2686 |
| }, |
| { |
| "epoch": 0.5216484089723527, |
| "grad_norm": 0.656594344651998, |
| "learning_rate": 2.9702380952380956e-05, |
| "loss": 0.2919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16237576305866241, |
| "step": 500, |
| "valid_targets_mean": 4444.4, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 0.5268648930620762, |
| "grad_norm": 0.6575613660501014, |
| "learning_rate": 3.0000000000000004e-05, |
| "loss": 0.3041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17889975011348724, |
| "step": 505, |
| "valid_targets_mean": 4299.6, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 0.5320813771517997, |
| "grad_norm": 0.5479096145334218, |
| "learning_rate": 3.029761904761905e-05, |
| "loss": 0.3017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14003689587116241, |
| "step": 510, |
| "valid_targets_mean": 4393.6, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 0.5372978612415232, |
| "grad_norm": 0.5360140658558523, |
| "learning_rate": 3.059523809523809e-05, |
| "loss": 0.2981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12671706080436707, |
| "step": 515, |
| "valid_targets_mean": 4213.6, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 0.5425143453312468, |
| "grad_norm": 0.5819274109832838, |
| "learning_rate": 3.089285714285715e-05, |
| "loss": 0.2809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15547394752502441, |
| "step": 520, |
| "valid_targets_mean": 5292.5, |
| "valid_targets_min": 2411 |
| }, |
| { |
| "epoch": 0.5477308294209703, |
| "grad_norm": 0.6271478607759707, |
| "learning_rate": 3.1190476190476195e-05, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13740107417106628, |
| "step": 525, |
| "valid_targets_mean": 3955.8, |
| "valid_targets_min": 1794 |
| }, |
| { |
| "epoch": 0.5529473135106938, |
| "grad_norm": 0.6144076854065791, |
| "learning_rate": 3.148809523809524e-05, |
| "loss": 0.3015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16323667764663696, |
| "step": 530, |
| "valid_targets_mean": 4617.8, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 0.5581637976004173, |
| "grad_norm": 0.5755859874184027, |
| "learning_rate": 3.1785714285714284e-05, |
| "loss": 0.2746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16000992059707642, |
| "step": 535, |
| "valid_targets_mean": 4906.9, |
| "valid_targets_min": 1472 |
| }, |
| { |
| "epoch": 0.5633802816901409, |
| "grad_norm": 0.5841607584218472, |
| "learning_rate": 3.208333333333334e-05, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1828911006450653, |
| "step": 540, |
| "valid_targets_mean": 4911.2, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 0.5685967657798644, |
| "grad_norm": 0.6225126753513331, |
| "learning_rate": 3.2380952380952386e-05, |
| "loss": 0.2906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13055923581123352, |
| "step": 545, |
| "valid_targets_mean": 3726.4, |
| "valid_targets_min": 1582 |
| }, |
| { |
| "epoch": 0.5738132498695879, |
| "grad_norm": 0.6692567934262729, |
| "learning_rate": 3.2678571428571434e-05, |
| "loss": 0.2936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15656331181526184, |
| "step": 550, |
| "valid_targets_mean": 4944.5, |
| "valid_targets_min": 2628 |
| }, |
| { |
| "epoch": 0.5790297339593115, |
| "grad_norm": 0.5229234196483743, |
| "learning_rate": 3.2976190476190475e-05, |
| "loss": 0.2877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11388491094112396, |
| "step": 555, |
| "valid_targets_mean": 4577.4, |
| "valid_targets_min": 2796 |
| }, |
| { |
| "epoch": 0.584246218049035, |
| "grad_norm": 0.6005262130280019, |
| "learning_rate": 3.327380952380953e-05, |
| "loss": 0.2899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1324496865272522, |
| "step": 560, |
| "valid_targets_mean": 4016.9, |
| "valid_targets_min": 1753 |
| }, |
| { |
| "epoch": 0.5894627021387585, |
| "grad_norm": 0.5582592039832068, |
| "learning_rate": 3.357142857142858e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16673031449317932, |
| "step": 565, |
| "valid_targets_mean": 4915.5, |
| "valid_targets_min": 3237 |
| }, |
| { |
| "epoch": 0.594679186228482, |
| "grad_norm": 0.5260273166710314, |
| "learning_rate": 3.386904761904762e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1317315697669983, |
| "step": 570, |
| "valid_targets_mean": 5027.9, |
| "valid_targets_min": 1969 |
| }, |
| { |
| "epoch": 0.5998956703182056, |
| "grad_norm": 0.5868369090440616, |
| "learning_rate": 3.4166666666666666e-05, |
| "loss": 0.303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18660710752010345, |
| "step": 575, |
| "valid_targets_mean": 5281.8, |
| "valid_targets_min": 3504 |
| }, |
| { |
| "epoch": 0.6051121544079291, |
| "grad_norm": 0.9504039681858983, |
| "learning_rate": 3.446428571428572e-05, |
| "loss": 0.3099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1338704526424408, |
| "step": 580, |
| "valid_targets_mean": 3767.8, |
| "valid_targets_min": 1589 |
| }, |
| { |
| "epoch": 0.6103286384976526, |
| "grad_norm": 0.5713320017873411, |
| "learning_rate": 3.476190476190477e-05, |
| "loss": 0.2933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1240009069442749, |
| "step": 585, |
| "valid_targets_mean": 3634.8, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 0.6155451225873761, |
| "grad_norm": 0.5766203236737801, |
| "learning_rate": 3.505952380952381e-05, |
| "loss": 0.2891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1292295604944229, |
| "step": 590, |
| "valid_targets_mean": 4069.0, |
| "valid_targets_min": 1502 |
| }, |
| { |
| "epoch": 0.6207616066770997, |
| "grad_norm": 0.509485527289052, |
| "learning_rate": 3.535714285714286e-05, |
| "loss": 0.297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13671892881393433, |
| "step": 595, |
| "valid_targets_mean": 4888.6, |
| "valid_targets_min": 1856 |
| }, |
| { |
| "epoch": 0.6259780907668232, |
| "grad_norm": 0.5632636770642139, |
| "learning_rate": 3.565476190476191e-05, |
| "loss": 0.3065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1881425380706787, |
| "step": 600, |
| "valid_targets_mean": 5378.8, |
| "valid_targets_min": 1564 |
| }, |
| { |
| "epoch": 0.6311945748565467, |
| "grad_norm": 0.551815417531546, |
| "learning_rate": 3.595238095238096e-05, |
| "loss": 0.278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12198884785175323, |
| "step": 605, |
| "valid_targets_mean": 4786.9, |
| "valid_targets_min": 1645 |
| }, |
| { |
| "epoch": 0.6364110589462703, |
| "grad_norm": 0.6064211172693338, |
| "learning_rate": 3.625e-05, |
| "loss": 0.2959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13710130751132965, |
| "step": 610, |
| "valid_targets_mean": 3977.6, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 0.6416275430359938, |
| "grad_norm": 2.843437049352432, |
| "learning_rate": 3.654761904761905e-05, |
| "loss": 0.284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14728930592536926, |
| "step": 615, |
| "valid_targets_mean": 5308.1, |
| "valid_targets_min": 2902 |
| }, |
| { |
| "epoch": 0.6468440271257173, |
| "grad_norm": 0.5212278169545214, |
| "learning_rate": 3.6845238095238096e-05, |
| "loss": 0.2649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11422304809093475, |
| "step": 620, |
| "valid_targets_mean": 4256.2, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 0.6520605112154408, |
| "grad_norm": 0.6069012446608004, |
| "learning_rate": 3.714285714285715e-05, |
| "loss": 0.2857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11972630023956299, |
| "step": 625, |
| "valid_targets_mean": 3628.0, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 0.6572769953051644, |
| "grad_norm": 0.5524190052154624, |
| "learning_rate": 3.744047619047619e-05, |
| "loss": 0.2893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14479461312294006, |
| "step": 630, |
| "valid_targets_mean": 5443.0, |
| "valid_targets_min": 1800 |
| }, |
| { |
| "epoch": 0.6624934793948879, |
| "grad_norm": 0.5939914890338424, |
| "learning_rate": 3.773809523809524e-05, |
| "loss": 0.3049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1578492522239685, |
| "step": 635, |
| "valid_targets_mean": 4863.4, |
| "valid_targets_min": 1855 |
| }, |
| { |
| "epoch": 0.6677099634846114, |
| "grad_norm": 0.5991744292599832, |
| "learning_rate": 3.803571428571429e-05, |
| "loss": 0.2922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15006765723228455, |
| "step": 640, |
| "valid_targets_mean": 4413.6, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 0.672926447574335, |
| "grad_norm": 0.5457954762595464, |
| "learning_rate": 3.833333333333334e-05, |
| "loss": 0.2793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14794906973838806, |
| "step": 645, |
| "valid_targets_mean": 6368.5, |
| "valid_targets_min": 4418 |
| }, |
| { |
| "epoch": 0.6781429316640585, |
| "grad_norm": 0.5704049215370746, |
| "learning_rate": 3.863095238095238e-05, |
| "loss": 0.306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14829003810882568, |
| "step": 650, |
| "valid_targets_mean": 4605.2, |
| "valid_targets_min": 3205 |
| }, |
| { |
| "epoch": 0.6833594157537819, |
| "grad_norm": 0.6576815095015953, |
| "learning_rate": 3.892857142857143e-05, |
| "loss": 0.2698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12923435866832733, |
| "step": 655, |
| "valid_targets_mean": 5369.6, |
| "valid_targets_min": 3794 |
| }, |
| { |
| "epoch": 0.6885758998435054, |
| "grad_norm": 0.4740614886361887, |
| "learning_rate": 3.922619047619048e-05, |
| "loss": 0.2791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11359081417322159, |
| "step": 660, |
| "valid_targets_mean": 6124.8, |
| "valid_targets_min": 2690 |
| }, |
| { |
| "epoch": 0.693792383933229, |
| "grad_norm": 0.5956200241918845, |
| "learning_rate": 3.9523809523809526e-05, |
| "loss": 0.2876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1414283812046051, |
| "step": 665, |
| "valid_targets_mean": 4818.5, |
| "valid_targets_min": 2155 |
| }, |
| { |
| "epoch": 0.6990088680229525, |
| "grad_norm": 0.5490856058705245, |
| "learning_rate": 3.982142857142857e-05, |
| "loss": 0.2799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13476689159870148, |
| "step": 670, |
| "valid_targets_mean": 4888.8, |
| "valid_targets_min": 2899 |
| }, |
| { |
| "epoch": 0.704225352112676, |
| "grad_norm": 0.5550928220084757, |
| "learning_rate": 3.999998918212333e-05, |
| "loss": 0.3073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.149751678109169, |
| "step": 675, |
| "valid_targets_mean": 4782.4, |
| "valid_targets_min": 1897 |
| }, |
| { |
| "epoch": 0.7094418362023995, |
| "grad_norm": 0.5885239420736949, |
| "learning_rate": 3.999986748114514e-05, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13731074333190918, |
| "step": 680, |
| "valid_targets_mean": 3692.5, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 0.7146583202921231, |
| "grad_norm": 0.60321378124438, |
| "learning_rate": 3.99996105576685e-05, |
| "loss": 0.2849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13662073016166687, |
| "step": 685, |
| "valid_targets_mean": 3336.6, |
| "valid_targets_min": 1719 |
| }, |
| { |
| "epoch": 0.7198748043818466, |
| "grad_norm": 0.5236148500487113, |
| "learning_rate": 3.999921841343052e-05, |
| "loss": 0.2636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13473102450370789, |
| "step": 690, |
| "valid_targets_mean": 5899.0, |
| "valid_targets_min": 1893 |
| }, |
| { |
| "epoch": 0.7250912884715701, |
| "grad_norm": 0.5216261505238765, |
| "learning_rate": 3.999869105108254e-05, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.149178609251976, |
| "step": 695, |
| "valid_targets_mean": 6292.6, |
| "valid_targets_min": 2097 |
| }, |
| { |
| "epoch": 0.7303077725612936, |
| "grad_norm": 0.5072205193470503, |
| "learning_rate": 3.9998028474190154e-05, |
| "loss": 0.2949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1225869357585907, |
| "step": 700, |
| "valid_targets_mean": 4711.9, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 0.7355242566510172, |
| "grad_norm": 0.5870083608117771, |
| "learning_rate": 3.999723068723316e-05, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16150489449501038, |
| "step": 705, |
| "valid_targets_mean": 3687.8, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 0.7407407407407407, |
| "grad_norm": 0.5716499953461907, |
| "learning_rate": 3.9996297695605534e-05, |
| "loss": 0.2802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14318493008613586, |
| "step": 710, |
| "valid_targets_mean": 4756.6, |
| "valid_targets_min": 2589 |
| }, |
| { |
| "epoch": 0.7459572248304642, |
| "grad_norm": 0.5518834028265162, |
| "learning_rate": 3.999522950561537e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15709498524665833, |
| "step": 715, |
| "valid_targets_mean": 5477.6, |
| "valid_targets_min": 2652 |
| }, |
| { |
| "epoch": 0.7511737089201878, |
| "grad_norm": 0.5468921565229283, |
| "learning_rate": 3.999402612448491e-05, |
| "loss": 0.2783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13745816051959991, |
| "step": 720, |
| "valid_targets_mean": 5289.8, |
| "valid_targets_min": 1577 |
| }, |
| { |
| "epoch": 0.7563901930099113, |
| "grad_norm": 0.5341399634224744, |
| "learning_rate": 3.99926875603504e-05, |
| "loss": 0.2947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11996178328990936, |
| "step": 725, |
| "valid_targets_mean": 4295.9, |
| "valid_targets_min": 1978 |
| }, |
| { |
| "epoch": 0.7616066770996348, |
| "grad_norm": 0.5370344491067444, |
| "learning_rate": 3.9991213822262105e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12039448320865631, |
| "step": 730, |
| "valid_targets_mean": 4307.6, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 0.7668231611893583, |
| "grad_norm": 0.5654025265803629, |
| "learning_rate": 3.9989604920184215e-05, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16871072351932526, |
| "step": 735, |
| "valid_targets_mean": 4641.4, |
| "valid_targets_min": 2175 |
| }, |
| { |
| "epoch": 0.7720396452790819, |
| "grad_norm": 0.5259197078408168, |
| "learning_rate": 3.99878608649948e-05, |
| "loss": 0.3013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13495999574661255, |
| "step": 740, |
| "valid_targets_mean": 4812.6, |
| "valid_targets_min": 2191 |
| }, |
| { |
| "epoch": 0.7772561293688054, |
| "grad_norm": 1.1255799489662346, |
| "learning_rate": 3.9985981668485694e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14621102809906006, |
| "step": 745, |
| "valid_targets_mean": 5571.9, |
| "valid_targets_min": 2454 |
| }, |
| { |
| "epoch": 0.7824726134585289, |
| "grad_norm": 0.6841805332983792, |
| "learning_rate": 3.9983967343362476e-05, |
| "loss": 0.2813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1594194769859314, |
| "step": 750, |
| "valid_targets_mean": 4458.8, |
| "valid_targets_min": 2398 |
| }, |
| { |
| "epoch": 0.7876890975482524, |
| "grad_norm": 0.5688763680479169, |
| "learning_rate": 3.998181790324434e-05, |
| "loss": 0.2806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11155922710895538, |
| "step": 755, |
| "valid_targets_mean": 5125.8, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 0.792905581637976, |
| "grad_norm": 0.5663799770218837, |
| "learning_rate": 3.997953336266402e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13671280443668365, |
| "step": 760, |
| "valid_targets_mean": 4331.0, |
| "valid_targets_min": 1698 |
| }, |
| { |
| "epoch": 0.7981220657276995, |
| "grad_norm": 0.4994161989543307, |
| "learning_rate": 3.997711373706768e-05, |
| "loss": 0.2781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13220706582069397, |
| "step": 765, |
| "valid_targets_mean": 4664.6, |
| "valid_targets_min": 2156 |
| }, |
| { |
| "epoch": 0.803338549817423, |
| "grad_norm": 0.5643131809161603, |
| "learning_rate": 3.997455904281481e-05, |
| "loss": 0.2793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13809676468372345, |
| "step": 770, |
| "valid_targets_mean": 4958.5, |
| "valid_targets_min": 2016 |
| }, |
| { |
| "epoch": 0.8085550339071466, |
| "grad_norm": 0.5300737652935752, |
| "learning_rate": 3.997186929717814e-05, |
| "loss": 0.2683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.130964994430542, |
| "step": 775, |
| "valid_targets_mean": 5666.2, |
| "valid_targets_min": 2116 |
| }, |
| { |
| "epoch": 0.8137715179968701, |
| "grad_norm": 0.8166695055830062, |
| "learning_rate": 3.996904451834349e-05, |
| "loss": 0.2661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1320631504058838, |
| "step": 780, |
| "valid_targets_mean": 5200.8, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 0.8189880020865936, |
| "grad_norm": 0.543142258456127, |
| "learning_rate": 3.9966084725409675e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1417725682258606, |
| "step": 785, |
| "valid_targets_mean": 5192.5, |
| "valid_targets_min": 2511 |
| }, |
| { |
| "epoch": 0.8242044861763171, |
| "grad_norm": 0.5210956540849055, |
| "learning_rate": 3.996298993838836e-05, |
| "loss": 0.2758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15136831998825073, |
| "step": 790, |
| "valid_targets_mean": 5622.9, |
| "valid_targets_min": 1956 |
| }, |
| { |
| "epoch": 0.8294209702660407, |
| "grad_norm": 0.47514344367102546, |
| "learning_rate": 3.995976017820392e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12267716228961945, |
| "step": 795, |
| "valid_targets_mean": 6080.2, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 0.8346374543557642, |
| "grad_norm": 0.5198837968552323, |
| "learning_rate": 3.995639546669331e-05, |
| "loss": 0.2574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12230321764945984, |
| "step": 800, |
| "valid_targets_mean": 5335.1, |
| "valid_targets_min": 2366 |
| }, |
| { |
| "epoch": 0.8398539384454877, |
| "grad_norm": 0.5782590386242095, |
| "learning_rate": 3.995289582660593e-05, |
| "loss": 0.3062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12575706839561462, |
| "step": 805, |
| "valid_targets_mean": 4269.2, |
| "valid_targets_min": 1913 |
| }, |
| { |
| "epoch": 0.8450704225352113, |
| "grad_norm": 0.7226163816777547, |
| "learning_rate": 3.9949261281603415e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16310575604438782, |
| "step": 810, |
| "valid_targets_mean": 4868.8, |
| "valid_targets_min": 2549 |
| }, |
| { |
| "epoch": 0.8502869066249348, |
| "grad_norm": 0.5820788067610744, |
| "learning_rate": 3.9945491856259556e-05, |
| "loss": 0.2742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16203533113002777, |
| "step": 815, |
| "valid_targets_mean": 4391.1, |
| "valid_targets_min": 2389 |
| }, |
| { |
| "epoch": 0.8555033907146583, |
| "grad_norm": 0.4808444611294702, |
| "learning_rate": 3.994158757606009e-05, |
| "loss": 0.2689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12435003370046616, |
| "step": 820, |
| "valid_targets_mean": 6628.9, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 0.8607198748043818, |
| "grad_norm": 0.5317205644416775, |
| "learning_rate": 3.993754846740249e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1366286277770996, |
| "step": 825, |
| "valid_targets_mean": 5113.5, |
| "valid_targets_min": 2620 |
| }, |
| { |
| "epoch": 0.8659363588941054, |
| "grad_norm": 0.514616285975049, |
| "learning_rate": 3.9933374557595875e-05, |
| "loss": 0.2726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14324252307415009, |
| "step": 830, |
| "valid_targets_mean": 5052.0, |
| "valid_targets_min": 1822 |
| }, |
| { |
| "epoch": 0.8711528429838289, |
| "grad_norm": 0.5563820422337162, |
| "learning_rate": 3.992906587486076e-05, |
| "loss": 0.2828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14511628448963165, |
| "step": 835, |
| "valid_targets_mean": 5581.1, |
| "valid_targets_min": 1457 |
| }, |
| { |
| "epoch": 0.8763693270735524, |
| "grad_norm": 0.5721077702569866, |
| "learning_rate": 3.992462244832886e-05, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15223796665668488, |
| "step": 840, |
| "valid_targets_mean": 5086.6, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 0.881585811163276, |
| "grad_norm": 0.5725237613771451, |
| "learning_rate": 3.9920044308042956e-05, |
| "loss": 0.2589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10571226477622986, |
| "step": 845, |
| "valid_targets_mean": 3588.8, |
| "valid_targets_min": 1842 |
| }, |
| { |
| "epoch": 0.8868022952529995, |
| "grad_norm": 0.51365646064338, |
| "learning_rate": 3.991533148495662e-05, |
| "loss": 0.2608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13923339545726776, |
| "step": 850, |
| "valid_targets_mean": 5327.6, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 0.892018779342723, |
| "grad_norm": 0.5828963561508581, |
| "learning_rate": 3.991048401093405e-05, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13550780713558197, |
| "step": 855, |
| "valid_targets_mean": 4516.8, |
| "valid_targets_min": 1461 |
| }, |
| { |
| "epoch": 0.8972352634324465, |
| "grad_norm": 0.6966096284074984, |
| "learning_rate": 3.990550191874985e-05, |
| "loss": 0.2854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1444419026374817, |
| "step": 860, |
| "valid_targets_mean": 3679.0, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 0.9024517475221701, |
| "grad_norm": 0.5184778153693645, |
| "learning_rate": 3.990038524208878e-05, |
| "loss": 0.2829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1318383663892746, |
| "step": 865, |
| "valid_targets_mean": 4986.8, |
| "valid_targets_min": 1791 |
| }, |
| { |
| "epoch": 0.9076682316118936, |
| "grad_norm": 0.5331023362961945, |
| "learning_rate": 3.9895134015545565e-05, |
| "loss": 0.2651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11663781106472015, |
| "step": 870, |
| "valid_targets_mean": 3661.8, |
| "valid_targets_min": 1949 |
| }, |
| { |
| "epoch": 0.9128847157016171, |
| "grad_norm": 0.5407143848415595, |
| "learning_rate": 3.988974827462464e-05, |
| "loss": 0.2721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13874134421348572, |
| "step": 875, |
| "valid_targets_mean": 5499.4, |
| "valid_targets_min": 2758 |
| }, |
| { |
| "epoch": 0.9181011997913406, |
| "grad_norm": 0.6194812388582897, |
| "learning_rate": 3.98842280557399e-05, |
| "loss": 0.2691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12969379127025604, |
| "step": 880, |
| "valid_targets_mean": 3967.9, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 0.9233176838810642, |
| "grad_norm": 0.5699586459948414, |
| "learning_rate": 3.98785733962145e-05, |
| "loss": 0.279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12774772942066193, |
| "step": 885, |
| "valid_targets_mean": 5061.0, |
| "valid_targets_min": 1507 |
| }, |
| { |
| "epoch": 0.9285341679707877, |
| "grad_norm": 0.5607102394615596, |
| "learning_rate": 3.9872784334280555e-05, |
| "loss": 0.2701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1534000188112259, |
| "step": 890, |
| "valid_targets_mean": 4859.0, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 0.9337506520605112, |
| "grad_norm": 0.5331536557365746, |
| "learning_rate": 3.9866860909078876e-05, |
| "loss": 0.2778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13779212534427643, |
| "step": 895, |
| "valid_targets_mean": 5181.9, |
| "valid_targets_min": 2671 |
| }, |
| { |
| "epoch": 0.9389671361502347, |
| "grad_norm": 0.5238806901596113, |
| "learning_rate": 3.9860803160658756e-05, |
| "loss": 0.2879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17478299140930176, |
| "step": 900, |
| "valid_targets_mean": 5491.2, |
| "valid_targets_min": 2754 |
| }, |
| { |
| "epoch": 0.9441836202399583, |
| "grad_norm": 0.5398420703049978, |
| "learning_rate": 3.985461112997766e-05, |
| "loss": 0.2827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11654013395309448, |
| "step": 905, |
| "valid_targets_mean": 4031.8, |
| "valid_targets_min": 1793 |
| }, |
| { |
| "epoch": 0.9494001043296818, |
| "grad_norm": 0.49304635275161546, |
| "learning_rate": 3.9848284858900955e-05, |
| "loss": 0.2633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.137330561876297, |
| "step": 910, |
| "valid_targets_mean": 5403.9, |
| "valid_targets_min": 2683 |
| }, |
| { |
| "epoch": 0.9546165884194053, |
| "grad_norm": 0.5686775162126456, |
| "learning_rate": 3.984182439020164e-05, |
| "loss": 0.2722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12234842777252197, |
| "step": 915, |
| "valid_targets_mean": 4553.5, |
| "valid_targets_min": 1963 |
| }, |
| { |
| "epoch": 0.9598330725091289, |
| "grad_norm": 0.615897132103767, |
| "learning_rate": 3.9835229767560034e-05, |
| "loss": 0.2682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13465642929077148, |
| "step": 920, |
| "valid_targets_mean": 3425.9, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 0.9650495565988524, |
| "grad_norm": 0.5417221970747348, |
| "learning_rate": 3.982850103556351e-05, |
| "loss": 0.2703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15093615651130676, |
| "step": 925, |
| "valid_targets_mean": 5625.1, |
| "valid_targets_min": 3329 |
| }, |
| { |
| "epoch": 0.9702660406885759, |
| "grad_norm": 0.5082091887909534, |
| "learning_rate": 3.982163823970615e-05, |
| "loss": 0.2841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1644631326198578, |
| "step": 930, |
| "valid_targets_mean": 4725.9, |
| "valid_targets_min": 1249 |
| }, |
| { |
| "epoch": 0.9754825247782994, |
| "grad_norm": 0.5020653386918221, |
| "learning_rate": 3.98146414263885e-05, |
| "loss": 0.2665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16657038033008575, |
| "step": 935, |
| "valid_targets_mean": 5279.6, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 0.980699008868023, |
| "grad_norm": 0.6491733294026691, |
| "learning_rate": 3.980751064291719e-05, |
| "loss": 0.2679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11266623437404633, |
| "step": 940, |
| "valid_targets_mean": 5246.4, |
| "valid_targets_min": 2342 |
| }, |
| { |
| "epoch": 0.9859154929577465, |
| "grad_norm": 0.586745643603928, |
| "learning_rate": 3.980024593750466e-05, |
| "loss": 0.2707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1562008559703827, |
| "step": 945, |
| "valid_targets_mean": 4508.4, |
| "valid_targets_min": 2638 |
| }, |
| { |
| "epoch": 0.99113197704747, |
| "grad_norm": 0.5976427152991887, |
| "learning_rate": 3.979284735926882e-05, |
| "loss": 0.2758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15834422409534454, |
| "step": 950, |
| "valid_targets_mean": 4706.4, |
| "valid_targets_min": 2701 |
| }, |
| { |
| "epoch": 0.9963484611371936, |
| "grad_norm": 0.552931359694199, |
| "learning_rate": 3.978531495823271e-05, |
| "loss": 0.2647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1401374489068985, |
| "step": 955, |
| "valid_targets_mean": 5464.8, |
| "valid_targets_min": 1975 |
| }, |
| { |
| "epoch": 1.0010432968179448, |
| "grad_norm": 0.5555627129782201, |
| "learning_rate": 3.977764878532418e-05, |
| "loss": 0.2699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11594857275485992, |
| "step": 960, |
| "valid_targets_mean": 5819.6, |
| "valid_targets_min": 2150 |
| }, |
| { |
| "epoch": 1.0062597809076683, |
| "grad_norm": 0.621737305129113, |
| "learning_rate": 3.976984889237551e-05, |
| "loss": 0.2868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1225830540060997, |
| "step": 965, |
| "valid_targets_mean": 3963.1, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 1.0114762649973918, |
| "grad_norm": 0.609624728818975, |
| "learning_rate": 3.9761915332123113e-05, |
| "loss": 0.2692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14671842753887177, |
| "step": 970, |
| "valid_targets_mean": 5083.1, |
| "valid_targets_min": 1630 |
| }, |
| { |
| "epoch": 1.0166927490871154, |
| "grad_norm": 0.49609282046376096, |
| "learning_rate": 3.975384815820713e-05, |
| "loss": 0.2667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12384708225727081, |
| "step": 975, |
| "valid_targets_mean": 5693.2, |
| "valid_targets_min": 2773 |
| }, |
| { |
| "epoch": 1.021909233176839, |
| "grad_norm": 0.6954457613343509, |
| "learning_rate": 3.974564742517109e-05, |
| "loss": 0.2838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12282181531190872, |
| "step": 980, |
| "valid_targets_mean": 3497.1, |
| "valid_targets_min": 1946 |
| }, |
| { |
| "epoch": 1.0271257172665624, |
| "grad_norm": 0.6348864007116859, |
| "learning_rate": 3.973731318846155e-05, |
| "loss": 0.2576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1495770364999771, |
| "step": 985, |
| "valid_targets_mean": 4063.0, |
| "valid_targets_min": 1679 |
| }, |
| { |
| "epoch": 1.032342201356286, |
| "grad_norm": 0.482982401425952, |
| "learning_rate": 3.97288455044277e-05, |
| "loss": 0.252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1389351636171341, |
| "step": 990, |
| "valid_targets_mean": 7056.1, |
| "valid_targets_min": 2762 |
| }, |
| { |
| "epoch": 1.0375586854460095, |
| "grad_norm": 0.6245759540283572, |
| "learning_rate": 3.972024443032098e-05, |
| "loss": 0.2542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15486538410186768, |
| "step": 995, |
| "valid_targets_mean": 5081.5, |
| "valid_targets_min": 2001 |
| }, |
| { |
| "epoch": 1.042775169535733, |
| "grad_norm": 0.5572267300723684, |
| "learning_rate": 3.971151002429471e-05, |
| "loss": 0.2665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11726558208465576, |
| "step": 1000, |
| "valid_targets_mean": 3408.6, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 1.0479916536254565, |
| "grad_norm": 0.6297986573579426, |
| "learning_rate": 3.97026423454037e-05, |
| "loss": 0.2643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11347624659538269, |
| "step": 1005, |
| "valid_targets_mean": 4425.0, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 1.05320813771518, |
| "grad_norm": 1.0334220724567058, |
| "learning_rate": 3.969364145360383e-05, |
| "loss": 0.2666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1397000104188919, |
| "step": 1010, |
| "valid_targets_mean": 5443.9, |
| "valid_targets_min": 2683 |
| }, |
| { |
| "epoch": 1.0584246218049036, |
| "grad_norm": 0.5487545829063336, |
| "learning_rate": 3.9684507409751655e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12293633818626404, |
| "step": 1015, |
| "valid_targets_mean": 4722.2, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 1.063641105894627, |
| "grad_norm": 0.5225719855265429, |
| "learning_rate": 3.967524027560401e-05, |
| "loss": 0.264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12677009403705597, |
| "step": 1020, |
| "valid_targets_mean": 5619.6, |
| "valid_targets_min": 3686 |
| }, |
| { |
| "epoch": 1.0688575899843507, |
| "grad_norm": 0.864013546733522, |
| "learning_rate": 3.966584011381753e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1692778766155243, |
| "step": 1025, |
| "valid_targets_mean": 6027.2, |
| "valid_targets_min": 1870 |
| }, |
| { |
| "epoch": 1.074074074074074, |
| "grad_norm": 0.5121362893536919, |
| "learning_rate": 3.965630698794833e-05, |
| "loss": 0.2463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09930215775966644, |
| "step": 1030, |
| "valid_targets_mean": 4419.8, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 1.0792905581637977, |
| "grad_norm": 0.6385093892320182, |
| "learning_rate": 3.964664096245149e-05, |
| "loss": 0.2589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14801526069641113, |
| "step": 1035, |
| "valid_targets_mean": 5311.0, |
| "valid_targets_min": 2371 |
| }, |
| { |
| "epoch": 1.084507042253521, |
| "grad_norm": 0.5519490683028426, |
| "learning_rate": 3.9636842102680635e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13327637314796448, |
| "step": 1040, |
| "valid_targets_mean": 4245.5, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 1.0897235263432448, |
| "grad_norm": 0.5813596168647382, |
| "learning_rate": 3.962691047488754e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15237219631671906, |
| "step": 1045, |
| "valid_targets_mean": 4386.4, |
| "valid_targets_min": 2232 |
| }, |
| { |
| "epoch": 1.094940010432968, |
| "grad_norm": 0.6065188708681333, |
| "learning_rate": 3.9616846146221606e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14218102395534515, |
| "step": 1050, |
| "valid_targets_mean": 3918.5, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 1.1001564945226918, |
| "grad_norm": 0.6071274238740759, |
| "learning_rate": 3.960664918472947e-05, |
| "loss": 0.2562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1331966370344162, |
| "step": 1055, |
| "valid_targets_mean": 4948.6, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 1.1053729786124151, |
| "grad_norm": 0.5810232005672644, |
| "learning_rate": 3.959631965935453e-05, |
| "loss": 0.2633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1407533884048462, |
| "step": 1060, |
| "valid_targets_mean": 4580.9, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 1.1105894627021389, |
| "grad_norm": 0.5631301298626795, |
| "learning_rate": 3.958585763993646e-05, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10973257571458817, |
| "step": 1065, |
| "valid_targets_mean": 5161.8, |
| "valid_targets_min": 2310 |
| }, |
| { |
| "epoch": 1.1158059467918622, |
| "grad_norm": 0.5202732767439506, |
| "learning_rate": 3.9575263197210736e-05, |
| "loss": 0.243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10115311294794083, |
| "step": 1070, |
| "valid_targets_mean": 5175.4, |
| "valid_targets_min": 2177 |
| }, |
| { |
| "epoch": 1.1210224308815857, |
| "grad_norm": 0.5882733680606071, |
| "learning_rate": 3.9564536402808194e-05, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12298896908760071, |
| "step": 1075, |
| "valid_targets_mean": 4286.4, |
| "valid_targets_min": 2060 |
| }, |
| { |
| "epoch": 1.1262389149713092, |
| "grad_norm": 0.5995795533171111, |
| "learning_rate": 3.955367732925451e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12658976018428802, |
| "step": 1080, |
| "valid_targets_mean": 4708.6, |
| "valid_targets_min": 2377 |
| }, |
| { |
| "epoch": 1.131455399061033, |
| "grad_norm": 0.6038080285810509, |
| "learning_rate": 3.954268604996972e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14354118704795837, |
| "step": 1085, |
| "valid_targets_mean": 4013.9, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 1.1366718831507563, |
| "grad_norm": 0.5477620531002403, |
| "learning_rate": 3.953156263926773e-05, |
| "loss": 0.2554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15162897109985352, |
| "step": 1090, |
| "valid_targets_mean": 6166.2, |
| "valid_targets_min": 4399 |
| }, |
| { |
| "epoch": 1.14188836724048, |
| "grad_norm": 0.7334723583908891, |
| "learning_rate": 3.952030717235581e-05, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14085112512111664, |
| "step": 1095, |
| "valid_targets_mean": 4769.4, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 1.1471048513302033, |
| "grad_norm": 0.5306348893521031, |
| "learning_rate": 3.950891972533408e-05, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13832436501979828, |
| "step": 1100, |
| "valid_targets_mean": 6099.9, |
| "valid_targets_min": 3870 |
| }, |
| { |
| "epoch": 1.1523213354199269, |
| "grad_norm": 0.5449133161144042, |
| "learning_rate": 3.9497400375195e-05, |
| "loss": 0.2686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13858945667743683, |
| "step": 1105, |
| "valid_targets_mean": 5039.5, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 1.1575378195096504, |
| "grad_norm": 0.7632046290203769, |
| "learning_rate": 3.948574919982286e-05, |
| "loss": 0.2704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11112897843122482, |
| "step": 1110, |
| "valid_targets_mean": 3455.1, |
| "valid_targets_min": 1829 |
| }, |
| { |
| "epoch": 1.162754303599374, |
| "grad_norm": 0.49851988432836863, |
| "learning_rate": 3.947396627799322e-05, |
| "loss": 0.2437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11539632827043533, |
| "step": 1115, |
| "valid_targets_mean": 5286.5, |
| "valid_targets_min": 1511 |
| }, |
| { |
| "epoch": 1.1679707876890975, |
| "grad_norm": 0.5024471509769345, |
| "learning_rate": 3.946205168937243e-05, |
| "loss": 0.2516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13856856524944305, |
| "step": 1120, |
| "valid_targets_mean": 4765.1, |
| "valid_targets_min": 1964 |
| }, |
| { |
| "epoch": 1.173187271778821, |
| "grad_norm": 0.5432749443314605, |
| "learning_rate": 3.945000551451703e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1260114163160324, |
| "step": 1125, |
| "valid_targets_mean": 4719.8, |
| "valid_targets_min": 3216 |
| }, |
| { |
| "epoch": 1.1784037558685445, |
| "grad_norm": 0.5347251152463858, |
| "learning_rate": 3.9437827834873265e-05, |
| "loss": 0.245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13661740720272064, |
| "step": 1130, |
| "valid_targets_mean": 5735.2, |
| "valid_targets_min": 2569 |
| }, |
| { |
| "epoch": 1.183620239958268, |
| "grad_norm": 0.5849586970257857, |
| "learning_rate": 3.942551873277649e-05, |
| "loss": 0.2477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13512352108955383, |
| "step": 1135, |
| "valid_targets_mean": 3875.9, |
| "valid_targets_min": 1736 |
| }, |
| { |
| "epoch": 1.1888367240479916, |
| "grad_norm": 0.706188938231076, |
| "learning_rate": 3.941307829145063e-05, |
| "loss": 0.2667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1348978728055954, |
| "step": 1140, |
| "valid_targets_mean": 3433.6, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 1.194053208137715, |
| "grad_norm": 0.5819976508163556, |
| "learning_rate": 3.9400506595007624e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12072448432445526, |
| "step": 1145, |
| "valid_targets_mean": 5552.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.1992696922274386, |
| "grad_norm": 0.521212706251135, |
| "learning_rate": 3.938780372844685e-05, |
| "loss": 0.2494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12627771496772766, |
| "step": 1150, |
| "valid_targets_mean": 4875.2, |
| "valid_targets_min": 2060 |
| }, |
| { |
| "epoch": 1.2044861763171621, |
| "grad_norm": 0.4991058739569063, |
| "learning_rate": 3.9374969777654535e-05, |
| "loss": 0.2607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11231563240289688, |
| "step": 1155, |
| "valid_targets_mean": 4992.5, |
| "valid_targets_min": 1974 |
| }, |
| { |
| "epoch": 1.2097026604068857, |
| "grad_norm": 0.5866190042090614, |
| "learning_rate": 3.93620048294032e-05, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11389137804508209, |
| "step": 1160, |
| "valid_targets_mean": 6012.9, |
| "valid_targets_min": 2817 |
| }, |
| { |
| "epoch": 1.2149191444966092, |
| "grad_norm": 0.4629469681351049, |
| "learning_rate": 3.9348908971351065e-05, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12433037161827087, |
| "step": 1165, |
| "valid_targets_mean": 4916.2, |
| "valid_targets_min": 2756 |
| }, |
| { |
| "epoch": 1.2201356285863327, |
| "grad_norm": 0.509878580010751, |
| "learning_rate": 3.933568229204145e-05, |
| "loss": 0.2582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10058669745922089, |
| "step": 1170, |
| "valid_targets_mean": 4582.0, |
| "valid_targets_min": 2072 |
| }, |
| { |
| "epoch": 1.2253521126760563, |
| "grad_norm": 0.5073486803677913, |
| "learning_rate": 3.9322324880902177e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14870202541351318, |
| "step": 1175, |
| "valid_targets_mean": 6096.4, |
| "valid_targets_min": 2270 |
| }, |
| { |
| "epoch": 1.2305685967657798, |
| "grad_norm": 0.6612168228167724, |
| "learning_rate": 3.930883682824496e-05, |
| "loss": 0.2596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15461964905261993, |
| "step": 1180, |
| "valid_targets_mean": 4362.9, |
| "valid_targets_min": 3061 |
| }, |
| { |
| "epoch": 1.2357850808555033, |
| "grad_norm": 0.6620573437399087, |
| "learning_rate": 3.929521822526483e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15261363983154297, |
| "step": 1185, |
| "valid_targets_mean": 4584.1, |
| "valid_targets_min": 2628 |
| }, |
| { |
| "epoch": 1.2410015649452268, |
| "grad_norm": 0.4756252268617344, |
| "learning_rate": 3.928146916403946e-05, |
| "loss": 0.2586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12918442487716675, |
| "step": 1190, |
| "valid_targets_mean": 5145.9, |
| "valid_targets_min": 2544 |
| }, |
| { |
| "epoch": 1.2462180490349504, |
| "grad_norm": 0.5674756284095253, |
| "learning_rate": 3.926758973752859e-05, |
| "loss": 0.249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11604364216327667, |
| "step": 1195, |
| "valid_targets_mean": 3338.5, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 1.251434533124674, |
| "grad_norm": 0.6470503790424013, |
| "learning_rate": 3.925358003957338e-05, |
| "loss": 0.2753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12425130605697632, |
| "step": 1200, |
| "valid_targets_mean": 3237.9, |
| "valid_targets_min": 1388 |
| }, |
| { |
| "epoch": 1.2566510172143974, |
| "grad_norm": 0.5160599914067892, |
| "learning_rate": 3.923944016489578e-05, |
| "loss": 0.2637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11762993782758713, |
| "step": 1205, |
| "valid_targets_mean": 4643.5, |
| "valid_targets_min": 1558 |
| }, |
| { |
| "epoch": 1.261867501304121, |
| "grad_norm": 0.6457663474938289, |
| "learning_rate": 3.9225170209097865e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1162123754620552, |
| "step": 1210, |
| "valid_targets_mean": 5133.0, |
| "valid_targets_min": 1571 |
| }, |
| { |
| "epoch": 1.2670839853938445, |
| "grad_norm": 0.5568943712279375, |
| "learning_rate": 3.921077026866125e-05, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14134006202220917, |
| "step": 1215, |
| "valid_targets_mean": 4286.0, |
| "valid_targets_min": 1389 |
| }, |
| { |
| "epoch": 1.272300469483568, |
| "grad_norm": 0.517359055890604, |
| "learning_rate": 3.919624044094636e-05, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11771930754184723, |
| "step": 1220, |
| "valid_targets_mean": 4357.6, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 1.2775169535732915, |
| "grad_norm": 0.5454382018602275, |
| "learning_rate": 3.918158082419184e-05, |
| "loss": 0.2562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11294469237327576, |
| "step": 1225, |
| "valid_targets_mean": 3347.9, |
| "valid_targets_min": 1687 |
| }, |
| { |
| "epoch": 1.282733437663015, |
| "grad_norm": 0.6268629083676116, |
| "learning_rate": 3.916679151751383e-05, |
| "loss": 0.2451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13156986236572266, |
| "step": 1230, |
| "valid_targets_mean": 5386.9, |
| "valid_targets_min": 2398 |
| }, |
| { |
| "epoch": 1.2879499217527386, |
| "grad_norm": 0.5152482932661713, |
| "learning_rate": 3.9151872620905356e-05, |
| "loss": 0.2652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12673966586589813, |
| "step": 1235, |
| "valid_targets_mean": 5135.2, |
| "valid_targets_min": 2135 |
| }, |
| { |
| "epoch": 1.2931664058424621, |
| "grad_norm": 0.5279356047844522, |
| "learning_rate": 3.913682423523561e-05, |
| "loss": 0.2452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16639316082000732, |
| "step": 1240, |
| "valid_targets_mean": 5856.9, |
| "valid_targets_min": 2179 |
| }, |
| { |
| "epoch": 1.2983828899321856, |
| "grad_norm": 0.5152996791191741, |
| "learning_rate": 3.912164646224927e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12303348630666733, |
| "step": 1245, |
| "valid_targets_mean": 5895.6, |
| "valid_targets_min": 3347 |
| }, |
| { |
| "epoch": 1.3035993740219092, |
| "grad_norm": 0.5491144223145925, |
| "learning_rate": 3.910633940456585e-05, |
| "loss": 0.2683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11502029746770859, |
| "step": 1250, |
| "valid_targets_mean": 4442.5, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 1.3088158581116327, |
| "grad_norm": 0.48581532743409384, |
| "learning_rate": 3.909090316567896e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10068874061107635, |
| "step": 1255, |
| "valid_targets_mean": 4060.6, |
| "valid_targets_min": 1660 |
| }, |
| { |
| "epoch": 1.3140323422013562, |
| "grad_norm": 0.5354120459678681, |
| "learning_rate": 3.9075337849955614e-05, |
| "loss": 0.2695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09602093696594238, |
| "step": 1260, |
| "valid_targets_mean": 3535.4, |
| "valid_targets_min": 1612 |
| }, |
| { |
| "epoch": 1.3192488262910798, |
| "grad_norm": 0.6410666645859446, |
| "learning_rate": 3.905964356263558e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13208051025867462, |
| "step": 1265, |
| "valid_targets_mean": 4003.4, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 1.3244653103808033, |
| "grad_norm": 0.5129454984326265, |
| "learning_rate": 3.9043820409830585e-05, |
| "loss": 0.25, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11679510772228241, |
| "step": 1270, |
| "valid_targets_mean": 5320.9, |
| "valid_targets_min": 2200 |
| }, |
| { |
| "epoch": 1.3296817944705268, |
| "grad_norm": 0.5156628308288126, |
| "learning_rate": 3.9027868498523645e-05, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10929737985134125, |
| "step": 1275, |
| "valid_targets_mean": 4530.8, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 1.3348982785602503, |
| "grad_norm": 0.46219046923829427, |
| "learning_rate": 3.901178793656836e-05, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10228785872459412, |
| "step": 1280, |
| "valid_targets_mean": 5299.5, |
| "valid_targets_min": 2905 |
| }, |
| { |
| "epoch": 1.3401147626499739, |
| "grad_norm": 0.5341016427474178, |
| "learning_rate": 3.899557883268811e-05, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09990217536687851, |
| "step": 1285, |
| "valid_targets_mean": 4161.8, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 1.3453312467396974, |
| "grad_norm": 0.5979056549754926, |
| "learning_rate": 3.897924129647542e-05, |
| "loss": 0.25, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.149190291762352, |
| "step": 1290, |
| "valid_targets_mean": 4748.6, |
| "valid_targets_min": 1896 |
| }, |
| { |
| "epoch": 1.350547730829421, |
| "grad_norm": 0.4679255872634688, |
| "learning_rate": 3.896277543839114e-05, |
| "loss": 0.249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07849105447530746, |
| "step": 1295, |
| "valid_targets_mean": 4052.5, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 1.3557642149191445, |
| "grad_norm": 0.48873872918678035, |
| "learning_rate": 3.894618136976372e-05, |
| "loss": 0.2499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12221433222293854, |
| "step": 1300, |
| "valid_targets_mean": 6071.9, |
| "valid_targets_min": 3029 |
| }, |
| { |
| "epoch": 1.360980699008868, |
| "grad_norm": 0.5021611507848466, |
| "learning_rate": 3.89294592027885e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11469393223524094, |
| "step": 1305, |
| "valid_targets_mean": 5044.8, |
| "valid_targets_min": 1538 |
| }, |
| { |
| "epoch": 1.3661971830985915, |
| "grad_norm": 0.6851521282855704, |
| "learning_rate": 3.891260905052685e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12349982559680939, |
| "step": 1310, |
| "valid_targets_mean": 4046.6, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 1.371413667188315, |
| "grad_norm": 0.4857351004667739, |
| "learning_rate": 3.8895631026905546e-05, |
| "loss": 0.2407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11351583153009415, |
| "step": 1315, |
| "valid_targets_mean": 4832.2, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 1.3766301512780386, |
| "grad_norm": 0.48743716553823263, |
| "learning_rate": 3.887852524671587e-05, |
| "loss": 0.2513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13305367529392242, |
| "step": 1320, |
| "valid_targets_mean": 4628.4, |
| "valid_targets_min": 3069 |
| }, |
| { |
| "epoch": 1.381846635367762, |
| "grad_norm": 0.5121653531868553, |
| "learning_rate": 3.886129182561291e-05, |
| "loss": 0.2422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13066956400871277, |
| "step": 1325, |
| "valid_targets_mean": 5233.6, |
| "valid_targets_min": 2904 |
| }, |
| { |
| "epoch": 1.3870631194574856, |
| "grad_norm": 0.5334399942963226, |
| "learning_rate": 3.8843930880114745e-05, |
| "loss": 0.2571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13521258533000946, |
| "step": 1330, |
| "valid_targets_mean": 4983.1, |
| "valid_targets_min": 2285 |
| }, |
| { |
| "epoch": 1.3922796035472091, |
| "grad_norm": 0.5364662379844092, |
| "learning_rate": 3.882644252760168e-05, |
| "loss": 0.2535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09757325053215027, |
| "step": 1335, |
| "valid_targets_mean": 5430.8, |
| "valid_targets_min": 1906 |
| }, |
| { |
| "epoch": 1.3974960876369327, |
| "grad_norm": 0.5647185520715633, |
| "learning_rate": 3.8808826886315426e-05, |
| "loss": 0.2587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16115015745162964, |
| "step": 1340, |
| "valid_targets_mean": 5568.1, |
| "valid_targets_min": 3457 |
| }, |
| { |
| "epoch": 1.4027125717266562, |
| "grad_norm": 0.5014826960092932, |
| "learning_rate": 3.8791084075358344e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11483775824308395, |
| "step": 1345, |
| "valid_targets_mean": 4442.0, |
| "valid_targets_min": 2289 |
| }, |
| { |
| "epoch": 1.4079290558163797, |
| "grad_norm": 0.5704838065984214, |
| "learning_rate": 3.8773214214692564e-05, |
| "loss": 0.2584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11861691623926163, |
| "step": 1350, |
| "valid_targets_mean": 4343.2, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 1.4131455399061033, |
| "grad_norm": 0.761018845309024, |
| "learning_rate": 3.8755217425139264e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13714927434921265, |
| "step": 1355, |
| "valid_targets_mean": 5168.2, |
| "valid_targets_min": 3425 |
| }, |
| { |
| "epoch": 1.4183620239958268, |
| "grad_norm": 1.0936619935803085, |
| "learning_rate": 3.8737093828377785e-05, |
| "loss": 0.2451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14459095895290375, |
| "step": 1360, |
| "valid_targets_mean": 6778.4, |
| "valid_targets_min": 3605 |
| }, |
| { |
| "epoch": 1.4235785080855503, |
| "grad_norm": 0.7122909792884763, |
| "learning_rate": 3.8718843546944844e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13594117760658264, |
| "step": 1365, |
| "valid_targets_mean": 3794.0, |
| "valid_targets_min": 2609 |
| }, |
| { |
| "epoch": 1.4287949921752738, |
| "grad_norm": 0.6457112430833799, |
| "learning_rate": 3.870046670423369e-05, |
| "loss": 0.2721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17264269292354584, |
| "step": 1370, |
| "valid_targets_mean": 5524.8, |
| "valid_targets_min": 2106 |
| }, |
| { |
| "epoch": 1.4340114762649974, |
| "grad_norm": 0.5822348000748305, |
| "learning_rate": 3.868196342449327e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16046279668807983, |
| "step": 1375, |
| "valid_targets_mean": 5263.5, |
| "valid_targets_min": 2182 |
| }, |
| { |
| "epoch": 1.439227960354721, |
| "grad_norm": 0.5455896041089222, |
| "learning_rate": 3.8663333832827415e-05, |
| "loss": 0.2673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12363915145397186, |
| "step": 1380, |
| "valid_targets_mean": 4780.6, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 1.4444444444444444, |
| "grad_norm": 0.5204598568724569, |
| "learning_rate": 3.864457805519395e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11119193583726883, |
| "step": 1385, |
| "valid_targets_mean": 4275.2, |
| "valid_targets_min": 1765 |
| }, |
| { |
| "epoch": 1.449660928534168, |
| "grad_norm": 0.5157545561785613, |
| "learning_rate": 3.862569621840385e-05, |
| "loss": 0.2683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10522519052028656, |
| "step": 1390, |
| "valid_targets_mean": 4213.8, |
| "valid_targets_min": 1582 |
| }, |
| { |
| "epoch": 1.4548774126238915, |
| "grad_norm": 0.6264579348760222, |
| "learning_rate": 3.860668845012044e-05, |
| "loss": 0.2742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15325672924518585, |
| "step": 1395, |
| "valid_targets_mean": 3898.5, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 1.460093896713615, |
| "grad_norm": 0.5585909276055782, |
| "learning_rate": 3.8587554878858466e-05, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11405700445175171, |
| "step": 1400, |
| "valid_targets_mean": 3959.1, |
| "valid_targets_min": 2054 |
| }, |
| { |
| "epoch": 1.4653103808033385, |
| "grad_norm": 0.49813932042181147, |
| "learning_rate": 3.8568295633983244e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09434691071510315, |
| "step": 1405, |
| "valid_targets_mean": 3593.0, |
| "valid_targets_min": 1552 |
| }, |
| { |
| "epoch": 1.470526864893062, |
| "grad_norm": 0.6041663662890155, |
| "learning_rate": 3.85489108457098e-05, |
| "loss": 0.2453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1227974146604538, |
| "step": 1410, |
| "valid_targets_mean": 5324.5, |
| "valid_targets_min": 3171 |
| }, |
| { |
| "epoch": 1.4757433489827856, |
| "grad_norm": 0.5406878285872566, |
| "learning_rate": 3.8529400645101984e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16151192784309387, |
| "step": 1415, |
| "valid_targets_mean": 6263.1, |
| "valid_targets_min": 2764 |
| }, |
| { |
| "epoch": 1.4809598330725091, |
| "grad_norm": 0.5238933209978773, |
| "learning_rate": 3.850976516407157e-05, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12694543600082397, |
| "step": 1420, |
| "valid_targets_mean": 4904.8, |
| "valid_targets_min": 3051 |
| }, |
| { |
| "epoch": 1.4861763171622326, |
| "grad_norm": 0.49515325116736575, |
| "learning_rate": 3.8490004535377356e-05, |
| "loss": 0.2558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13720092177391052, |
| "step": 1425, |
| "valid_targets_mean": 4950.0, |
| "valid_targets_min": 1835 |
| }, |
| { |
| "epoch": 1.4913928012519562, |
| "grad_norm": 0.5409120061465099, |
| "learning_rate": 3.8470118892624345e-05, |
| "loss": 0.241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12328615039587021, |
| "step": 1430, |
| "valid_targets_mean": 4782.9, |
| "valid_targets_min": 1710 |
| }, |
| { |
| "epoch": 1.4966092853416797, |
| "grad_norm": 0.5345646077783061, |
| "learning_rate": 3.8450108370262714e-05, |
| "loss": 0.2398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18213754892349243, |
| "step": 1435, |
| "valid_targets_mean": 5736.0, |
| "valid_targets_min": 2259 |
| }, |
| { |
| "epoch": 1.5018257694314032, |
| "grad_norm": 0.5103518853898554, |
| "learning_rate": 3.8429973103587016e-05, |
| "loss": 0.2602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1235252320766449, |
| "step": 1440, |
| "valid_targets_mean": 4339.1, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 1.5070422535211268, |
| "grad_norm": 0.4747786716627152, |
| "learning_rate": 3.840971322873519e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10930084437131882, |
| "step": 1445, |
| "valid_targets_mean": 5637.6, |
| "valid_targets_min": 2409 |
| }, |
| { |
| "epoch": 1.5122587376108503, |
| "grad_norm": 0.5150860304783956, |
| "learning_rate": 3.838932888268771e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14165997505187988, |
| "step": 1450, |
| "valid_targets_mean": 5255.9, |
| "valid_targets_min": 1939 |
| }, |
| { |
| "epoch": 1.5174752217005738, |
| "grad_norm": 0.5198511487212314, |
| "learning_rate": 3.836882020326658e-05, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14433275163173676, |
| "step": 1455, |
| "valid_targets_mean": 5713.9, |
| "valid_targets_min": 2514 |
| }, |
| { |
| "epoch": 1.5226917057902973, |
| "grad_norm": 0.671332298083507, |
| "learning_rate": 3.834818732913448e-05, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14078345894813538, |
| "step": 1460, |
| "valid_targets_mean": 3379.2, |
| "valid_targets_min": 2012 |
| }, |
| { |
| "epoch": 1.5279081898800209, |
| "grad_norm": 0.49013989594302837, |
| "learning_rate": 3.8327430399793754e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11260563135147095, |
| "step": 1465, |
| "valid_targets_mean": 5242.4, |
| "valid_targets_min": 2071 |
| }, |
| { |
| "epoch": 1.5331246739697444, |
| "grad_norm": 0.5364799216625429, |
| "learning_rate": 3.8306549555585536e-05, |
| "loss": 0.2639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09743601083755493, |
| "step": 1470, |
| "valid_targets_mean": 2970.5, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 1.538341158059468, |
| "grad_norm": 0.5204043919051834, |
| "learning_rate": 3.828554493768876e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11134983599185944, |
| "step": 1475, |
| "valid_targets_mean": 4600.8, |
| "valid_targets_min": 1666 |
| }, |
| { |
| "epoch": 1.5435576421491914, |
| "grad_norm": 0.533126954524228, |
| "learning_rate": 3.826441668811921e-05, |
| "loss": 0.2455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12382099032402039, |
| "step": 1480, |
| "valid_targets_mean": 4916.2, |
| "valid_targets_min": 2308 |
| }, |
| { |
| "epoch": 1.548774126238915, |
| "grad_norm": 0.629159424717442, |
| "learning_rate": 3.8243164949728565e-05, |
| "loss": 0.2484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1136583536863327, |
| "step": 1485, |
| "valid_targets_mean": 4257.9, |
| "valid_targets_min": 1824 |
| }, |
| { |
| "epoch": 1.5539906103286385, |
| "grad_norm": 0.5576499245867822, |
| "learning_rate": 3.8221789866203434e-05, |
| "loss": 0.2651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16036765277385712, |
| "step": 1490, |
| "valid_targets_mean": 5219.4, |
| "valid_targets_min": 2558 |
| }, |
| { |
| "epoch": 1.559207094418362, |
| "grad_norm": 0.5011305426689374, |
| "learning_rate": 3.820029158206438e-05, |
| "loss": 0.253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10513623058795929, |
| "step": 1495, |
| "valid_targets_mean": 5296.9, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 1.5644235785080856, |
| "grad_norm": 0.5810044246720123, |
| "learning_rate": 3.817867024266497e-05, |
| "loss": 0.2613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13431760668754578, |
| "step": 1500, |
| "valid_targets_mean": 4602.8, |
| "valid_targets_min": 1710 |
| }, |
| { |
| "epoch": 1.569640062597809, |
| "grad_norm": 0.4619545433317578, |
| "learning_rate": 3.8156925994190735e-05, |
| "loss": 0.247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09452519565820694, |
| "step": 1505, |
| "valid_targets_mean": 5179.8, |
| "valid_targets_min": 2189 |
| }, |
| { |
| "epoch": 1.5748565466875326, |
| "grad_norm": 0.5751374560743624, |
| "learning_rate": 3.813505898365822e-05, |
| "loss": 0.2545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09860014170408249, |
| "step": 1510, |
| "valid_targets_mean": 3707.4, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 1.5800730307772561, |
| "grad_norm": 0.5174007955451221, |
| "learning_rate": 3.8113069358914024e-05, |
| "loss": 0.2574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11332970857620239, |
| "step": 1515, |
| "valid_targets_mean": 5254.5, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 1.5852895148669797, |
| "grad_norm": 0.6377777694857345, |
| "learning_rate": 3.80909572686337e-05, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12425677478313446, |
| "step": 1520, |
| "valid_targets_mean": 5519.5, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 1.5905059989567032, |
| "grad_norm": 0.531286078112967, |
| "learning_rate": 3.806872286232086e-05, |
| "loss": 0.2454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10937950015068054, |
| "step": 1525, |
| "valid_targets_mean": 5120.5, |
| "valid_targets_min": 1810 |
| }, |
| { |
| "epoch": 1.5957224830464267, |
| "grad_norm": 0.5064919099325197, |
| "learning_rate": 3.80463662903061e-05, |
| "loss": 0.2737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10155424475669861, |
| "step": 1530, |
| "valid_targets_mean": 5331.2, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 1.6009389671361502, |
| "grad_norm": 0.5171512298024863, |
| "learning_rate": 3.802388770374598e-05, |
| "loss": 0.2534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11525417864322662, |
| "step": 1535, |
| "valid_targets_mean": 4886.1, |
| "valid_targets_min": 2724 |
| }, |
| { |
| "epoch": 1.6061554512258738, |
| "grad_norm": 0.5843884031448716, |
| "learning_rate": 3.8001287254622064e-05, |
| "loss": 0.2595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11978837847709656, |
| "step": 1540, |
| "valid_targets_mean": 3578.6, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 1.6113719353155973, |
| "grad_norm": 0.5172038207495926, |
| "learning_rate": 3.797856509573981e-05, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11195925623178482, |
| "step": 1545, |
| "valid_targets_mean": 3779.6, |
| "valid_targets_min": 208 |
| }, |
| { |
| "epoch": 1.6165884194053208, |
| "grad_norm": 0.47122341882486524, |
| "learning_rate": 3.795572138072759e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12011150270700455, |
| "step": 1550, |
| "valid_targets_mean": 6209.4, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 1.6218049034950444, |
| "grad_norm": 0.48927193258845336, |
| "learning_rate": 3.793275626403564e-05, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1319829821586609, |
| "step": 1555, |
| "valid_targets_mean": 5578.1, |
| "valid_targets_min": 2057 |
| }, |
| { |
| "epoch": 1.6270213875847679, |
| "grad_norm": 0.48409051046392965, |
| "learning_rate": 3.790966990093503e-05, |
| "loss": 0.2339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10502097010612488, |
| "step": 1560, |
| "valid_targets_mean": 5231.0, |
| "valid_targets_min": 3204 |
| }, |
| { |
| "epoch": 1.6322378716744914, |
| "grad_norm": 0.5544493076567448, |
| "learning_rate": 3.788646244751654e-05, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12199460715055466, |
| "step": 1565, |
| "valid_targets_mean": 4882.4, |
| "valid_targets_min": 3027 |
| }, |
| { |
| "epoch": 1.637454355764215, |
| "grad_norm": 0.5645954649757362, |
| "learning_rate": 3.7863134060689734e-05, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11990859359502792, |
| "step": 1570, |
| "valid_targets_mean": 3640.4, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 1.6426708398539385, |
| "grad_norm": 0.45622175926885516, |
| "learning_rate": 3.783968489818179e-05, |
| "loss": 0.2474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09329172968864441, |
| "step": 1575, |
| "valid_targets_mean": 5609.4, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 1.647887323943662, |
| "grad_norm": 0.5746045595380861, |
| "learning_rate": 3.781611511853646e-05, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15213215351104736, |
| "step": 1580, |
| "valid_targets_mean": 4927.5, |
| "valid_targets_min": 2514 |
| }, |
| { |
| "epoch": 1.6531038080333855, |
| "grad_norm": 0.4756606852258843, |
| "learning_rate": 3.779242488111304e-05, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09551073610782623, |
| "step": 1585, |
| "valid_targets_mean": 4230.0, |
| "valid_targets_min": 1646 |
| }, |
| { |
| "epoch": 1.658320292123109, |
| "grad_norm": 0.50567057762336, |
| "learning_rate": 3.776861434608524e-05, |
| "loss": 0.2446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12129361927509308, |
| "step": 1590, |
| "valid_targets_mean": 4804.4, |
| "valid_targets_min": 2404 |
| }, |
| { |
| "epoch": 1.6635367762128326, |
| "grad_norm": 0.5017088642180424, |
| "learning_rate": 3.774468367444012e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12084630131721497, |
| "step": 1595, |
| "valid_targets_mean": 4832.0, |
| "valid_targets_min": 2261 |
| }, |
| { |
| "epoch": 1.668753260302556, |
| "grad_norm": 0.5067963445162644, |
| "learning_rate": 3.7720633027977034e-05, |
| "loss": 0.2537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10921032726764679, |
| "step": 1600, |
| "valid_targets_mean": 4878.5, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 1.6739697443922796, |
| "grad_norm": 0.5670844609525346, |
| "learning_rate": 3.7696462569306467e-05, |
| "loss": 0.258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11840958148241043, |
| "step": 1605, |
| "valid_targets_mean": 3607.9, |
| "valid_targets_min": 2357 |
| }, |
| { |
| "epoch": 1.6791862284820032, |
| "grad_norm": 0.47359585402114174, |
| "learning_rate": 3.7672172461849e-05, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10673607885837555, |
| "step": 1610, |
| "valid_targets_mean": 5604.9, |
| "valid_targets_min": 1862 |
| }, |
| { |
| "epoch": 1.6844027125717267, |
| "grad_norm": 0.48428867641956413, |
| "learning_rate": 3.7647762869834164e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12657439708709717, |
| "step": 1615, |
| "valid_targets_mean": 4580.1, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 1.6896191966614502, |
| "grad_norm": 0.5013336800445145, |
| "learning_rate": 3.7623233958299364e-05, |
| "loss": 0.2422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08720278739929199, |
| "step": 1620, |
| "valid_targets_mean": 3723.0, |
| "valid_targets_min": 1383 |
| }, |
| { |
| "epoch": 1.6948356807511737, |
| "grad_norm": 0.5933134524932153, |
| "learning_rate": 3.7598585893088726e-05, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14190977811813354, |
| "step": 1625, |
| "valid_targets_mean": 4540.6, |
| "valid_targets_min": 1762 |
| }, |
| { |
| "epoch": 1.7000521648408973, |
| "grad_norm": 1.2127607017517221, |
| "learning_rate": 3.7573818840852004e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1074744164943695, |
| "step": 1630, |
| "valid_targets_mean": 4648.8, |
| "valid_targets_min": 2365 |
| }, |
| { |
| "epoch": 1.7052686489306208, |
| "grad_norm": 0.4752655984423174, |
| "learning_rate": 3.754893296904344e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0906633660197258, |
| "step": 1635, |
| "valid_targets_mean": 4332.1, |
| "valid_targets_min": 1967 |
| }, |
| { |
| "epoch": 1.7104851330203443, |
| "grad_norm": 0.48332414158338666, |
| "learning_rate": 3.752392844592064e-05, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12134155631065369, |
| "step": 1640, |
| "valid_targets_mean": 4402.6, |
| "valid_targets_min": 1857 |
| }, |
| { |
| "epoch": 1.7157016171100679, |
| "grad_norm": 0.5528011425591683, |
| "learning_rate": 3.7498805440543436e-05, |
| "loss": 0.2461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13630694150924683, |
| "step": 1645, |
| "valid_targets_mean": 4838.1, |
| "valid_targets_min": 2858 |
| }, |
| { |
| "epoch": 1.7209181011997914, |
| "grad_norm": 0.539257716336949, |
| "learning_rate": 3.747356412277272e-05, |
| "loss": 0.2536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12012304365634918, |
| "step": 1650, |
| "valid_targets_mean": 5222.1, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 1.726134585289515, |
| "grad_norm": 0.4985928915472987, |
| "learning_rate": 3.744820466326933e-05, |
| "loss": 0.2495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12551480531692505, |
| "step": 1655, |
| "valid_targets_mean": 4609.0, |
| "valid_targets_min": 1461 |
| }, |
| { |
| "epoch": 1.7313510693792384, |
| "grad_norm": 0.48441783157096807, |
| "learning_rate": 3.7422727233492876e-05, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15556228160858154, |
| "step": 1660, |
| "valid_targets_mean": 5658.8, |
| "valid_targets_min": 1767 |
| }, |
| { |
| "epoch": 1.736567553468962, |
| "grad_norm": 0.532508856659577, |
| "learning_rate": 3.739713200570058e-05, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10466257482767105, |
| "step": 1665, |
| "valid_targets_mean": 4985.1, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 1.7417840375586855, |
| "grad_norm": 0.5450230060599003, |
| "learning_rate": 3.737141915294612e-05, |
| "loss": 0.2437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10845594108104706, |
| "step": 1670, |
| "valid_targets_mean": 4706.2, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 1.747000521648409, |
| "grad_norm": 0.591198881980741, |
| "learning_rate": 3.734558884907847e-05, |
| "loss": 0.2499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1261470913887024, |
| "step": 1675, |
| "valid_targets_mean": 4374.8, |
| "valid_targets_min": 1659 |
| }, |
| { |
| "epoch": 1.7522170057381325, |
| "grad_norm": 0.4954991221034555, |
| "learning_rate": 3.7319641268740684e-05, |
| "loss": 0.2348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12304702401161194, |
| "step": 1680, |
| "valid_targets_mean": 5559.2, |
| "valid_targets_min": 3116 |
| }, |
| { |
| "epoch": 1.757433489827856, |
| "grad_norm": 0.4523983100902319, |
| "learning_rate": 3.729357658736877e-05, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10654617100954056, |
| "step": 1685, |
| "valid_targets_mean": 5304.4, |
| "valid_targets_min": 2748 |
| }, |
| { |
| "epoch": 1.7626499739175796, |
| "grad_norm": 0.4781303041020441, |
| "learning_rate": 3.7267394981190456e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13260826468467712, |
| "step": 1690, |
| "valid_targets_mean": 5369.8, |
| "valid_targets_min": 2116 |
| }, |
| { |
| "epoch": 1.7678664580073031, |
| "grad_norm": 0.4665938814513094, |
| "learning_rate": 3.724109662722402e-05, |
| "loss": 0.2347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11321903765201569, |
| "step": 1695, |
| "valid_targets_mean": 5622.1, |
| "valid_targets_min": 3314 |
| }, |
| { |
| "epoch": 1.7730829420970267, |
| "grad_norm": 0.563972673121229, |
| "learning_rate": 3.72146817032771e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12348375469446182, |
| "step": 1700, |
| "valid_targets_mean": 4625.1, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 1.77829942618675, |
| "grad_norm": 0.49684534538885133, |
| "learning_rate": 3.718815038794549e-05, |
| "loss": 0.2689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11572001874446869, |
| "step": 1705, |
| "valid_targets_mean": 4280.5, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 1.7835159102764737, |
| "grad_norm": 0.539515924089831, |
| "learning_rate": 3.71615028606119e-05, |
| "loss": 0.2393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1124250739812851, |
| "step": 1710, |
| "valid_targets_mean": 4333.1, |
| "valid_targets_min": 1636 |
| }, |
| { |
| "epoch": 1.788732394366197, |
| "grad_norm": 0.5258087357470302, |
| "learning_rate": 3.713473930144479e-05, |
| "loss": 0.2499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1382165402173996, |
| "step": 1715, |
| "valid_targets_mean": 4965.2, |
| "valid_targets_min": 1416 |
| }, |
| { |
| "epoch": 1.7939488784559208, |
| "grad_norm": 0.5235070365330642, |
| "learning_rate": 3.710785989139713e-05, |
| "loss": 0.261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12338519096374512, |
| "step": 1720, |
| "valid_targets_mean": 4041.2, |
| "valid_targets_min": 1908 |
| }, |
| { |
| "epoch": 1.799165362545644, |
| "grad_norm": 0.5419756293085212, |
| "learning_rate": 3.7080864812205176e-05, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12302734702825546, |
| "step": 1725, |
| "valid_targets_mean": 4363.4, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 1.8043818466353678, |
| "grad_norm": 0.4802544830790868, |
| "learning_rate": 3.705375424638723e-05, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.124026820063591, |
| "step": 1730, |
| "valid_targets_mean": 4707.2, |
| "valid_targets_min": 2589 |
| }, |
| { |
| "epoch": 1.8095983307250911, |
| "grad_norm": 0.48677623141738435, |
| "learning_rate": 3.702652837724244e-05, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13875910639762878, |
| "step": 1735, |
| "valid_targets_mean": 5555.6, |
| "valid_targets_min": 3939 |
| }, |
| { |
| "epoch": 1.8148148148148149, |
| "grad_norm": 0.9516607300521612, |
| "learning_rate": 3.6999187388849517e-05, |
| "loss": 0.248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1442538946866989, |
| "step": 1740, |
| "valid_targets_mean": 4964.8, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 1.8200312989045382, |
| "grad_norm": 0.5283790292684337, |
| "learning_rate": 3.697173146606553e-05, |
| "loss": 0.2605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10957943648099899, |
| "step": 1745, |
| "valid_targets_mean": 3189.6, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 1.825247782994262, |
| "grad_norm": 0.5387767109946204, |
| "learning_rate": 3.694416079452463e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11930787563323975, |
| "step": 1750, |
| "valid_targets_mean": 4071.8, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 1.8304642670839852, |
| "grad_norm": 0.5581490472860003, |
| "learning_rate": 3.6916475560636806e-05, |
| "loss": 0.2542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12916062772274017, |
| "step": 1755, |
| "valid_targets_mean": 4486.4, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 1.835680751173709, |
| "grad_norm": 0.5536821065094885, |
| "learning_rate": 3.688867595158663e-05, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14876341819763184, |
| "step": 1760, |
| "valid_targets_mean": 4862.4, |
| "valid_targets_min": 1730 |
| }, |
| { |
| "epoch": 1.8408972352634323, |
| "grad_norm": 0.5843970090001455, |
| "learning_rate": 3.686076215533198e-05, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16234152019023895, |
| "step": 1765, |
| "valid_targets_mean": 5925.6, |
| "valid_targets_min": 3125 |
| }, |
| { |
| "epoch": 1.846113719353156, |
| "grad_norm": 0.6527702228685233, |
| "learning_rate": 3.683273436060275e-05, |
| "loss": 0.255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1514151692390442, |
| "step": 1770, |
| "valid_targets_mean": 3472.9, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 1.8513302034428794, |
| "grad_norm": 0.46388789877785, |
| "learning_rate": 3.680459275689964e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.136823832988739, |
| "step": 1775, |
| "valid_targets_mean": 5753.6, |
| "valid_targets_min": 1458 |
| }, |
| { |
| "epoch": 1.856546687532603, |
| "grad_norm": 0.5332179778953855, |
| "learning_rate": 3.677633753449278e-05, |
| "loss": 0.2395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11068500578403473, |
| "step": 1780, |
| "valid_targets_mean": 5434.1, |
| "valid_targets_min": 3823 |
| }, |
| { |
| "epoch": 1.8617631716223264, |
| "grad_norm": 1.1242798095109956, |
| "learning_rate": 3.674796888442056e-05, |
| "loss": 0.2461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11812400817871094, |
| "step": 1785, |
| "valid_targets_mean": 4917.5, |
| "valid_targets_min": 2439 |
| }, |
| { |
| "epoch": 1.8669796557120502, |
| "grad_norm": 0.5522589864356385, |
| "learning_rate": 3.671948699848822e-05, |
| "loss": 0.2644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11022226512432098, |
| "step": 1790, |
| "valid_targets_mean": 3553.0, |
| "valid_targets_min": 2518 |
| }, |
| { |
| "epoch": 1.8721961398017735, |
| "grad_norm": 0.5586953345582154, |
| "learning_rate": 3.6690892069266624e-05, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12100788950920105, |
| "step": 1795, |
| "valid_targets_mean": 4217.9, |
| "valid_targets_min": 2319 |
| }, |
| { |
| "epoch": 1.8774126238914972, |
| "grad_norm": 0.6245335282858276, |
| "learning_rate": 3.666218429009094e-05, |
| "loss": 0.2395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11601720750331879, |
| "step": 1800, |
| "valid_targets_mean": 4822.2, |
| "valid_targets_min": 1259 |
| }, |
| { |
| "epoch": 1.8826291079812205, |
| "grad_norm": 0.4361533309646699, |
| "learning_rate": 3.6633363855059336e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11116553843021393, |
| "step": 1805, |
| "valid_targets_mean": 6440.9, |
| "valid_targets_min": 2174 |
| }, |
| { |
| "epoch": 1.8878455920709443, |
| "grad_norm": 0.49914721297729236, |
| "learning_rate": 3.6604430959031676e-05, |
| "loss": 0.2626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15305811166763306, |
| "step": 1810, |
| "valid_targets_mean": 4380.8, |
| "valid_targets_min": 1366 |
| }, |
| { |
| "epoch": 1.8930620761606676, |
| "grad_norm": 0.5437652077862022, |
| "learning_rate": 3.6575385797628166e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13775449991226196, |
| "step": 1815, |
| "valid_targets_mean": 5084.4, |
| "valid_targets_min": 2826 |
| }, |
| { |
| "epoch": 1.8982785602503913, |
| "grad_norm": 0.5165100386805054, |
| "learning_rate": 3.654622856722808e-05, |
| "loss": 0.2438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13797417283058167, |
| "step": 1820, |
| "valid_targets_mean": 4657.2, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 1.9034950443401146, |
| "grad_norm": 0.8637494671339646, |
| "learning_rate": 3.651695946496839e-05, |
| "loss": 0.2532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09824159741401672, |
| "step": 1825, |
| "valid_targets_mean": 5041.9, |
| "valid_targets_min": 3198 |
| }, |
| { |
| "epoch": 1.9087115284298384, |
| "grad_norm": 0.45619472777373626, |
| "learning_rate": 3.6487578688742485e-05, |
| "loss": 0.2347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09745252877473831, |
| "step": 1830, |
| "valid_targets_mean": 4831.0, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 1.9139280125195617, |
| "grad_norm": 0.46659452122338013, |
| "learning_rate": 3.6458086437198764e-05, |
| "loss": 0.2343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11686418205499649, |
| "step": 1835, |
| "valid_targets_mean": 5696.5, |
| "valid_targets_min": 1816 |
| }, |
| { |
| "epoch": 1.9191444966092854, |
| "grad_norm": 0.5734880079061442, |
| "learning_rate": 3.642848290973934e-05, |
| "loss": 0.2454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1568131148815155, |
| "step": 1840, |
| "valid_targets_mean": 4659.0, |
| "valid_targets_min": 1469 |
| }, |
| { |
| "epoch": 1.9243609806990087, |
| "grad_norm": 0.4718312237043105, |
| "learning_rate": 3.6398768306518706e-05, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10714077949523926, |
| "step": 1845, |
| "valid_targets_mean": 5023.5, |
| "valid_targets_min": 2130 |
| }, |
| { |
| "epoch": 1.9295774647887325, |
| "grad_norm": 0.5573780363946851, |
| "learning_rate": 3.636894282844233e-05, |
| "loss": 0.2596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1489737182855606, |
| "step": 1850, |
| "valid_targets_mean": 3690.5, |
| "valid_targets_min": 3023 |
| }, |
| { |
| "epoch": 1.9347939488784558, |
| "grad_norm": 0.4695102238444236, |
| "learning_rate": 3.6339006677165316e-05, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11228922009468079, |
| "step": 1855, |
| "valid_targets_mean": 5067.9, |
| "valid_targets_min": 1794 |
| }, |
| { |
| "epoch": 1.9400104329681795, |
| "grad_norm": 0.509184552401322, |
| "learning_rate": 3.630896005509108e-05, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12257759273052216, |
| "step": 1860, |
| "valid_targets_mean": 5672.6, |
| "valid_targets_min": 3567 |
| }, |
| { |
| "epoch": 1.9452269170579028, |
| "grad_norm": 0.5624899738669874, |
| "learning_rate": 3.6278803165369926e-05, |
| "loss": 0.2513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10627146065235138, |
| "step": 1865, |
| "valid_targets_mean": 3758.6, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 1.9504434011476266, |
| "grad_norm": 0.5845320960330752, |
| "learning_rate": 3.6248536211897715e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1219656765460968, |
| "step": 1870, |
| "valid_targets_mean": 4353.5, |
| "valid_targets_min": 1778 |
| }, |
| { |
| "epoch": 1.95565988523735, |
| "grad_norm": 0.5898029464379284, |
| "learning_rate": 3.621815939931444e-05, |
| "loss": 0.2463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11879602074623108, |
| "step": 1875, |
| "valid_targets_mean": 3925.4, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 1.9608763693270737, |
| "grad_norm": 0.47207322347001124, |
| "learning_rate": 3.6187672933002904e-05, |
| "loss": 0.2377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12292701750993729, |
| "step": 1880, |
| "valid_targets_mean": 5703.8, |
| "valid_targets_min": 3091 |
| }, |
| { |
| "epoch": 1.966092853416797, |
| "grad_norm": 0.49751207176942625, |
| "learning_rate": 3.6157077019087254e-05, |
| "loss": 0.2531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12327823042869568, |
| "step": 1885, |
| "valid_targets_mean": 4978.5, |
| "valid_targets_min": 1778 |
| }, |
| { |
| "epoch": 1.9713093375065207, |
| "grad_norm": 0.5215491471402459, |
| "learning_rate": 3.612637186443169e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13275089859962463, |
| "step": 1890, |
| "valid_targets_mean": 4872.0, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 1.976525821596244, |
| "grad_norm": 0.5480006277598584, |
| "learning_rate": 3.609555767663895e-05, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11053438484668732, |
| "step": 1895, |
| "valid_targets_mean": 6055.5, |
| "valid_targets_min": 2435 |
| }, |
| { |
| "epoch": 1.9817423056859678, |
| "grad_norm": 0.9008272684690406, |
| "learning_rate": 3.6064634664048996e-05, |
| "loss": 0.2581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14233778417110443, |
| "step": 1900, |
| "valid_targets_mean": 3512.8, |
| "valid_targets_min": 1351 |
| }, |
| { |
| "epoch": 1.986958789775691, |
| "grad_norm": 0.6617795177051474, |
| "learning_rate": 3.603360303573757e-05, |
| "loss": 0.2512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1280476152896881, |
| "step": 1905, |
| "valid_targets_mean": 4181.1, |
| "valid_targets_min": 1982 |
| }, |
| { |
| "epoch": 1.9921752738654148, |
| "grad_norm": 0.5497708615752375, |
| "learning_rate": 3.600246300151476e-05, |
| "loss": 0.2405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11217804253101349, |
| "step": 1910, |
| "valid_targets_mean": 4834.0, |
| "valid_targets_min": 1885 |
| }, |
| { |
| "epoch": 1.9973917579551381, |
| "grad_norm": 0.5549717938139402, |
| "learning_rate": 3.597121477192364e-05, |
| "loss": 0.2872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14330707490444183, |
| "step": 1915, |
| "valid_targets_mean": 5543.5, |
| "valid_targets_min": 1502 |
| }, |
| { |
| "epoch": 2.0020865936358896, |
| "grad_norm": 0.5269936041252705, |
| "learning_rate": 3.593985855823878e-05, |
| "loss": 0.2472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10810284316539764, |
| "step": 1920, |
| "valid_targets_mean": 5318.8, |
| "valid_targets_min": 4030 |
| }, |
| { |
| "epoch": 2.007303077725613, |
| "grad_norm": 0.5974233968850137, |
| "learning_rate": 3.590839457246487e-05, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1327662169933319, |
| "step": 1925, |
| "valid_targets_mean": 4653.5, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 2.0125195618153366, |
| "grad_norm": 0.569055358921142, |
| "learning_rate": 3.587682302733527e-05, |
| "loss": 0.2389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15174917876720428, |
| "step": 1930, |
| "valid_targets_mean": 5089.8, |
| "valid_targets_min": 2551 |
| }, |
| { |
| "epoch": 2.01773604590506, |
| "grad_norm": 0.6071785094734595, |
| "learning_rate": 3.584514413631054e-05, |
| "loss": 0.2296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1039377972483635, |
| "step": 1935, |
| "valid_targets_mean": 4698.2, |
| "valid_targets_min": 3511 |
| }, |
| { |
| "epoch": 2.0229525299947837, |
| "grad_norm": 0.7649753469176215, |
| "learning_rate": 3.581335811357703e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1236136332154274, |
| "step": 1940, |
| "valid_targets_mean": 5705.1, |
| "valid_targets_min": 2985 |
| }, |
| { |
| "epoch": 2.028169014084507, |
| "grad_norm": 0.55394336882652, |
| "learning_rate": 3.578146517404546e-05, |
| "loss": 0.2106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11663387715816498, |
| "step": 1945, |
| "valid_targets_mean": 4723.4, |
| "valid_targets_min": 1671 |
| }, |
| { |
| "epoch": 2.0333854981742308, |
| "grad_norm": 0.5082030698850123, |
| "learning_rate": 3.574946553334938e-05, |
| "loss": 0.2225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10076865553855896, |
| "step": 1950, |
| "valid_targets_mean": 4673.2, |
| "valid_targets_min": 2717 |
| }, |
| { |
| "epoch": 2.038601982263954, |
| "grad_norm": 0.5567379435319525, |
| "learning_rate": 3.571735940784381e-05, |
| "loss": 0.2196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1046312004327774, |
| "step": 1955, |
| "valid_targets_mean": 4137.0, |
| "valid_targets_min": 1847 |
| }, |
| { |
| "epoch": 2.043818466353678, |
| "grad_norm": 0.48985358034713516, |
| "learning_rate": 3.5685147014603705e-05, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08953490853309631, |
| "step": 1960, |
| "valid_targets_mean": 5168.4, |
| "valid_targets_min": 3013 |
| }, |
| { |
| "epoch": 2.049034950443401, |
| "grad_norm": 0.571831332261129, |
| "learning_rate": 3.5652828571422536e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10120147466659546, |
| "step": 1965, |
| "valid_targets_mean": 4631.1, |
| "valid_targets_min": 1478 |
| }, |
| { |
| "epoch": 2.054251434533125, |
| "grad_norm": 0.7529034629375903, |
| "learning_rate": 3.5620404296810766e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09623203426599503, |
| "step": 1970, |
| "valid_targets_mean": 4019.8, |
| "valid_targets_min": 1673 |
| }, |
| { |
| "epoch": 2.059467918622848, |
| "grad_norm": 0.5687919001896762, |
| "learning_rate": 3.558787440999442e-05, |
| "loss": 0.2284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11071816086769104, |
| "step": 1975, |
| "valid_targets_mean": 5494.5, |
| "valid_targets_min": 2436 |
| }, |
| { |
| "epoch": 2.064684402712572, |
| "grad_norm": 0.5368577826880351, |
| "learning_rate": 3.55552391309136e-05, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1275230348110199, |
| "step": 1980, |
| "valid_targets_mean": 6043.0, |
| "valid_targets_min": 2155 |
| }, |
| { |
| "epoch": 2.0699008868022952, |
| "grad_norm": 0.5409911221432354, |
| "learning_rate": 3.5522498680220954e-05, |
| "loss": 0.2374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11893551796674728, |
| "step": 1985, |
| "valid_targets_mean": 5916.8, |
| "valid_targets_min": 2004 |
| }, |
| { |
| "epoch": 2.075117370892019, |
| "grad_norm": 0.50408544253174, |
| "learning_rate": 3.5489653279280225e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09793812036514282, |
| "step": 1990, |
| "valid_targets_mean": 5182.1, |
| "valid_targets_min": 2615 |
| }, |
| { |
| "epoch": 2.0803338549817423, |
| "grad_norm": 0.6171549014287283, |
| "learning_rate": 3.545670315016475e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13135838508605957, |
| "step": 1995, |
| "valid_targets_mean": 4706.6, |
| "valid_targets_min": 1718 |
| }, |
| { |
| "epoch": 2.085550339071466, |
| "grad_norm": 0.46573730964278404, |
| "learning_rate": 3.5423648515655934e-05, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09348612278699875, |
| "step": 2000, |
| "valid_targets_mean": 5483.9, |
| "valid_targets_min": 3057 |
| }, |
| { |
| "epoch": 2.0907668231611893, |
| "grad_norm": 0.5522490520394556, |
| "learning_rate": 3.539048959924178e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1360378861427307, |
| "step": 2005, |
| "valid_targets_mean": 4643.5, |
| "valid_targets_min": 1534 |
| }, |
| { |
| "epoch": 2.095983307250913, |
| "grad_norm": 0.5474360037399448, |
| "learning_rate": 3.535722662511535e-05, |
| "loss": 0.2258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12546919286251068, |
| "step": 2010, |
| "valid_targets_mean": 4983.0, |
| "valid_targets_min": 1833 |
| }, |
| { |
| "epoch": 2.1011997913406364, |
| "grad_norm": 0.524017047747236, |
| "learning_rate": 3.532385981817326e-05, |
| "loss": 0.2282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09845712780952454, |
| "step": 2015, |
| "valid_targets_mean": 4596.1, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 2.10641627543036, |
| "grad_norm": 0.493032897409189, |
| "learning_rate": 3.5290389404014136e-05, |
| "loss": 0.2406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09936146438121796, |
| "step": 2020, |
| "valid_targets_mean": 5361.8, |
| "valid_targets_min": 2427 |
| }, |
| { |
| "epoch": 2.1116327595200834, |
| "grad_norm": 0.48009492015893784, |
| "learning_rate": 3.5256815608937155e-05, |
| "loss": 0.2196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08758233487606049, |
| "step": 2025, |
| "valid_targets_mean": 4458.4, |
| "valid_targets_min": 1363 |
| }, |
| { |
| "epoch": 2.116849243609807, |
| "grad_norm": 0.5338485179025612, |
| "learning_rate": 3.522313865994043e-05, |
| "loss": 0.228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09387579560279846, |
| "step": 2030, |
| "valid_targets_mean": 4182.8, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 2.1220657276995305, |
| "grad_norm": 0.7751541416535409, |
| "learning_rate": 3.518935878471952e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12653851509094238, |
| "step": 2035, |
| "valid_targets_mean": 3748.4, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 2.127282211789254, |
| "grad_norm": 0.5172812414306709, |
| "learning_rate": 3.515547621166591e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11102648824453354, |
| "step": 2040, |
| "valid_targets_mean": 5220.8, |
| "valid_targets_min": 2812 |
| }, |
| { |
| "epoch": 2.1324986958789776, |
| "grad_norm": 0.5421914141921881, |
| "learning_rate": 3.5121491169865425e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11301957070827484, |
| "step": 2045, |
| "valid_targets_mean": 5223.4, |
| "valid_targets_min": 2652 |
| }, |
| { |
| "epoch": 2.1377151799687013, |
| "grad_norm": 0.5487760380319388, |
| "learning_rate": 3.508740388909669e-05, |
| "loss": 0.2221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0976884514093399, |
| "step": 2050, |
| "valid_targets_mean": 4488.4, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 2.1429316640584246, |
| "grad_norm": 0.5405842722582158, |
| "learning_rate": 3.505321459982961e-05, |
| "loss": 0.2252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12626048922538757, |
| "step": 2055, |
| "valid_targets_mean": 5094.5, |
| "valid_targets_min": 2013 |
| }, |
| { |
| "epoch": 2.148148148148148, |
| "grad_norm": 0.5246815278254859, |
| "learning_rate": 3.501892353322376e-05, |
| "loss": 0.2137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09376654028892517, |
| "step": 2060, |
| "valid_targets_mean": 4093.5, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 2.1533646322378717, |
| "grad_norm": 0.4251847589281074, |
| "learning_rate": 3.498453092112687e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08616240322589874, |
| "step": 2065, |
| "valid_targets_mean": 4603.5, |
| "valid_targets_min": 2121 |
| }, |
| { |
| "epoch": 2.1585811163275954, |
| "grad_norm": 0.47383850020780094, |
| "learning_rate": 3.495003699607322e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1174222081899643, |
| "step": 2070, |
| "valid_targets_mean": 6127.4, |
| "valid_targets_min": 2805 |
| }, |
| { |
| "epoch": 2.1637976004173187, |
| "grad_norm": 0.47843260960694084, |
| "learning_rate": 3.49154419912821e-05, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10661450028419495, |
| "step": 2075, |
| "valid_targets_mean": 4927.1, |
| "valid_targets_min": 1689 |
| }, |
| { |
| "epoch": 2.169014084507042, |
| "grad_norm": 0.4899763108410606, |
| "learning_rate": 3.48807461406562e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10473626852035522, |
| "step": 2080, |
| "valid_targets_mean": 5954.0, |
| "valid_targets_min": 1628 |
| }, |
| { |
| "epoch": 2.174230568596766, |
| "grad_norm": 0.5388649564403426, |
| "learning_rate": 3.484594967878007e-05, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11704675853252411, |
| "step": 2085, |
| "valid_targets_mean": 5408.0, |
| "valid_targets_min": 3345 |
| }, |
| { |
| "epoch": 2.1794470526864895, |
| "grad_norm": 0.5038235678306854, |
| "learning_rate": 3.481105284091847e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12047860026359558, |
| "step": 2090, |
| "valid_targets_mean": 4923.1, |
| "valid_targets_min": 2056 |
| }, |
| { |
| "epoch": 2.184663536776213, |
| "grad_norm": 0.5218145944948759, |
| "learning_rate": 3.4776055863014864e-05, |
| "loss": 0.2295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10921941697597504, |
| "step": 2095, |
| "valid_targets_mean": 4686.8, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 2.189880020865936, |
| "grad_norm": 0.5464581574239525, |
| "learning_rate": 3.474095898168975e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.132952481508255, |
| "step": 2100, |
| "valid_targets_mean": 4852.8, |
| "valid_targets_min": 2843 |
| }, |
| { |
| "epoch": 2.19509650495566, |
| "grad_norm": 0.4939978105645992, |
| "learning_rate": 3.470576243423911e-05, |
| "loss": 0.2379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08919451385736465, |
| "step": 2105, |
| "valid_targets_mean": 4851.6, |
| "valid_targets_min": 1716 |
| }, |
| { |
| "epoch": 2.2003129890453836, |
| "grad_norm": 0.5339982334715729, |
| "learning_rate": 3.467046645863276e-05, |
| "loss": 0.234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12849083542823792, |
| "step": 2110, |
| "valid_targets_mean": 5342.1, |
| "valid_targets_min": 2569 |
| }, |
| { |
| "epoch": 2.205529473135107, |
| "grad_norm": 0.50197354954302, |
| "learning_rate": 3.463507129351279e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11599946022033691, |
| "step": 2115, |
| "valid_targets_mean": 4914.8, |
| "valid_targets_min": 1776 |
| }, |
| { |
| "epoch": 2.2107459572248302, |
| "grad_norm": 0.5788077914862068, |
| "learning_rate": 3.459957717819191e-05, |
| "loss": 0.2334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12925925850868225, |
| "step": 2120, |
| "valid_targets_mean": 3880.0, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 2.215962441314554, |
| "grad_norm": 0.46285027634666653, |
| "learning_rate": 3.4563984352651874e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07943163812160492, |
| "step": 2125, |
| "valid_targets_mean": 4488.4, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 2.2211789254042777, |
| "grad_norm": 0.642471074334573, |
| "learning_rate": 3.45282930575418e-05, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09657199680805206, |
| "step": 2130, |
| "valid_targets_mean": 3349.5, |
| "valid_targets_min": 1582 |
| }, |
| { |
| "epoch": 2.226395409494001, |
| "grad_norm": 0.570788848317248, |
| "learning_rate": 3.449250353417661e-05, |
| "loss": 0.244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13143855333328247, |
| "step": 2135, |
| "valid_targets_mean": 4533.5, |
| "valid_targets_min": 1976 |
| }, |
| { |
| "epoch": 2.2316118935837244, |
| "grad_norm": 0.46714669131619335, |
| "learning_rate": 3.445661602453533e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1163138896226883, |
| "step": 2140, |
| "valid_targets_mean": 6082.4, |
| "valid_targets_min": 3087 |
| }, |
| { |
| "epoch": 2.236828377673448, |
| "grad_norm": 0.5587627949228191, |
| "learning_rate": 3.44206307712595e-05, |
| "loss": 0.2246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10658030956983566, |
| "step": 2145, |
| "valid_targets_mean": 5567.4, |
| "valid_targets_min": 1752 |
| }, |
| { |
| "epoch": 2.2420448617631714, |
| "grad_norm": 0.5303710463405483, |
| "learning_rate": 3.4384548017651544e-05, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12135177850723267, |
| "step": 2150, |
| "valid_targets_mean": 4302.0, |
| "valid_targets_min": 1581 |
| }, |
| { |
| "epoch": 2.247261345852895, |
| "grad_norm": 0.5375666300344333, |
| "learning_rate": 3.4348368007673065e-05, |
| "loss": 0.2173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10137631744146347, |
| "step": 2155, |
| "valid_targets_mean": 4868.8, |
| "valid_targets_min": 2466 |
| }, |
| { |
| "epoch": 2.2524778299426185, |
| "grad_norm": 0.4744381052708486, |
| "learning_rate": 3.4312090985943266e-05, |
| "loss": 0.2207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12538987398147583, |
| "step": 2160, |
| "valid_targets_mean": 6205.9, |
| "valid_targets_min": 3568 |
| }, |
| { |
| "epoch": 2.257694314032342, |
| "grad_norm": 0.5048698772755993, |
| "learning_rate": 3.4275717197737234e-05, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13870665431022644, |
| "step": 2165, |
| "valid_targets_mean": 6170.1, |
| "valid_targets_min": 4471 |
| }, |
| { |
| "epoch": 2.262910798122066, |
| "grad_norm": 0.5539634836266141, |
| "learning_rate": 3.423924688898433e-05, |
| "loss": 0.2308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11574719846248627, |
| "step": 2170, |
| "valid_targets_mean": 3427.8, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 2.2681272822117893, |
| "grad_norm": 0.5553833706907942, |
| "learning_rate": 3.420268030626651e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15152722597122192, |
| "step": 2175, |
| "valid_targets_mean": 5756.5, |
| "valid_targets_min": 3664 |
| }, |
| { |
| "epoch": 2.2733437663015126, |
| "grad_norm": 0.5095935579851769, |
| "learning_rate": 3.416601769681663e-05, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11749089509248734, |
| "step": 2180, |
| "valid_targets_mean": 5107.2, |
| "valid_targets_min": 2944 |
| }, |
| { |
| "epoch": 2.2785602503912363, |
| "grad_norm": 0.5234036773875547, |
| "learning_rate": 3.412925930851683e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09326408058404922, |
| "step": 2185, |
| "valid_targets_mean": 4192.4, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 2.28377673448096, |
| "grad_norm": 0.4626305179647282, |
| "learning_rate": 3.40924053898968e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11077827215194702, |
| "step": 2190, |
| "valid_targets_mean": 5611.8, |
| "valid_targets_min": 2071 |
| }, |
| { |
| "epoch": 2.2889932185706834, |
| "grad_norm": 0.4695916370734793, |
| "learning_rate": 3.405545619013214e-05, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09071405231952667, |
| "step": 2195, |
| "valid_targets_mean": 4260.8, |
| "valid_targets_min": 1449 |
| }, |
| { |
| "epoch": 2.2942097026604067, |
| "grad_norm": 0.4893098076374061, |
| "learning_rate": 3.401841195904267e-05, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09764277935028076, |
| "step": 2200, |
| "valid_targets_mean": 5340.1, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 2.2994261867501304, |
| "grad_norm": 0.4998943508577529, |
| "learning_rate": 3.398127294709072e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11398491263389587, |
| "step": 2205, |
| "valid_targets_mean": 5257.5, |
| "valid_targets_min": 2999 |
| }, |
| { |
| "epoch": 2.3046426708398537, |
| "grad_norm": 0.6434654135986683, |
| "learning_rate": 3.3944039405379444e-05, |
| "loss": 0.2385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1256795972585678, |
| "step": 2210, |
| "valid_targets_mean": 4567.8, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 2.3098591549295775, |
| "grad_norm": 0.4832895047866086, |
| "learning_rate": 3.390671158565115e-05, |
| "loss": 0.2209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10829693078994751, |
| "step": 2215, |
| "valid_targets_mean": 5266.4, |
| "valid_targets_min": 1833 |
| }, |
| { |
| "epoch": 2.315075639019301, |
| "grad_norm": 0.5197732499257903, |
| "learning_rate": 3.386928974028555e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11667078733444214, |
| "step": 2220, |
| "valid_targets_mean": 4708.9, |
| "valid_targets_min": 2253 |
| }, |
| { |
| "epoch": 2.3202921231090246, |
| "grad_norm": 0.7416911718593487, |
| "learning_rate": 3.3831774122298106e-05, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13515786826610565, |
| "step": 2225, |
| "valid_targets_mean": 4782.2, |
| "valid_targets_min": 2366 |
| }, |
| { |
| "epoch": 2.325508607198748, |
| "grad_norm": 0.5510764958479842, |
| "learning_rate": 3.3794164985338266e-05, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10666011273860931, |
| "step": 2230, |
| "valid_targets_mean": 4350.9, |
| "valid_targets_min": 1540 |
| }, |
| { |
| "epoch": 2.3307250912884716, |
| "grad_norm": 0.5423326354389533, |
| "learning_rate": 3.37564625836878e-05, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10791268199682236, |
| "step": 2235, |
| "valid_targets_mean": 4865.4, |
| "valid_targets_min": 2019 |
| }, |
| { |
| "epoch": 2.335941575378195, |
| "grad_norm": 0.4972937429968323, |
| "learning_rate": 3.3718667172259026e-05, |
| "loss": 0.2316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08703801780939102, |
| "step": 2240, |
| "valid_targets_mean": 2945.8, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 2.3411580594679187, |
| "grad_norm": 0.5383237315751074, |
| "learning_rate": 3.368077900659315e-05, |
| "loss": 0.2285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1342734694480896, |
| "step": 2245, |
| "valid_targets_mean": 5155.4, |
| "valid_targets_min": 2019 |
| }, |
| { |
| "epoch": 2.346374543557642, |
| "grad_norm": 0.514318390379442, |
| "learning_rate": 3.364279834285848e-05, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09559551626443863, |
| "step": 2250, |
| "valid_targets_mean": 5152.1, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 2.3515910276473657, |
| "grad_norm": 0.4910773560407386, |
| "learning_rate": 3.360472543784875e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10180678218603134, |
| "step": 2255, |
| "valid_targets_mean": 4525.9, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 2.356807511737089, |
| "grad_norm": 0.5174129329847302, |
| "learning_rate": 3.356656054898132e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10733669251203537, |
| "step": 2260, |
| "valid_targets_mean": 5592.4, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 2.3620239958268128, |
| "grad_norm": 0.5954295865676773, |
| "learning_rate": 3.352830393429547e-05, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09375312924385071, |
| "step": 2265, |
| "valid_targets_mean": 3314.8, |
| "valid_targets_min": 1484 |
| }, |
| { |
| "epoch": 2.367240479916536, |
| "grad_norm": 0.5076393805523123, |
| "learning_rate": 3.3489955852450675e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10176807641983032, |
| "step": 2270, |
| "valid_targets_mean": 5248.9, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 2.37245696400626, |
| "grad_norm": 0.5436901139551851, |
| "learning_rate": 3.3451516562724834e-05, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11518465727567673, |
| "step": 2275, |
| "valid_targets_mean": 4245.1, |
| "valid_targets_min": 1524 |
| }, |
| { |
| "epoch": 2.377673448095983, |
| "grad_norm": 0.6268421209222852, |
| "learning_rate": 3.341298632501249e-05, |
| "loss": 0.2396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09579107910394669, |
| "step": 2280, |
| "valid_targets_mean": 3428.9, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 2.382889932185707, |
| "grad_norm": 0.5315792277064773, |
| "learning_rate": 3.3374365399823134e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11502724140882492, |
| "step": 2285, |
| "valid_targets_mean": 6031.4, |
| "valid_targets_min": 2479 |
| }, |
| { |
| "epoch": 2.38810641627543, |
| "grad_norm": 0.49735017544368204, |
| "learning_rate": 3.3335654048279395e-05, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09845283627510071, |
| "step": 2290, |
| "valid_targets_mean": 4845.5, |
| "valid_targets_min": 2411 |
| }, |
| { |
| "epoch": 2.393322900365154, |
| "grad_norm": 0.5469215023981283, |
| "learning_rate": 3.329685253211528e-05, |
| "loss": 0.2137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11125972121953964, |
| "step": 2295, |
| "valid_targets_mean": 4891.2, |
| "valid_targets_min": 1818 |
| }, |
| { |
| "epoch": 2.3985393844548772, |
| "grad_norm": 0.5596864924707663, |
| "learning_rate": 3.325796111367444e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09879964590072632, |
| "step": 2300, |
| "valid_targets_mean": 4206.2, |
| "valid_targets_min": 1500 |
| }, |
| { |
| "epoch": 2.403755868544601, |
| "grad_norm": 0.653380795920544, |
| "learning_rate": 3.321898005590835e-05, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12416934967041016, |
| "step": 2305, |
| "valid_targets_mean": 6310.6, |
| "valid_targets_min": 1974 |
| }, |
| { |
| "epoch": 2.4089723526343243, |
| "grad_norm": 0.5247996620010477, |
| "learning_rate": 3.317990962237454e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10957548022270203, |
| "step": 2310, |
| "valid_targets_mean": 4463.8, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 2.414188836724048, |
| "grad_norm": 0.5196272325888798, |
| "learning_rate": 3.314075007723487e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08740301430225372, |
| "step": 2315, |
| "valid_targets_mean": 4568.4, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 2.4194053208137714, |
| "grad_norm": 0.5008644373074299, |
| "learning_rate": 3.3101501685253657e-05, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11096716672182083, |
| "step": 2320, |
| "valid_targets_mean": 5336.0, |
| "valid_targets_min": 4362 |
| }, |
| { |
| "epoch": 2.424621804903495, |
| "grad_norm": 0.428977239056974, |
| "learning_rate": 3.306216471179594e-05, |
| "loss": 0.2263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08757981657981873, |
| "step": 2325, |
| "valid_targets_mean": 5136.8, |
| "valid_targets_min": 2698 |
| }, |
| { |
| "epoch": 2.4298382889932184, |
| "grad_norm": 0.5202747625384637, |
| "learning_rate": 3.3022739422825686e-05, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13886937499046326, |
| "step": 2330, |
| "valid_targets_mean": 5362.8, |
| "valid_targets_min": 2061 |
| }, |
| { |
| "epoch": 2.435054773082942, |
| "grad_norm": 0.6250715487666877, |
| "learning_rate": 3.2983226084903944e-05, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1500546783208847, |
| "step": 2335, |
| "valid_targets_mean": 4644.6, |
| "valid_targets_min": 2649 |
| }, |
| { |
| "epoch": 2.4402712571726655, |
| "grad_norm": 0.5557503693150626, |
| "learning_rate": 3.294362496518711e-05, |
| "loss": 0.2433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09636768698692322, |
| "step": 2340, |
| "valid_targets_mean": 3254.9, |
| "valid_targets_min": 2193 |
| }, |
| { |
| "epoch": 2.445487741262389, |
| "grad_norm": 0.5881862964624829, |
| "learning_rate": 3.290393633142507e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11908422410488129, |
| "step": 2345, |
| "valid_targets_mean": 3358.6, |
| "valid_targets_min": 1389 |
| }, |
| { |
| "epoch": 2.4507042253521125, |
| "grad_norm": 0.6091244420286501, |
| "learning_rate": 3.286416045195943e-05, |
| "loss": 0.2246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11243793368339539, |
| "step": 2350, |
| "valid_targets_mean": 4268.9, |
| "valid_targets_min": 1955 |
| }, |
| { |
| "epoch": 2.4559207094418363, |
| "grad_norm": 0.48418326756678837, |
| "learning_rate": 3.282429759572164e-05, |
| "loss": 0.2264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10682648420333862, |
| "step": 2355, |
| "valid_targets_mean": 4991.8, |
| "valid_targets_min": 2411 |
| }, |
| { |
| "epoch": 2.4611371935315596, |
| "grad_norm": 0.6154620221091804, |
| "learning_rate": 3.2784348032231245e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14139145612716675, |
| "step": 2360, |
| "valid_targets_mean": 4965.9, |
| "valid_targets_min": 2315 |
| }, |
| { |
| "epoch": 2.4663536776212833, |
| "grad_norm": 0.5385970318526734, |
| "learning_rate": 3.274431203159402e-05, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14069698750972748, |
| "step": 2365, |
| "valid_targets_mean": 4361.8, |
| "valid_targets_min": 1566 |
| }, |
| { |
| "epoch": 2.4715701617110066, |
| "grad_norm": 0.5238156534717102, |
| "learning_rate": 3.270418986450017e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14405012130737305, |
| "step": 2370, |
| "valid_targets_mean": 4839.0, |
| "valid_targets_min": 2308 |
| }, |
| { |
| "epoch": 2.4767866458007304, |
| "grad_norm": 0.5200091388870949, |
| "learning_rate": 3.266398180222247e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11240924149751663, |
| "step": 2375, |
| "valid_targets_mean": 5034.5, |
| "valid_targets_min": 2717 |
| }, |
| { |
| "epoch": 2.4820031298904537, |
| "grad_norm": 0.4730142225715713, |
| "learning_rate": 3.262368811661446e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10924851894378662, |
| "step": 2380, |
| "valid_targets_mean": 5697.5, |
| "valid_targets_min": 3468 |
| }, |
| { |
| "epoch": 2.4872196139801774, |
| "grad_norm": 0.46335257394324575, |
| "learning_rate": 3.2583309080108576e-05, |
| "loss": 0.2277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1245822086930275, |
| "step": 2385, |
| "valid_targets_mean": 6104.1, |
| "valid_targets_min": 2641 |
| }, |
| { |
| "epoch": 2.4924360980699007, |
| "grad_norm": 0.6316903304176071, |
| "learning_rate": 3.254284496571434e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12317271530628204, |
| "step": 2390, |
| "valid_targets_mean": 3770.5, |
| "valid_targets_min": 1728 |
| }, |
| { |
| "epoch": 2.4976525821596245, |
| "grad_norm": 0.5103735358120499, |
| "learning_rate": 3.25022960470165e-05, |
| "loss": 0.2253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11588916182518005, |
| "step": 2395, |
| "valid_targets_mean": 4118.6, |
| "valid_targets_min": 1346 |
| }, |
| { |
| "epoch": 2.502869066249348, |
| "grad_norm": 0.4871119144422768, |
| "learning_rate": 3.246166259817318e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13652253150939941, |
| "step": 2400, |
| "valid_targets_mean": 5047.4, |
| "valid_targets_min": 1612 |
| }, |
| { |
| "epoch": 2.5080855503390715, |
| "grad_norm": 0.4861440062729529, |
| "learning_rate": 3.242094489391402e-05, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10882267355918884, |
| "step": 2405, |
| "valid_targets_mean": 5876.6, |
| "valid_targets_min": 3946 |
| }, |
| { |
| "epoch": 2.513302034428795, |
| "grad_norm": 0.46289868704399717, |
| "learning_rate": 3.238014320953832e-05, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1044938936829567, |
| "step": 2410, |
| "valid_targets_mean": 4208.9, |
| "valid_targets_min": 1687 |
| }, |
| { |
| "epoch": 2.5185185185185186, |
| "grad_norm": 0.5602170615460815, |
| "learning_rate": 3.233925782091322e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12824594974517822, |
| "step": 2415, |
| "valid_targets_mean": 5145.0, |
| "valid_targets_min": 2146 |
| }, |
| { |
| "epoch": 2.523735002608242, |
| "grad_norm": 0.5057079123729123, |
| "learning_rate": 3.229828900447174e-05, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10087256878614426, |
| "step": 2420, |
| "valid_targets_mean": 3804.2, |
| "valid_targets_min": 1705 |
| }, |
| { |
| "epoch": 2.5289514866979657, |
| "grad_norm": 0.4891221057987663, |
| "learning_rate": 3.2257237037211026e-05, |
| "loss": 0.2413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10101897269487381, |
| "step": 2425, |
| "valid_targets_mean": 4812.5, |
| "valid_targets_min": 1906 |
| }, |
| { |
| "epoch": 2.534167970787689, |
| "grad_norm": 0.4800832908969296, |
| "learning_rate": 3.221610219669038e-05, |
| "loss": 0.2407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09936263412237167, |
| "step": 2430, |
| "valid_targets_mean": 5023.1, |
| "valid_targets_min": 2494 |
| }, |
| { |
| "epoch": 2.5393844548774127, |
| "grad_norm": 0.5214332602895505, |
| "learning_rate": 3.2174884761029456e-05, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11070659756660461, |
| "step": 2435, |
| "valid_targets_mean": 3862.4, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 2.544600938967136, |
| "grad_norm": 0.4380816528769799, |
| "learning_rate": 3.2133585008906307e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1011088639497757, |
| "step": 2440, |
| "valid_targets_mean": 5430.8, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 2.5498174230568598, |
| "grad_norm": 0.46027248912239865, |
| "learning_rate": 3.209220321955559e-05, |
| "loss": 0.2189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10920900106430054, |
| "step": 2445, |
| "valid_targets_mean": 5854.5, |
| "valid_targets_min": 2768 |
| }, |
| { |
| "epoch": 2.555033907146583, |
| "grad_norm": 0.48906639298459353, |
| "learning_rate": 3.205073967276659e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10530338436365128, |
| "step": 2450, |
| "valid_targets_mean": 4083.2, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 2.560250391236307, |
| "grad_norm": 0.5144930723935189, |
| "learning_rate": 3.20091946488814e-05, |
| "loss": 0.2208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0825672447681427, |
| "step": 2455, |
| "valid_targets_mean": 3818.4, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 2.56546687532603, |
| "grad_norm": 0.4803660050648124, |
| "learning_rate": 3.196756842879297e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10335831344127655, |
| "step": 2460, |
| "valid_targets_mean": 5047.2, |
| "valid_targets_min": 2337 |
| }, |
| { |
| "epoch": 2.570683359415754, |
| "grad_norm": 0.5012910750754004, |
| "learning_rate": 3.1925861293943234e-05, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11575934290885925, |
| "step": 2465, |
| "valid_targets_mean": 5853.1, |
| "valid_targets_min": 2189 |
| }, |
| { |
| "epoch": 2.575899843505477, |
| "grad_norm": 0.4688930376633368, |
| "learning_rate": 3.1884073526321216e-05, |
| "loss": 0.2296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14094386994838715, |
| "step": 2470, |
| "valid_targets_mean": 5949.8, |
| "valid_targets_min": 3518 |
| }, |
| { |
| "epoch": 2.581116327595201, |
| "grad_norm": 0.5088090240154572, |
| "learning_rate": 3.18422054084611e-05, |
| "loss": 0.2066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09743362665176392, |
| "step": 2475, |
| "valid_targets_mean": 4409.0, |
| "valid_targets_min": 1524 |
| }, |
| { |
| "epoch": 2.5863328116849242, |
| "grad_norm": 0.4703303047324992, |
| "learning_rate": 3.180025722344034e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10678398609161377, |
| "step": 2480, |
| "valid_targets_mean": 4728.4, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 2.591549295774648, |
| "grad_norm": 0.47593412985692757, |
| "learning_rate": 3.175822925487774e-05, |
| "loss": 0.2173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10073505342006683, |
| "step": 2485, |
| "valid_targets_mean": 4718.8, |
| "valid_targets_min": 3346 |
| }, |
| { |
| "epoch": 2.5967657798643713, |
| "grad_norm": 0.4920218712524974, |
| "learning_rate": 3.171612178693151e-05, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11507917940616608, |
| "step": 2490, |
| "valid_targets_mean": 4916.9, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 2.601982263954095, |
| "grad_norm": 0.4704795417511032, |
| "learning_rate": 3.1673935104297414e-05, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1106872484087944, |
| "step": 2495, |
| "valid_targets_mean": 4785.4, |
| "valid_targets_min": 2302 |
| }, |
| { |
| "epoch": 2.6071987480438183, |
| "grad_norm": 0.5091338737668465, |
| "learning_rate": 3.163166949220675e-05, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10870622843503952, |
| "step": 2500, |
| "valid_targets_mean": 4724.8, |
| "valid_targets_min": 2701 |
| }, |
| { |
| "epoch": 2.612415232133542, |
| "grad_norm": 0.5760031101096204, |
| "learning_rate": 3.158932523642451e-05, |
| "loss": 0.2256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11305932700634003, |
| "step": 2505, |
| "valid_targets_mean": 3259.8, |
| "valid_targets_min": 1670 |
| }, |
| { |
| "epoch": 2.6176317162232654, |
| "grad_norm": 0.5586883651231902, |
| "learning_rate": 3.1546902623247385e-05, |
| "loss": 0.2234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11771593242883682, |
| "step": 2510, |
| "valid_targets_mean": 4426.1, |
| "valid_targets_min": 1614 |
| }, |
| { |
| "epoch": 2.622848200312989, |
| "grad_norm": 0.44460060389704, |
| "learning_rate": 3.1504401939501866e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09268401563167572, |
| "step": 2515, |
| "valid_targets_mean": 5090.4, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 2.6280646844027125, |
| "grad_norm": 0.5286504269687488, |
| "learning_rate": 3.146182347254228e-05, |
| "loss": 0.2253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09826931357383728, |
| "step": 2520, |
| "valid_targets_mean": 3926.9, |
| "valid_targets_min": 1849 |
| }, |
| { |
| "epoch": 2.633281168492436, |
| "grad_norm": 0.5472063222952046, |
| "learning_rate": 3.141916751024889e-05, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11021539568901062, |
| "step": 2525, |
| "valid_targets_mean": 3473.4, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 2.6384976525821595, |
| "grad_norm": 0.5300711810657301, |
| "learning_rate": 3.137643434102588e-05, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10026170313358307, |
| "step": 2530, |
| "valid_targets_mean": 4814.9, |
| "valid_targets_min": 2288 |
| }, |
| { |
| "epoch": 2.6437141366718833, |
| "grad_norm": 1.174712487837169, |
| "learning_rate": 3.1333624253799464e-05, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12371222674846649, |
| "step": 2535, |
| "valid_targets_mean": 4467.4, |
| "valid_targets_min": 2724 |
| }, |
| { |
| "epoch": 2.6489306207616066, |
| "grad_norm": 0.4546709608823972, |
| "learning_rate": 3.1290737538015904e-05, |
| "loss": 0.221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10781063139438629, |
| "step": 2540, |
| "valid_targets_mean": 5799.5, |
| "valid_targets_min": 2347 |
| }, |
| { |
| "epoch": 2.6541471048513303, |
| "grad_norm": 0.5291702687360377, |
| "learning_rate": 3.1247774483639575e-05, |
| "loss": 0.2249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1144791916012764, |
| "step": 2545, |
| "valid_targets_mean": 5432.8, |
| "valid_targets_min": 2682 |
| }, |
| { |
| "epoch": 2.6593635889410536, |
| "grad_norm": 0.5852435107991737, |
| "learning_rate": 3.120473538115096e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1168883740901947, |
| "step": 2550, |
| "valid_targets_mean": 3021.1, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 2.6645800730307774, |
| "grad_norm": 0.47127956576865276, |
| "learning_rate": 3.116162052154476e-05, |
| "loss": 0.2331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11396898329257965, |
| "step": 2555, |
| "valid_targets_mean": 6150.8, |
| "valid_targets_min": 2352 |
| }, |
| { |
| "epoch": 2.6697965571205007, |
| "grad_norm": 0.5677104907261632, |
| "learning_rate": 3.111843019632784e-05, |
| "loss": 0.219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1140974909067154, |
| "step": 2560, |
| "valid_targets_mean": 4371.8, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 2.6750130412102244, |
| "grad_norm": 0.5135047232303005, |
| "learning_rate": 3.1075164697517326e-05, |
| "loss": 0.2321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14363232254981995, |
| "step": 2565, |
| "valid_targets_mean": 4825.5, |
| "valid_targets_min": 1654 |
| }, |
| { |
| "epoch": 2.6802295252999477, |
| "grad_norm": 0.4614751924595173, |
| "learning_rate": 3.10318243176386e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12825116515159607, |
| "step": 2570, |
| "valid_targets_mean": 6663.1, |
| "valid_targets_min": 4549 |
| }, |
| { |
| "epoch": 2.6854460093896715, |
| "grad_norm": 0.4447211391455603, |
| "learning_rate": 3.0988409349723317e-05, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09917019307613373, |
| "step": 2575, |
| "valid_targets_mean": 4940.4, |
| "valid_targets_min": 1874 |
| }, |
| { |
| "epoch": 2.690662493479395, |
| "grad_norm": 0.5923061285468841, |
| "learning_rate": 3.094492008730746e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12513403594493866, |
| "step": 2580, |
| "valid_targets_mean": 4263.1, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 2.6958789775691185, |
| "grad_norm": 0.47124178649015935, |
| "learning_rate": 3.09013568244293e-05, |
| "loss": 0.2184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13531747460365295, |
| "step": 2585, |
| "valid_targets_mean": 5632.5, |
| "valid_targets_min": 3831 |
| }, |
| { |
| "epoch": 2.701095461658842, |
| "grad_norm": 0.5403423623876756, |
| "learning_rate": 3.085771985562745e-05, |
| "loss": 0.2295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12237776815891266, |
| "step": 2590, |
| "valid_targets_mean": 3775.8, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 2.7063119457485656, |
| "grad_norm": 0.5155907110817727, |
| "learning_rate": 3.081400947593887e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13526003062725067, |
| "step": 2595, |
| "valid_targets_mean": 5696.9, |
| "valid_targets_min": 2821 |
| }, |
| { |
| "epoch": 2.711528429838289, |
| "grad_norm": 0.44091513916610836, |
| "learning_rate": 3.077022598089685e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11125567555427551, |
| "step": 2600, |
| "valid_targets_mean": 5083.6, |
| "valid_targets_min": 2907 |
| }, |
| { |
| "epoch": 2.7167449139280127, |
| "grad_norm": 0.4431674084041847, |
| "learning_rate": 3.072636966652904e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09183455258607864, |
| "step": 2605, |
| "valid_targets_mean": 5000.2, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 2.721961398017736, |
| "grad_norm": 0.5143712648136293, |
| "learning_rate": 3.0682440829355416e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.095421701669693, |
| "step": 2610, |
| "valid_targets_mean": 5004.0, |
| "valid_targets_min": 1716 |
| }, |
| { |
| "epoch": 2.7271778821074597, |
| "grad_norm": 0.651128340932718, |
| "learning_rate": 3.06384397663863e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12816166877746582, |
| "step": 2615, |
| "valid_targets_mean": 4944.4, |
| "valid_targets_min": 2675 |
| }, |
| { |
| "epoch": 2.732394366197183, |
| "grad_norm": 0.5121680237262853, |
| "learning_rate": 3.059436677512035e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09256739914417267, |
| "step": 2620, |
| "valid_targets_mean": 5635.0, |
| "valid_targets_min": 1654 |
| }, |
| { |
| "epoch": 2.7376108502869068, |
| "grad_norm": 0.5253930631743816, |
| "learning_rate": 3.055022215354254e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0999249666929245, |
| "step": 2625, |
| "valid_targets_mean": 4448.1, |
| "valid_targets_min": 1759 |
| }, |
| { |
| "epoch": 2.74282733437663, |
| "grad_norm": 0.4665503122808902, |
| "learning_rate": 3.0506006200122154e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0951077789068222, |
| "step": 2630, |
| "valid_targets_mean": 6096.5, |
| "valid_targets_min": 2287 |
| }, |
| { |
| "epoch": 2.748043818466354, |
| "grad_norm": 0.5540067912846297, |
| "learning_rate": 3.0461719213810756e-05, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10958708822727203, |
| "step": 2635, |
| "valid_targets_mean": 4392.0, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 2.753260302556077, |
| "grad_norm": 0.5403656845643583, |
| "learning_rate": 3.0417361494040167e-05, |
| "loss": 0.2117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09634451568126678, |
| "step": 2640, |
| "valid_targets_mean": 4302.9, |
| "valid_targets_min": 2000 |
| }, |
| { |
| "epoch": 2.758476786645801, |
| "grad_norm": 0.48890425105030777, |
| "learning_rate": 3.037293334072047e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09244073927402496, |
| "step": 2645, |
| "valid_targets_mean": 4441.4, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 2.763693270735524, |
| "grad_norm": 0.8071588301611544, |
| "learning_rate": 3.0328435054237944e-05, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12001083046197891, |
| "step": 2650, |
| "valid_targets_mean": 5670.4, |
| "valid_targets_min": 3512 |
| }, |
| { |
| "epoch": 2.768909754825248, |
| "grad_norm": 0.5166100506124706, |
| "learning_rate": 3.0283866935453057e-05, |
| "loss": 0.2141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09812520444393158, |
| "step": 2655, |
| "valid_targets_mean": 4672.1, |
| "valid_targets_min": 2182 |
| }, |
| { |
| "epoch": 2.7741262389149712, |
| "grad_norm": 0.5431485751253808, |
| "learning_rate": 3.023922928569843e-05, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08231854438781738, |
| "step": 2660, |
| "valid_targets_mean": 4050.5, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 2.779342723004695, |
| "grad_norm": 0.548024674822343, |
| "learning_rate": 3.019452240677678e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10818839073181152, |
| "step": 2665, |
| "valid_targets_mean": 5073.2, |
| "valid_targets_min": 2784 |
| }, |
| { |
| "epoch": 2.7845592070944183, |
| "grad_norm": 0.45219125259119536, |
| "learning_rate": 3.0149746600958908e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09542427957057953, |
| "step": 2670, |
| "valid_targets_mean": 5374.5, |
| "valid_targets_min": 2643 |
| }, |
| { |
| "epoch": 2.789775691184142, |
| "grad_norm": 0.5237070659230012, |
| "learning_rate": 3.0104902170981633e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12666651606559753, |
| "step": 2675, |
| "valid_targets_mean": 5108.5, |
| "valid_targets_min": 2881 |
| }, |
| { |
| "epoch": 2.7949921752738653, |
| "grad_norm": 0.5623383881117362, |
| "learning_rate": 3.005998942004576e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11492735147476196, |
| "step": 2680, |
| "valid_targets_mean": 4912.5, |
| "valid_targets_min": 1576 |
| }, |
| { |
| "epoch": 2.800208659363589, |
| "grad_norm": 0.4967970451357785, |
| "learning_rate": 3.0015008651814023e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10141061246395111, |
| "step": 2685, |
| "valid_targets_mean": 5782.2, |
| "valid_targets_min": 4685 |
| }, |
| { |
| "epoch": 2.8054251434533124, |
| "grad_norm": 0.5569297331417894, |
| "learning_rate": 2.9969960170409033e-05, |
| "loss": 0.2061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09066125750541687, |
| "step": 2690, |
| "valid_targets_mean": 3822.2, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 2.810641627543036, |
| "grad_norm": 0.506000102515865, |
| "learning_rate": 2.9924844280411208e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08468958735466003, |
| "step": 2695, |
| "valid_targets_mean": 4311.0, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 2.8158581116327595, |
| "grad_norm": 0.5017771195620422, |
| "learning_rate": 2.987966128685674e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10154730081558228, |
| "step": 2700, |
| "valid_targets_mean": 5108.1, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 2.821074595722483, |
| "grad_norm": 0.5476798734262958, |
| "learning_rate": 2.9834411495235526e-05, |
| "loss": 0.2133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12037491798400879, |
| "step": 2705, |
| "valid_targets_mean": 5233.4, |
| "valid_targets_min": 2800 |
| }, |
| { |
| "epoch": 2.8262910798122065, |
| "grad_norm": 0.44932035235145384, |
| "learning_rate": 2.9789095211489082e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09355040639638901, |
| "step": 2710, |
| "valid_targets_mean": 5838.6, |
| "valid_targets_min": 3760 |
| }, |
| { |
| "epoch": 2.8315075639019303, |
| "grad_norm": 0.47333389883380045, |
| "learning_rate": 2.9743712742008486e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10253272950649261, |
| "step": 2715, |
| "valid_targets_mean": 4421.9, |
| "valid_targets_min": 2890 |
| }, |
| { |
| "epoch": 2.8367240479916536, |
| "grad_norm": 0.5375950820349465, |
| "learning_rate": 2.9698264393632326e-05, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1102854460477829, |
| "step": 2720, |
| "valid_targets_mean": 4968.8, |
| "valid_targets_min": 2680 |
| }, |
| { |
| "epoch": 2.8419405320813773, |
| "grad_norm": 0.5232020100718042, |
| "learning_rate": 2.9652750473644597e-05, |
| "loss": 0.2235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11462263762950897, |
| "step": 2725, |
| "valid_targets_mean": 4508.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 2.8471570161711006, |
| "grad_norm": 0.5091367498962615, |
| "learning_rate": 2.9607171289772635e-05, |
| "loss": 0.2011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.079213947057724, |
| "step": 2730, |
| "valid_targets_mean": 3589.6, |
| "valid_targets_min": 1720 |
| }, |
| { |
| "epoch": 2.8523735002608244, |
| "grad_norm": 0.5643515615874065, |
| "learning_rate": 2.9561527150185035e-05, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1061231940984726, |
| "step": 2735, |
| "valid_targets_mean": 3623.8, |
| "valid_targets_min": 2571 |
| }, |
| { |
| "epoch": 2.8575899843505477, |
| "grad_norm": 0.5613579427983747, |
| "learning_rate": 2.9515818363489582e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11006490886211395, |
| "step": 2740, |
| "valid_targets_mean": 3667.1, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 2.8628064684402714, |
| "grad_norm": 0.5135290693677292, |
| "learning_rate": 2.9470045238731127e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08775778114795685, |
| "step": 2745, |
| "valid_targets_mean": 3874.0, |
| "valid_targets_min": 1796 |
| }, |
| { |
| "epoch": 2.8680229525299947, |
| "grad_norm": 0.5463293762668832, |
| "learning_rate": 2.9424208085389544e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09706106781959534, |
| "step": 2750, |
| "valid_targets_mean": 3911.5, |
| "valid_targets_min": 1673 |
| }, |
| { |
| "epoch": 2.873239436619718, |
| "grad_norm": 0.5183834834422304, |
| "learning_rate": 2.9378307213377603e-05, |
| "loss": 0.2115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08352254331111908, |
| "step": 2755, |
| "valid_targets_mean": 4454.4, |
| "valid_targets_min": 2804 |
| }, |
| { |
| "epoch": 2.878455920709442, |
| "grad_norm": 0.5770424551148836, |
| "learning_rate": 2.93323429330389e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09712273627519608, |
| "step": 2760, |
| "valid_targets_mean": 3493.5, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 2.8836724047991655, |
| "grad_norm": 0.570092751100507, |
| "learning_rate": 2.9286315555145718e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09480474889278412, |
| "step": 2765, |
| "valid_targets_mean": 3264.5, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 2.888888888888889, |
| "grad_norm": 0.5805090100880006, |
| "learning_rate": 2.924022539089698e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10904529690742493, |
| "step": 2770, |
| "valid_targets_mean": 3947.9, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 2.894105372978612, |
| "grad_norm": 0.5143467986188817, |
| "learning_rate": 2.9194072751916106e-05, |
| "loss": 0.2109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10561254620552063, |
| "step": 2775, |
| "valid_targets_mean": 4174.1, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 2.899321857068336, |
| "grad_norm": 0.5183144103803144, |
| "learning_rate": 2.914785795024893e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11688891053199768, |
| "step": 2780, |
| "valid_targets_mean": 4901.1, |
| "valid_targets_min": 1730 |
| }, |
| { |
| "epoch": 2.9045383411580596, |
| "grad_norm": 0.46116198229098343, |
| "learning_rate": 2.9101581298361563e-05, |
| "loss": 0.2042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09363597631454468, |
| "step": 2785, |
| "valid_targets_mean": 5823.0, |
| "valid_targets_min": 2244 |
| }, |
| { |
| "epoch": 2.909754825247783, |
| "grad_norm": 0.48816280745048407, |
| "learning_rate": 2.90552431091383e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10668014734983444, |
| "step": 2790, |
| "valid_targets_mean": 5915.4, |
| "valid_targets_min": 3217 |
| }, |
| { |
| "epoch": 2.9149713093375063, |
| "grad_norm": 0.5517023076313732, |
| "learning_rate": 2.9008843695879508e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08863114565610886, |
| "step": 2795, |
| "valid_targets_mean": 3674.1, |
| "valid_targets_min": 2100 |
| }, |
| { |
| "epoch": 2.92018779342723, |
| "grad_norm": 0.5499560039327777, |
| "learning_rate": 2.896238337229949e-05, |
| "loss": 0.2086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09519973397254944, |
| "step": 2800, |
| "valid_targets_mean": 3128.8, |
| "valid_targets_min": 1972 |
| }, |
| { |
| "epoch": 2.9254042775169538, |
| "grad_norm": 0.5069525819334271, |
| "learning_rate": 2.891586245252439e-05, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09028097987174988, |
| "step": 2805, |
| "valid_targets_mean": 3955.2, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 2.930620761606677, |
| "grad_norm": 0.5284167009175657, |
| "learning_rate": 2.886928125109003e-05, |
| "loss": 0.204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09937043488025665, |
| "step": 2810, |
| "valid_targets_mean": 3209.9, |
| "valid_targets_min": 1695 |
| }, |
| { |
| "epoch": 2.9358372456964004, |
| "grad_norm": 0.514428610600362, |
| "learning_rate": 2.882264008293982e-05, |
| "loss": 0.212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09932732582092285, |
| "step": 2815, |
| "valid_targets_mean": 4201.6, |
| "valid_targets_min": 3051 |
| }, |
| { |
| "epoch": 2.941053729786124, |
| "grad_norm": 0.47964295600940404, |
| "learning_rate": 2.8775939263422615e-05, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09465121477842331, |
| "step": 2820, |
| "valid_targets_mean": 4782.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.946270213875848, |
| "grad_norm": 0.486121904797812, |
| "learning_rate": 2.872917910829059e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08913619071245193, |
| "step": 2825, |
| "valid_targets_mean": 5105.4, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 2.951486697965571, |
| "grad_norm": 0.5131169786296125, |
| "learning_rate": 2.8682359933697075e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11593284457921982, |
| "step": 2830, |
| "valid_targets_mean": 6001.1, |
| "valid_targets_min": 4034 |
| }, |
| { |
| "epoch": 2.9567031820552945, |
| "grad_norm": 0.459211391733568, |
| "learning_rate": 2.863548205619447e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09318007528781891, |
| "step": 2835, |
| "valid_targets_mean": 6029.0, |
| "valid_targets_min": 3253 |
| }, |
| { |
| "epoch": 2.9619196661450182, |
| "grad_norm": 0.4458782331734817, |
| "learning_rate": 2.8588545792732056e-05, |
| "loss": 0.2082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09560025483369827, |
| "step": 2840, |
| "valid_targets_mean": 6000.8, |
| "valid_targets_min": 2719 |
| }, |
| { |
| "epoch": 2.967136150234742, |
| "grad_norm": 0.5232106421625217, |
| "learning_rate": 2.8541551460653875e-05, |
| "loss": 0.2126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10834867507219315, |
| "step": 2845, |
| "valid_targets_mean": 4287.6, |
| "valid_targets_min": 1332 |
| }, |
| { |
| "epoch": 2.9723526343244653, |
| "grad_norm": 0.4928528121504029, |
| "learning_rate": 2.8494499377696586e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10745708644390106, |
| "step": 2850, |
| "valid_targets_mean": 4780.6, |
| "valid_targets_min": 2086 |
| }, |
| { |
| "epoch": 2.9775691184141886, |
| "grad_norm": 0.5418304544270003, |
| "learning_rate": 2.8447389861987295e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11443772912025452, |
| "step": 2855, |
| "valid_targets_mean": 5209.1, |
| "valid_targets_min": 2074 |
| }, |
| { |
| "epoch": 2.9827856025039123, |
| "grad_norm": 0.5349528695072473, |
| "learning_rate": 2.8400223232041456e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0880689024925232, |
| "step": 2860, |
| "valid_targets_mean": 3408.2, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 2.988002086593636, |
| "grad_norm": 0.521180920734931, |
| "learning_rate": 2.835299980676064e-05, |
| "loss": 0.2108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09700939059257507, |
| "step": 2865, |
| "valid_targets_mean": 4068.4, |
| "valid_targets_min": 1601 |
| }, |
| { |
| "epoch": 2.9932185706833594, |
| "grad_norm": 0.5841605140570019, |
| "learning_rate": 2.8305719905430442e-05, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09895017743110657, |
| "step": 2870, |
| "valid_targets_mean": 3847.4, |
| "valid_targets_min": 1880 |
| }, |
| { |
| "epoch": 2.9984350547730827, |
| "grad_norm": 0.5340999977183173, |
| "learning_rate": 2.8258383847718306e-05, |
| "loss": 0.2011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0996866226196289, |
| "step": 2875, |
| "valid_targets_mean": 4587.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 3.0041731872717787, |
| "grad_norm": 0.5432573380933222, |
| "learning_rate": 2.821099195367135e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10880480706691742, |
| "step": 2880, |
| "valid_targets_mean": 4063.4, |
| "valid_targets_min": 1935 |
| }, |
| { |
| "epoch": 3.0093896713615025, |
| "grad_norm": 0.5098029143065635, |
| "learning_rate": 2.8163544543714216e-05, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1081823781132698, |
| "step": 2885, |
| "valid_targets_mean": 5142.0, |
| "valid_targets_min": 3182 |
| }, |
| { |
| "epoch": 3.014606155451226, |
| "grad_norm": 0.5895808146199872, |
| "learning_rate": 2.811604193864689e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10698902606964111, |
| "step": 2890, |
| "valid_targets_mean": 4254.1, |
| "valid_targets_min": 2355 |
| }, |
| { |
| "epoch": 3.0198226395409495, |
| "grad_norm": 0.5650383200847922, |
| "learning_rate": 2.806848445964255e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11510180681943893, |
| "step": 2895, |
| "valid_targets_mean": 5211.9, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 3.025039123630673, |
| "grad_norm": 0.5046127729418071, |
| "learning_rate": 2.8020872428245382e-05, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10055027157068253, |
| "step": 2900, |
| "valid_targets_mean": 4550.6, |
| "valid_targets_min": 2221 |
| }, |
| { |
| "epoch": 3.0302556077203966, |
| "grad_norm": 0.5143888700198478, |
| "learning_rate": 2.797320616636841e-05, |
| "loss": 0.1997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08974705636501312, |
| "step": 2905, |
| "valid_targets_mean": 4972.5, |
| "valid_targets_min": 1387 |
| }, |
| { |
| "epoch": 3.03547209181012, |
| "grad_norm": 0.5639627901417625, |
| "learning_rate": 2.792548599629132e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1048688143491745, |
| "step": 2910, |
| "valid_targets_mean": 3778.1, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 3.0406885758998436, |
| "grad_norm": 0.4911563103950299, |
| "learning_rate": 2.787771224065829e-05, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10737472772598267, |
| "step": 2915, |
| "valid_targets_mean": 5409.1, |
| "valid_targets_min": 1856 |
| }, |
| { |
| "epoch": 3.045905059989567, |
| "grad_norm": 0.5109420202460491, |
| "learning_rate": 2.782988522247578e-05, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07555101811885834, |
| "step": 2920, |
| "valid_targets_mean": 3609.0, |
| "valid_targets_min": 1389 |
| }, |
| { |
| "epoch": 3.0511215440792907, |
| "grad_norm": 0.5698280895875829, |
| "learning_rate": 2.7782005265110375e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1072496846318245, |
| "step": 2925, |
| "valid_targets_mean": 4099.1, |
| "valid_targets_min": 1709 |
| }, |
| { |
| "epoch": 3.056338028169014, |
| "grad_norm": 0.5686178883209573, |
| "learning_rate": 2.7734072692286604e-05, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.098935566842556, |
| "step": 2930, |
| "valid_targets_mean": 4887.2, |
| "valid_targets_min": 2229 |
| }, |
| { |
| "epoch": 3.0615545122587378, |
| "grad_norm": 0.46177160728507305, |
| "learning_rate": 2.768608782808472e-05, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11339068412780762, |
| "step": 2935, |
| "valid_targets_mean": 4938.5, |
| "valid_targets_min": 2697 |
| }, |
| { |
| "epoch": 3.066770996348461, |
| "grad_norm": 0.6115771579825644, |
| "learning_rate": 2.763805099693854e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11126293987035751, |
| "step": 2940, |
| "valid_targets_mean": 5077.1, |
| "valid_targets_min": 2709 |
| }, |
| { |
| "epoch": 3.071987480438185, |
| "grad_norm": 0.49981838433460235, |
| "learning_rate": 2.7589962523633218e-05, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10545983910560608, |
| "step": 2945, |
| "valid_targets_mean": 5120.2, |
| "valid_targets_min": 4024 |
| }, |
| { |
| "epoch": 3.077203964527908, |
| "grad_norm": 0.5155139995422544, |
| "learning_rate": 2.75418227333031e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09514853358268738, |
| "step": 2950, |
| "valid_targets_mean": 4197.0, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 3.082420448617632, |
| "grad_norm": 0.5631463806969298, |
| "learning_rate": 2.749363195142947e-05, |
| "loss": 0.2114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11387265473604202, |
| "step": 2955, |
| "valid_targets_mean": 3833.0, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 3.087636932707355, |
| "grad_norm": 0.4798516487742818, |
| "learning_rate": 2.744539050383838e-05, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08828402310609818, |
| "step": 2960, |
| "valid_targets_mean": 5108.2, |
| "valid_targets_min": 3763 |
| }, |
| { |
| "epoch": 3.092853416797079, |
| "grad_norm": 0.49935619585933316, |
| "learning_rate": 2.7397098716698463e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0784873217344284, |
| "step": 2965, |
| "valid_targets_mean": 3645.4, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 3.0980699008868022, |
| "grad_norm": 0.5740236186286182, |
| "learning_rate": 2.7348756916518663e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11879893392324448, |
| "step": 2970, |
| "valid_targets_mean": 4630.5, |
| "valid_targets_min": 2337 |
| }, |
| { |
| "epoch": 3.103286384976526, |
| "grad_norm": 0.49720043396949304, |
| "learning_rate": 2.7300365430146117e-05, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09360023587942123, |
| "step": 2975, |
| "valid_targets_mean": 4715.8, |
| "valid_targets_min": 2100 |
| }, |
| { |
| "epoch": 3.1085028690662493, |
| "grad_norm": 0.5748390414549844, |
| "learning_rate": 2.7251924584763867e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08847415447235107, |
| "step": 2980, |
| "valid_targets_mean": 5378.0, |
| "valid_targets_min": 1436 |
| }, |
| { |
| "epoch": 3.113719353155973, |
| "grad_norm": 0.6128159668745522, |
| "learning_rate": 2.7203434707888684e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10356289148330688, |
| "step": 2985, |
| "valid_targets_mean": 4386.2, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 3.1189358372456963, |
| "grad_norm": 0.4623396861624209, |
| "learning_rate": 2.7154896127368872e-05, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08556468784809113, |
| "step": 2990, |
| "valid_targets_mean": 4330.9, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 3.12415232133542, |
| "grad_norm": 0.47632641128775954, |
| "learning_rate": 2.7106309171381995e-05, |
| "loss": 0.2206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09726077318191528, |
| "step": 2995, |
| "valid_targets_mean": 5095.5, |
| "valid_targets_min": 2772 |
| }, |
| { |
| "epoch": 3.1293688054251434, |
| "grad_norm": 0.4358985904565822, |
| "learning_rate": 2.705767416843272e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08343064039945602, |
| "step": 3000, |
| "valid_targets_mean": 5686.4, |
| "valid_targets_min": 2232 |
| }, |
| { |
| "epoch": 3.134585289514867, |
| "grad_norm": 0.4662300187644352, |
| "learning_rate": 2.700899144735055e-05, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09762425720691681, |
| "step": 3005, |
| "valid_targets_mean": 7094.2, |
| "valid_targets_min": 4216 |
| }, |
| { |
| "epoch": 3.1398017736045905, |
| "grad_norm": 0.572864701842524, |
| "learning_rate": 2.696026133728763e-05, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11816585063934326, |
| "step": 3010, |
| "valid_targets_mean": 4220.5, |
| "valid_targets_min": 1831 |
| }, |
| { |
| "epoch": 3.145018257694314, |
| "grad_norm": 0.6564931432141663, |
| "learning_rate": 2.69114841677165e-05, |
| "loss": 0.201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14300262928009033, |
| "step": 3015, |
| "valid_targets_mean": 4046.2, |
| "valid_targets_min": 2195 |
| }, |
| { |
| "epoch": 3.1502347417840375, |
| "grad_norm": 0.5445913204399667, |
| "learning_rate": 2.6862660268427885e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08168022334575653, |
| "step": 3020, |
| "valid_targets_mean": 3510.5, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 3.1554512258737613, |
| "grad_norm": 0.43119649018053213, |
| "learning_rate": 2.6813789969528454e-05, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09258949756622314, |
| "step": 3025, |
| "valid_targets_mean": 5464.4, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 3.1606677099634846, |
| "grad_norm": 0.4836818452699736, |
| "learning_rate": 2.6764873601438588e-05, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09587261825799942, |
| "step": 3030, |
| "valid_targets_mean": 4636.5, |
| "valid_targets_min": 3153 |
| }, |
| { |
| "epoch": 3.1658841940532083, |
| "grad_norm": 0.5586001035995521, |
| "learning_rate": 2.6715911494890163e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10193102061748505, |
| "step": 3035, |
| "valid_targets_mean": 4426.2, |
| "valid_targets_min": 1840 |
| }, |
| { |
| "epoch": 3.1711006781429316, |
| "grad_norm": 0.5283576654998282, |
| "learning_rate": 2.6666903980924284e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0847351923584938, |
| "step": 3040, |
| "valid_targets_mean": 3890.5, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 3.1763171622326554, |
| "grad_norm": 0.5676964469700314, |
| "learning_rate": 2.6617851390889074e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09379324316978455, |
| "step": 3045, |
| "valid_targets_mean": 4143.2, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 3.1815336463223787, |
| "grad_norm": 0.4716476728022729, |
| "learning_rate": 2.6568754056437412e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09522826969623566, |
| "step": 3050, |
| "valid_targets_mean": 5153.1, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 3.1867501304121024, |
| "grad_norm": 0.5416779765838748, |
| "learning_rate": 2.6519612309524727e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1138598769903183, |
| "step": 3055, |
| "valid_targets_mean": 5099.8, |
| "valid_targets_min": 1988 |
| }, |
| { |
| "epoch": 3.1919666145018257, |
| "grad_norm": 0.46628157941186205, |
| "learning_rate": 2.6470426482406688e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09998682886362076, |
| "step": 3060, |
| "valid_targets_mean": 5174.2, |
| "valid_targets_min": 2479 |
| }, |
| { |
| "epoch": 3.1971830985915495, |
| "grad_norm": 0.47981739400067036, |
| "learning_rate": 2.6421196907637036e-05, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12754079699516296, |
| "step": 3065, |
| "valid_targets_mean": 5541.4, |
| "valid_targets_min": 1640 |
| }, |
| { |
| "epoch": 3.202399582681273, |
| "grad_norm": 0.4885126359821133, |
| "learning_rate": 2.6371923918065273e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10627619922161102, |
| "step": 3070, |
| "valid_targets_mean": 5309.2, |
| "valid_targets_min": 2826 |
| }, |
| { |
| "epoch": 3.2076160667709965, |
| "grad_norm": 0.48230793079709744, |
| "learning_rate": 2.6322607846834444e-05, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09124992787837982, |
| "step": 3075, |
| "valid_targets_mean": 5459.0, |
| "valid_targets_min": 1847 |
| }, |
| { |
| "epoch": 3.21283255086072, |
| "grad_norm": 0.4840767198131845, |
| "learning_rate": 2.6273249027378878e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11224304139614105, |
| "step": 3080, |
| "valid_targets_mean": 6000.8, |
| "valid_targets_min": 2293 |
| }, |
| { |
| "epoch": 3.2180490349504436, |
| "grad_norm": 0.5298237383686266, |
| "learning_rate": 2.6223847793421938e-05, |
| "loss": 0.2123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12696264684200287, |
| "step": 3085, |
| "valid_targets_mean": 5593.4, |
| "valid_targets_min": 1575 |
| }, |
| { |
| "epoch": 3.223265519040167, |
| "grad_norm": 0.5203116045231617, |
| "learning_rate": 2.6174404478973746e-05, |
| "loss": 0.2055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1275153011083603, |
| "step": 3090, |
| "valid_targets_mean": 5331.2, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 3.2284820031298906, |
| "grad_norm": 0.5828601869235734, |
| "learning_rate": 2.612491941832894e-05, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0915302038192749, |
| "step": 3095, |
| "valid_targets_mean": 4977.4, |
| "valid_targets_min": 2578 |
| }, |
| { |
| "epoch": 3.233698487219614, |
| "grad_norm": 0.5398544671737381, |
| "learning_rate": 2.6075392946064417e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10789971053600311, |
| "step": 3100, |
| "valid_targets_mean": 3956.2, |
| "valid_targets_min": 2939 |
| }, |
| { |
| "epoch": 3.2389149713093377, |
| "grad_norm": 0.4403664580551399, |
| "learning_rate": 2.6025825397037057e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08687441051006317, |
| "step": 3105, |
| "valid_targets_mean": 5205.9, |
| "valid_targets_min": 2809 |
| }, |
| { |
| "epoch": 3.244131455399061, |
| "grad_norm": 0.7045669258986819, |
| "learning_rate": 2.5976217106381477e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10237893462181091, |
| "step": 3110, |
| "valid_targets_mean": 4216.4, |
| "valid_targets_min": 2507 |
| }, |
| { |
| "epoch": 3.2493479394887848, |
| "grad_norm": 0.7939478704963069, |
| "learning_rate": 2.5926568409507754e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10826735943555832, |
| "step": 3115, |
| "valid_targets_mean": 3386.1, |
| "valid_targets_min": 2024 |
| }, |
| { |
| "epoch": 3.254564423578508, |
| "grad_norm": 0.4631710792328562, |
| "learning_rate": 2.587687964209914e-05, |
| "loss": 0.2002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09974386543035507, |
| "step": 3120, |
| "valid_targets_mean": 6154.4, |
| "valid_targets_min": 3831 |
| }, |
| { |
| "epoch": 3.2597809076682314, |
| "grad_norm": 0.6167658223322712, |
| "learning_rate": 2.5827151140109836e-05, |
| "loss": 0.2075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10356143116950989, |
| "step": 3125, |
| "valid_targets_mean": 3086.8, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 3.264997391757955, |
| "grad_norm": 0.4803738947300794, |
| "learning_rate": 2.5777383239762676e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0884963721036911, |
| "step": 3130, |
| "valid_targets_mean": 4174.9, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 3.270213875847679, |
| "grad_norm": 0.4983305286310679, |
| "learning_rate": 2.5727576277546888e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10087882727384567, |
| "step": 3135, |
| "valid_targets_mean": 5994.5, |
| "valid_targets_min": 2589 |
| }, |
| { |
| "epoch": 3.275430359937402, |
| "grad_norm": 0.5292682881012424, |
| "learning_rate": 2.5677730590215792e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08946658670902252, |
| "step": 3140, |
| "valid_targets_mean": 4218.1, |
| "valid_targets_min": 2399 |
| }, |
| { |
| "epoch": 3.2806468440271255, |
| "grad_norm": 0.5432813000606039, |
| "learning_rate": 2.5627846514784553e-05, |
| "loss": 0.2126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10207852721214294, |
| "step": 3145, |
| "valid_targets_mean": 4425.6, |
| "valid_targets_min": 1771 |
| }, |
| { |
| "epoch": 3.2858633281168492, |
| "grad_norm": 0.4739180329442054, |
| "learning_rate": 2.5577924388527847e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08045230805873871, |
| "step": 3150, |
| "valid_targets_mean": 4412.9, |
| "valid_targets_min": 1902 |
| }, |
| { |
| "epoch": 3.291079812206573, |
| "grad_norm": 0.5129124350976356, |
| "learning_rate": 2.552796454897766e-05, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10335686802864075, |
| "step": 3155, |
| "valid_targets_mean": 4059.5, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 3.2962962962962963, |
| "grad_norm": 0.5048649484725314, |
| "learning_rate": 2.5477967333920942e-05, |
| "loss": 0.2118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08793478459119797, |
| "step": 3160, |
| "valid_targets_mean": 4847.5, |
| "valid_targets_min": 2248 |
| }, |
| { |
| "epoch": 3.3015127803860196, |
| "grad_norm": 0.5096565360116999, |
| "learning_rate": 2.5427933081397357e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09852844476699829, |
| "step": 3165, |
| "valid_targets_mean": 6222.0, |
| "valid_targets_min": 2832 |
| }, |
| { |
| "epoch": 3.3067292644757433, |
| "grad_norm": 0.5524222903071977, |
| "learning_rate": 2.5377862129696966e-05, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09711448103189468, |
| "step": 3170, |
| "valid_targets_mean": 3722.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 3.311945748565467, |
| "grad_norm": 0.5010581256335986, |
| "learning_rate": 2.5327754817357974e-05, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11068551242351532, |
| "step": 3175, |
| "valid_targets_mean": 4448.4, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 3.3171622326551904, |
| "grad_norm": 0.5784075536421294, |
| "learning_rate": 2.527761148316443e-05, |
| "loss": 0.2112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11487346887588501, |
| "step": 3180, |
| "valid_targets_mean": 4466.1, |
| "valid_targets_min": 2013 |
| }, |
| { |
| "epoch": 3.3223787167449137, |
| "grad_norm": 0.426680182728146, |
| "learning_rate": 2.522743246614392e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10178497433662415, |
| "step": 3185, |
| "valid_targets_mean": 7223.5, |
| "valid_targets_min": 3311 |
| }, |
| { |
| "epoch": 3.3275952008346374, |
| "grad_norm": 0.49811839249156864, |
| "learning_rate": 2.5177218105565306e-05, |
| "loss": 0.2066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1128610149025917, |
| "step": 3190, |
| "valid_targets_mean": 6292.2, |
| "valid_targets_min": 3554 |
| }, |
| { |
| "epoch": 3.332811684924361, |
| "grad_norm": 0.5078621835027752, |
| "learning_rate": 2.5126968740936386e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08550669997930527, |
| "step": 3195, |
| "valid_targets_mean": 4097.4, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 3.3380281690140845, |
| "grad_norm": 0.45696188434632573, |
| "learning_rate": 2.5076684712001655e-05, |
| "loss": 0.2074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10041764378547668, |
| "step": 3200, |
| "valid_targets_mean": 5978.9, |
| "valid_targets_min": 4028 |
| }, |
| { |
| "epoch": 3.343244653103808, |
| "grad_norm": 0.5543164563658722, |
| "learning_rate": 2.5026366358739963e-05, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09462873637676239, |
| "step": 3205, |
| "valid_targets_mean": 3540.6, |
| "valid_targets_min": 1551 |
| }, |
| { |
| "epoch": 3.3484611371935316, |
| "grad_norm": 0.48975883173543067, |
| "learning_rate": 2.4976014021362236e-05, |
| "loss": 0.2017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09664043039083481, |
| "step": 3210, |
| "valid_targets_mean": 5091.4, |
| "valid_targets_min": 1972 |
| }, |
| { |
| "epoch": 3.3536776212832553, |
| "grad_norm": 0.513525253001271, |
| "learning_rate": 2.492562804030918e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09498007595539093, |
| "step": 3215, |
| "valid_targets_mean": 4646.6, |
| "valid_targets_min": 2783 |
| }, |
| { |
| "epoch": 3.3588941053729786, |
| "grad_norm": 0.45078436201229916, |
| "learning_rate": 2.487520875624895e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08881426602602005, |
| "step": 3220, |
| "valid_targets_mean": 5305.9, |
| "valid_targets_min": 1930 |
| }, |
| { |
| "epoch": 3.364110589462702, |
| "grad_norm": 0.5572321448921217, |
| "learning_rate": 2.48247565100749e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10880579054355621, |
| "step": 3225, |
| "valid_targets_mean": 4563.0, |
| "valid_targets_min": 2926 |
| }, |
| { |
| "epoch": 3.3693270735524257, |
| "grad_norm": 0.45553103261946104, |
| "learning_rate": 2.4774271642903213e-05, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09201472997665405, |
| "step": 3230, |
| "valid_targets_mean": 5588.8, |
| "valid_targets_min": 3122 |
| }, |
| { |
| "epoch": 3.3745435576421494, |
| "grad_norm": 0.5351435584039045, |
| "learning_rate": 2.4723754496070652e-05, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12355613708496094, |
| "step": 3235, |
| "valid_targets_mean": 5921.0, |
| "valid_targets_min": 1685 |
| }, |
| { |
| "epoch": 3.3797600417318727, |
| "grad_norm": 0.525343936043067, |
| "learning_rate": 2.4673205411132218e-05, |
| "loss": 0.2011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08146161586046219, |
| "step": 3240, |
| "valid_targets_mean": 4078.1, |
| "valid_targets_min": 1735 |
| }, |
| { |
| "epoch": 3.384976525821596, |
| "grad_norm": 0.5969585175703439, |
| "learning_rate": 2.462262472985886e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11669494211673737, |
| "step": 3245, |
| "valid_targets_mean": 4652.0, |
| "valid_targets_min": 2152 |
| }, |
| { |
| "epoch": 3.3901930099113198, |
| "grad_norm": 0.4904811094853748, |
| "learning_rate": 2.457201279423514e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09706364572048187, |
| "step": 3250, |
| "valid_targets_mean": 5183.4, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 3.3954094940010435, |
| "grad_norm": 0.48524335395336343, |
| "learning_rate": 2.4521369946456954e-05, |
| "loss": 0.2045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07379470020532608, |
| "step": 3255, |
| "valid_targets_mean": 4762.6, |
| "valid_targets_min": 2958 |
| }, |
| { |
| "epoch": 3.400625978090767, |
| "grad_norm": 0.5190341323172759, |
| "learning_rate": 2.447069652892918e-05, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09849357604980469, |
| "step": 3260, |
| "valid_targets_mean": 4050.6, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 3.40584246218049, |
| "grad_norm": 0.5384524430842462, |
| "learning_rate": 2.4419992884263404e-05, |
| "loss": 0.2143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10016826540231705, |
| "step": 3265, |
| "valid_targets_mean": 3539.6, |
| "valid_targets_min": 1561 |
| }, |
| { |
| "epoch": 3.411058946270214, |
| "grad_norm": 0.4839432642617593, |
| "learning_rate": 2.436925935527557e-05, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09900754690170288, |
| "step": 3270, |
| "valid_targets_mean": 5767.1, |
| "valid_targets_min": 2299 |
| }, |
| { |
| "epoch": 3.4162754303599376, |
| "grad_norm": 0.5696481657445573, |
| "learning_rate": 2.4318496284983676e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10886025428771973, |
| "step": 3275, |
| "valid_targets_mean": 3911.4, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 3.421491914449661, |
| "grad_norm": 0.5366826232420506, |
| "learning_rate": 2.4267704016605453e-05, |
| "loss": 0.201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08289587497711182, |
| "step": 3280, |
| "valid_targets_mean": 3652.1, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 3.4267083985393842, |
| "grad_norm": 0.44760621004310186, |
| "learning_rate": 2.421688289355606e-05, |
| "loss": 0.1929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08253911137580872, |
| "step": 3285, |
| "valid_targets_mean": 5076.9, |
| "valid_targets_min": 1472 |
| }, |
| { |
| "epoch": 3.431924882629108, |
| "grad_norm": 0.4659646608854954, |
| "learning_rate": 2.4166033259445723e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09929650276899338, |
| "step": 3290, |
| "valid_targets_mean": 5470.1, |
| "valid_targets_min": 1714 |
| }, |
| { |
| "epoch": 3.4371413667188317, |
| "grad_norm": 0.4944754452218446, |
| "learning_rate": 2.4115155458077453e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1077100932598114, |
| "step": 3295, |
| "valid_targets_mean": 6142.6, |
| "valid_targets_min": 4037 |
| }, |
| { |
| "epoch": 3.442357850808555, |
| "grad_norm": 0.522019943595844, |
| "learning_rate": 2.4064249833444702e-05, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10570424795150757, |
| "step": 3300, |
| "valid_targets_mean": 4540.2, |
| "valid_targets_min": 2456 |
| }, |
| { |
| "epoch": 3.4475743348982784, |
| "grad_norm": 0.522378360073098, |
| "learning_rate": 2.401331672972904e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11249788105487823, |
| "step": 3305, |
| "valid_targets_mean": 4124.2, |
| "valid_targets_min": 1964 |
| }, |
| { |
| "epoch": 3.452790818988002, |
| "grad_norm": 0.42580018646073436, |
| "learning_rate": 2.3962356491297814e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07327315956354141, |
| "step": 3310, |
| "valid_targets_mean": 5672.4, |
| "valid_targets_min": 4383 |
| }, |
| { |
| "epoch": 3.458007303077726, |
| "grad_norm": 0.4679885478899873, |
| "learning_rate": 2.391136946270186e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10529530048370361, |
| "step": 3315, |
| "valid_targets_mean": 5588.2, |
| "valid_targets_min": 1455 |
| }, |
| { |
| "epoch": 3.463223787167449, |
| "grad_norm": 0.5281070345011083, |
| "learning_rate": 2.3860355988673122e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09942032396793365, |
| "step": 3320, |
| "valid_targets_mean": 5508.9, |
| "valid_targets_min": 1571 |
| }, |
| { |
| "epoch": 3.4684402712571725, |
| "grad_norm": 0.5745443529023152, |
| "learning_rate": 2.380931641412236e-05, |
| "loss": 0.2117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11996541917324066, |
| "step": 3325, |
| "valid_targets_mean": 5269.0, |
| "valid_targets_min": 2910 |
| }, |
| { |
| "epoch": 3.473656755346896, |
| "grad_norm": 0.5576721588744232, |
| "learning_rate": 2.3758251084136794e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10790915787220001, |
| "step": 3330, |
| "valid_targets_mean": 4009.0, |
| "valid_targets_min": 1859 |
| }, |
| { |
| "epoch": 3.4788732394366195, |
| "grad_norm": 0.4679862459416396, |
| "learning_rate": 2.3707160343977792e-05, |
| "loss": 0.2029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10469825565814972, |
| "step": 3335, |
| "valid_targets_mean": 5888.2, |
| "valid_targets_min": 2404 |
| }, |
| { |
| "epoch": 3.4840897235263433, |
| "grad_norm": 0.49135430552405057, |
| "learning_rate": 2.3656044539078523e-05, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10415101796388626, |
| "step": 3340, |
| "valid_targets_mean": 5754.0, |
| "valid_targets_min": 3117 |
| }, |
| { |
| "epoch": 3.4893062076160666, |
| "grad_norm": 0.49652290425608847, |
| "learning_rate": 2.3604904015041617e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1110752671957016, |
| "step": 3345, |
| "valid_targets_mean": 5765.8, |
| "valid_targets_min": 4411 |
| }, |
| { |
| "epoch": 3.4945226917057903, |
| "grad_norm": 0.5481521868558625, |
| "learning_rate": 2.3553739117636835e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11676967144012451, |
| "step": 3350, |
| "valid_targets_mean": 5643.6, |
| "valid_targets_min": 1626 |
| }, |
| { |
| "epoch": 3.4997391757955136, |
| "grad_norm": 0.5427911383944662, |
| "learning_rate": 2.3502550192798726e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13177376985549927, |
| "step": 3355, |
| "valid_targets_mean": 4822.4, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 3.5049556598852374, |
| "grad_norm": 0.5260980866358562, |
| "learning_rate": 2.345133758662431e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10232182592153549, |
| "step": 3360, |
| "valid_targets_mean": 4270.2, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 3.5101721439749607, |
| "grad_norm": 0.46855511810503486, |
| "learning_rate": 2.3400101645370702e-05, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11119550466537476, |
| "step": 3365, |
| "valid_targets_mean": 5504.2, |
| "valid_targets_min": 2764 |
| }, |
| { |
| "epoch": 3.5153886280646844, |
| "grad_norm": 0.5238851262161284, |
| "learning_rate": 2.3348842715452803e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11851681768894196, |
| "step": 3370, |
| "valid_targets_mean": 5526.2, |
| "valid_targets_min": 3314 |
| }, |
| { |
| "epoch": 3.520605112154408, |
| "grad_norm": 0.5351641663094854, |
| "learning_rate": 2.3297561143440932e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10816239565610886, |
| "step": 3375, |
| "valid_targets_mean": 5042.5, |
| "valid_targets_min": 2194 |
| }, |
| { |
| "epoch": 3.5258215962441315, |
| "grad_norm": 0.5418076404930998, |
| "learning_rate": 2.3246257276058507e-05, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10289973020553589, |
| "step": 3380, |
| "valid_targets_mean": 4962.2, |
| "valid_targets_min": 1250 |
| }, |
| { |
| "epoch": 3.531038080333855, |
| "grad_norm": 0.5835177880403055, |
| "learning_rate": 2.3194931460179677e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11193951964378357, |
| "step": 3385, |
| "valid_targets_mean": 4545.5, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 3.5362545644235786, |
| "grad_norm": 0.4409714869921065, |
| "learning_rate": 2.314358404282699e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09257347881793976, |
| "step": 3390, |
| "valid_targets_mean": 5921.9, |
| "valid_targets_min": 4133 |
| }, |
| { |
| "epoch": 3.5414710485133023, |
| "grad_norm": 0.48479378902625975, |
| "learning_rate": 2.309221537116906e-05, |
| "loss": 0.2042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10169748961925507, |
| "step": 3395, |
| "valid_targets_mean": 5093.8, |
| "valid_targets_min": 2127 |
| }, |
| { |
| "epoch": 3.5466875326030256, |
| "grad_norm": 0.4999342137491525, |
| "learning_rate": 2.3040825792518188e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10100770741701126, |
| "step": 3400, |
| "valid_targets_mean": 5618.4, |
| "valid_targets_min": 4602 |
| }, |
| { |
| "epoch": 3.551904016692749, |
| "grad_norm": 0.5798992641647128, |
| "learning_rate": 2.298941565432804e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10427383333444595, |
| "step": 3405, |
| "valid_targets_mean": 4501.9, |
| "valid_targets_min": 2200 |
| }, |
| { |
| "epoch": 3.5571205007824727, |
| "grad_norm": 0.514151979940359, |
| "learning_rate": 2.2937985304191285e-05, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09981776773929596, |
| "step": 3410, |
| "valid_targets_mean": 5144.2, |
| "valid_targets_min": 2434 |
| }, |
| { |
| "epoch": 3.5623369848721964, |
| "grad_norm": 0.49224599352391807, |
| "learning_rate": 2.2886535089837247e-05, |
| "loss": 0.1998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11161879450082779, |
| "step": 3415, |
| "valid_targets_mean": 7394.0, |
| "valid_targets_min": 2984 |
| }, |
| { |
| "epoch": 3.5675534689619197, |
| "grad_norm": 0.5112976626672822, |
| "learning_rate": 2.2835065359129564e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08873531967401505, |
| "step": 3420, |
| "valid_targets_mean": 4770.6, |
| "valid_targets_min": 3574 |
| }, |
| { |
| "epoch": 3.572769953051643, |
| "grad_norm": 0.5368546255179795, |
| "learning_rate": 2.278357646006381e-05, |
| "loss": 0.2066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08348749577999115, |
| "step": 3425, |
| "valid_targets_mean": 4058.6, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 3.5779864371413668, |
| "grad_norm": 0.5130542955157593, |
| "learning_rate": 2.273206874076518e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10261701047420502, |
| "step": 3430, |
| "valid_targets_mean": 5305.4, |
| "valid_targets_min": 3152 |
| }, |
| { |
| "epoch": 3.5832029212310905, |
| "grad_norm": 0.4841718810074, |
| "learning_rate": 2.26805425494861e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09375569969415665, |
| "step": 3435, |
| "valid_targets_mean": 5293.2, |
| "valid_targets_min": 2908 |
| }, |
| { |
| "epoch": 3.588419405320814, |
| "grad_norm": 0.5169121108069523, |
| "learning_rate": 2.26289982346039e-05, |
| "loss": 0.1935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09104648232460022, |
| "step": 3440, |
| "valid_targets_mean": 4429.5, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 3.593635889410537, |
| "grad_norm": 0.49322986983878714, |
| "learning_rate": 2.2577436144618438e-05, |
| "loss": 0.1996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09873166680335999, |
| "step": 3445, |
| "valid_targets_mean": 4847.2, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 3.598852373500261, |
| "grad_norm": 0.524507361163139, |
| "learning_rate": 2.2525856628149754e-05, |
| "loss": 0.1934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10959742963314056, |
| "step": 3450, |
| "valid_targets_mean": 5337.8, |
| "valid_targets_min": 1515 |
| }, |
| { |
| "epoch": 3.604068857589984, |
| "grad_norm": 0.5038836279165287, |
| "learning_rate": 2.2474260033935718e-05, |
| "loss": 0.1979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09655040502548218, |
| "step": 3455, |
| "valid_targets_mean": 5096.9, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 3.609285341679708, |
| "grad_norm": 0.5434625017319136, |
| "learning_rate": 2.2422646710829653e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11120036989450455, |
| "step": 3460, |
| "valid_targets_mean": 4631.4, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 3.6145018257694312, |
| "grad_norm": 0.4643557437705012, |
| "learning_rate": 2.2371017007798005e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1015571653842926, |
| "step": 3465, |
| "valid_targets_mean": 5713.1, |
| "valid_targets_min": 2234 |
| }, |
| { |
| "epoch": 3.619718309859155, |
| "grad_norm": 0.5438936323798786, |
| "learning_rate": 2.231937127391795e-05, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1269652396440506, |
| "step": 3470, |
| "valid_targets_mean": 4342.6, |
| "valid_targets_min": 2144 |
| }, |
| { |
| "epoch": 3.6249347939488783, |
| "grad_norm": 0.5261720551564346, |
| "learning_rate": 2.226770985837507e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10666371881961823, |
| "step": 3475, |
| "valid_targets_mean": 4991.1, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 3.630151278038602, |
| "grad_norm": 0.48971826448674355, |
| "learning_rate": 2.2216033110460952e-05, |
| "loss": 0.2105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11108003556728363, |
| "step": 3480, |
| "valid_targets_mean": 5494.9, |
| "valid_targets_min": 2406 |
| }, |
| { |
| "epoch": 3.6353677621283254, |
| "grad_norm": 0.6310033254541642, |
| "learning_rate": 2.216434137957087e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14492467045783997, |
| "step": 3485, |
| "valid_targets_mean": 4256.5, |
| "valid_targets_min": 2999 |
| }, |
| { |
| "epoch": 3.640584246218049, |
| "grad_norm": 0.4509439637081253, |
| "learning_rate": 2.2112635015201383e-05, |
| "loss": 0.1947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10062622278928757, |
| "step": 3490, |
| "valid_targets_mean": 4395.6, |
| "valid_targets_min": 2232 |
| }, |
| { |
| "epoch": 3.6458007303077724, |
| "grad_norm": 0.5309888811229617, |
| "learning_rate": 2.2060914366948004e-05, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13531291484832764, |
| "step": 3495, |
| "valid_targets_mean": 4848.5, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 3.651017214397496, |
| "grad_norm": 0.49378897883013445, |
| "learning_rate": 2.2009179784502802e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10192813724279404, |
| "step": 3500, |
| "valid_targets_mean": 4548.9, |
| "valid_targets_min": 1422 |
| }, |
| { |
| "epoch": 3.6562336984872195, |
| "grad_norm": 0.4496118679496516, |
| "learning_rate": 2.1957431617652074e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09512370079755783, |
| "step": 3505, |
| "valid_targets_mean": 5200.8, |
| "valid_targets_min": 1777 |
| }, |
| { |
| "epoch": 3.661450182576943, |
| "grad_norm": 0.4627518225433372, |
| "learning_rate": 2.1905670216273967e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10607169568538666, |
| "step": 3510, |
| "valid_targets_mean": 5725.0, |
| "valid_targets_min": 2263 |
| }, |
| { |
| "epoch": 3.6666666666666665, |
| "grad_norm": 0.6142333426220774, |
| "learning_rate": 2.185389593033609e-05, |
| "loss": 0.2087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10711097717285156, |
| "step": 3515, |
| "valid_targets_mean": 3951.2, |
| "valid_targets_min": 2040 |
| }, |
| { |
| "epoch": 3.6718831507563903, |
| "grad_norm": 0.4564859698569454, |
| "learning_rate": 2.1802109109893184e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10178106278181076, |
| "step": 3520, |
| "valid_targets_mean": 5606.4, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 3.6770996348461136, |
| "grad_norm": 0.4578707908340693, |
| "learning_rate": 2.1750310105084725e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11136416345834732, |
| "step": 3525, |
| "valid_targets_mean": 7570.0, |
| "valid_targets_min": 2331 |
| }, |
| { |
| "epoch": 3.6823161189358373, |
| "grad_norm": 0.4530824968720263, |
| "learning_rate": 2.1698499266132585e-05, |
| "loss": 0.1963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08735674619674683, |
| "step": 3530, |
| "valid_targets_mean": 4930.5, |
| "valid_targets_min": 2301 |
| }, |
| { |
| "epoch": 3.6875326030255606, |
| "grad_norm": 0.45806092476342786, |
| "learning_rate": 2.164667694333863e-05, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08106125891208649, |
| "step": 3535, |
| "valid_targets_mean": 4889.6, |
| "valid_targets_min": 2107 |
| }, |
| { |
| "epoch": 3.6927490871152844, |
| "grad_norm": 0.5918590421269798, |
| "learning_rate": 2.159484348708239e-05, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11161507666110992, |
| "step": 3540, |
| "valid_targets_mean": 4062.0, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 3.6979655712050077, |
| "grad_norm": 0.509743862744301, |
| "learning_rate": 2.1542999247818653e-05, |
| "loss": 0.2072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12011369317770004, |
| "step": 3545, |
| "valid_targets_mean": 5757.8, |
| "valid_targets_min": 2037 |
| }, |
| { |
| "epoch": 3.7031820552947314, |
| "grad_norm": 0.4753458839491459, |
| "learning_rate": 2.149114457607512e-05, |
| "loss": 0.2068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11911623179912567, |
| "step": 3550, |
| "valid_targets_mean": 5659.5, |
| "valid_targets_min": 3885 |
| }, |
| { |
| "epoch": 3.7083985393844547, |
| "grad_norm": 0.5342061703088573, |
| "learning_rate": 2.1439279822450034e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08299921452999115, |
| "step": 3555, |
| "valid_targets_mean": 3785.2, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 3.7136150234741785, |
| "grad_norm": 0.4727141206820206, |
| "learning_rate": 2.1387405337609787e-05, |
| "loss": 0.2117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11511692404747009, |
| "step": 3560, |
| "valid_targets_mean": 5902.4, |
| "valid_targets_min": 3456 |
| }, |
| { |
| "epoch": 3.718831507563902, |
| "grad_norm": 0.4698992789174544, |
| "learning_rate": 2.1335521472286578e-05, |
| "loss": 0.2119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09991538524627686, |
| "step": 3565, |
| "valid_targets_mean": 5482.8, |
| "valid_targets_min": 2860 |
| }, |
| { |
| "epoch": 3.7240479916536255, |
| "grad_norm": 0.44549155893660347, |
| "learning_rate": 2.1283628577276034e-05, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09587128460407257, |
| "step": 3570, |
| "valid_targets_mean": 6596.9, |
| "valid_targets_min": 5190 |
| }, |
| { |
| "epoch": 3.729264475743349, |
| "grad_norm": 0.5225931871767929, |
| "learning_rate": 2.1231727003434816e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11135206371545792, |
| "step": 3575, |
| "valid_targets_mean": 4997.1, |
| "valid_targets_min": 3775 |
| }, |
| { |
| "epoch": 3.7344809598330726, |
| "grad_norm": 0.5052943373674356, |
| "learning_rate": 2.1179817101678272e-05, |
| "loss": 0.1985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11900711059570312, |
| "step": 3580, |
| "valid_targets_mean": 4403.1, |
| "valid_targets_min": 2023 |
| }, |
| { |
| "epoch": 3.739697443922796, |
| "grad_norm": 0.47991849736021147, |
| "learning_rate": 2.1127899222978064e-05, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10209795087575912, |
| "step": 3585, |
| "valid_targets_mean": 5810.5, |
| "valid_targets_min": 1632 |
| }, |
| { |
| "epoch": 3.7449139280125197, |
| "grad_norm": 0.4664445962766321, |
| "learning_rate": 2.107597371835979e-05, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09806659072637558, |
| "step": 3590, |
| "valid_targets_mean": 4265.9, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 3.750130412102243, |
| "grad_norm": 0.5482988875290883, |
| "learning_rate": 2.1024040938900586e-05, |
| "loss": 0.206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11896420270204544, |
| "step": 3595, |
| "valid_targets_mean": 5041.1, |
| "valid_targets_min": 1875 |
| }, |
| { |
| "epoch": 3.7553468961919667, |
| "grad_norm": 0.5046703560081168, |
| "learning_rate": 2.097210123572679e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10202568769454956, |
| "step": 3600, |
| "valid_targets_mean": 4581.6, |
| "valid_targets_min": 2032 |
| }, |
| { |
| "epoch": 3.76056338028169, |
| "grad_norm": 0.5134332654087025, |
| "learning_rate": 2.092015496001155e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09612300992012024, |
| "step": 3605, |
| "valid_targets_mean": 4159.4, |
| "valid_targets_min": 1893 |
| }, |
| { |
| "epoch": 3.7657798643714138, |
| "grad_norm": 0.49986159400195557, |
| "learning_rate": 2.0868202462972458e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09765844792127609, |
| "step": 3610, |
| "valid_targets_mean": 4365.2, |
| "valid_targets_min": 2086 |
| }, |
| { |
| "epoch": 3.770996348461137, |
| "grad_norm": 0.49759426834449094, |
| "learning_rate": 2.0816244095869157e-05, |
| "loss": 0.2072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10434122383594513, |
| "step": 3615, |
| "valid_targets_mean": 4772.0, |
| "valid_targets_min": 2390 |
| }, |
| { |
| "epoch": 3.776212832550861, |
| "grad_norm": 0.48191796442862084, |
| "learning_rate": 2.0764280210001e-05, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09581761062145233, |
| "step": 3620, |
| "valid_targets_mean": 4700.4, |
| "valid_targets_min": 1854 |
| }, |
| { |
| "epoch": 3.781429316640584, |
| "grad_norm": 0.45651214224663467, |
| "learning_rate": 2.0712311156704624e-05, |
| "loss": 0.2109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11849430203437805, |
| "step": 3625, |
| "valid_targets_mean": 6474.9, |
| "valid_targets_min": 2325 |
| }, |
| { |
| "epoch": 3.786645800730308, |
| "grad_norm": 0.5128768250151106, |
| "learning_rate": 2.066033728735162e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10043670237064362, |
| "step": 3630, |
| "valid_targets_mean": 4569.6, |
| "valid_targets_min": 2703 |
| }, |
| { |
| "epoch": 3.791862284820031, |
| "grad_norm": 0.5205659397746013, |
| "learning_rate": 2.0608358953346146e-05, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12045201659202576, |
| "step": 3635, |
| "valid_targets_mean": 4408.4, |
| "valid_targets_min": 1794 |
| }, |
| { |
| "epoch": 3.797078768909755, |
| "grad_norm": 0.44524938384432866, |
| "learning_rate": 2.0556376506122535e-05, |
| "loss": 0.1951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09781882166862488, |
| "step": 3640, |
| "valid_targets_mean": 5613.9, |
| "valid_targets_min": 2932 |
| }, |
| { |
| "epoch": 3.8022952529994782, |
| "grad_norm": 0.5628102931009461, |
| "learning_rate": 2.0504390297142935e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11225159466266632, |
| "step": 3645, |
| "valid_targets_mean": 5291.5, |
| "valid_targets_min": 3199 |
| }, |
| { |
| "epoch": 3.807511737089202, |
| "grad_norm": 0.48068417775523864, |
| "learning_rate": 2.0452400677894936e-05, |
| "loss": 0.2248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11818863451480865, |
| "step": 3650, |
| "valid_targets_mean": 6005.4, |
| "valid_targets_min": 1832 |
| }, |
| { |
| "epoch": 3.8127282211789253, |
| "grad_norm": 0.4802884620146345, |
| "learning_rate": 2.0400407999889165e-05, |
| "loss": 0.2201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08356926590204239, |
| "step": 3655, |
| "valid_targets_mean": 4897.5, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 3.817944705268649, |
| "grad_norm": 0.4996117329409353, |
| "learning_rate": 2.0348412614656952e-05, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10854753106832504, |
| "step": 3660, |
| "valid_targets_mean": 5317.0, |
| "valid_targets_min": 2965 |
| }, |
| { |
| "epoch": 3.8231611893583723, |
| "grad_norm": 0.4822390374810917, |
| "learning_rate": 2.0296414873747915e-05, |
| "loss": 0.1985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10188714414834976, |
| "step": 3665, |
| "valid_targets_mean": 5403.4, |
| "valid_targets_min": 2299 |
| }, |
| { |
| "epoch": 3.828377673448096, |
| "grad_norm": 0.508619515441862, |
| "learning_rate": 2.0244415128727612e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09003810584545135, |
| "step": 3670, |
| "valid_targets_mean": 4603.9, |
| "valid_targets_min": 2767 |
| }, |
| { |
| "epoch": 3.8335941575378194, |
| "grad_norm": 0.46912333306432125, |
| "learning_rate": 2.0192413731175146e-05, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09568269550800323, |
| "step": 3675, |
| "valid_targets_mean": 5408.6, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 3.838810641627543, |
| "grad_norm": 0.5460759203899835, |
| "learning_rate": 2.0140411032680775e-05, |
| "loss": 0.2033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1019095927476883, |
| "step": 3680, |
| "valid_targets_mean": 4524.6, |
| "valid_targets_min": 1596 |
| }, |
| { |
| "epoch": 3.8440271257172665, |
| "grad_norm": 0.4974781466356231, |
| "learning_rate": 2.008840738484359e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10185645520687103, |
| "step": 3685, |
| "valid_targets_mean": 4695.8, |
| "valid_targets_min": 2022 |
| }, |
| { |
| "epoch": 3.84924360980699, |
| "grad_norm": 0.5521100717903332, |
| "learning_rate": 2.0036403139269067e-05, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09987007081508636, |
| "step": 3690, |
| "valid_targets_mean": 4702.2, |
| "valid_targets_min": 1670 |
| }, |
| { |
| "epoch": 3.8544600938967135, |
| "grad_norm": 0.5097492757774731, |
| "learning_rate": 1.998439864756674e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11091513931751251, |
| "step": 3695, |
| "valid_targets_mean": 5430.6, |
| "valid_targets_min": 3621 |
| }, |
| { |
| "epoch": 3.8596765779864373, |
| "grad_norm": 0.5149786258022108, |
| "learning_rate": 1.993239426134781e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12105295807123184, |
| "step": 3700, |
| "valid_targets_mean": 5099.6, |
| "valid_targets_min": 2804 |
| }, |
| { |
| "epoch": 3.8648930620761606, |
| "grad_norm": 0.5485933673253874, |
| "learning_rate": 1.988039033222275e-05, |
| "loss": 0.2159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11051084101200104, |
| "step": 3705, |
| "valid_targets_mean": 4257.6, |
| "valid_targets_min": 2166 |
| }, |
| { |
| "epoch": 3.8701095461658843, |
| "grad_norm": 0.5637753025367358, |
| "learning_rate": 1.982838721179896e-05, |
| "loss": 0.2081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10755988210439682, |
| "step": 3710, |
| "valid_targets_mean": 4024.9, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 3.8753260302556076, |
| "grad_norm": 0.8170415462558644, |
| "learning_rate": 1.9776385251678352e-05, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11058570444583893, |
| "step": 3715, |
| "valid_targets_mean": 4973.9, |
| "valid_targets_min": 2001 |
| }, |
| { |
| "epoch": 3.8805425143453314, |
| "grad_norm": 0.4929423575864892, |
| "learning_rate": 1.9724384803455013e-05, |
| "loss": 0.2095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10546065121889114, |
| "step": 3720, |
| "valid_targets_mean": 4542.1, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 3.8857589984350547, |
| "grad_norm": 0.5979911719291678, |
| "learning_rate": 1.9672386218712794e-05, |
| "loss": 0.212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09815919399261475, |
| "step": 3725, |
| "valid_targets_mean": 4957.8, |
| "valid_targets_min": 2453 |
| }, |
| { |
| "epoch": 3.8909754825247784, |
| "grad_norm": 0.5153570159758912, |
| "learning_rate": 1.962038984902295e-05, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10997527837753296, |
| "step": 3730, |
| "valid_targets_mean": 4998.4, |
| "valid_targets_min": 1986 |
| }, |
| { |
| "epoch": 3.8961919666145017, |
| "grad_norm": 0.5593692235819094, |
| "learning_rate": 1.9568396045941766e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10075406730175018, |
| "step": 3735, |
| "valid_targets_mean": 3630.2, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 3.9014084507042255, |
| "grad_norm": 0.49266099775399863, |
| "learning_rate": 1.951640516100817e-05, |
| "loss": 0.2156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10078372061252594, |
| "step": 3740, |
| "valid_targets_mean": 4820.2, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 3.906624934793949, |
| "grad_norm": 0.6120689199450674, |
| "learning_rate": 1.9464417545741352e-05, |
| "loss": 0.2086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13580328226089478, |
| "step": 3745, |
| "valid_targets_mean": 4586.2, |
| "valid_targets_min": 1724 |
| }, |
| { |
| "epoch": 3.9118414188836725, |
| "grad_norm": 0.5385939169738648, |
| "learning_rate": 1.941243355163841e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11604689061641693, |
| "step": 3750, |
| "valid_targets_mean": 5049.1, |
| "valid_targets_min": 1586 |
| }, |
| { |
| "epoch": 3.917057902973396, |
| "grad_norm": 0.4701296001393863, |
| "learning_rate": 1.936045353017195e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10644729435443878, |
| "step": 3755, |
| "valid_targets_mean": 4908.4, |
| "valid_targets_min": 2287 |
| }, |
| { |
| "epoch": 3.9222743870631196, |
| "grad_norm": 0.5300256155038029, |
| "learning_rate": 1.9308477832787724e-05, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08712330460548401, |
| "step": 3760, |
| "valid_targets_mean": 4941.6, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 3.927490871152843, |
| "grad_norm": 0.5473484318788164, |
| "learning_rate": 1.9256506810902226e-05, |
| "loss": 0.2118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11402727663516998, |
| "step": 3765, |
| "valid_targets_mean": 4187.4, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 3.9327073552425666, |
| "grad_norm": 0.48275177236367606, |
| "learning_rate": 1.9204540815900368e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10041767358779907, |
| "step": 3770, |
| "valid_targets_mean": 5450.4, |
| "valid_targets_min": 1852 |
| }, |
| { |
| "epoch": 3.93792383933229, |
| "grad_norm": 0.5194319283174178, |
| "learning_rate": 1.915258019913306e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10384313762187958, |
| "step": 3775, |
| "valid_targets_mean": 4937.1, |
| "valid_targets_min": 2276 |
| }, |
| { |
| "epoch": 3.9431403234220137, |
| "grad_norm": 0.5102834439544414, |
| "learning_rate": 1.9100625311914855e-05, |
| "loss": 0.1935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11289326846599579, |
| "step": 3780, |
| "valid_targets_mean": 5011.9, |
| "valid_targets_min": 2077 |
| }, |
| { |
| "epoch": 3.948356807511737, |
| "grad_norm": 0.5188674050207436, |
| "learning_rate": 1.9048676505521552e-05, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1049310639500618, |
| "step": 3785, |
| "valid_targets_mean": 4873.9, |
| "valid_targets_min": 2730 |
| }, |
| { |
| "epoch": 3.9535732916014608, |
| "grad_norm": 0.4969938713059937, |
| "learning_rate": 1.8996734131187867e-05, |
| "loss": 0.2011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1003921777009964, |
| "step": 3790, |
| "valid_targets_mean": 4873.9, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 3.958789775691184, |
| "grad_norm": 0.5311902182679525, |
| "learning_rate": 1.894479854010499e-05, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10483424365520477, |
| "step": 3795, |
| "valid_targets_mean": 4369.6, |
| "valid_targets_min": 1711 |
| }, |
| { |
| "epoch": 3.964006259780908, |
| "grad_norm": 0.5333966811645783, |
| "learning_rate": 1.8892870083418272e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09669163823127747, |
| "step": 3800, |
| "valid_targets_mean": 3691.0, |
| "valid_targets_min": 1875 |
| }, |
| { |
| "epoch": 3.969222743870631, |
| "grad_norm": 0.4544249740651942, |
| "learning_rate": 1.8840949112224823e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10293082892894745, |
| "step": 3805, |
| "valid_targets_mean": 5624.8, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 3.974439227960355, |
| "grad_norm": 0.5444361564882776, |
| "learning_rate": 1.8789035977571145e-05, |
| "loss": 0.2042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10902902483940125, |
| "step": 3810, |
| "valid_targets_mean": 4516.5, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 3.979655712050078, |
| "grad_norm": 0.5111837101240407, |
| "learning_rate": 1.873713103045076e-05, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09919290989637375, |
| "step": 3815, |
| "valid_targets_mean": 4874.5, |
| "valid_targets_min": 2037 |
| }, |
| { |
| "epoch": 3.984872196139802, |
| "grad_norm": 0.5541412732399372, |
| "learning_rate": 1.8685234621801803e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1078808456659317, |
| "step": 3820, |
| "valid_targets_mean": 3935.0, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 3.9900886802295252, |
| "grad_norm": 0.5213068337768594, |
| "learning_rate": 1.863334710250471e-05, |
| "loss": 0.2109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11251041293144226, |
| "step": 3825, |
| "valid_targets_mean": 4976.2, |
| "valid_targets_min": 2908 |
| }, |
| { |
| "epoch": 3.995305164319249, |
| "grad_norm": 0.6187092625734034, |
| "learning_rate": 1.858146882337981e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10999973118305206, |
| "step": 3830, |
| "valid_targets_mean": 3286.1, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 0.5917940970126754, |
| "learning_rate": 1.852960013518495e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1782897263765335, |
| "step": 3835, |
| "valid_targets_mean": 5665.9, |
| "valid_targets_min": 3034 |
| }, |
| { |
| "epoch": 4.005216484089724, |
| "grad_norm": 0.46607771414324617, |
| "learning_rate": 1.8477741388613132e-05, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09920147061347961, |
| "step": 3840, |
| "valid_targets_mean": 6056.2, |
| "valid_targets_min": 2699 |
| }, |
| { |
| "epoch": 4.010432968179447, |
| "grad_norm": 0.4768192176770827, |
| "learning_rate": 1.8425892934290152e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07980208843946457, |
| "step": 3845, |
| "valid_targets_mean": 4985.4, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 4.01564945226917, |
| "grad_norm": 0.6027113819965128, |
| "learning_rate": 1.8374055122772195e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11384853720664978, |
| "step": 3850, |
| "valid_targets_mean": 4757.9, |
| "valid_targets_min": 2591 |
| }, |
| { |
| "epoch": 4.020865936358894, |
| "grad_norm": 0.6170472555517669, |
| "learning_rate": 1.8322228304543515e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10987308621406555, |
| "step": 3855, |
| "valid_targets_mean": 4566.6, |
| "valid_targets_min": 1568 |
| }, |
| { |
| "epoch": 4.026082420448618, |
| "grad_norm": 0.5361888807617837, |
| "learning_rate": 1.827041283001403e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10329025983810425, |
| "step": 3860, |
| "valid_targets_mean": 6410.9, |
| "valid_targets_min": 2809 |
| }, |
| { |
| "epoch": 4.031298904538341, |
| "grad_norm": 0.5138123234586494, |
| "learning_rate": 1.8218609049516943e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10162970423698425, |
| "step": 3865, |
| "valid_targets_mean": 4866.2, |
| "valid_targets_min": 2589 |
| }, |
| { |
| "epoch": 4.0365153886280645, |
| "grad_norm": 0.629738341072631, |
| "learning_rate": 1.816681731330641e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09866997599601746, |
| "step": 3870, |
| "valid_targets_mean": 3714.9, |
| "valid_targets_min": 1792 |
| }, |
| { |
| "epoch": 4.041731872717788, |
| "grad_norm": 0.5076510284900337, |
| "learning_rate": 1.811503797155516e-05, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08396624028682709, |
| "step": 3875, |
| "valid_targets_mean": 4964.0, |
| "valid_targets_min": 2687 |
| }, |
| { |
| "epoch": 4.046948356807512, |
| "grad_norm": 0.5604202388209889, |
| "learning_rate": 1.8063271374352097e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07950867712497711, |
| "step": 3880, |
| "valid_targets_mean": 4328.1, |
| "valid_targets_min": 2683 |
| }, |
| { |
| "epoch": 4.052164840897235, |
| "grad_norm": 0.5195318213554949, |
| "learning_rate": 1.8011517871699978e-05, |
| "loss": 0.1938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09295456111431122, |
| "step": 3885, |
| "valid_targets_mean": 4763.0, |
| "valid_targets_min": 2191 |
| }, |
| { |
| "epoch": 4.057381324986959, |
| "grad_norm": 0.49574508785301097, |
| "learning_rate": 1.7959777813513015e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08722072839736938, |
| "step": 3890, |
| "valid_targets_mean": 5509.4, |
| "valid_targets_min": 2389 |
| }, |
| { |
| "epoch": 4.062597809076682, |
| "grad_norm": 0.555672291436396, |
| "learning_rate": 1.7908051549614527e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10567817091941833, |
| "step": 3895, |
| "valid_targets_mean": 4166.8, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 4.067814293166406, |
| "grad_norm": 0.576453985393876, |
| "learning_rate": 1.7856339429734557e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10580688714981079, |
| "step": 3900, |
| "valid_targets_mean": 4304.9, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 4.073030777256129, |
| "grad_norm": 0.48395931003632825, |
| "learning_rate": 1.780464180350753e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08282601833343506, |
| "step": 3905, |
| "valid_targets_mean": 5238.0, |
| "valid_targets_min": 1478 |
| }, |
| { |
| "epoch": 4.078247261345853, |
| "grad_norm": 0.4822897854810889, |
| "learning_rate": 1.7752959020469868e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09229675680398941, |
| "step": 3910, |
| "valid_targets_mean": 5155.9, |
| "valid_targets_min": 2004 |
| }, |
| { |
| "epoch": 4.083463745435576, |
| "grad_norm": 0.6181703509272917, |
| "learning_rate": 1.7701291430057653e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10611573606729507, |
| "step": 3915, |
| "valid_targets_mean": 3013.1, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 4.0886802295253, |
| "grad_norm": 0.49745890025257705, |
| "learning_rate": 1.7649639381604207e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08665668964385986, |
| "step": 3920, |
| "valid_targets_mean": 5601.6, |
| "valid_targets_min": 2905 |
| }, |
| { |
| "epoch": 4.093896713615023, |
| "grad_norm": 0.5178774003263724, |
| "learning_rate": 1.759800322433781e-05, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1114279106259346, |
| "step": 3925, |
| "valid_targets_mean": 5073.0, |
| "valid_targets_min": 1884 |
| }, |
| { |
| "epoch": 4.099113197704747, |
| "grad_norm": 0.48501226491558996, |
| "learning_rate": 1.7546383307379284e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09173507988452911, |
| "step": 3930, |
| "valid_targets_mean": 5578.1, |
| "valid_targets_min": 1780 |
| }, |
| { |
| "epoch": 4.1043296817944706, |
| "grad_norm": 0.609147488412618, |
| "learning_rate": 1.7494779979739645e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10356195271015167, |
| "step": 3935, |
| "valid_targets_mean": 4226.8, |
| "valid_targets_min": 1939 |
| }, |
| { |
| "epoch": 4.109546165884194, |
| "grad_norm": 0.5526486664927994, |
| "learning_rate": 1.7443193590317756e-05, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08991257846355438, |
| "step": 3940, |
| "valid_targets_mean": 3742.1, |
| "valid_targets_min": 2015 |
| }, |
| { |
| "epoch": 4.114762649973917, |
| "grad_norm": 0.520797455000569, |
| "learning_rate": 1.7391624487897947e-05, |
| "loss": 0.1847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0994281992316246, |
| "step": 3945, |
| "valid_targets_mean": 4919.4, |
| "valid_targets_min": 1876 |
| }, |
| { |
| "epoch": 4.119979134063641, |
| "grad_norm": 0.5815937259094293, |
| "learning_rate": 1.734007302114768e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07230329513549805, |
| "step": 3950, |
| "valid_targets_mean": 3220.5, |
| "valid_targets_min": 1525 |
| }, |
| { |
| "epoch": 4.125195618153365, |
| "grad_norm": 0.498745760416118, |
| "learning_rate": 1.728853953861516e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10175873339176178, |
| "step": 3955, |
| "valid_targets_mean": 5411.1, |
| "valid_targets_min": 3212 |
| }, |
| { |
| "epoch": 4.130412102243088, |
| "grad_norm": 0.48426613600890606, |
| "learning_rate": 1.723702438872701e-05, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07348211109638214, |
| "step": 3960, |
| "valid_targets_mean": 4504.8, |
| "valid_targets_min": 1674 |
| }, |
| { |
| "epoch": 4.135628586332811, |
| "grad_norm": 0.4949250093153264, |
| "learning_rate": 1.718552791978591e-05, |
| "loss": 0.1808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08084411919116974, |
| "step": 3965, |
| "valid_targets_mean": 4177.2, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 4.140845070422535, |
| "grad_norm": 0.5462401892454734, |
| "learning_rate": 1.713405047996822e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08703359961509705, |
| "step": 3970, |
| "valid_targets_mean": 4648.9, |
| "valid_targets_min": 3039 |
| }, |
| { |
| "epoch": 4.146061554512259, |
| "grad_norm": 0.5596781224211703, |
| "learning_rate": 1.7082592417321647e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0826859325170517, |
| "step": 3975, |
| "valid_targets_mean": 4734.5, |
| "valid_targets_min": 1646 |
| }, |
| { |
| "epoch": 4.1512780386019825, |
| "grad_norm": 0.5208769324737493, |
| "learning_rate": 1.7031154079762885e-05, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10567048192024231, |
| "step": 3980, |
| "valid_targets_mean": 6375.9, |
| "valid_targets_min": 3444 |
| }, |
| { |
| "epoch": 4.156494522691705, |
| "grad_norm": 0.46231862393023193, |
| "learning_rate": 1.6979735815075263e-05, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08094746619462967, |
| "step": 3985, |
| "valid_targets_mean": 5711.2, |
| "valid_targets_min": 2724 |
| }, |
| { |
| "epoch": 4.161711006781429, |
| "grad_norm": 0.47782347604207814, |
| "learning_rate": 1.6928337970906406e-05, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10498857498168945, |
| "step": 3990, |
| "valid_targets_mean": 6370.1, |
| "valid_targets_min": 3429 |
| }, |
| { |
| "epoch": 4.166927490871153, |
| "grad_norm": 0.533700092920349, |
| "learning_rate": 1.687696089476585e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09806228429079056, |
| "step": 3995, |
| "valid_targets_mean": 4882.9, |
| "valid_targets_min": 2680 |
| }, |
| { |
| "epoch": 4.172143974960877, |
| "grad_norm": 0.5973811736413226, |
| "learning_rate": 1.6825604934022734e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10948151350021362, |
| "step": 4000, |
| "valid_targets_mean": 4622.4, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 4.1773604590505995, |
| "grad_norm": 0.5839781166361364, |
| "learning_rate": 1.6774270435903423e-05, |
| "loss": 0.1857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09380412101745605, |
| "step": 4005, |
| "valid_targets_mean": 4379.6, |
| "valid_targets_min": 2864 |
| }, |
| { |
| "epoch": 4.182576943140323, |
| "grad_norm": 0.4932464057306441, |
| "learning_rate": 1.6722957747489172e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08225096017122269, |
| "step": 4010, |
| "valid_targets_mean": 5334.0, |
| "valid_targets_min": 1478 |
| }, |
| { |
| "epoch": 4.187793427230047, |
| "grad_norm": 0.5860383161281291, |
| "learning_rate": 1.6671667215713784e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13215795159339905, |
| "step": 4015, |
| "valid_targets_mean": 5308.4, |
| "valid_targets_min": 2775 |
| }, |
| { |
| "epoch": 4.193009911319771, |
| "grad_norm": 0.5247016468745013, |
| "learning_rate": 1.6620399187361226e-05, |
| "loss": 0.19, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09403416514396667, |
| "step": 4020, |
| "valid_targets_mean": 4737.9, |
| "valid_targets_min": 1846 |
| }, |
| { |
| "epoch": 4.198226395409494, |
| "grad_norm": 0.5463858968727039, |
| "learning_rate": 1.656915400906336e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12462165206670761, |
| "step": 4025, |
| "valid_targets_mean": 5254.2, |
| "valid_targets_min": 2690 |
| }, |
| { |
| "epoch": 4.203442879499217, |
| "grad_norm": 0.5437506670021418, |
| "learning_rate": 1.6517932027297525e-05, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10087625682353973, |
| "step": 4030, |
| "valid_targets_mean": 5404.0, |
| "valid_targets_min": 2414 |
| }, |
| { |
| "epoch": 4.208659363588941, |
| "grad_norm": 0.4920007300056477, |
| "learning_rate": 1.6466733588384233e-05, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0758361667394638, |
| "step": 4035, |
| "valid_targets_mean": 4849.0, |
| "valid_targets_min": 2562 |
| }, |
| { |
| "epoch": 4.213875847678665, |
| "grad_norm": 0.5334617341832782, |
| "learning_rate": 1.6415559038484827e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09430640190839767, |
| "step": 4040, |
| "valid_targets_mean": 4943.1, |
| "valid_targets_min": 1510 |
| }, |
| { |
| "epoch": 4.219092331768388, |
| "grad_norm": 0.5275723874222573, |
| "learning_rate": 1.6364408723599116e-05, |
| "loss": 0.1771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09793593734502792, |
| "step": 4045, |
| "valid_targets_mean": 4466.1, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 4.2243088158581115, |
| "grad_norm": 0.5463254998017771, |
| "learning_rate": 1.6313282989563062e-05, |
| "loss": 0.1852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09902290999889374, |
| "step": 4050, |
| "valid_targets_mean": 5299.5, |
| "valid_targets_min": 2944 |
| }, |
| { |
| "epoch": 4.229525299947835, |
| "grad_norm": 0.5464292051087032, |
| "learning_rate": 1.626218218204643e-05, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08867479115724564, |
| "step": 4055, |
| "valid_targets_mean": 4553.4, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 4.234741784037559, |
| "grad_norm": 0.5750184592559107, |
| "learning_rate": 1.6211106646550455e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08512931317090988, |
| "step": 4060, |
| "valid_targets_mean": 4165.4, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 4.239958268127282, |
| "grad_norm": 0.482544491305686, |
| "learning_rate": 1.616005672840551e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0946473479270935, |
| "step": 4065, |
| "valid_targets_mean": 6244.1, |
| "valid_targets_min": 3696 |
| }, |
| { |
| "epoch": 4.245174752217006, |
| "grad_norm": 0.6441334590686112, |
| "learning_rate": 1.6109032772768736e-05, |
| "loss": 0.2125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12765106558799744, |
| "step": 4070, |
| "valid_targets_mean": 4555.0, |
| "valid_targets_min": 2488 |
| }, |
| { |
| "epoch": 4.250391236306729, |
| "grad_norm": 0.5467731898668896, |
| "learning_rate": 1.6058035124621766e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09254036843776703, |
| "step": 4075, |
| "valid_targets_mean": 4768.2, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 4.255607720396453, |
| "grad_norm": 0.5335943285352456, |
| "learning_rate": 1.6007064128768354e-05, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09836730360984802, |
| "step": 4080, |
| "valid_targets_mean": 4161.2, |
| "valid_targets_min": 2358 |
| }, |
| { |
| "epoch": 4.260824204486176, |
| "grad_norm": 0.505854543811336, |
| "learning_rate": 1.5956120129832054e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09282954782247543, |
| "step": 4085, |
| "valid_targets_mean": 5335.9, |
| "valid_targets_min": 2540 |
| }, |
| { |
| "epoch": 4.2660406885759, |
| "grad_norm": 0.5168993888236286, |
| "learning_rate": 1.5905203472253892e-05, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10466302931308746, |
| "step": 4090, |
| "valid_targets_mean": 5806.4, |
| "valid_targets_min": 1544 |
| }, |
| { |
| "epoch": 4.271257172665623, |
| "grad_norm": 0.5570781330788017, |
| "learning_rate": 1.5854314500290025e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08315970003604889, |
| "step": 4095, |
| "valid_targets_mean": 3761.0, |
| "valid_targets_min": 2307 |
| }, |
| { |
| "epoch": 4.276473656755347, |
| "grad_norm": 0.5180539101793878, |
| "learning_rate": 1.580345355800944e-05, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10318869352340698, |
| "step": 4100, |
| "valid_targets_mean": 6067.6, |
| "valid_targets_min": 3533 |
| }, |
| { |
| "epoch": 4.28169014084507, |
| "grad_norm": 0.4759566364417453, |
| "learning_rate": 1.5752620989291592e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08804687112569809, |
| "step": 4105, |
| "valid_targets_mean": 5481.1, |
| "valid_targets_min": 2230 |
| }, |
| { |
| "epoch": 4.286906624934794, |
| "grad_norm": 0.6145751936823841, |
| "learning_rate": 1.5701817137824108e-05, |
| "loss": 0.1901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08851298689842224, |
| "step": 4110, |
| "valid_targets_mean": 3818.9, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 4.2921231090245175, |
| "grad_norm": 0.52579025932417, |
| "learning_rate": 1.5651042347100452e-05, |
| "loss": 0.1938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11087971180677414, |
| "step": 4115, |
| "valid_targets_mean": 4957.0, |
| "valid_targets_min": 2571 |
| }, |
| { |
| "epoch": 4.297339593114241, |
| "grad_norm": 0.5076438247402, |
| "learning_rate": 1.5600296960417597e-05, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08762188255786896, |
| "step": 4120, |
| "valid_targets_mean": 4572.0, |
| "valid_targets_min": 2468 |
| }, |
| { |
| "epoch": 4.302556077203964, |
| "grad_norm": 0.5232042525437712, |
| "learning_rate": 1.5549581320873715e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10302773863077164, |
| "step": 4125, |
| "valid_targets_mean": 5525.5, |
| "valid_targets_min": 3418 |
| }, |
| { |
| "epoch": 4.307772561293688, |
| "grad_norm": 0.5084431660923632, |
| "learning_rate": 1.549889577136586e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0906180590391159, |
| "step": 4130, |
| "valid_targets_mean": 4597.6, |
| "valid_targets_min": 2371 |
| }, |
| { |
| "epoch": 4.312989045383412, |
| "grad_norm": 0.5164682116047572, |
| "learning_rate": 1.5448240654587622e-05, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08768324553966522, |
| "step": 4135, |
| "valid_targets_mean": 5027.8, |
| "valid_targets_min": 1861 |
| }, |
| { |
| "epoch": 4.318205529473135, |
| "grad_norm": 0.4705826792702526, |
| "learning_rate": 1.5397616313026853e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0866117849946022, |
| "step": 4140, |
| "valid_targets_mean": 5228.9, |
| "valid_targets_min": 4108 |
| }, |
| { |
| "epoch": 4.323422013562858, |
| "grad_norm": 0.5119602922505897, |
| "learning_rate": 1.5347023088963315e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10736275464296341, |
| "step": 4145, |
| "valid_targets_mean": 4940.8, |
| "valid_targets_min": 2638 |
| }, |
| { |
| "epoch": 4.328638497652582, |
| "grad_norm": 0.5780230067512474, |
| "learning_rate": 1.5296461324466384e-05, |
| "loss": 0.1883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11072811484336853, |
| "step": 4150, |
| "valid_targets_mean": 3822.2, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 4.333854981742306, |
| "grad_norm": 0.45976859901606687, |
| "learning_rate": 1.5245931361392727e-05, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09216370433568954, |
| "step": 4155, |
| "valid_targets_mean": 5424.5, |
| "valid_targets_min": 2679 |
| }, |
| { |
| "epoch": 4.3390714658320295, |
| "grad_norm": 0.4822877754433266, |
| "learning_rate": 1.5195433541384009e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09953758120536804, |
| "step": 4160, |
| "valid_targets_mean": 6368.4, |
| "valid_targets_min": 3936 |
| }, |
| { |
| "epoch": 4.344287949921752, |
| "grad_norm": 0.5462791770593632, |
| "learning_rate": 1.514496820586456e-05, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11608624458312988, |
| "step": 4165, |
| "valid_targets_mean": 4398.8, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 4.349504434011476, |
| "grad_norm": 0.5280279895369452, |
| "learning_rate": 1.5094535696039067e-05, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08779674768447876, |
| "step": 4170, |
| "valid_targets_mean": 4909.9, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 4.3547209181012, |
| "grad_norm": 0.497296131238902, |
| "learning_rate": 1.50441363528903e-05, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08548164367675781, |
| "step": 4175, |
| "valid_targets_mean": 4348.1, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 4.359937402190924, |
| "grad_norm": 0.571056849057062, |
| "learning_rate": 1.4993770517176764e-05, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09022928774356842, |
| "step": 4180, |
| "valid_targets_mean": 4375.6, |
| "valid_targets_min": 1328 |
| }, |
| { |
| "epoch": 4.3651538862806465, |
| "grad_norm": 0.552954874618173, |
| "learning_rate": 1.4943438529430428e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11038275063037872, |
| "step": 4185, |
| "valid_targets_mean": 5781.0, |
| "valid_targets_min": 2714 |
| }, |
| { |
| "epoch": 4.37037037037037, |
| "grad_norm": 0.5709690624150761, |
| "learning_rate": 1.4893140729954402e-05, |
| "loss": 0.1796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07892560213804245, |
| "step": 4190, |
| "valid_targets_mean": 3561.4, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 4.375586854460094, |
| "grad_norm": 0.46304764562125006, |
| "learning_rate": 1.4842877458820644e-05, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07885998487472534, |
| "step": 4195, |
| "valid_targets_mean": 5008.0, |
| "valid_targets_min": 2734 |
| }, |
| { |
| "epoch": 4.380803338549818, |
| "grad_norm": 0.5489716863526718, |
| "learning_rate": 1.4792649055867668e-05, |
| "loss": 0.206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12214149534702301, |
| "step": 4200, |
| "valid_targets_mean": 5317.6, |
| "valid_targets_min": 3488 |
| }, |
| { |
| "epoch": 4.386019822639541, |
| "grad_norm": 0.5936222854237478, |
| "learning_rate": 1.474245586069822e-05, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10609170794487, |
| "step": 4205, |
| "valid_targets_mean": 3679.5, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 4.391236306729264, |
| "grad_norm": 0.8794519825330008, |
| "learning_rate": 1.4692298212677018e-05, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08555130660533905, |
| "step": 4210, |
| "valid_targets_mean": 4084.1, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 4.396452790818988, |
| "grad_norm": 0.5014053800504651, |
| "learning_rate": 1.464217645092843e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10078731179237366, |
| "step": 4215, |
| "valid_targets_mean": 5622.2, |
| "valid_targets_min": 2675 |
| }, |
| { |
| "epoch": 4.401669274908712, |
| "grad_norm": 0.45310896431300557, |
| "learning_rate": 1.4592090914334206e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08208087086677551, |
| "step": 4220, |
| "valid_targets_mean": 5558.6, |
| "valid_targets_min": 2868 |
| }, |
| { |
| "epoch": 4.406885758998435, |
| "grad_norm": 0.49986230812739674, |
| "learning_rate": 1.4542041941531136e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10097955167293549, |
| "step": 4225, |
| "valid_targets_mean": 5447.5, |
| "valid_targets_min": 2116 |
| }, |
| { |
| "epoch": 4.4121022430881585, |
| "grad_norm": 0.5059809184345644, |
| "learning_rate": 1.4492029870908835e-05, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09783491492271423, |
| "step": 4230, |
| "valid_targets_mean": 5252.1, |
| "valid_targets_min": 4056 |
| }, |
| { |
| "epoch": 4.417318727177882, |
| "grad_norm": 0.520314079146309, |
| "learning_rate": 1.4442055040607402e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0887046605348587, |
| "step": 4235, |
| "valid_targets_mean": 4721.4, |
| "valid_targets_min": 2066 |
| }, |
| { |
| "epoch": 4.422535211267606, |
| "grad_norm": 0.6181759123091992, |
| "learning_rate": 1.4392117788515138e-05, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08616556227207184, |
| "step": 4240, |
| "valid_targets_mean": 3734.6, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 4.427751695357329, |
| "grad_norm": 0.4976989934186071, |
| "learning_rate": 1.4342218452266284e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08760233223438263, |
| "step": 4245, |
| "valid_targets_mean": 3873.8, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 4.432968179447053, |
| "grad_norm": 0.5501596884251593, |
| "learning_rate": 1.4292357369238726e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09641134738922119, |
| "step": 4250, |
| "valid_targets_mean": 5268.8, |
| "valid_targets_min": 1951 |
| }, |
| { |
| "epoch": 4.438184663536776, |
| "grad_norm": 0.48594084697619444, |
| "learning_rate": 1.42425348765517e-05, |
| "loss": 0.1804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08059099316596985, |
| "step": 4255, |
| "valid_targets_mean": 5099.4, |
| "valid_targets_min": 1572 |
| }, |
| { |
| "epoch": 4.4434011476265, |
| "grad_norm": 0.48163357483780256, |
| "learning_rate": 1.4192751311063541e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07465652376413345, |
| "step": 4260, |
| "valid_targets_mean": 4928.2, |
| "valid_targets_min": 1986 |
| }, |
| { |
| "epoch": 4.448617631716223, |
| "grad_norm": 0.5582075282557117, |
| "learning_rate": 1.4143007009369388e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08925212919712067, |
| "step": 4265, |
| "valid_targets_mean": 4252.5, |
| "valid_targets_min": 2466 |
| }, |
| { |
| "epoch": 4.453834115805947, |
| "grad_norm": 0.49782397194604244, |
| "learning_rate": 1.4093302307798906e-05, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08925595879554749, |
| "step": 4270, |
| "valid_targets_mean": 4721.1, |
| "valid_targets_min": 2373 |
| }, |
| { |
| "epoch": 4.45905059989567, |
| "grad_norm": 0.5009132428350149, |
| "learning_rate": 1.4043637542414007e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08160844445228577, |
| "step": 4275, |
| "valid_targets_mean": 3924.8, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 4.464267083985394, |
| "grad_norm": 0.5628054062789214, |
| "learning_rate": 1.399401304900661e-05, |
| "loss": 0.1847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09798973798751831, |
| "step": 4280, |
| "valid_targets_mean": 3923.4, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 4.469483568075117, |
| "grad_norm": 0.585729577018991, |
| "learning_rate": 1.3944429163096332e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08872173726558685, |
| "step": 4285, |
| "valid_targets_mean": 3880.2, |
| "valid_targets_min": 1583 |
| }, |
| { |
| "epoch": 4.474700052164841, |
| "grad_norm": 0.5760467170898765, |
| "learning_rate": 1.3894886219928247e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09322041273117065, |
| "step": 4290, |
| "valid_targets_mean": 3371.4, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 4.4799165362545645, |
| "grad_norm": 0.5291247471161196, |
| "learning_rate": 1.3845384554470596e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08454497158527374, |
| "step": 4295, |
| "valid_targets_mean": 4669.1, |
| "valid_targets_min": 2090 |
| }, |
| { |
| "epoch": 4.485133020344288, |
| "grad_norm": 0.5617399480952876, |
| "learning_rate": 1.3795924501412542e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09035874158143997, |
| "step": 4300, |
| "valid_targets_mean": 4323.1, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 4.490349504434011, |
| "grad_norm": 0.5485745370649264, |
| "learning_rate": 1.3746506395161901e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09074965864419937, |
| "step": 4305, |
| "valid_targets_mean": 4551.8, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 4.495565988523735, |
| "grad_norm": 0.5405262796801544, |
| "learning_rate": 1.3697130569842874e-05, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10740135610103607, |
| "step": 4310, |
| "valid_targets_mean": 5237.6, |
| "valid_targets_min": 1602 |
| }, |
| { |
| "epoch": 4.500782472613459, |
| "grad_norm": 0.5557849275633413, |
| "learning_rate": 1.3647797359293797e-05, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09277792274951935, |
| "step": 4315, |
| "valid_targets_mean": 3707.9, |
| "valid_targets_min": 1389 |
| }, |
| { |
| "epoch": 4.505998956703182, |
| "grad_norm": 0.48870583625018515, |
| "learning_rate": 1.359850709706489e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09530732780694962, |
| "step": 4320, |
| "valid_targets_mean": 5565.2, |
| "valid_targets_min": 4395 |
| }, |
| { |
| "epoch": 4.511215440792905, |
| "grad_norm": 0.5622484777803662, |
| "learning_rate": 1.354926011641596e-05, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08089743554592133, |
| "step": 4325, |
| "valid_targets_mean": 3019.0, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 4.516431924882629, |
| "grad_norm": 0.5542477243808857, |
| "learning_rate": 1.3500056750314215e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09326313436031342, |
| "step": 4330, |
| "valid_targets_mean": 3765.6, |
| "valid_targets_min": 2014 |
| }, |
| { |
| "epoch": 4.521648408972353, |
| "grad_norm": 0.5233146742760183, |
| "learning_rate": 1.345089733143196e-05, |
| "loss": 0.1856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10327020287513733, |
| "step": 4335, |
| "valid_targets_mean": 4620.4, |
| "valid_targets_min": 2016 |
| }, |
| { |
| "epoch": 4.5268648930620765, |
| "grad_norm": 0.4698810059913912, |
| "learning_rate": 1.3401782192144372e-05, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06537723541259766, |
| "step": 4340, |
| "valid_targets_mean": 4914.2, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 4.532081377151799, |
| "grad_norm": 0.4813674546712752, |
| "learning_rate": 1.3352711664527242e-05, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08028852939605713, |
| "step": 4345, |
| "valid_targets_mean": 4774.6, |
| "valid_targets_min": 1768 |
| }, |
| { |
| "epoch": 4.537297861241523, |
| "grad_norm": 0.55463033366809, |
| "learning_rate": 1.3303686080354739e-05, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0880127102136612, |
| "step": 4350, |
| "valid_targets_mean": 3802.6, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 4.542514345331247, |
| "grad_norm": 0.5472619983465714, |
| "learning_rate": 1.3254705771097154e-05, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10948982834815979, |
| "step": 4355, |
| "valid_targets_mean": 4689.6, |
| "valid_targets_min": 2202 |
| }, |
| { |
| "epoch": 4.547730829420971, |
| "grad_norm": 0.5603369394501863, |
| "learning_rate": 1.3205771067918675e-05, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07711246609687805, |
| "step": 4360, |
| "valid_targets_mean": 4079.0, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 4.5529473135106935, |
| "grad_norm": 0.5492810122172286, |
| "learning_rate": 1.3156882301675133e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08386009186506271, |
| "step": 4365, |
| "valid_targets_mean": 3945.0, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 4.558163797600417, |
| "grad_norm": 0.4715280247213639, |
| "learning_rate": 1.3108039802911776e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08024720102548599, |
| "step": 4370, |
| "valid_targets_mean": 5053.8, |
| "valid_targets_min": 2785 |
| }, |
| { |
| "epoch": 4.563380281690141, |
| "grad_norm": 0.5877837255800695, |
| "learning_rate": 1.3059243901861024e-05, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09088737517595291, |
| "step": 4375, |
| "valid_targets_mean": 3530.5, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 4.568596765779865, |
| "grad_norm": 0.5176398815331197, |
| "learning_rate": 1.3010494928440248e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09199392050504684, |
| "step": 4380, |
| "valid_targets_mean": 4320.6, |
| "valid_targets_min": 2250 |
| }, |
| { |
| "epoch": 4.573813249869588, |
| "grad_norm": 0.4934780148015792, |
| "learning_rate": 1.2961793212249527e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08720052242279053, |
| "step": 4385, |
| "valid_targets_mean": 4446.1, |
| "valid_targets_min": 2146 |
| }, |
| { |
| "epoch": 4.579029733959311, |
| "grad_norm": 0.4754133828329036, |
| "learning_rate": 1.2913139082569434e-05, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07586514949798584, |
| "step": 4390, |
| "valid_targets_mean": 4668.9, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 4.584246218049035, |
| "grad_norm": 0.49030213981053966, |
| "learning_rate": 1.2864532868358799e-05, |
| "loss": 0.1906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08727875351905823, |
| "step": 4395, |
| "valid_targets_mean": 6398.2, |
| "valid_targets_min": 2712 |
| }, |
| { |
| "epoch": 4.589462702138759, |
| "grad_norm": 0.4978857129207338, |
| "learning_rate": 1.2815974898252482e-05, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09104059636592865, |
| "step": 4400, |
| "valid_targets_mean": 5123.6, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 4.594679186228482, |
| "grad_norm": 0.5064315260591452, |
| "learning_rate": 1.2767465500559162e-05, |
| "loss": 0.1903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10585306584835052, |
| "step": 4405, |
| "valid_targets_mean": 5692.2, |
| "valid_targets_min": 1967 |
| }, |
| { |
| "epoch": 4.5998956703182055, |
| "grad_norm": 0.5367081628888567, |
| "learning_rate": 1.271900500325911e-05, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09236375987529755, |
| "step": 4410, |
| "valid_targets_mean": 4742.2, |
| "valid_targets_min": 1586 |
| }, |
| { |
| "epoch": 4.605112154407929, |
| "grad_norm": 0.5758230696012199, |
| "learning_rate": 1.2670593734001972e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09824080020189285, |
| "step": 4415, |
| "valid_targets_mean": 4728.8, |
| "valid_targets_min": 3753 |
| }, |
| { |
| "epoch": 4.610328638497653, |
| "grad_norm": 0.4734993971322568, |
| "learning_rate": 1.2622232020104568e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09226129949092865, |
| "step": 4420, |
| "valid_targets_mean": 5586.2, |
| "valid_targets_min": 2757 |
| }, |
| { |
| "epoch": 4.615545122587376, |
| "grad_norm": 0.4959936805670171, |
| "learning_rate": 1.2573920188548634e-05, |
| "loss": 0.1886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10080541670322418, |
| "step": 4425, |
| "valid_targets_mean": 5626.9, |
| "valid_targets_min": 3439 |
| }, |
| { |
| "epoch": 4.6207616066771, |
| "grad_norm": 0.5551311601238801, |
| "learning_rate": 1.2525658565978668e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11569254845380783, |
| "step": 4430, |
| "valid_targets_mean": 5708.4, |
| "valid_targets_min": 2079 |
| }, |
| { |
| "epoch": 4.625978090766823, |
| "grad_norm": 0.665499653435843, |
| "learning_rate": 1.2477447478699696e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10402677953243256, |
| "step": 4435, |
| "valid_targets_mean": 3055.1, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 4.631194574856547, |
| "grad_norm": 0.6135164109299587, |
| "learning_rate": 1.2429287252675062e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08897197991609573, |
| "step": 4440, |
| "valid_targets_mean": 4009.1, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 4.63641105894627, |
| "grad_norm": 0.6150723224583431, |
| "learning_rate": 1.2381178213524223e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09846167266368866, |
| "step": 4445, |
| "valid_targets_mean": 3743.9, |
| "valid_targets_min": 2535 |
| }, |
| { |
| "epoch": 4.641627543035994, |
| "grad_norm": 0.4603297482, |
| "learning_rate": 1.2333120686520568e-05, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07244417071342468, |
| "step": 4450, |
| "valid_targets_mean": 4653.0, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 4.646844027125717, |
| "grad_norm": 0.5421584576747219, |
| "learning_rate": 1.2285114996589181e-05, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09737575054168701, |
| "step": 4455, |
| "valid_targets_mean": 4780.5, |
| "valid_targets_min": 1596 |
| }, |
| { |
| "epoch": 4.652060511215441, |
| "grad_norm": 0.5306503819722574, |
| "learning_rate": 1.2237161468304681e-05, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1015390157699585, |
| "step": 4460, |
| "valid_targets_mean": 4998.6, |
| "valid_targets_min": 2885 |
| }, |
| { |
| "epoch": 4.657276995305164, |
| "grad_norm": 0.48783463584651493, |
| "learning_rate": 1.218926042588902e-05, |
| "loss": 0.1851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07946668565273285, |
| "step": 4465, |
| "valid_targets_mean": 4776.6, |
| "valid_targets_min": 1922 |
| }, |
| { |
| "epoch": 4.662493479394888, |
| "grad_norm": 0.5305581567223895, |
| "learning_rate": 1.2141412193209274e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09118214249610901, |
| "step": 4470, |
| "valid_targets_mean": 4462.5, |
| "valid_targets_min": 3245 |
| }, |
| { |
| "epoch": 4.6677099634846115, |
| "grad_norm": 0.4768961351208789, |
| "learning_rate": 1.2093617093775458e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08062206208705902, |
| "step": 4475, |
| "valid_targets_mean": 5484.6, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 4.672926447574335, |
| "grad_norm": 0.5063335449476011, |
| "learning_rate": 1.2045875450738352e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07570169866085052, |
| "step": 4480, |
| "valid_targets_mean": 4700.0, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 4.678142931664058, |
| "grad_norm": 0.4568648722852648, |
| "learning_rate": 1.199818758688731e-05, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07844646275043488, |
| "step": 4485, |
| "valid_targets_mean": 4799.9, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 4.683359415753782, |
| "grad_norm": 0.5085681390429685, |
| "learning_rate": 1.1950553824648077e-05, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11995210498571396, |
| "step": 4490, |
| "valid_targets_mean": 5328.2, |
| "valid_targets_min": 2971 |
| }, |
| { |
| "epoch": 4.688575899843506, |
| "grad_norm": 0.5129356193317287, |
| "learning_rate": 1.1902974486080599e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07197125256061554, |
| "step": 4495, |
| "valid_targets_mean": 3731.9, |
| "valid_targets_min": 2461 |
| }, |
| { |
| "epoch": 4.6937923839332285, |
| "grad_norm": 0.5253442583183974, |
| "learning_rate": 1.1855449892876858e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09587593376636505, |
| "step": 4500, |
| "valid_targets_mean": 5387.5, |
| "valid_targets_min": 3194 |
| }, |
| { |
| "epoch": 4.699008868022952, |
| "grad_norm": 0.5519442551812616, |
| "learning_rate": 1.1807980366358699e-05, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12228633463382721, |
| "step": 4505, |
| "valid_targets_mean": 5418.8, |
| "valid_targets_min": 2167 |
| }, |
| { |
| "epoch": 4.704225352112676, |
| "grad_norm": 0.537327606366864, |
| "learning_rate": 1.1760566227475642e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08802211284637451, |
| "step": 4510, |
| "valid_targets_mean": 4752.1, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 4.7094418362024, |
| "grad_norm": 0.5001814385756308, |
| "learning_rate": 1.1713207796802739e-05, |
| "loss": 0.1848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07559408247470856, |
| "step": 4515, |
| "valid_targets_mean": 4547.1, |
| "valid_targets_min": 2084 |
| }, |
| { |
| "epoch": 4.7146583202921235, |
| "grad_norm": 0.6139574218469945, |
| "learning_rate": 1.166590539453837e-05, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0800754651427269, |
| "step": 4520, |
| "valid_targets_mean": 2884.9, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 4.719874804381846, |
| "grad_norm": 0.44098987196857486, |
| "learning_rate": 1.1618659340502104e-05, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07793943583965302, |
| "step": 4525, |
| "valid_targets_mean": 5205.0, |
| "valid_targets_min": 3386 |
| }, |
| { |
| "epoch": 4.72509128847157, |
| "grad_norm": 0.5328520356066797, |
| "learning_rate": 1.157146995413252e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09932157397270203, |
| "step": 4530, |
| "valid_targets_mean": 5007.4, |
| "valid_targets_min": 3180 |
| }, |
| { |
| "epoch": 4.730307772561294, |
| "grad_norm": 0.5714349312818425, |
| "learning_rate": 1.152433755448509e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11112132668495178, |
| "step": 4535, |
| "valid_targets_mean": 4135.0, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 4.735524256651017, |
| "grad_norm": 0.6077934906569697, |
| "learning_rate": 1.1477262460229945e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10875889658927917, |
| "step": 4540, |
| "valid_targets_mean": 4602.1, |
| "valid_targets_min": 2684 |
| }, |
| { |
| "epoch": 4.7407407407407405, |
| "grad_norm": 0.49634424152814044, |
| "learning_rate": 1.143024498964981e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08921676874160767, |
| "step": 4545, |
| "valid_targets_mean": 4846.4, |
| "valid_targets_min": 1671 |
| }, |
| { |
| "epoch": 4.745957224830464, |
| "grad_norm": 0.5484808828375776, |
| "learning_rate": 1.1383285460637766e-05, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08307075500488281, |
| "step": 4550, |
| "valid_targets_mean": 4329.8, |
| "valid_targets_min": 2076 |
| }, |
| { |
| "epoch": 4.751173708920188, |
| "grad_norm": 0.5699100757156194, |
| "learning_rate": 1.1336384190695172e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0887555330991745, |
| "step": 4555, |
| "valid_targets_mean": 4386.0, |
| "valid_targets_min": 2263 |
| }, |
| { |
| "epoch": 4.756390193009912, |
| "grad_norm": 0.6162552932737473, |
| "learning_rate": 1.1289541496929466e-05, |
| "loss": 0.1934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1148238554596901, |
| "step": 4560, |
| "valid_targets_mean": 4499.8, |
| "valid_targets_min": 1708 |
| }, |
| { |
| "epoch": 4.761606677099635, |
| "grad_norm": 0.5482788011589695, |
| "learning_rate": 1.1242757696052044e-05, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12479747831821442, |
| "step": 4565, |
| "valid_targets_mean": 5401.1, |
| "valid_targets_min": 2918 |
| }, |
| { |
| "epoch": 4.766823161189358, |
| "grad_norm": 0.5888332418366768, |
| "learning_rate": 1.1196033104376141e-05, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09170383214950562, |
| "step": 4570, |
| "valid_targets_mean": 3555.5, |
| "valid_targets_min": 1731 |
| }, |
| { |
| "epoch": 4.772039645279082, |
| "grad_norm": 0.5317249435508927, |
| "learning_rate": 1.1149368037814644e-05, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10484310239553452, |
| "step": 4575, |
| "valid_targets_mean": 4555.9, |
| "valid_targets_min": 2096 |
| }, |
| { |
| "epoch": 4.777256129368805, |
| "grad_norm": 0.4799591252187416, |
| "learning_rate": 1.1102762811877974e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08517284691333771, |
| "step": 4580, |
| "valid_targets_mean": 5683.2, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 4.782472613458529, |
| "grad_norm": 0.5368871499454133, |
| "learning_rate": 1.1056217741672e-05, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09460750967264175, |
| "step": 4585, |
| "valid_targets_mean": 4530.9, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 4.7876890975482524, |
| "grad_norm": 0.6264850463625782, |
| "learning_rate": 1.1009733141895823e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1226273775100708, |
| "step": 4590, |
| "valid_targets_mean": 3832.9, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 4.792905581637976, |
| "grad_norm": 0.5854870439324866, |
| "learning_rate": 1.0963309326839708e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09034893661737442, |
| "step": 4595, |
| "valid_targets_mean": 4724.6, |
| "valid_targets_min": 1686 |
| }, |
| { |
| "epoch": 4.7981220657277, |
| "grad_norm": 0.5325653015133102, |
| "learning_rate": 1.0916946610382966e-05, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0999528169631958, |
| "step": 4600, |
| "valid_targets_mean": 4824.1, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 4.803338549817423, |
| "grad_norm": 1.1082587355140117, |
| "learning_rate": 1.0870645305991772e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09996119141578674, |
| "step": 4605, |
| "valid_targets_mean": 3833.6, |
| "valid_targets_min": 2319 |
| }, |
| { |
| "epoch": 4.808555033907147, |
| "grad_norm": 0.5691295113560585, |
| "learning_rate": 1.0824405726717119e-05, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10683897137641907, |
| "step": 4610, |
| "valid_targets_mean": 5273.0, |
| "valid_targets_min": 2815 |
| }, |
| { |
| "epoch": 4.81377151799687, |
| "grad_norm": 0.4870388968066102, |
| "learning_rate": 1.0778228185192639e-05, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10072125494480133, |
| "step": 4615, |
| "valid_targets_mean": 5368.4, |
| "valid_targets_min": 2944 |
| }, |
| { |
| "epoch": 4.818988002086593, |
| "grad_norm": 0.4751385993259293, |
| "learning_rate": 1.0732112993632539e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10202068090438843, |
| "step": 4620, |
| "valid_targets_mean": 6273.8, |
| "valid_targets_min": 3310 |
| }, |
| { |
| "epoch": 4.824204486176317, |
| "grad_norm": 0.5417469989722015, |
| "learning_rate": 1.0686060463829451e-05, |
| "loss": 0.1796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09483262896537781, |
| "step": 4625, |
| "valid_targets_mean": 4831.4, |
| "valid_targets_min": 3176 |
| }, |
| { |
| "epoch": 4.829420970266041, |
| "grad_norm": 0.5340135754400219, |
| "learning_rate": 1.0640070907152342e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08007314801216125, |
| "step": 4630, |
| "valid_targets_mean": 4769.1, |
| "valid_targets_min": 3676 |
| }, |
| { |
| "epoch": 4.834637454355764, |
| "grad_norm": 0.535400223422294, |
| "learning_rate": 1.0594144634544405e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10891067236661911, |
| "step": 4635, |
| "valid_targets_mean": 5453.6, |
| "valid_targets_min": 2466 |
| }, |
| { |
| "epoch": 4.839853938445488, |
| "grad_norm": 0.5421802927843254, |
| "learning_rate": 1.0548281956520978e-05, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10159303992986679, |
| "step": 4640, |
| "valid_targets_mean": 4223.2, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 4.845070422535211, |
| "grad_norm": 0.4817463581579997, |
| "learning_rate": 1.0502483183167395e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09178589284420013, |
| "step": 4645, |
| "valid_targets_mean": 5853.9, |
| "valid_targets_min": 3404 |
| }, |
| { |
| "epoch": 4.850286906624935, |
| "grad_norm": 0.4579589936355861, |
| "learning_rate": 1.0456748624136951e-05, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.089797243475914, |
| "step": 4650, |
| "valid_targets_mean": 5684.2, |
| "valid_targets_min": 1831 |
| }, |
| { |
| "epoch": 4.8555033907146585, |
| "grad_norm": 0.5325226015959841, |
| "learning_rate": 1.0411078588648756e-05, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10591491311788559, |
| "step": 4655, |
| "valid_targets_mean": 4545.8, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 4.860719874804381, |
| "grad_norm": 0.5359785835739626, |
| "learning_rate": 1.0365473385485662e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11070498824119568, |
| "step": 4660, |
| "valid_targets_mean": 5118.9, |
| "valid_targets_min": 2572 |
| }, |
| { |
| "epoch": 4.865936358894105, |
| "grad_norm": 0.4681140800466057, |
| "learning_rate": 1.0319933322992206e-05, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06727112829685211, |
| "step": 4665, |
| "valid_targets_mean": 6828.0, |
| "valid_targets_min": 3398 |
| }, |
| { |
| "epoch": 4.871152842983829, |
| "grad_norm": 0.544596415614375, |
| "learning_rate": 1.0274458709072459e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10550592839717865, |
| "step": 4670, |
| "valid_targets_mean": 4509.0, |
| "valid_targets_min": 1603 |
| }, |
| { |
| "epoch": 4.876369327073553, |
| "grad_norm": 0.5211494915877919, |
| "learning_rate": 1.022904985118803e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08883964270353317, |
| "step": 4675, |
| "valid_targets_mean": 4939.5, |
| "valid_targets_min": 2072 |
| }, |
| { |
| "epoch": 4.881585811163276, |
| "grad_norm": 0.5366796706123248, |
| "learning_rate": 1.0183707056355883e-05, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08497545123100281, |
| "step": 4680, |
| "valid_targets_mean": 4657.1, |
| "valid_targets_min": 2882 |
| }, |
| { |
| "epoch": 4.886802295252999, |
| "grad_norm": 0.5538098669256223, |
| "learning_rate": 1.0138430631146372e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09791304171085358, |
| "step": 4685, |
| "valid_targets_mean": 4562.9, |
| "valid_targets_min": 1733 |
| }, |
| { |
| "epoch": 4.892018779342723, |
| "grad_norm": 0.5122227553184248, |
| "learning_rate": 1.009322088168108e-05, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08409063518047333, |
| "step": 4690, |
| "valid_targets_mean": 4454.1, |
| "valid_targets_min": 2488 |
| }, |
| { |
| "epoch": 4.897235263432447, |
| "grad_norm": 0.47515776141982186, |
| "learning_rate": 1.0048078113630806e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09185665845870972, |
| "step": 4695, |
| "valid_targets_mean": 5278.4, |
| "valid_targets_min": 2265 |
| }, |
| { |
| "epoch": 4.90245174752217, |
| "grad_norm": 0.4708229178412286, |
| "learning_rate": 1.0003002632213455e-05, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08610205352306366, |
| "step": 4700, |
| "valid_targets_mean": 5702.5, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 4.907668231611893, |
| "grad_norm": 0.5456843140599923, |
| "learning_rate": 9.95799474219202e-06, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08927833288908005, |
| "step": 4705, |
| "valid_targets_mean": 3771.5, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 4.912884715701617, |
| "grad_norm": 0.5304864811688249, |
| "learning_rate": 9.913054747872473e-06, |
| "loss": 0.1861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08944433927536011, |
| "step": 4710, |
| "valid_targets_mean": 3983.1, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 4.918101199791341, |
| "grad_norm": 0.5120679513132991, |
| "learning_rate": 9.868182953101754e-06, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09833677113056183, |
| "step": 4715, |
| "valid_targets_mean": 4892.6, |
| "valid_targets_min": 1868 |
| }, |
| { |
| "epoch": 4.923317683881065, |
| "grad_norm": 0.4740197796982808, |
| "learning_rate": 9.823379661265677e-06, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09384319186210632, |
| "step": 4720, |
| "valid_targets_mean": 5562.9, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 4.9285341679707875, |
| "grad_norm": 0.5754044617169406, |
| "learning_rate": 9.778645175286904e-06, |
| "loss": 0.1886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09790576994419098, |
| "step": 4725, |
| "valid_targets_mean": 3851.1, |
| "valid_targets_min": 2615 |
| }, |
| { |
| "epoch": 4.933750652060511, |
| "grad_norm": 0.5467350049580387, |
| "learning_rate": 9.733979797622874e-06, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08118186891078949, |
| "step": 4730, |
| "valid_targets_mean": 4144.5, |
| "valid_targets_min": 2603 |
| }, |
| { |
| "epoch": 4.938967136150235, |
| "grad_norm": 0.5391696977368485, |
| "learning_rate": 9.689383830263808e-06, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09587861597537994, |
| "step": 4735, |
| "valid_targets_mean": 4530.6, |
| "valid_targets_min": 1367 |
| }, |
| { |
| "epoch": 4.944183620239958, |
| "grad_norm": 0.5053495433942577, |
| "learning_rate": 9.6448575747306e-06, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09295158088207245, |
| "step": 4740, |
| "valid_targets_mean": 5147.0, |
| "valid_targets_min": 2828 |
| }, |
| { |
| "epoch": 4.949400104329682, |
| "grad_norm": 0.5045776281748604, |
| "learning_rate": 9.60040133207281e-06, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10613466799259186, |
| "step": 4745, |
| "valid_targets_mean": 5857.0, |
| "valid_targets_min": 1833 |
| }, |
| { |
| "epoch": 4.954616588419405, |
| "grad_norm": 0.6058619681222275, |
| "learning_rate": 9.556015402866661e-06, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09133664518594742, |
| "step": 4750, |
| "valid_targets_mean": 4276.0, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 4.959833072509129, |
| "grad_norm": 0.4959626512225186, |
| "learning_rate": 9.511700087212934e-06, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07980967313051224, |
| "step": 4755, |
| "valid_targets_mean": 5189.9, |
| "valid_targets_min": 1708 |
| }, |
| { |
| "epoch": 4.965049556598853, |
| "grad_norm": 0.48580137728306516, |
| "learning_rate": 9.467455684735015e-06, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09308650344610214, |
| "step": 4760, |
| "valid_targets_mean": 5298.2, |
| "valid_targets_min": 2556 |
| }, |
| { |
| "epoch": 4.970266040688576, |
| "grad_norm": 0.5535867237148877, |
| "learning_rate": 9.423282494576804e-06, |
| "loss": 0.1985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10663655400276184, |
| "step": 4765, |
| "valid_targets_mean": 3930.9, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 4.975482524778299, |
| "grad_norm": 0.4835117585178872, |
| "learning_rate": 9.379180815400753e-06, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08318492770195007, |
| "step": 4770, |
| "valid_targets_mean": 4649.0, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 4.980699008868023, |
| "grad_norm": 0.5328360355929028, |
| "learning_rate": 9.33515094538579e-06, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11444680392742157, |
| "step": 4775, |
| "valid_targets_mean": 4569.6, |
| "valid_targets_min": 2494 |
| }, |
| { |
| "epoch": 4.985915492957746, |
| "grad_norm": 2.34205486469549, |
| "learning_rate": 9.291193182225341e-06, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09870575368404388, |
| "step": 4780, |
| "valid_targets_mean": 4542.0, |
| "valid_targets_min": 2048 |
| }, |
| { |
| "epoch": 4.99113197704747, |
| "grad_norm": 0.5444826085311868, |
| "learning_rate": 9.247307823125296e-06, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09969726204872131, |
| "step": 4785, |
| "valid_targets_mean": 4778.9, |
| "valid_targets_min": 2030 |
| }, |
| { |
| "epoch": 4.9963484611371936, |
| "grad_norm": 0.4600774725768868, |
| "learning_rate": 9.203495164802027e-06, |
| "loss": 0.175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08270413428544998, |
| "step": 4790, |
| "valid_targets_mean": 4215.5, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 5.001043296817945, |
| "grad_norm": 0.5767089850528268, |
| "learning_rate": 9.159755503480345e-06, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09802889823913574, |
| "step": 4795, |
| "valid_targets_mean": 3765.0, |
| "valid_targets_min": 2046 |
| }, |
| { |
| "epoch": 5.006259780907668, |
| "grad_norm": 0.5088779515908076, |
| "learning_rate": 9.116089134891532e-06, |
| "loss": 0.1824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08812258392572403, |
| "step": 4800, |
| "valid_targets_mean": 4855.0, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 5.011476264997392, |
| "grad_norm": 0.5579258578134513, |
| "learning_rate": 9.072496354271307e-06, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10268765687942505, |
| "step": 4805, |
| "valid_targets_mean": 5290.8, |
| "valid_targets_min": 2498 |
| }, |
| { |
| "epoch": 5.016692749087115, |
| "grad_norm": 0.49026031524788816, |
| "learning_rate": 9.028977456357872e-06, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08821749687194824, |
| "step": 4810, |
| "valid_targets_mean": 4934.0, |
| "valid_targets_min": 2634 |
| }, |
| { |
| "epoch": 5.021909233176839, |
| "grad_norm": 0.5755929497427029, |
| "learning_rate": 8.985532735389873e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09229262173175812, |
| "step": 4815, |
| "valid_targets_mean": 4120.2, |
| "valid_targets_min": 2454 |
| }, |
| { |
| "epoch": 5.027125717266562, |
| "grad_norm": 0.4788832049075145, |
| "learning_rate": 8.942162485104436e-06, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10502435266971588, |
| "step": 4820, |
| "valid_targets_mean": 7206.6, |
| "valid_targets_min": 3051 |
| }, |
| { |
| "epoch": 5.032342201356286, |
| "grad_norm": 0.5452723647928759, |
| "learning_rate": 8.898866998735195e-06, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07429133355617523, |
| "step": 4825, |
| "valid_targets_mean": 5484.9, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 5.037558685446009, |
| "grad_norm": 0.4701185100292731, |
| "learning_rate": 8.85564656901028e-06, |
| "loss": 0.2003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07872854173183441, |
| "step": 4830, |
| "valid_targets_mean": 6550.2, |
| "valid_targets_min": 2823 |
| }, |
| { |
| "epoch": 5.042775169535733, |
| "grad_norm": 0.5136050624625815, |
| "learning_rate": 8.81250148815035e-06, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09415871649980545, |
| "step": 4835, |
| "valid_targets_mean": 5931.8, |
| "valid_targets_min": 3171 |
| }, |
| { |
| "epoch": 5.0479916536254565, |
| "grad_norm": 0.52701581256359, |
| "learning_rate": 8.769432047866608e-06, |
| "loss": 0.1759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09285668283700943, |
| "step": 4840, |
| "valid_targets_mean": 5262.5, |
| "valid_targets_min": 2397 |
| }, |
| { |
| "epoch": 5.05320813771518, |
| "grad_norm": 0.49187753178141813, |
| "learning_rate": 8.72643853935887e-06, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07486429065465927, |
| "step": 4845, |
| "valid_targets_mean": 5657.0, |
| "valid_targets_min": 2807 |
| }, |
| { |
| "epoch": 5.058424621804903, |
| "grad_norm": 0.5222415808875729, |
| "learning_rate": 8.683521253313527e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0767851322889328, |
| "step": 4850, |
| "valid_targets_mean": 5430.5, |
| "valid_targets_min": 1363 |
| }, |
| { |
| "epoch": 5.063641105894627, |
| "grad_norm": 0.5849510322338102, |
| "learning_rate": 8.640680479901648e-06, |
| "loss": 0.1754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1165381669998169, |
| "step": 4855, |
| "valid_targets_mean": 5751.6, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 5.068857589984351, |
| "grad_norm": 0.552824844759434, |
| "learning_rate": 8.597916508776958e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08179624378681183, |
| "step": 4860, |
| "valid_targets_mean": 4421.5, |
| "valid_targets_min": 2044 |
| }, |
| { |
| "epoch": 5.074074074074074, |
| "grad_norm": 0.5852806584482265, |
| "learning_rate": 8.55522962907394e-06, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09368069469928741, |
| "step": 4865, |
| "valid_targets_mean": 4771.2, |
| "valid_targets_min": 2303 |
| }, |
| { |
| "epoch": 5.079290558163797, |
| "grad_norm": 0.5656026175754425, |
| "learning_rate": 8.512620129405816e-06, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08062414079904556, |
| "step": 4870, |
| "valid_targets_mean": 4366.1, |
| "valid_targets_min": 1651 |
| }, |
| { |
| "epoch": 5.084507042253521, |
| "grad_norm": 0.6056679184030501, |
| "learning_rate": 8.470088297862669e-06, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.093223437666893, |
| "step": 4875, |
| "valid_targets_mean": 4162.6, |
| "valid_targets_min": 1806 |
| }, |
| { |
| "epoch": 5.089723526343245, |
| "grad_norm": 0.46297603218535177, |
| "learning_rate": 8.427634422009399e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06911472976207733, |
| "step": 4880, |
| "valid_targets_mean": 4408.1, |
| "valid_targets_min": 182 |
| }, |
| { |
| "epoch": 5.0949400104329685, |
| "grad_norm": 0.480165349242614, |
| "learning_rate": 8.385258788883889e-06, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.080543652176857, |
| "step": 4885, |
| "valid_targets_mean": 5390.2, |
| "valid_targets_min": 2339 |
| }, |
| { |
| "epoch": 5.100156494522691, |
| "grad_norm": 0.6187632230317968, |
| "learning_rate": 8.342961684994975e-06, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09540046751499176, |
| "step": 4890, |
| "valid_targets_mean": 4305.9, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 5.105372978612415, |
| "grad_norm": 0.5014931985409201, |
| "learning_rate": 8.300743396320566e-06, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09194246679544449, |
| "step": 4895, |
| "valid_targets_mean": 5965.2, |
| "valid_targets_min": 4203 |
| }, |
| { |
| "epoch": 5.110589462702139, |
| "grad_norm": 0.4761619942669461, |
| "learning_rate": 8.25860420830567e-06, |
| "loss": 0.1843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08677559345960617, |
| "step": 4900, |
| "valid_targets_mean": 6193.1, |
| "valid_targets_min": 2616 |
| }, |
| { |
| "epoch": 5.115805946791863, |
| "grad_norm": 0.5438438081832728, |
| "learning_rate": 8.216544405860482e-06, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07954394817352295, |
| "step": 4905, |
| "valid_targets_mean": 4145.0, |
| "valid_targets_min": 1802 |
| }, |
| { |
| "epoch": 5.1210224308815855, |
| "grad_norm": 0.5844190463597226, |
| "learning_rate": 8.17456427335848e-06, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0916503518819809, |
| "step": 4910, |
| "valid_targets_mean": 4599.1, |
| "valid_targets_min": 3185 |
| }, |
| { |
| "epoch": 5.126238914971309, |
| "grad_norm": 0.4767795377130653, |
| "learning_rate": 8.132664094634452e-06, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07637080550193787, |
| "step": 4915, |
| "valid_targets_mean": 5424.6, |
| "valid_targets_min": 1951 |
| }, |
| { |
| "epoch": 5.131455399061033, |
| "grad_norm": 0.5719534354285207, |
| "learning_rate": 8.090844152982628e-06, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0903482586145401, |
| "step": 4920, |
| "valid_targets_mean": 4490.8, |
| "valid_targets_min": 3336 |
| }, |
| { |
| "epoch": 5.136671883150757, |
| "grad_norm": 0.594228113828102, |
| "learning_rate": 8.049104731154722e-06, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10992646217346191, |
| "step": 4925, |
| "valid_targets_mean": 4066.6, |
| "valid_targets_min": 1850 |
| }, |
| { |
| "epoch": 5.14188836724048, |
| "grad_norm": 0.5393641346325978, |
| "learning_rate": 8.007446111358066e-06, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10360969603061676, |
| "step": 4930, |
| "valid_targets_mean": 5236.2, |
| "valid_targets_min": 1630 |
| }, |
| { |
| "epoch": 5.147104851330203, |
| "grad_norm": 0.8629098322126454, |
| "learning_rate": 7.965868575253632e-06, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08919937908649445, |
| "step": 4935, |
| "valid_targets_mean": 5563.1, |
| "valid_targets_min": 3712 |
| }, |
| { |
| "epoch": 5.152321335419927, |
| "grad_norm": 0.5271937265549865, |
| "learning_rate": 7.92437240395422e-06, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07373526692390442, |
| "step": 4940, |
| "valid_targets_mean": 4110.0, |
| "valid_targets_min": 2084 |
| }, |
| { |
| "epoch": 5.157537819509651, |
| "grad_norm": 0.5319044522991199, |
| "learning_rate": 7.882957878022472e-06, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10028360038995743, |
| "step": 4945, |
| "valid_targets_mean": 4937.0, |
| "valid_targets_min": 1926 |
| }, |
| { |
| "epoch": 5.162754303599374, |
| "grad_norm": 0.5770944750107858, |
| "learning_rate": 7.841625277469043e-06, |
| "loss": 0.176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09501786530017853, |
| "step": 4950, |
| "valid_targets_mean": 4708.1, |
| "valid_targets_min": 1991 |
| }, |
| { |
| "epoch": 5.1679707876890975, |
| "grad_norm": 0.5449691133821197, |
| "learning_rate": 7.800374881750644e-06, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09172935783863068, |
| "step": 4955, |
| "valid_targets_mean": 4663.4, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 5.173187271778821, |
| "grad_norm": 0.5307143737733113, |
| "learning_rate": 7.759206969768216e-06, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07758703082799911, |
| "step": 4960, |
| "valid_targets_mean": 4877.8, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 5.178403755868545, |
| "grad_norm": 0.5757575845426983, |
| "learning_rate": 7.718121819864983e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0805349200963974, |
| "step": 4965, |
| "valid_targets_mean": 4184.6, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 5.183620239958268, |
| "grad_norm": 0.5721969021340418, |
| "learning_rate": 7.677119709824635e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07684718072414398, |
| "step": 4970, |
| "valid_targets_mean": 4147.8, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 5.188836724047992, |
| "grad_norm": 0.5078691963548261, |
| "learning_rate": 7.636200916869387e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08875864744186401, |
| "step": 4975, |
| "valid_targets_mean": 5011.4, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 5.194053208137715, |
| "grad_norm": 0.5524157308543848, |
| "learning_rate": 7.595365717658143e-06, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.083509162068367, |
| "step": 4980, |
| "valid_targets_mean": 4123.9, |
| "valid_targets_min": 1454 |
| }, |
| { |
| "epoch": 5.199269692227439, |
| "grad_norm": 0.51400023936975, |
| "learning_rate": 7.554614388284609e-06, |
| "loss": 0.1851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08999491482973099, |
| "step": 4985, |
| "valid_targets_mean": 4854.6, |
| "valid_targets_min": 2395 |
| }, |
| { |
| "epoch": 5.204486176317162, |
| "grad_norm": 0.5864600154596398, |
| "learning_rate": 7.513947204275453e-06, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09562638401985168, |
| "step": 4990, |
| "valid_targets_mean": 4584.2, |
| "valid_targets_min": 2267 |
| }, |
| { |
| "epoch": 5.209702660406886, |
| "grad_norm": 0.5532188252087719, |
| "learning_rate": 7.473364440588404e-06, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0839436799287796, |
| "step": 4995, |
| "valid_targets_mean": 4932.2, |
| "valid_targets_min": 1548 |
| }, |
| { |
| "epoch": 5.214919144496609, |
| "grad_norm": 0.6299330322378309, |
| "learning_rate": 7.432866371610403e-06, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08354543149471283, |
| "step": 5000, |
| "valid_targets_mean": 4348.8, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 5.220135628586333, |
| "grad_norm": 0.4959684289084111, |
| "learning_rate": 7.392453271155786e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08260548859834671, |
| "step": 5005, |
| "valid_targets_mean": 5807.4, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 5.225352112676056, |
| "grad_norm": 0.5620999384066929, |
| "learning_rate": 7.352125412464368e-06, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0748911052942276, |
| "step": 5010, |
| "valid_targets_mean": 4590.0, |
| "valid_targets_min": 1848 |
| }, |
| { |
| "epoch": 5.23056859676578, |
| "grad_norm": 0.5581675018957084, |
| "learning_rate": 7.311883068199659e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0873471274971962, |
| "step": 5015, |
| "valid_targets_mean": 4160.9, |
| "valid_targets_min": 1793 |
| }, |
| { |
| "epoch": 5.2357850808555035, |
| "grad_norm": 0.5052128067171061, |
| "learning_rate": 7.271726510446968e-06, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08994010090827942, |
| "step": 5020, |
| "valid_targets_mean": 5267.4, |
| "valid_targets_min": 3135 |
| }, |
| { |
| "epoch": 5.241001564945227, |
| "grad_norm": 0.4877172138308242, |
| "learning_rate": 7.231656010711609e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08713434636592865, |
| "step": 5025, |
| "valid_targets_mean": 5588.8, |
| "valid_targets_min": 3191 |
| }, |
| { |
| "epoch": 5.24621804903495, |
| "grad_norm": 0.5816293543459301, |
| "learning_rate": 7.191671839917025e-06, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09546761214733124, |
| "step": 5030, |
| "valid_targets_mean": 4677.6, |
| "valid_targets_min": 3102 |
| }, |
| { |
| "epoch": 5.251434533124674, |
| "grad_norm": 0.5452525730299029, |
| "learning_rate": 7.15177426840298e-06, |
| "loss": 0.1813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09644042700529099, |
| "step": 5035, |
| "valid_targets_mean": 5553.9, |
| "valid_targets_min": 2409 |
| }, |
| { |
| "epoch": 5.256651017214398, |
| "grad_norm": 0.5146838047889054, |
| "learning_rate": 7.111963565923723e-06, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08240243792533875, |
| "step": 5040, |
| "valid_targets_mean": 5156.4, |
| "valid_targets_min": 2389 |
| }, |
| { |
| "epoch": 5.261867501304121, |
| "grad_norm": 0.5502902856949233, |
| "learning_rate": 7.07224000164618e-06, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10105292499065399, |
| "step": 5045, |
| "valid_targets_mean": 4615.9, |
| "valid_targets_min": 2221 |
| }, |
| { |
| "epoch": 5.267083985393844, |
| "grad_norm": 0.5516918505283356, |
| "learning_rate": 7.032603844148098e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09628251194953918, |
| "step": 5050, |
| "valid_targets_mean": 5681.5, |
| "valid_targets_min": 3383 |
| }, |
| { |
| "epoch": 5.272300469483568, |
| "grad_norm": 0.5388756000981851, |
| "learning_rate": 6.993055361416281e-06, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09925254434347153, |
| "step": 5055, |
| "valid_targets_mean": 4482.9, |
| "valid_targets_min": 3670 |
| }, |
| { |
| "epoch": 5.277516953573292, |
| "grad_norm": 0.5006488169663625, |
| "learning_rate": 6.953594820844725e-06, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08879800140857697, |
| "step": 5060, |
| "valid_targets_mean": 6420.1, |
| "valid_targets_min": 3558 |
| }, |
| { |
| "epoch": 5.2827334376630155, |
| "grad_norm": 0.5560127327398505, |
| "learning_rate": 6.914222489232834e-06, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0899522602558136, |
| "step": 5065, |
| "valid_targets_mean": 5202.9, |
| "valid_targets_min": 3176 |
| }, |
| { |
| "epoch": 5.287949921752738, |
| "grad_norm": 0.6756236046106081, |
| "learning_rate": 6.874938632783639e-06, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08966085314750671, |
| "step": 5070, |
| "valid_targets_mean": 3571.6, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 5.293166405842462, |
| "grad_norm": 0.5422017060339238, |
| "learning_rate": 6.835743517101947e-06, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08440357446670532, |
| "step": 5075, |
| "valid_targets_mean": 4761.0, |
| "valid_targets_min": 1624 |
| }, |
| { |
| "epoch": 5.298382889932186, |
| "grad_norm": 0.5591333270753611, |
| "learning_rate": 6.796637407192608e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07776360213756561, |
| "step": 5080, |
| "valid_targets_mean": 4593.9, |
| "valid_targets_min": 2015 |
| }, |
| { |
| "epoch": 5.30359937402191, |
| "grad_norm": 0.6151205137047357, |
| "learning_rate": 6.7576205674586405e-06, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0986764132976532, |
| "step": 5085, |
| "valid_targets_mean": 3976.8, |
| "valid_targets_min": 1415 |
| }, |
| { |
| "epoch": 5.3088158581116325, |
| "grad_norm": 0.5539153347512382, |
| "learning_rate": 6.718693261699542e-06, |
| "loss": 0.1739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08884495496749878, |
| "step": 5090, |
| "valid_targets_mean": 4511.4, |
| "valid_targets_min": 2240 |
| }, |
| { |
| "epoch": 5.314032342201356, |
| "grad_norm": 0.5839635887811082, |
| "learning_rate": 6.679855753109419e-06, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0866798609495163, |
| "step": 5095, |
| "valid_targets_mean": 3695.5, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 5.31924882629108, |
| "grad_norm": 0.524703444091149, |
| "learning_rate": 6.64110830427527e-06, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07154019176959991, |
| "step": 5100, |
| "valid_targets_mean": 4561.2, |
| "valid_targets_min": 2558 |
| }, |
| { |
| "epoch": 5.324465310380804, |
| "grad_norm": 0.5815298167263548, |
| "learning_rate": 6.602451177175162e-06, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08907519280910492, |
| "step": 5105, |
| "valid_targets_mean": 3357.4, |
| "valid_targets_min": 2213 |
| }, |
| { |
| "epoch": 5.329681794470527, |
| "grad_norm": 0.4817977233073812, |
| "learning_rate": 6.563884633176505e-06, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08714839071035385, |
| "step": 5110, |
| "valid_targets_mean": 5580.0, |
| "valid_targets_min": 2439 |
| }, |
| { |
| "epoch": 5.33489827856025, |
| "grad_norm": 0.5242439779801624, |
| "learning_rate": 6.5254089330342366e-06, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07945850491523743, |
| "step": 5115, |
| "valid_targets_mean": 4681.1, |
| "valid_targets_min": 3074 |
| }, |
| { |
| "epoch": 5.340114762649974, |
| "grad_norm": 0.5615047976477149, |
| "learning_rate": 6.487024336889107e-06, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09414586424827576, |
| "step": 5120, |
| "valid_targets_mean": 5437.2, |
| "valid_targets_min": 2212 |
| }, |
| { |
| "epoch": 5.345331246739698, |
| "grad_norm": 0.5258908501065038, |
| "learning_rate": 6.448731104265871e-06, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10087031126022339, |
| "step": 5125, |
| "valid_targets_mean": 5349.8, |
| "valid_targets_min": 2886 |
| }, |
| { |
| "epoch": 5.350547730829421, |
| "grad_norm": 0.5321933147958745, |
| "learning_rate": 6.410529494071596e-06, |
| "loss": 0.176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09096763283014297, |
| "step": 5130, |
| "valid_targets_mean": 5575.4, |
| "valid_targets_min": 1571 |
| }, |
| { |
| "epoch": 5.3557642149191445, |
| "grad_norm": 0.47426003796053384, |
| "learning_rate": 6.372419764593825e-06, |
| "loss": 0.1775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08991380780935287, |
| "step": 5135, |
| "valid_targets_mean": 6106.4, |
| "valid_targets_min": 3744 |
| }, |
| { |
| "epoch": 5.360980699008868, |
| "grad_norm": 0.5301388683550673, |
| "learning_rate": 6.334402173498926e-06, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07810938358306885, |
| "step": 5140, |
| "valid_targets_mean": 4348.8, |
| "valid_targets_min": 2076 |
| }, |
| { |
| "epoch": 5.366197183098592, |
| "grad_norm": 0.5374279733696077, |
| "learning_rate": 6.296476977830272e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08754917979240417, |
| "step": 5145, |
| "valid_targets_mean": 5014.2, |
| "valid_targets_min": 2862 |
| }, |
| { |
| "epoch": 5.371413667188315, |
| "grad_norm": 0.7206731702211141, |
| "learning_rate": 6.2586444340065625e-06, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0999416708946228, |
| "step": 5150, |
| "valid_targets_mean": 4403.9, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 5.376630151278039, |
| "grad_norm": 0.47298145612120657, |
| "learning_rate": 6.22090479782004e-06, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07644212245941162, |
| "step": 5155, |
| "valid_targets_mean": 4559.2, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 5.381846635367762, |
| "grad_norm": 0.6183890277166507, |
| "learning_rate": 6.18325832443478e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09842634201049805, |
| "step": 5160, |
| "valid_targets_mean": 4859.1, |
| "valid_targets_min": 3053 |
| }, |
| { |
| "epoch": 5.387063119457486, |
| "grad_norm": 0.5809269936749796, |
| "learning_rate": 6.145705268384996e-06, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08372758328914642, |
| "step": 5165, |
| "valid_targets_mean": 4085.4, |
| "valid_targets_min": 1622 |
| }, |
| { |
| "epoch": 5.392279603547209, |
| "grad_norm": 0.4953269082886467, |
| "learning_rate": 6.108245883573258e-06, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08300064504146576, |
| "step": 5170, |
| "valid_targets_mean": 5048.5, |
| "valid_targets_min": 2023 |
| }, |
| { |
| "epoch": 5.397496087636933, |
| "grad_norm": 0.5175745081691734, |
| "learning_rate": 6.070880423268839e-06, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08488012105226517, |
| "step": 5175, |
| "valid_targets_mean": 5152.5, |
| "valid_targets_min": 3232 |
| }, |
| { |
| "epoch": 5.402712571726656, |
| "grad_norm": 0.5076264348082026, |
| "learning_rate": 6.033609140105949e-06, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07731913775205612, |
| "step": 5180, |
| "valid_targets_mean": 4969.0, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 5.40792905581638, |
| "grad_norm": 0.5404816837020461, |
| "learning_rate": 5.996432286082061e-06, |
| "loss": 0.1809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09518995881080627, |
| "step": 5185, |
| "valid_targets_mean": 5947.1, |
| "valid_targets_min": 2923 |
| }, |
| { |
| "epoch": 5.413145539906103, |
| "grad_norm": 0.5159738238694263, |
| "learning_rate": 5.9593501125561885e-06, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07734167575836182, |
| "step": 5190, |
| "valid_targets_mean": 5073.8, |
| "valid_targets_min": 3352 |
| }, |
| { |
| "epoch": 5.418362023995827, |
| "grad_norm": 0.5684634602268366, |
| "learning_rate": 5.922362870247214e-06, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10236285626888275, |
| "step": 5195, |
| "valid_targets_mean": 4632.4, |
| "valid_targets_min": 2124 |
| }, |
| { |
| "epoch": 5.4235785080855505, |
| "grad_norm": 0.5373820991292663, |
| "learning_rate": 5.885470809232143e-06, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07851923257112503, |
| "step": 5200, |
| "valid_targets_mean": 4475.5, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 5.428794992175274, |
| "grad_norm": 0.5458806892088824, |
| "learning_rate": 5.8486741789444804e-06, |
| "loss": 0.1735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0888456404209137, |
| "step": 5205, |
| "valid_targets_mean": 4564.1, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 5.434011476264997, |
| "grad_norm": 0.5479391419138662, |
| "learning_rate": 5.8119732281724715e-06, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09237441420555115, |
| "step": 5210, |
| "valid_targets_mean": 5527.6, |
| "valid_targets_min": 2991 |
| }, |
| { |
| "epoch": 5.439227960354721, |
| "grad_norm": 0.5194660932458187, |
| "learning_rate": 5.775368205057488e-06, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07880048453807831, |
| "step": 5215, |
| "valid_targets_mean": 4676.0, |
| "valid_targets_min": 2155 |
| }, |
| { |
| "epoch": 5.444444444444445, |
| "grad_norm": 0.5598013074244899, |
| "learning_rate": 5.738859357092297e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08336806297302246, |
| "step": 5220, |
| "valid_targets_mean": 4326.5, |
| "valid_targets_min": 1821 |
| }, |
| { |
| "epoch": 5.449660928534168, |
| "grad_norm": 0.5747509440158713, |
| "learning_rate": 5.7024469311194095e-06, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0965658500790596, |
| "step": 5225, |
| "valid_targets_mean": 3991.5, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 5.454877412623891, |
| "grad_norm": 0.5983423632567207, |
| "learning_rate": 5.66613117332943e-06, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11357493698596954, |
| "step": 5230, |
| "valid_targets_mean": 5065.5, |
| "valid_targets_min": 3065 |
| }, |
| { |
| "epoch": 5.460093896713615, |
| "grad_norm": 0.5468847755310513, |
| "learning_rate": 5.629912329259355e-06, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09041740000247955, |
| "step": 5235, |
| "valid_targets_mean": 4774.6, |
| "valid_targets_min": 1518 |
| }, |
| { |
| "epoch": 5.465310380803339, |
| "grad_norm": 0.5117526048335445, |
| "learning_rate": 5.593790643790935e-06, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09142474830150604, |
| "step": 5240, |
| "valid_targets_mean": 5328.4, |
| "valid_targets_min": 3105 |
| }, |
| { |
| "epoch": 5.470526864893062, |
| "grad_norm": 0.5251513808853013, |
| "learning_rate": 5.557766361149013e-06, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08423709869384766, |
| "step": 5245, |
| "valid_targets_mean": 4627.4, |
| "valid_targets_min": 2463 |
| }, |
| { |
| "epoch": 5.475743348982785, |
| "grad_norm": 0.5367593742044022, |
| "learning_rate": 5.521839724899887e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08371119946241379, |
| "step": 5250, |
| "valid_targets_mean": 4551.9, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 5.480959833072509, |
| "grad_norm": 0.5999861887031098, |
| "learning_rate": 5.48601097794963e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08510912209749222, |
| "step": 5255, |
| "valid_targets_mean": 3554.6, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 5.486176317162233, |
| "grad_norm": 0.5291638823924313, |
| "learning_rate": 5.450280362542495e-06, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08900319039821625, |
| "step": 5260, |
| "valid_targets_mean": 5461.8, |
| "valid_targets_min": 1675 |
| }, |
| { |
| "epoch": 5.491392801251957, |
| "grad_norm": 0.5538581823082644, |
| "learning_rate": 5.414648120259225e-06, |
| "loss": 0.176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0811634510755539, |
| "step": 5265, |
| "valid_targets_mean": 4332.2, |
| "valid_targets_min": 2098 |
| }, |
| { |
| "epoch": 5.4966092853416795, |
| "grad_norm": 0.6247487880807111, |
| "learning_rate": 5.379114492015467e-06, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1094445213675499, |
| "step": 5270, |
| "valid_targets_mean": 4459.2, |
| "valid_targets_min": 2641 |
| }, |
| { |
| "epoch": 5.501825769431403, |
| "grad_norm": 0.5155655112469832, |
| "learning_rate": 5.343679718060104e-06, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06469831615686417, |
| "step": 5275, |
| "valid_targets_mean": 4931.0, |
| "valid_targets_min": 3162 |
| }, |
| { |
| "epoch": 5.507042253521127, |
| "grad_norm": 0.5920115869396942, |
| "learning_rate": 5.308344037973672e-06, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08934450894594193, |
| "step": 5280, |
| "valid_targets_mean": 4298.9, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 5.51225873761085, |
| "grad_norm": 0.5119002875008457, |
| "learning_rate": 5.2731076906666786e-06, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08615301549434662, |
| "step": 5285, |
| "valid_targets_mean": 4840.4, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 5.517475221700574, |
| "grad_norm": 0.5262229363816199, |
| "learning_rate": 5.237970914378068e-06, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09570074081420898, |
| "step": 5290, |
| "valid_targets_mean": 5322.9, |
| "valid_targets_min": 3350 |
| }, |
| { |
| "epoch": 5.522691705790297, |
| "grad_norm": 0.5538227803274636, |
| "learning_rate": 5.202933946673532e-06, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08771003782749176, |
| "step": 5295, |
| "valid_targets_mean": 4497.5, |
| "valid_targets_min": 2001 |
| }, |
| { |
| "epoch": 5.527908189880021, |
| "grad_norm": 0.5502507076068306, |
| "learning_rate": 5.1679970244439695e-06, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07107767462730408, |
| "step": 5300, |
| "valid_targets_mean": 3696.2, |
| "valid_targets_min": 2225 |
| }, |
| { |
| "epoch": 5.533124673969745, |
| "grad_norm": 0.5512386550175091, |
| "learning_rate": 5.13316038390383e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0939207673072815, |
| "step": 5305, |
| "valid_targets_mean": 5463.0, |
| "valid_targets_min": 3574 |
| }, |
| { |
| "epoch": 5.538341158059468, |
| "grad_norm": 0.5278227929504776, |
| "learning_rate": 5.098424260589565e-06, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10499151796102524, |
| "step": 5310, |
| "valid_targets_mean": 5881.4, |
| "valid_targets_min": 3680 |
| }, |
| { |
| "epoch": 5.5435576421491914, |
| "grad_norm": 0.5519375612123985, |
| "learning_rate": 5.063788889357995e-06, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09371333569288254, |
| "step": 5315, |
| "valid_targets_mean": 5093.1, |
| "valid_targets_min": 1624 |
| }, |
| { |
| "epoch": 5.548774126238915, |
| "grad_norm": 0.5716503917543002, |
| "learning_rate": 5.029254504384733e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10242068767547607, |
| "step": 5320, |
| "valid_targets_mean": 4717.9, |
| "valid_targets_min": 2413 |
| }, |
| { |
| "epoch": 5.553990610328638, |
| "grad_norm": 0.5874419944817311, |
| "learning_rate": 4.9948213391626325e-06, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10250916332006454, |
| "step": 5325, |
| "valid_targets_mean": 4346.5, |
| "valid_targets_min": 2439 |
| }, |
| { |
| "epoch": 5.559207094418362, |
| "grad_norm": 0.5504381846725983, |
| "learning_rate": 4.960489626500153e-06, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07717075943946838, |
| "step": 5330, |
| "valid_targets_mean": 4242.8, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 5.5644235785080856, |
| "grad_norm": 0.5146939011973244, |
| "learning_rate": 4.926259598519851e-06, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06690868735313416, |
| "step": 5335, |
| "valid_targets_mean": 4106.6, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 5.569640062597809, |
| "grad_norm": 0.5505646821539498, |
| "learning_rate": 4.892131486656733e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08535034954547882, |
| "step": 5340, |
| "valid_targets_mean": 5032.8, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 5.574856546687533, |
| "grad_norm": 0.529809183401811, |
| "learning_rate": 4.858105521656768e-06, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08789815753698349, |
| "step": 5345, |
| "valid_targets_mean": 5742.9, |
| "valid_targets_min": 3928 |
| }, |
| { |
| "epoch": 5.580073030777256, |
| "grad_norm": 0.5370726178638763, |
| "learning_rate": 4.824181933575272e-06, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10115206241607666, |
| "step": 5350, |
| "valid_targets_mean": 5713.5, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 5.58528951486698, |
| "grad_norm": 0.5569605856751727, |
| "learning_rate": 4.790360951775392e-06, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09263263642787933, |
| "step": 5355, |
| "valid_targets_mean": 5239.4, |
| "valid_targets_min": 2056 |
| }, |
| { |
| "epoch": 5.590505998956703, |
| "grad_norm": 0.5455568305099259, |
| "learning_rate": 4.756642804926517e-06, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09849033504724503, |
| "step": 5360, |
| "valid_targets_mean": 5447.1, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 5.595722483046426, |
| "grad_norm": 0.6272566838215045, |
| "learning_rate": 4.7230277210027685e-06, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09728604555130005, |
| "step": 5365, |
| "valid_targets_mean": 3810.0, |
| "valid_targets_min": 2077 |
| }, |
| { |
| "epoch": 5.60093896713615, |
| "grad_norm": 0.4949180746326753, |
| "learning_rate": 4.689515927281427e-06, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07689865678548813, |
| "step": 5370, |
| "valid_targets_mean": 5535.0, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 5.606155451225874, |
| "grad_norm": 0.521391228466892, |
| "learning_rate": 4.6561076503414235e-06, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07850983738899231, |
| "step": 5375, |
| "valid_targets_mean": 4991.0, |
| "valid_targets_min": 2411 |
| }, |
| { |
| "epoch": 5.6113719353155975, |
| "grad_norm": 0.5047705118028566, |
| "learning_rate": 4.622803116061789e-06, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08694680035114288, |
| "step": 5380, |
| "valid_targets_mean": 5849.4, |
| "valid_targets_min": 3531 |
| }, |
| { |
| "epoch": 5.616588419405321, |
| "grad_norm": 0.535962737554241, |
| "learning_rate": 4.589602549620127e-06, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09452635049819946, |
| "step": 5385, |
| "valid_targets_mean": 5429.2, |
| "valid_targets_min": 3055 |
| }, |
| { |
| "epoch": 5.621804903495044, |
| "grad_norm": 0.5852505700527569, |
| "learning_rate": 4.556506175491097e-06, |
| "loss": 0.1809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08648938685655594, |
| "step": 5390, |
| "valid_targets_mean": 4766.6, |
| "valid_targets_min": 2003 |
| }, |
| { |
| "epoch": 5.627021387584768, |
| "grad_norm": 0.5898102688979189, |
| "learning_rate": 4.523514217444918e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11465403437614441, |
| "step": 5395, |
| "valid_targets_mean": 5365.4, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 5.632237871674492, |
| "grad_norm": 0.5229012788505973, |
| "learning_rate": 4.490626898545805e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07465511560440063, |
| "step": 5400, |
| "valid_targets_mean": 4374.1, |
| "valid_targets_min": 1664 |
| }, |
| { |
| "epoch": 5.6374543557642145, |
| "grad_norm": 0.5409442222602789, |
| "learning_rate": 4.4578444411505005e-06, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08053886890411377, |
| "step": 5405, |
| "valid_targets_mean": 5253.8, |
| "valid_targets_min": 2479 |
| }, |
| { |
| "epoch": 5.642670839853938, |
| "grad_norm": 0.5285523050183011, |
| "learning_rate": 4.425167066906777e-06, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07296570390462875, |
| "step": 5410, |
| "valid_targets_mean": 4937.6, |
| "valid_targets_min": 3123 |
| }, |
| { |
| "epoch": 5.647887323943662, |
| "grad_norm": 0.5416239529994494, |
| "learning_rate": 4.392594996751891e-06, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09565962851047516, |
| "step": 5415, |
| "valid_targets_mean": 5340.2, |
| "valid_targets_min": 3983 |
| }, |
| { |
| "epoch": 5.653103808033386, |
| "grad_norm": 0.5311968413285663, |
| "learning_rate": 4.360128450911154e-06, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0871681272983551, |
| "step": 5420, |
| "valid_targets_mean": 5207.1, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 5.6583202921231095, |
| "grad_norm": 0.507054671436209, |
| "learning_rate": 4.3277676488963775e-06, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08645960688591003, |
| "step": 5425, |
| "valid_targets_mean": 5039.8, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 5.663536776212832, |
| "grad_norm": 0.568306365639052, |
| "learning_rate": 4.295512809504447e-06, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08979377150535583, |
| "step": 5430, |
| "valid_targets_mean": 5396.4, |
| "valid_targets_min": 1649 |
| }, |
| { |
| "epoch": 5.668753260302556, |
| "grad_norm": 0.5130604318115416, |
| "learning_rate": 4.263364150815803e-06, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06490998715162277, |
| "step": 5435, |
| "valid_targets_mean": 3744.5, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 5.67396974439228, |
| "grad_norm": 0.5692022571266344, |
| "learning_rate": 4.231321890192981e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10590483248233795, |
| "step": 5440, |
| "valid_targets_mean": 4565.5, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 5.679186228482003, |
| "grad_norm": 0.5957273632676808, |
| "learning_rate": 4.19938624427914e-06, |
| "loss": 0.1665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08738480508327484, |
| "step": 5445, |
| "valid_targets_mean": 4124.2, |
| "valid_targets_min": 2426 |
| }, |
| { |
| "epoch": 5.6844027125717265, |
| "grad_norm": 0.5059513068357104, |
| "learning_rate": 4.167557428996611e-06, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09112801402807236, |
| "step": 5450, |
| "valid_targets_mean": 4731.6, |
| "valid_targets_min": 2194 |
| }, |
| { |
| "epoch": 5.68961919666145, |
| "grad_norm": 0.5693590655270471, |
| "learning_rate": 4.135835659545406e-06, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09921035915613174, |
| "step": 5455, |
| "valid_targets_mean": 4494.1, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 5.694835680751174, |
| "grad_norm": 0.5024039878747486, |
| "learning_rate": 4.104221150401806e-06, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10560700297355652, |
| "step": 5460, |
| "valid_targets_mean": 6348.4, |
| "valid_targets_min": 1947 |
| }, |
| { |
| "epoch": 5.700052164840898, |
| "grad_norm": 0.4650548652863463, |
| "learning_rate": 4.072714115316863e-06, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06292714923620224, |
| "step": 5465, |
| "valid_targets_mean": 5174.2, |
| "valid_targets_min": 1897 |
| }, |
| { |
| "epoch": 5.705268648930621, |
| "grad_norm": 0.4486459885321795, |
| "learning_rate": 4.041314767314983e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07271754741668701, |
| "step": 5470, |
| "valid_targets_mean": 5976.1, |
| "valid_targets_min": 2077 |
| }, |
| { |
| "epoch": 5.710485133020344, |
| "grad_norm": 0.5938653009407587, |
| "learning_rate": 4.010023318692502e-06, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09291598200798035, |
| "step": 5475, |
| "valid_targets_mean": 3675.5, |
| "valid_targets_min": 1525 |
| }, |
| { |
| "epoch": 5.715701617110068, |
| "grad_norm": 0.5328052077536234, |
| "learning_rate": 3.978839981016203e-06, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10603446513414383, |
| "step": 5480, |
| "valid_targets_mean": 5534.8, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 5.720918101199791, |
| "grad_norm": 0.5222740838976995, |
| "learning_rate": 3.947764965121934e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07417292892932892, |
| "step": 5485, |
| "valid_targets_mean": 4324.2, |
| "valid_targets_min": 1883 |
| }, |
| { |
| "epoch": 5.726134585289515, |
| "grad_norm": 0.5901115757033547, |
| "learning_rate": 3.916798481113144e-06, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09025438129901886, |
| "step": 5490, |
| "valid_targets_mean": 3641.8, |
| "valid_targets_min": 1759 |
| }, |
| { |
| "epoch": 5.731351069379238, |
| "grad_norm": 0.5857376932555667, |
| "learning_rate": 3.885940738359492e-06, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0782744288444519, |
| "step": 5495, |
| "valid_targets_mean": 3576.2, |
| "valid_targets_min": 1538 |
| }, |
| { |
| "epoch": 5.736567553468962, |
| "grad_norm": 0.47645456542263637, |
| "learning_rate": 3.855191945495405e-06, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0868457555770874, |
| "step": 5500, |
| "valid_targets_mean": 5765.2, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 5.741784037558686, |
| "grad_norm": 0.5236361251793296, |
| "learning_rate": 3.824552310418703e-06, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06546823680400848, |
| "step": 5505, |
| "valid_targets_mean": 5086.6, |
| "valid_targets_min": 2965 |
| }, |
| { |
| "epoch": 5.747000521648409, |
| "grad_norm": 0.5091732574059794, |
| "learning_rate": 3.794022040289147e-06, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07745197415351868, |
| "step": 5510, |
| "valid_targets_mean": 5054.1, |
| "valid_targets_min": 2306 |
| }, |
| { |
| "epoch": 5.7522170057381325, |
| "grad_norm": 0.46441623103319934, |
| "learning_rate": 3.763601341527088e-06, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07298596203327179, |
| "step": 5515, |
| "valid_targets_mean": 5433.0, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 5.757433489827856, |
| "grad_norm": 0.49641591292243104, |
| "learning_rate": 3.733290419812019e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08252263814210892, |
| "step": 5520, |
| "valid_targets_mean": 5315.5, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 5.762649973917579, |
| "grad_norm": 0.6789379381663515, |
| "learning_rate": 3.7030894800812365e-06, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10934539139270782, |
| "step": 5525, |
| "valid_targets_mean": 4483.8, |
| "valid_targets_min": 1772 |
| }, |
| { |
| "epoch": 5.767866458007303, |
| "grad_norm": 0.5423814329508395, |
| "learning_rate": 3.672998726528414e-06, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11362475156784058, |
| "step": 5530, |
| "valid_targets_mean": 5748.1, |
| "valid_targets_min": 2177 |
| }, |
| { |
| "epoch": 5.773082942097027, |
| "grad_norm": 0.5489625563953952, |
| "learning_rate": 3.6430183626022574e-06, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09776196628808975, |
| "step": 5535, |
| "valid_targets_mean": 6000.1, |
| "valid_targets_min": 3982 |
| }, |
| { |
| "epoch": 5.77829942618675, |
| "grad_norm": 0.6233184110121164, |
| "learning_rate": 3.613148591005071e-06, |
| "loss": 0.1693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08113294094800949, |
| "step": 5540, |
| "valid_targets_mean": 4493.1, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 5.783515910276473, |
| "grad_norm": 0.4822987640375631, |
| "learning_rate": 3.5833896136914705e-06, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07164439558982849, |
| "step": 5545, |
| "valid_targets_mean": 5387.6, |
| "valid_targets_min": 2047 |
| }, |
| { |
| "epoch": 5.788732394366197, |
| "grad_norm": 0.4749912986402253, |
| "learning_rate": 3.553741631866938e-06, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09115122258663177, |
| "step": 5550, |
| "valid_targets_mean": 6122.4, |
| "valid_targets_min": 2286 |
| }, |
| { |
| "epoch": 5.793948878455921, |
| "grad_norm": 0.5946909865400563, |
| "learning_rate": 3.524204845986523e-06, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08981865644454956, |
| "step": 5555, |
| "valid_targets_mean": 4332.4, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 5.7991653625456445, |
| "grad_norm": 0.4981777296421743, |
| "learning_rate": 3.494779455753443e-06, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07500408589839935, |
| "step": 5560, |
| "valid_targets_mean": 4568.4, |
| "valid_targets_min": 2141 |
| }, |
| { |
| "epoch": 5.804381846635367, |
| "grad_norm": 0.6142734821840982, |
| "learning_rate": 3.4654656601177482e-06, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10738922655582428, |
| "step": 5565, |
| "valid_targets_mean": 3865.8, |
| "valid_targets_min": 1623 |
| }, |
| { |
| "epoch": 5.809598330725091, |
| "grad_norm": 0.6888133941635042, |
| "learning_rate": 3.4362636572749984e-06, |
| "loss": 0.177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09062996506690979, |
| "step": 5570, |
| "valid_targets_mean": 4535.8, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 5.814814814814815, |
| "grad_norm": 0.5144938987206906, |
| "learning_rate": 3.4071736446648805e-06, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08362233638763428, |
| "step": 5575, |
| "valid_targets_mean": 5688.2, |
| "valid_targets_min": 1588 |
| }, |
| { |
| "epoch": 5.820031298904539, |
| "grad_norm": 0.55001093740802, |
| "learning_rate": 3.3781958189699183e-06, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10185902565717697, |
| "step": 5580, |
| "valid_targets_mean": 5194.5, |
| "valid_targets_min": 2848 |
| }, |
| { |
| "epoch": 5.8252477829942615, |
| "grad_norm": 0.5048679008418444, |
| "learning_rate": 3.3493303761141016e-06, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08554618060588837, |
| "step": 5585, |
| "valid_targets_mean": 6494.1, |
| "valid_targets_min": 2608 |
| }, |
| { |
| "epoch": 5.830464267083985, |
| "grad_norm": 0.5470595580590045, |
| "learning_rate": 3.320577511261589e-06, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09496854245662689, |
| "step": 5590, |
| "valid_targets_mean": 5576.2, |
| "valid_targets_min": 3507 |
| }, |
| { |
| "epoch": 5.835680751173709, |
| "grad_norm": 0.52994182216623, |
| "learning_rate": 3.291937418815376e-06, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08456946909427643, |
| "step": 5595, |
| "valid_targets_mean": 3731.2, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 5.840897235263433, |
| "grad_norm": 0.5798170124783152, |
| "learning_rate": 3.2634102924159982e-06, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10535246133804321, |
| "step": 5600, |
| "valid_targets_mean": 4603.9, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 5.846113719353156, |
| "grad_norm": 0.5136604632732348, |
| "learning_rate": 3.2349963249401894e-06, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08853639662265778, |
| "step": 5605, |
| "valid_targets_mean": 5272.5, |
| "valid_targets_min": 2097 |
| }, |
| { |
| "epoch": 5.851330203442879, |
| "grad_norm": 0.5423322037998392, |
| "learning_rate": 3.2066957084996163e-06, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1070578321814537, |
| "step": 5610, |
| "valid_targets_mean": 5331.8, |
| "valid_targets_min": 3613 |
| }, |
| { |
| "epoch": 5.856546687532603, |
| "grad_norm": 0.5064494433132412, |
| "learning_rate": 3.178508634439539e-06, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07132753729820251, |
| "step": 5615, |
| "valid_targets_mean": 4434.9, |
| "valid_targets_min": 1705 |
| }, |
| { |
| "epoch": 5.861763171622327, |
| "grad_norm": 0.5051160365914387, |
| "learning_rate": 3.150435293337557e-06, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07303132116794586, |
| "step": 5620, |
| "valid_targets_mean": 4491.8, |
| "valid_targets_min": 1976 |
| }, |
| { |
| "epoch": 5.86697965571205, |
| "grad_norm": 0.5606453533642057, |
| "learning_rate": 3.1224758750022934e-06, |
| "loss": 0.174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06995655596256256, |
| "step": 5625, |
| "valid_targets_mean": 4081.4, |
| "valid_targets_min": 1896 |
| }, |
| { |
| "epoch": 5.8721961398017735, |
| "grad_norm": 0.5653178986022215, |
| "learning_rate": 3.0946305684721145e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09811203926801682, |
| "step": 5630, |
| "valid_targets_mean": 5245.2, |
| "valid_targets_min": 1947 |
| }, |
| { |
| "epoch": 5.877412623891497, |
| "grad_norm": 0.5252545759785076, |
| "learning_rate": 3.066899562013872e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07529449462890625, |
| "step": 5635, |
| "valid_targets_mean": 3975.2, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 5.882629107981221, |
| "grad_norm": 0.5433632880437022, |
| "learning_rate": 3.0392830431216037e-06, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07809676975011826, |
| "step": 5640, |
| "valid_targets_mean": 4935.0, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 5.887845592070944, |
| "grad_norm": 0.5289957385883606, |
| "learning_rate": 3.01178119851528e-06, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08336209505796432, |
| "step": 5645, |
| "valid_targets_mean": 4886.6, |
| "valid_targets_min": 1800 |
| }, |
| { |
| "epoch": 5.893062076160668, |
| "grad_norm": 0.5575156548605359, |
| "learning_rate": 2.9843942141395365e-06, |
| "loss": 0.1765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0846119076013565, |
| "step": 5650, |
| "valid_targets_mean": 3872.9, |
| "valid_targets_min": 1389 |
| }, |
| { |
| "epoch": 5.898278560250391, |
| "grad_norm": 0.5878385442301363, |
| "learning_rate": 2.9571222751624317e-06, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09252753853797913, |
| "step": 5655, |
| "valid_targets_mean": 4209.4, |
| "valid_targets_min": 2028 |
| }, |
| { |
| "epoch": 5.903495044340115, |
| "grad_norm": 0.551111216455573, |
| "learning_rate": 2.9299655659741622e-06, |
| "loss": 0.1804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09265060722827911, |
| "step": 5660, |
| "valid_targets_mean": 4456.5, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 5.908711528429838, |
| "grad_norm": 0.5820990540633043, |
| "learning_rate": 2.9029242701858606e-06, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08701181411743164, |
| "step": 5665, |
| "valid_targets_mean": 4254.0, |
| "valid_targets_min": 2724 |
| }, |
| { |
| "epoch": 5.913928012519562, |
| "grad_norm": 0.5226092777050476, |
| "learning_rate": 2.8759985706283068e-06, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08515148609876633, |
| "step": 5670, |
| "valid_targets_mean": 4590.4, |
| "valid_targets_min": 2366 |
| }, |
| { |
| "epoch": 5.919144496609285, |
| "grad_norm": 0.5971219829568228, |
| "learning_rate": 2.8491886493507313e-06, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10314597189426422, |
| "step": 5675, |
| "valid_targets_mean": 4606.9, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 5.924360980699009, |
| "grad_norm": 0.5665002869239318, |
| "learning_rate": 2.8224946876195593e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08449500799179077, |
| "step": 5680, |
| "valid_targets_mean": 4555.5, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 5.929577464788732, |
| "grad_norm": 0.6007551768138341, |
| "learning_rate": 2.795916865917201e-06, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.100425586104393, |
| "step": 5685, |
| "valid_targets_mean": 4430.6, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 5.934793948878456, |
| "grad_norm": 0.5553678028748384, |
| "learning_rate": 2.7694553639408163e-06, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09645190834999084, |
| "step": 5690, |
| "valid_targets_mean": 5136.9, |
| "valid_targets_min": 2097 |
| }, |
| { |
| "epoch": 5.9400104329681795, |
| "grad_norm": 0.5350257692219152, |
| "learning_rate": 2.7431103606011113e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07542605698108673, |
| "step": 5695, |
| "valid_targets_mean": 4592.1, |
| "valid_targets_min": 2235 |
| }, |
| { |
| "epoch": 5.945226917057903, |
| "grad_norm": 0.5370749848123485, |
| "learning_rate": 2.71688203402112e-06, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10020209103822708, |
| "step": 5700, |
| "valid_targets_mean": 4956.2, |
| "valid_targets_min": 2666 |
| }, |
| { |
| "epoch": 5.950443401147626, |
| "grad_norm": 0.5616035739838323, |
| "learning_rate": 2.690770561535019e-06, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1056441217660904, |
| "step": 5705, |
| "valid_targets_mean": 5587.0, |
| "valid_targets_min": 3696 |
| }, |
| { |
| "epoch": 5.95565988523735, |
| "grad_norm": 0.505396409620737, |
| "learning_rate": 2.664776119686896e-06, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06738579273223877, |
| "step": 5710, |
| "valid_targets_mean": 4772.8, |
| "valid_targets_min": 1612 |
| }, |
| { |
| "epoch": 5.960876369327074, |
| "grad_norm": 0.558148133432388, |
| "learning_rate": 2.6388988842295947e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08058644086122513, |
| "step": 5715, |
| "valid_targets_mean": 3943.5, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 5.966092853416797, |
| "grad_norm": 0.49142281395227094, |
| "learning_rate": 2.6131390301234927e-06, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08975610136985779, |
| "step": 5720, |
| "valid_targets_mean": 6229.9, |
| "valid_targets_min": 3962 |
| }, |
| { |
| "epoch": 5.97130933750652, |
| "grad_norm": 0.5127563839312393, |
| "learning_rate": 2.587496731535326e-06, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08209004998207092, |
| "step": 5725, |
| "valid_targets_mean": 5349.5, |
| "valid_targets_min": 3091 |
| }, |
| { |
| "epoch": 5.976525821596244, |
| "grad_norm": 0.5870781435714937, |
| "learning_rate": 2.561972161837041e-06, |
| "loss": 0.177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09318692982196808, |
| "step": 5730, |
| "valid_targets_mean": 4410.8, |
| "valid_targets_min": 2042 |
| }, |
| { |
| "epoch": 5.981742305685968, |
| "grad_norm": 0.5331167201677213, |
| "learning_rate": 2.536565493604575e-06, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11014723777770996, |
| "step": 5735, |
| "valid_targets_mean": 6198.2, |
| "valid_targets_min": 4202 |
| }, |
| { |
| "epoch": 5.9869587897756915, |
| "grad_norm": 0.5217330036417076, |
| "learning_rate": 2.511276898616737e-06, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09141227602958679, |
| "step": 5740, |
| "valid_targets_mean": 5061.2, |
| "valid_targets_min": 1855 |
| }, |
| { |
| "epoch": 5.992175273865414, |
| "grad_norm": 0.7628287327814164, |
| "learning_rate": 2.4861065478539925e-06, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09051162749528885, |
| "step": 5745, |
| "valid_targets_mean": 4572.0, |
| "valid_targets_min": 2408 |
| }, |
| { |
| "epoch": 5.997391757955138, |
| "grad_norm": 0.5412099702884833, |
| "learning_rate": 2.4610546114973666e-06, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08535590022802353, |
| "step": 5750, |
| "valid_targets_mean": 4914.4, |
| "valid_targets_min": 2299 |
| }, |
| { |
| "epoch": 6.002086593635889, |
| "grad_norm": 0.5666885471819875, |
| "learning_rate": 2.4361212589272488e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09032214432954788, |
| "step": 5755, |
| "valid_targets_mean": 3914.6, |
| "valid_targets_min": 1557 |
| }, |
| { |
| "epoch": 6.007303077725613, |
| "grad_norm": 0.6348974302582981, |
| "learning_rate": 2.41130665872227e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09823325276374817, |
| "step": 5760, |
| "valid_targets_mean": 3898.2, |
| "valid_targets_min": 2288 |
| }, |
| { |
| "epoch": 6.012519561815337, |
| "grad_norm": 0.5197451846846918, |
| "learning_rate": 2.3866109786581484e-06, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08300504088401794, |
| "step": 5765, |
| "valid_targets_mean": 5492.9, |
| "valid_targets_min": 2909 |
| }, |
| { |
| "epoch": 6.01773604590506, |
| "grad_norm": 0.5408708311715636, |
| "learning_rate": 2.3620343857065776e-06, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09408125281333923, |
| "step": 5770, |
| "valid_targets_mean": 5499.2, |
| "valid_targets_min": 2076 |
| }, |
| { |
| "epoch": 6.022952529994783, |
| "grad_norm": 0.5192312881257993, |
| "learning_rate": 2.3375770460340654e-06, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06746099889278412, |
| "step": 5775, |
| "valid_targets_mean": 3975.4, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 6.028169014084507, |
| "grad_norm": 0.5604784350505317, |
| "learning_rate": 2.313239125000841e-06, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07895144820213318, |
| "step": 5780, |
| "valid_targets_mean": 5031.9, |
| "valid_targets_min": 1614 |
| }, |
| { |
| "epoch": 6.033385498174231, |
| "grad_norm": 0.6306239061423632, |
| "learning_rate": 2.2890207871597192e-06, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0700065940618515, |
| "step": 5785, |
| "valid_targets_mean": 4056.4, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 6.0386019822639545, |
| "grad_norm": 0.5089884137450019, |
| "learning_rate": 2.2649221962549905e-06, |
| "loss": 0.1735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07413844764232635, |
| "step": 5790, |
| "valid_targets_mean": 3877.6, |
| "valid_targets_min": 1967 |
| }, |
| { |
| "epoch": 6.043818466353677, |
| "grad_norm": 0.5490139284297806, |
| "learning_rate": 2.2409435152213123e-06, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07719350606203079, |
| "step": 5795, |
| "valid_targets_mean": 4704.6, |
| "valid_targets_min": 1875 |
| }, |
| { |
| "epoch": 6.049034950443401, |
| "grad_norm": 0.5200749426838338, |
| "learning_rate": 2.217084906182629e-06, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09560975432395935, |
| "step": 5800, |
| "valid_targets_mean": 4587.0, |
| "valid_targets_min": 2004 |
| }, |
| { |
| "epoch": 6.054251434533125, |
| "grad_norm": 0.5279382480355144, |
| "learning_rate": 2.1933465304510394e-06, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07469984143972397, |
| "step": 5805, |
| "valid_targets_mean": 4616.1, |
| "valid_targets_min": 2787 |
| }, |
| { |
| "epoch": 6.059467918622849, |
| "grad_norm": 0.5220287099547348, |
| "learning_rate": 2.1697285485257245e-06, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08868516981601715, |
| "step": 5810, |
| "valid_targets_mean": 5075.2, |
| "valid_targets_min": 2445 |
| }, |
| { |
| "epoch": 6.0646844027125715, |
| "grad_norm": 0.46278683097215284, |
| "learning_rate": 2.1462311200918816e-06, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08032315969467163, |
| "step": 5815, |
| "valid_targets_mean": 6912.1, |
| "valid_targets_min": 4191 |
| }, |
| { |
| "epoch": 6.069900886802295, |
| "grad_norm": 0.5398578125617447, |
| "learning_rate": 2.122854404019601e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08614116907119751, |
| "step": 5820, |
| "valid_targets_mean": 5010.5, |
| "valid_targets_min": 1165 |
| }, |
| { |
| "epoch": 6.075117370892019, |
| "grad_norm": 0.5510448083868443, |
| "learning_rate": 2.0995985583628366e-06, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08615755289793015, |
| "step": 5825, |
| "valid_targets_mean": 4735.5, |
| "valid_targets_min": 2360 |
| }, |
| { |
| "epoch": 6.080333854981743, |
| "grad_norm": 0.5286206981684528, |
| "learning_rate": 2.076463740358299e-06, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07922375202178955, |
| "step": 5830, |
| "valid_targets_mean": 4719.9, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 6.085550339071466, |
| "grad_norm": 0.542601600303056, |
| "learning_rate": 2.053450106424426e-06, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09550304710865021, |
| "step": 5835, |
| "valid_targets_mean": 5393.1, |
| "valid_targets_min": 2149 |
| }, |
| { |
| "epoch": 6.090766823161189, |
| "grad_norm": 0.5306422592987686, |
| "learning_rate": 2.030557812160301e-06, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07130551338195801, |
| "step": 5840, |
| "valid_targets_mean": 5550.6, |
| "valid_targets_min": 2537 |
| }, |
| { |
| "epoch": 6.095983307250913, |
| "grad_norm": 0.5524670056940677, |
| "learning_rate": 2.0077870123446107e-06, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09660788625478745, |
| "step": 5845, |
| "valid_targets_mean": 5510.6, |
| "valid_targets_min": 3218 |
| }, |
| { |
| "epoch": 6.101199791340637, |
| "grad_norm": 0.6028201350072254, |
| "learning_rate": 1.985137860934594e-06, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0916367769241333, |
| "step": 5850, |
| "valid_targets_mean": 4280.0, |
| "valid_targets_min": 2785 |
| }, |
| { |
| "epoch": 6.10641627543036, |
| "grad_norm": 0.6232053815595153, |
| "learning_rate": 1.962610511065013e-06, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10127604007720947, |
| "step": 5855, |
| "valid_targets_mean": 4280.5, |
| "valid_targets_min": 2726 |
| }, |
| { |
| "epoch": 6.1116327595200834, |
| "grad_norm": 0.619280822162956, |
| "learning_rate": 1.940205115047098e-06, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12848986685276031, |
| "step": 5860, |
| "valid_targets_mean": 4106.4, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 6.116849243609807, |
| "grad_norm": 0.5292656123250503, |
| "learning_rate": 1.917921824367539e-06, |
| "loss": 0.1609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08275945484638214, |
| "step": 5865, |
| "valid_targets_mean": 4719.5, |
| "valid_targets_min": 1832 |
| }, |
| { |
| "epoch": 6.122065727699531, |
| "grad_norm": 0.5288161525038574, |
| "learning_rate": 1.8957607896874419e-06, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08273669332265854, |
| "step": 5870, |
| "valid_targets_mean": 5099.6, |
| "valid_targets_min": 3109 |
| }, |
| { |
| "epoch": 6.127282211789254, |
| "grad_norm": 0.5663131444928124, |
| "learning_rate": 1.8737221608413314e-06, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07949776947498322, |
| "step": 5875, |
| "valid_targets_mean": 4202.1, |
| "valid_targets_min": 1950 |
| }, |
| { |
| "epoch": 6.132498695878978, |
| "grad_norm": 0.5866117096283481, |
| "learning_rate": 1.8518060868361099e-06, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07808201014995575, |
| "step": 5880, |
| "valid_targets_mean": 4536.1, |
| "valid_targets_min": 2511 |
| }, |
| { |
| "epoch": 6.137715179968701, |
| "grad_norm": 0.5630696018312298, |
| "learning_rate": 1.8300127158500714e-06, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09297695755958557, |
| "step": 5885, |
| "valid_targets_mean": 4877.8, |
| "valid_targets_min": 1476 |
| }, |
| { |
| "epoch": 6.142931664058425, |
| "grad_norm": 0.5508892680415837, |
| "learning_rate": 1.8083421952319047e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08836787194013596, |
| "step": 5890, |
| "valid_targets_mean": 4473.0, |
| "valid_targets_min": 1981 |
| }, |
| { |
| "epoch": 6.148148148148148, |
| "grad_norm": 0.4665790269124101, |
| "learning_rate": 1.786794671499672e-06, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08136850595474243, |
| "step": 5895, |
| "valid_targets_mean": 6519.1, |
| "valid_targets_min": 2308 |
| }, |
| { |
| "epoch": 6.153364632237872, |
| "grad_norm": 0.5891418596351246, |
| "learning_rate": 1.7653702903398384e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0934087485074997, |
| "step": 5900, |
| "valid_targets_mean": 5352.8, |
| "valid_targets_min": 3204 |
| }, |
| { |
| "epoch": 6.158581116327595, |
| "grad_norm": 0.5608103296545519, |
| "learning_rate": 1.7440691966062816e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08997437357902527, |
| "step": 5905, |
| "valid_targets_mean": 4794.9, |
| "valid_targets_min": 2556 |
| }, |
| { |
| "epoch": 6.163797600417318, |
| "grad_norm": 0.5098134796184438, |
| "learning_rate": 1.722891534319313e-06, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06943631917238235, |
| "step": 5910, |
| "valid_targets_mean": 4535.1, |
| "valid_targets_min": 1853 |
| }, |
| { |
| "epoch": 6.169014084507042, |
| "grad_norm": 0.526164578027781, |
| "learning_rate": 1.7018374466646981e-06, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07023682445287704, |
| "step": 5915, |
| "valid_targets_mean": 3967.6, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 6.174230568596766, |
| "grad_norm": 0.457588070414583, |
| "learning_rate": 1.6809070759927015e-06, |
| "loss": 0.1776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0662381500005722, |
| "step": 5920, |
| "valid_targets_mean": 5071.5, |
| "valid_targets_min": 1691 |
| }, |
| { |
| "epoch": 6.1794470526864895, |
| "grad_norm": 0.5283325738816248, |
| "learning_rate": 1.6601005638171065e-06, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07992766052484512, |
| "step": 5925, |
| "valid_targets_mean": 4880.5, |
| "valid_targets_min": 1822 |
| }, |
| { |
| "epoch": 6.184663536776213, |
| "grad_norm": 0.5747524763800537, |
| "learning_rate": 1.639418050814281e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08078983426094055, |
| "step": 5930, |
| "valid_targets_mean": 4498.0, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 6.189880020865936, |
| "grad_norm": 0.6198787612885583, |
| "learning_rate": 1.6188596768221976e-06, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08396267890930176, |
| "step": 5935, |
| "valid_targets_mean": 4227.2, |
| "valid_targets_min": 2318 |
| }, |
| { |
| "epoch": 6.19509650495566, |
| "grad_norm": 0.5888969905988224, |
| "learning_rate": 1.5984255808395198e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07747550308704376, |
| "step": 5940, |
| "valid_targets_mean": 3874.4, |
| "valid_targets_min": 2695 |
| }, |
| { |
| "epoch": 6.200312989045384, |
| "grad_norm": 0.6054536148347041, |
| "learning_rate": 1.5781159010246306e-06, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08089844882488251, |
| "step": 5945, |
| "valid_targets_mean": 4071.9, |
| "valid_targets_min": 2128 |
| }, |
| { |
| "epoch": 6.2055294731351065, |
| "grad_norm": 0.5858727701096971, |
| "learning_rate": 1.557930774694727e-06, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08756640553474426, |
| "step": 5950, |
| "valid_targets_mean": 4455.8, |
| "valid_targets_min": 1541 |
| }, |
| { |
| "epoch": 6.21074595722483, |
| "grad_norm": 0.5025857589454156, |
| "learning_rate": 1.5378703383248694e-06, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06149665266275406, |
| "step": 5955, |
| "valid_targets_mean": 4103.9, |
| "valid_targets_min": 2589 |
| }, |
| { |
| "epoch": 6.215962441314554, |
| "grad_norm": 0.5378682703982972, |
| "learning_rate": 1.5179347275470812e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07153839617967606, |
| "step": 5960, |
| "valid_targets_mean": 4121.4, |
| "valid_targets_min": 2355 |
| }, |
| { |
| "epoch": 6.221178925404278, |
| "grad_norm": 0.5349205613738541, |
| "learning_rate": 1.4981240771494032e-06, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08590535074472427, |
| "step": 5965, |
| "valid_targets_mean": 5365.2, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 6.2263954094940015, |
| "grad_norm": 0.5325294007196091, |
| "learning_rate": 1.4784385210750052e-06, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08586692810058594, |
| "step": 5970, |
| "valid_targets_mean": 5268.0, |
| "valid_targets_min": 2695 |
| }, |
| { |
| "epoch": 6.231611893583724, |
| "grad_norm": 0.4855600868655522, |
| "learning_rate": 1.458878192421278e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08848752081394196, |
| "step": 5975, |
| "valid_targets_mean": 6680.2, |
| "valid_targets_min": 4403 |
| }, |
| { |
| "epoch": 6.236828377673448, |
| "grad_norm": 0.6015572517875324, |
| "learning_rate": 1.4394432234389167e-06, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09191454201936722, |
| "step": 5980, |
| "valid_targets_mean": 4356.5, |
| "valid_targets_min": 1719 |
| }, |
| { |
| "epoch": 6.242044861763172, |
| "grad_norm": 0.4402990787358173, |
| "learning_rate": 1.4201337455310537e-06, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06941086053848267, |
| "step": 5985, |
| "valid_targets_mean": 6787.0, |
| "valid_targets_min": 2317 |
| }, |
| { |
| "epoch": 6.247261345852895, |
| "grad_norm": 0.5872346587921095, |
| "learning_rate": 1.4009498892523388e-06, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08713740855455399, |
| "step": 5990, |
| "valid_targets_mean": 3955.1, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 6.2524778299426185, |
| "grad_norm": 0.5316055760875934, |
| "learning_rate": 1.3818917843080848e-06, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09362940490245819, |
| "step": 5995, |
| "valid_targets_mean": 5888.6, |
| "valid_targets_min": 2046 |
| }, |
| { |
| "epoch": 6.257694314032342, |
| "grad_norm": 0.5763307643943745, |
| "learning_rate": 1.3629595595533673e-06, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09008698165416718, |
| "step": 6000, |
| "valid_targets_mean": 4186.6, |
| "valid_targets_min": 2044 |
| }, |
| { |
| "epoch": 6.262910798122066, |
| "grad_norm": 0.49631777502298174, |
| "learning_rate": 1.3441533429921804e-06, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08558864891529083, |
| "step": 6005, |
| "valid_targets_mean": 6150.6, |
| "valid_targets_min": 1425 |
| }, |
| { |
| "epoch": 6.26812728221179, |
| "grad_norm": 0.542934183154514, |
| "learning_rate": 1.3254732617765375e-06, |
| "loss": 0.1665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0806925892829895, |
| "step": 6010, |
| "valid_targets_mean": 5129.9, |
| "valid_targets_min": 1893 |
| }, |
| { |
| "epoch": 6.273343766301513, |
| "grad_norm": 0.597025228662152, |
| "learning_rate": 1.3069194422056454e-06, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09697069227695465, |
| "step": 6015, |
| "valid_targets_mean": 4211.5, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 6.278560250391236, |
| "grad_norm": 0.568551323103317, |
| "learning_rate": 1.2884920097250197e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08361931890249252, |
| "step": 6020, |
| "valid_targets_mean": 3935.1, |
| "valid_targets_min": 1387 |
| }, |
| { |
| "epoch": 6.28377673448096, |
| "grad_norm": 0.5386832032057025, |
| "learning_rate": 1.2701910889256651e-06, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07516301423311234, |
| "step": 6025, |
| "valid_targets_mean": 4690.6, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 6.288993218570683, |
| "grad_norm": 0.5096384905174148, |
| "learning_rate": 1.2520168035432102e-06, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06578829884529114, |
| "step": 6030, |
| "valid_targets_mean": 4611.1, |
| "valid_targets_min": 3188 |
| }, |
| { |
| "epoch": 6.294209702660407, |
| "grad_norm": 0.5078443664032133, |
| "learning_rate": 1.2339692764570853e-06, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08106677234172821, |
| "step": 6035, |
| "valid_targets_mean": 5301.2, |
| "valid_targets_min": 2076 |
| }, |
| { |
| "epoch": 6.29942618675013, |
| "grad_norm": 0.6013232433244711, |
| "learning_rate": 1.2160486296896834e-06, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08288998156785965, |
| "step": 6040, |
| "valid_targets_mean": 3733.9, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 6.304642670839854, |
| "grad_norm": 0.5419758577541648, |
| "learning_rate": 1.198254984405538e-06, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09677646309137344, |
| "step": 6045, |
| "valid_targets_mean": 4574.4, |
| "valid_targets_min": 2195 |
| }, |
| { |
| "epoch": 6.309859154929577, |
| "grad_norm": 0.5446277500236966, |
| "learning_rate": 1.1805884609105012e-06, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09340253472328186, |
| "step": 6050, |
| "valid_targets_mean": 4646.2, |
| "valid_targets_min": 1737 |
| }, |
| { |
| "epoch": 6.315075639019301, |
| "grad_norm": 0.5243574814276308, |
| "learning_rate": 1.1630491786509457e-06, |
| "loss": 0.1594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07701204717159271, |
| "step": 6055, |
| "valid_targets_mean": 5141.8, |
| "valid_targets_min": 2266 |
| }, |
| { |
| "epoch": 6.3202921231090246, |
| "grad_norm": 0.6435320951413327, |
| "learning_rate": 1.1456372562129281e-06, |
| "loss": 0.1614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08175545930862427, |
| "step": 6060, |
| "valid_targets_mean": 5562.0, |
| "valid_targets_min": 1603 |
| }, |
| { |
| "epoch": 6.325508607198748, |
| "grad_norm": 0.5265813662985552, |
| "learning_rate": 1.1283528113214114e-06, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08022892475128174, |
| "step": 6065, |
| "valid_targets_mean": 4575.2, |
| "valid_targets_min": 208 |
| }, |
| { |
| "epoch": 6.330725091288471, |
| "grad_norm": 0.5119238855169547, |
| "learning_rate": 1.1111959608394662e-06, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.061150819063186646, |
| "step": 6070, |
| "valid_targets_mean": 4400.9, |
| "valid_targets_min": 2043 |
| }, |
| { |
| "epoch": 6.335941575378195, |
| "grad_norm": 0.5238475909765726, |
| "learning_rate": 1.094166820767464e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07575885951519012, |
| "step": 6075, |
| "valid_targets_mean": 5175.4, |
| "valid_targets_min": 2431 |
| }, |
| { |
| "epoch": 6.341158059467919, |
| "grad_norm": 0.5587142799014, |
| "learning_rate": 1.0772655062423176e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07077431678771973, |
| "step": 6080, |
| "valid_targets_mean": 4443.2, |
| "valid_targets_min": 1914 |
| }, |
| { |
| "epoch": 6.346374543557642, |
| "grad_norm": 0.612857706137813, |
| "learning_rate": 1.0604921315366767e-06, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08608610928058624, |
| "step": 6085, |
| "valid_targets_mean": 4559.0, |
| "valid_targets_min": 1757 |
| }, |
| { |
| "epoch": 6.351591027647365, |
| "grad_norm": 0.6670742752657252, |
| "learning_rate": 1.0438468100581823e-06, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11555208265781403, |
| "step": 6090, |
| "valid_targets_mean": 3916.6, |
| "valid_targets_min": 2320 |
| }, |
| { |
| "epoch": 6.356807511737089, |
| "grad_norm": 0.5332052239349687, |
| "learning_rate": 1.027329654348672e-06, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06971243023872375, |
| "step": 6095, |
| "valid_targets_mean": 3657.0, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 6.362023995826813, |
| "grad_norm": 0.5501198346395842, |
| "learning_rate": 1.01094077608344e-06, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09527956694364548, |
| "step": 6100, |
| "valid_targets_mean": 5293.6, |
| "valid_targets_min": 1475 |
| }, |
| { |
| "epoch": 6.3672404799165365, |
| "grad_norm": 0.7035339378264363, |
| "learning_rate": 9.946802860704706e-07, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0827580913901329, |
| "step": 6105, |
| "valid_targets_mean": 4001.9, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 6.372456964006259, |
| "grad_norm": 0.493625895550495, |
| "learning_rate": 9.785482942497037e-07, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07613112032413483, |
| "step": 6110, |
| "valid_targets_mean": 4524.5, |
| "valid_targets_min": 1899 |
| }, |
| { |
| "epoch": 6.377673448095983, |
| "grad_norm": 0.5241022319748064, |
| "learning_rate": 9.625449096922667e-07, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09136146306991577, |
| "step": 6115, |
| "valid_targets_mean": 5662.6, |
| "valid_targets_min": 3728 |
| }, |
| { |
| "epoch": 6.382889932185707, |
| "grad_norm": 1.0353966703876931, |
| "learning_rate": 9.466702405997674e-07, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.067151740193367, |
| "step": 6120, |
| "valid_targets_mean": 3555.2, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 6.388106416275431, |
| "grad_norm": 0.5746423268370077, |
| "learning_rate": 9.309243943035295e-07, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09859921038150787, |
| "step": 6125, |
| "valid_targets_mean": 4599.2, |
| "valid_targets_min": 3171 |
| }, |
| { |
| "epoch": 6.3933229003651535, |
| "grad_norm": 0.6544515306472833, |
| "learning_rate": 9.153074772638937e-07, |
| "loss": 0.1706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.096698097884655, |
| "step": 6130, |
| "valid_targets_mean": 4089.5, |
| "valid_targets_min": 1654 |
| }, |
| { |
| "epoch": 6.398539384454877, |
| "grad_norm": 0.5566676155158136, |
| "learning_rate": 8.99819595069491e-07, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1017160415649414, |
| "step": 6135, |
| "valid_targets_mean": 5410.6, |
| "valid_targets_min": 1624 |
| }, |
| { |
| "epoch": 6.403755868544601, |
| "grad_norm": 0.5230990896861292, |
| "learning_rate": 8.844608524365172e-07, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08459442108869553, |
| "step": 6140, |
| "valid_targets_mean": 5277.2, |
| "valid_targets_min": 2523 |
| }, |
| { |
| "epoch": 6.408972352634325, |
| "grad_norm": 0.5274707382276024, |
| "learning_rate": 8.692313532080443e-07, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07985209673643112, |
| "step": 6145, |
| "valid_targets_mean": 5341.5, |
| "valid_targets_min": 2441 |
| }, |
| { |
| "epoch": 6.414188836724048, |
| "grad_norm": 0.5416031184874927, |
| "learning_rate": 8.54131200353292e-07, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08388903737068176, |
| "step": 6150, |
| "valid_targets_mean": 5301.2, |
| "valid_targets_min": 1152 |
| }, |
| { |
| "epoch": 6.419405320813771, |
| "grad_norm": 0.5391134609004025, |
| "learning_rate": 8.391604959669619e-07, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07807138562202454, |
| "step": 6155, |
| "valid_targets_mean": 4546.0, |
| "valid_targets_min": 1655 |
| }, |
| { |
| "epoch": 6.424621804903495, |
| "grad_norm": 0.4960672468122204, |
| "learning_rate": 8.243193412685246e-07, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07477937638759613, |
| "step": 6160, |
| "valid_targets_mean": 5704.6, |
| "valid_targets_min": 3157 |
| }, |
| { |
| "epoch": 6.429838288993219, |
| "grad_norm": 0.5500642984629969, |
| "learning_rate": 8.096078366015514e-07, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0865449458360672, |
| "step": 6165, |
| "valid_targets_mean": 5272.1, |
| "valid_targets_min": 2280 |
| }, |
| { |
| "epoch": 6.435054773082942, |
| "grad_norm": 0.4982969915490319, |
| "learning_rate": 7.950260814330169e-07, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07472272962331772, |
| "step": 6170, |
| "valid_targets_mean": 4460.2, |
| "valid_targets_min": 1878 |
| }, |
| { |
| "epoch": 6.4402712571726655, |
| "grad_norm": 0.5341667921203153, |
| "learning_rate": 7.805741743526441e-07, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0895976796746254, |
| "step": 6175, |
| "valid_targets_mean": 5404.6, |
| "valid_targets_min": 2367 |
| }, |
| { |
| "epoch": 6.445487741262389, |
| "grad_norm": 0.5492125654290198, |
| "learning_rate": 7.662522130722294e-07, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07540404051542282, |
| "step": 6180, |
| "valid_targets_mean": 4739.1, |
| "valid_targets_min": 1735 |
| }, |
| { |
| "epoch": 6.450704225352113, |
| "grad_norm": 0.5358545190242257, |
| "learning_rate": 7.520602944249855e-07, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10180626064538956, |
| "step": 6185, |
| "valid_targets_mean": 5684.0, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 6.455920709441836, |
| "grad_norm": 0.5091791636322476, |
| "learning_rate": 7.379985143648815e-07, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.058316584676504135, |
| "step": 6190, |
| "valid_targets_mean": 4836.5, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 6.46113719353156, |
| "grad_norm": 0.5586442466521836, |
| "learning_rate": 7.240669679660017e-07, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09539739787578583, |
| "step": 6195, |
| "valid_targets_mean": 5895.9, |
| "valid_targets_min": 3541 |
| }, |
| { |
| "epoch": 6.466353677621283, |
| "grad_norm": 0.5006232216627376, |
| "learning_rate": 7.102657494218879e-07, |
| "loss": 0.1663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06938563287258148, |
| "step": 6200, |
| "valid_targets_mean": 4634.5, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 6.471570161711007, |
| "grad_norm": 0.5546239126291488, |
| "learning_rate": 6.965949520449311e-07, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0821041464805603, |
| "step": 6205, |
| "valid_targets_mean": 5086.8, |
| "valid_targets_min": 1856 |
| }, |
| { |
| "epoch": 6.47678664580073, |
| "grad_norm": 0.4910903623028209, |
| "learning_rate": 6.830546682657035e-07, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07834288477897644, |
| "step": 6210, |
| "valid_targets_mean": 5048.6, |
| "valid_targets_min": 2940 |
| }, |
| { |
| "epoch": 6.482003129890454, |
| "grad_norm": 0.554755174369064, |
| "learning_rate": 6.696449896323698e-07, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08156804740428925, |
| "step": 6215, |
| "valid_targets_mean": 4262.4, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 6.487219613980177, |
| "grad_norm": 0.5793166829491566, |
| "learning_rate": 6.563660068100408e-07, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08402011543512344, |
| "step": 6220, |
| "valid_targets_mean": 3359.8, |
| "valid_targets_min": 1691 |
| }, |
| { |
| "epoch": 6.492436098069901, |
| "grad_norm": 0.5586393784517392, |
| "learning_rate": 6.432178095801678e-07, |
| "loss": 0.1594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09661173820495605, |
| "step": 6225, |
| "valid_targets_mean": 4351.2, |
| "valid_targets_min": 2666 |
| }, |
| { |
| "epoch": 6.497652582159624, |
| "grad_norm": 0.5716779271221131, |
| "learning_rate": 6.302004868399514e-07, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07923077046871185, |
| "step": 6230, |
| "valid_targets_mean": 3839.8, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 6.502869066249348, |
| "grad_norm": 0.5753569634982648, |
| "learning_rate": 6.173141266017113e-07, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07147848606109619, |
| "step": 6235, |
| "valid_targets_mean": 3394.2, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 6.5080855503390715, |
| "grad_norm": 0.5245411730700712, |
| "learning_rate": 6.045588159923266e-07, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08123113214969635, |
| "step": 6240, |
| "valid_targets_mean": 5400.9, |
| "valid_targets_min": 3096 |
| }, |
| { |
| "epoch": 6.513302034428795, |
| "grad_norm": 0.5374981308134168, |
| "learning_rate": 5.919346412526117e-07, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08702099323272705, |
| "step": 6245, |
| "valid_targets_mean": 5240.4, |
| "valid_targets_min": 1771 |
| }, |
| { |
| "epoch": 6.518518518518518, |
| "grad_norm": 0.5926256551419858, |
| "learning_rate": 5.794416877367526e-07, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07396068423986435, |
| "step": 6250, |
| "valid_targets_mean": 3938.5, |
| "valid_targets_min": 2393 |
| }, |
| { |
| "epoch": 6.523735002608242, |
| "grad_norm": 0.5130895160388712, |
| "learning_rate": 5.670800399117316e-07, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08972735702991486, |
| "step": 6255, |
| "valid_targets_mean": 5926.8, |
| "valid_targets_min": 2193 |
| }, |
| { |
| "epoch": 6.528951486697966, |
| "grad_norm": 0.6837534994812857, |
| "learning_rate": 5.548497813567455e-07, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09018000960350037, |
| "step": 6260, |
| "valid_targets_mean": 4145.4, |
| "valid_targets_min": 2124 |
| }, |
| { |
| "epoch": 6.534167970787689, |
| "grad_norm": 0.5858320399320168, |
| "learning_rate": 5.427509947626486e-07, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06871044635772705, |
| "step": 6265, |
| "valid_targets_mean": 4609.0, |
| "valid_targets_min": 1686 |
| }, |
| { |
| "epoch": 6.539384454877412, |
| "grad_norm": 0.9369134981527133, |
| "learning_rate": 5.307837619313949e-07, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09468284249305725, |
| "step": 6270, |
| "valid_targets_mean": 4776.0, |
| "valid_targets_min": 1565 |
| }, |
| { |
| "epoch": 6.544600938967136, |
| "grad_norm": 0.4906643606770716, |
| "learning_rate": 5.189481637754679e-07, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06301077455282211, |
| "step": 6275, |
| "valid_targets_mean": 4904.9, |
| "valid_targets_min": 2530 |
| }, |
| { |
| "epoch": 6.54981742305686, |
| "grad_norm": 0.5299721524580903, |
| "learning_rate": 5.072442803173649e-07, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0912301167845726, |
| "step": 6280, |
| "valid_targets_mean": 4950.5, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 6.5550339071465835, |
| "grad_norm": 0.6255622891103191, |
| "learning_rate": 4.956721906890228e-07, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09659097343683243, |
| "step": 6285, |
| "valid_targets_mean": 4950.6, |
| "valid_targets_min": 1533 |
| }, |
| { |
| "epoch": 6.560250391236306, |
| "grad_norm": 0.6174968011521565, |
| "learning_rate": 4.842319731313016e-07, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10585039108991623, |
| "step": 6290, |
| "valid_targets_mean": 4290.8, |
| "valid_targets_min": 1528 |
| }, |
| { |
| "epoch": 6.56546687532603, |
| "grad_norm": 0.5861852083749461, |
| "learning_rate": 4.729237049934621e-07, |
| "loss": 0.1682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08830663561820984, |
| "step": 6295, |
| "valid_targets_mean": 4821.6, |
| "valid_targets_min": 1612 |
| }, |
| { |
| "epoch": 6.570683359415754, |
| "grad_norm": 0.5463462106108242, |
| "learning_rate": 4.6174746273261793e-07, |
| "loss": 0.1708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08798755705356598, |
| "step": 6300, |
| "valid_targets_mean": 4962.6, |
| "valid_targets_min": 1741 |
| }, |
| { |
| "epoch": 6.575899843505478, |
| "grad_norm": 0.5532379866364969, |
| "learning_rate": 4.507033219132395e-07, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07625909149646759, |
| "step": 6305, |
| "valid_targets_mean": 4648.1, |
| "valid_targets_min": 2171 |
| }, |
| { |
| "epoch": 6.5811163275952005, |
| "grad_norm": 0.5065410208057752, |
| "learning_rate": 4.3979135720664035e-07, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06727365404367447, |
| "step": 6310, |
| "valid_targets_mean": 5517.6, |
| "valid_targets_min": 2833 |
| }, |
| { |
| "epoch": 6.586332811684924, |
| "grad_norm": 0.5493744454932743, |
| "learning_rate": 4.2901164239046443e-07, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09966464340686798, |
| "step": 6315, |
| "valid_targets_mean": 5292.9, |
| "valid_targets_min": 3144 |
| }, |
| { |
| "epoch": 6.591549295774648, |
| "grad_norm": 0.5761969297622763, |
| "learning_rate": 4.1836425034819106e-07, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08473914861679077, |
| "step": 6320, |
| "valid_targets_mean": 4597.6, |
| "valid_targets_min": 2802 |
| }, |
| { |
| "epoch": 6.596765779864372, |
| "grad_norm": 0.7363640904744337, |
| "learning_rate": 4.078492530686506e-07, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08203506469726562, |
| "step": 6325, |
| "valid_targets_mean": 3774.4, |
| "valid_targets_min": 1338 |
| }, |
| { |
| "epoch": 6.601982263954095, |
| "grad_norm": 0.5094006763949639, |
| "learning_rate": 3.9746672164551856e-07, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07795064151287079, |
| "step": 6330, |
| "valid_targets_mean": 5433.5, |
| "valid_targets_min": 1882 |
| }, |
| { |
| "epoch": 6.607198748043818, |
| "grad_norm": 0.6061614255410304, |
| "learning_rate": 3.872167262768578e-07, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07970091700553894, |
| "step": 6335, |
| "valid_targets_mean": 4424.8, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 6.612415232133542, |
| "grad_norm": 0.505158025715867, |
| "learning_rate": 3.7709933626461916e-07, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07546493411064148, |
| "step": 6340, |
| "valid_targets_mean": 4831.2, |
| "valid_targets_min": 2092 |
| }, |
| { |
| "epoch": 6.617631716223266, |
| "grad_norm": 0.48956541874495973, |
| "learning_rate": 3.671146200142017e-07, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08042104542255402, |
| "step": 6345, |
| "valid_targets_mean": 6330.6, |
| "valid_targets_min": 3720 |
| }, |
| { |
| "epoch": 6.622848200312989, |
| "grad_norm": 0.552499065585299, |
| "learning_rate": 3.5726264503396e-07, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0773078203201294, |
| "step": 6350, |
| "valid_targets_mean": 4676.6, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 6.6280646844027125, |
| "grad_norm": 0.5241665236185439, |
| "learning_rate": 3.475434779347731e-07, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08315479755401611, |
| "step": 6355, |
| "valid_targets_mean": 4854.5, |
| "valid_targets_min": 2492 |
| }, |
| { |
| "epoch": 6.633281168492436, |
| "grad_norm": 0.5229494178000254, |
| "learning_rate": 3.3795718442957593e-07, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07639910280704498, |
| "step": 6360, |
| "valid_targets_mean": 4369.9, |
| "valid_targets_min": 2310 |
| }, |
| { |
| "epoch": 6.63849765258216, |
| "grad_norm": 0.6365838431533449, |
| "learning_rate": 3.2850382933292903e-07, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06544691324234009, |
| "step": 6365, |
| "valid_targets_mean": 4716.8, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 6.643714136671883, |
| "grad_norm": 0.6078803116735846, |
| "learning_rate": 3.1918347656056946e-07, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08977963775396347, |
| "step": 6370, |
| "valid_targets_mean": 4123.0, |
| "valid_targets_min": 2271 |
| }, |
| { |
| "epoch": 6.648930620761607, |
| "grad_norm": 0.5502228136170516, |
| "learning_rate": 3.0999618912898267e-07, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08217453956604004, |
| "step": 6375, |
| "valid_targets_mean": 5216.9, |
| "valid_targets_min": 2267 |
| }, |
| { |
| "epoch": 6.65414710485133, |
| "grad_norm": 0.4903820521932893, |
| "learning_rate": 3.009420291549825e-07, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07962026447057724, |
| "step": 6380, |
| "valid_targets_mean": 6445.1, |
| "valid_targets_min": 1973 |
| }, |
| { |
| "epoch": 6.659363588941054, |
| "grad_norm": 0.6635091094279434, |
| "learning_rate": 2.9202105785527623e-07, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10168874263763428, |
| "step": 6385, |
| "valid_targets_mean": 3914.8, |
| "valid_targets_min": 2387 |
| }, |
| { |
| "epoch": 6.664580073030777, |
| "grad_norm": 0.5674026350366216, |
| "learning_rate": 2.8323333554606923e-07, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09658002853393555, |
| "step": 6390, |
| "valid_targets_mean": 5366.6, |
| "valid_targets_min": 2041 |
| }, |
| { |
| "epoch": 6.669796557120501, |
| "grad_norm": 0.5317292589938676, |
| "learning_rate": 2.745789216426387e-07, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07777095586061478, |
| "step": 6395, |
| "valid_targets_mean": 4769.0, |
| "valid_targets_min": 2111 |
| }, |
| { |
| "epoch": 6.675013041210224, |
| "grad_norm": 0.6203666831879747, |
| "learning_rate": 2.660578746589515e-07, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09512919187545776, |
| "step": 6400, |
| "valid_targets_mean": 4147.4, |
| "valid_targets_min": 1817 |
| }, |
| { |
| "epoch": 6.680229525299948, |
| "grad_norm": 0.6113606882976234, |
| "learning_rate": 2.5767025220724717e-07, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10862178355455399, |
| "step": 6405, |
| "valid_targets_mean": 5514.9, |
| "valid_targets_min": 2444 |
| }, |
| { |
| "epoch": 6.685446009389671, |
| "grad_norm": 0.5684941882814628, |
| "learning_rate": 2.4941611099766896e-07, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07307954132556915, |
| "step": 6410, |
| "valid_targets_mean": 4531.8, |
| "valid_targets_min": 1787 |
| }, |
| { |
| "epoch": 6.690662493479395, |
| "grad_norm": 0.5125407630567089, |
| "learning_rate": 2.4129550683786194e-07, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07515746355056763, |
| "step": 6415, |
| "valid_targets_mean": 4874.9, |
| "valid_targets_min": 2187 |
| }, |
| { |
| "epoch": 6.6958789775691185, |
| "grad_norm": 0.5153495108176748, |
| "learning_rate": 2.3330849463261363e-07, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0719965398311615, |
| "step": 6420, |
| "valid_targets_mean": 3854.9, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 6.701095461658842, |
| "grad_norm": 0.5176861251483592, |
| "learning_rate": 2.2545512838346716e-07, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06797109544277191, |
| "step": 6425, |
| "valid_targets_mean": 4365.1, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 6.706311945748565, |
| "grad_norm": 0.559817981189732, |
| "learning_rate": 2.1773546118836418e-07, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0822562575340271, |
| "step": 6430, |
| "valid_targets_mean": 4119.1, |
| "valid_targets_min": 1455 |
| }, |
| { |
| "epoch": 6.711528429838289, |
| "grad_norm": 0.5474882365834455, |
| "learning_rate": 2.1014954524128493e-07, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08481225371360779, |
| "step": 6435, |
| "valid_targets_mean": 5039.8, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 6.716744913928013, |
| "grad_norm": 0.5086535693869745, |
| "learning_rate": 2.0269743183189528e-07, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0783454105257988, |
| "step": 6440, |
| "valid_targets_mean": 4745.6, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 6.721961398017736, |
| "grad_norm": 0.5080116207115293, |
| "learning_rate": 1.9537917134520023e-07, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.068985216319561, |
| "step": 6445, |
| "valid_targets_mean": 4546.9, |
| "valid_targets_min": 3249 |
| }, |
| { |
| "epoch": 6.727177882107459, |
| "grad_norm": 0.5495255536817283, |
| "learning_rate": 1.881948132611977e-07, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06369595229625702, |
| "step": 6450, |
| "valid_targets_mean": 3474.2, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 6.732394366197183, |
| "grad_norm": 0.5994488137520114, |
| "learning_rate": 1.811444061545542e-07, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08287137746810913, |
| "step": 6455, |
| "valid_targets_mean": 4944.2, |
| "valid_targets_min": 2391 |
| }, |
| { |
| "epoch": 6.737610850286907, |
| "grad_norm": 0.5126567683176668, |
| "learning_rate": 1.7422799769426736e-07, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.061244308948516846, |
| "step": 6460, |
| "valid_targets_mean": 3977.2, |
| "valid_targets_min": 2516 |
| }, |
| { |
| "epoch": 6.7428273343766305, |
| "grad_norm": 0.5831515070930245, |
| "learning_rate": 1.674456346433506e-07, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08915935456752777, |
| "step": 6465, |
| "valid_targets_mean": 4809.4, |
| "valid_targets_min": 2022 |
| }, |
| { |
| "epoch": 6.748043818466353, |
| "grad_norm": 0.5730307050297281, |
| "learning_rate": 1.607973628585091e-07, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08513954281806946, |
| "step": 6470, |
| "valid_targets_mean": 4412.6, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 6.753260302556077, |
| "grad_norm": 0.5790497202571583, |
| "learning_rate": 1.542832272898398e-07, |
| "loss": 0.1771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09173041582107544, |
| "step": 6475, |
| "valid_targets_mean": 4468.9, |
| "valid_targets_min": 1852 |
| }, |
| { |
| "epoch": 6.758476786645801, |
| "grad_norm": 0.5159289857385856, |
| "learning_rate": 1.4790327198051624e-07, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07732409238815308, |
| "step": 6480, |
| "valid_targets_mean": 4268.2, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 6.763693270735525, |
| "grad_norm": 0.5261496459131189, |
| "learning_rate": 1.416575400664999e-07, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08644157648086548, |
| "step": 6485, |
| "valid_targets_mean": 5388.8, |
| "valid_targets_min": 2127 |
| }, |
| { |
| "epoch": 6.7689097548252475, |
| "grad_norm": 0.5229503599641532, |
| "learning_rate": 1.3554607377624263e-07, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07498866319656372, |
| "step": 6490, |
| "valid_targets_mean": 4785.5, |
| "valid_targets_min": 2022 |
| }, |
| { |
| "epoch": 6.774126238914971, |
| "grad_norm": 0.5073924620034521, |
| "learning_rate": 1.295689144304091e-07, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07597608864307404, |
| "step": 6495, |
| "valid_targets_mean": 5095.1, |
| "valid_targets_min": 1500 |
| }, |
| { |
| "epoch": 6.779342723004695, |
| "grad_norm": 0.5742958458442429, |
| "learning_rate": 1.237261024415881e-07, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08016721159219742, |
| "step": 6500, |
| "valid_targets_mean": 4903.2, |
| "valid_targets_min": 2192 |
| }, |
| { |
| "epoch": 6.784559207094419, |
| "grad_norm": 0.5634137025390458, |
| "learning_rate": 1.1801767731401958e-07, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0954822227358818, |
| "step": 6505, |
| "valid_targets_mean": 4574.5, |
| "valid_targets_min": 1753 |
| }, |
| { |
| "epoch": 6.789775691184142, |
| "grad_norm": 0.568993442444071, |
| "learning_rate": 1.1244367764333464e-07, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10571624338626862, |
| "step": 6510, |
| "valid_targets_mean": 5754.6, |
| "valid_targets_min": 3334 |
| }, |
| { |
| "epoch": 6.794992175273865, |
| "grad_norm": 0.5520081151531104, |
| "learning_rate": 1.0700414111629365e-07, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09768638759851456, |
| "step": 6515, |
| "valid_targets_mean": 3943.8, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 6.800208659363589, |
| "grad_norm": 0.5760719080774065, |
| "learning_rate": 1.0169910451052422e-07, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07405383884906769, |
| "step": 6520, |
| "valid_targets_mean": 4556.4, |
| "valid_targets_min": 1193 |
| }, |
| { |
| "epoch": 6.805425143453313, |
| "grad_norm": 0.4978196958326634, |
| "learning_rate": 9.652860369428141e-08, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0769326388835907, |
| "step": 6525, |
| "valid_targets_mean": 5648.2, |
| "valid_targets_min": 3140 |
| }, |
| { |
| "epoch": 6.810641627543036, |
| "grad_norm": 0.6255097736995268, |
| "learning_rate": 9.149267362619895e-08, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09469383209943771, |
| "step": 6530, |
| "valid_targets_mean": 5004.4, |
| "valid_targets_min": 1876 |
| }, |
| { |
| "epoch": 6.8158581116327595, |
| "grad_norm": 0.5891644536704017, |
| "learning_rate": 8.659134835504956e-08, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1021219789981842, |
| "step": 6535, |
| "valid_targets_mean": 4905.6, |
| "valid_targets_min": 2000 |
| }, |
| { |
| "epoch": 6.821074595722483, |
| "grad_norm": 0.5525031252703527, |
| "learning_rate": 8.18246610195339e-08, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08424567431211472, |
| "step": 6540, |
| "valid_targets_mean": 4678.4, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 6.826291079812207, |
| "grad_norm": 0.5791393289700533, |
| "learning_rate": 7.719264384802527e-08, |
| "loss": 0.1574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07773526012897491, |
| "step": 6545, |
| "valid_targets_mean": 4099.8, |
| "valid_targets_min": 1625 |
| }, |
| { |
| "epoch": 6.83150756390193, |
| "grad_norm": 0.5161030337927414, |
| "learning_rate": 7.269532815838532e-08, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08431129157543182, |
| "step": 6550, |
| "valid_targets_mean": 5410.5, |
| "valid_targets_min": 2155 |
| }, |
| { |
| "epoch": 6.836724047991654, |
| "grad_norm": 0.490060135511807, |
| "learning_rate": 6.833274435772196e-08, |
| "loss": 0.1583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06826452910900116, |
| "step": 6555, |
| "valid_targets_mean": 5077.6, |
| "valid_targets_min": 2890 |
| }, |
| { |
| "epoch": 6.841940532081377, |
| "grad_norm": 0.6084355470618008, |
| "learning_rate": 6.410492194220963e-08, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09635565429925919, |
| "step": 6560, |
| "valid_targets_mean": 4256.8, |
| "valid_targets_min": 1858 |
| }, |
| { |
| "epoch": 6.847157016171101, |
| "grad_norm": 0.5464942429975727, |
| "learning_rate": 6.001188949687153e-08, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0908285453915596, |
| "step": 6565, |
| "valid_targets_mean": 4766.1, |
| "valid_targets_min": 2251 |
| }, |
| { |
| "epoch": 6.852373500260824, |
| "grad_norm": 0.5324427723013748, |
| "learning_rate": 5.6053674695395463e-08, |
| "loss": 0.1609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07651311159133911, |
| "step": 6570, |
| "valid_targets_mean": 4681.2, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 6.857589984350548, |
| "grad_norm": 0.5316025405834288, |
| "learning_rate": 5.22303042999428e-08, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09243462979793549, |
| "step": 6575, |
| "valid_targets_mean": 5462.0, |
| "valid_targets_min": 2448 |
| }, |
| { |
| "epoch": 6.862806468440271, |
| "grad_norm": 0.5548110954612004, |
| "learning_rate": 4.8541804160968655e-08, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08866509795188904, |
| "step": 6580, |
| "valid_targets_mean": 4857.0, |
| "valid_targets_min": 2369 |
| }, |
| { |
| "epoch": 6.868022952529994, |
| "grad_norm": 0.6056436002002238, |
| "learning_rate": 4.498819921705089e-08, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08769193291664124, |
| "step": 6585, |
| "valid_targets_mean": 4305.8, |
| "valid_targets_min": 2471 |
| }, |
| { |
| "epoch": 6.873239436619718, |
| "grad_norm": 0.6181972867280068, |
| "learning_rate": 4.15695134947125e-08, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09733624756336212, |
| "step": 6590, |
| "valid_targets_mean": 3868.6, |
| "valid_targets_min": 1982 |
| }, |
| { |
| "epoch": 6.878455920709442, |
| "grad_norm": 0.5205648849887881, |
| "learning_rate": 3.8285770108272836e-08, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08204355835914612, |
| "step": 6595, |
| "valid_targets_mean": 5234.4, |
| "valid_targets_min": 2231 |
| }, |
| { |
| "epoch": 6.8836724047991655, |
| "grad_norm": 0.5328299359281365, |
| "learning_rate": 3.5136991259672183e-08, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06707605719566345, |
| "step": 6600, |
| "valid_targets_mean": 5658.4, |
| "valid_targets_min": 1472 |
| }, |
| { |
| "epoch": 6.888888888888889, |
| "grad_norm": 0.5526066203448274, |
| "learning_rate": 3.212319823834298e-08, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12305822968482971, |
| "step": 6605, |
| "valid_targets_mean": 4908.1, |
| "valid_targets_min": 1847 |
| }, |
| { |
| "epoch": 6.894105372978612, |
| "grad_norm": 0.48472299525783724, |
| "learning_rate": 2.9244411421049946e-08, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0804297924041748, |
| "step": 6610, |
| "valid_targets_mean": 4955.9, |
| "valid_targets_min": 2223 |
| }, |
| { |
| "epoch": 6.899321857068336, |
| "grad_norm": 0.491359095042733, |
| "learning_rate": 2.6500650271759077e-08, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0729602798819542, |
| "step": 6615, |
| "valid_targets_mean": 5261.2, |
| "valid_targets_min": 2934 |
| }, |
| { |
| "epoch": 6.90453834115806, |
| "grad_norm": 0.5105255246216366, |
| "learning_rate": 2.3891933341506636e-08, |
| "loss": 0.1593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07847601920366287, |
| "step": 6620, |
| "valid_targets_mean": 5682.6, |
| "valid_targets_min": 2283 |
| }, |
| { |
| "epoch": 6.9097548252477825, |
| "grad_norm": 0.5651999326941914, |
| "learning_rate": 2.1418278268270365e-08, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08119011670351028, |
| "step": 6625, |
| "valid_targets_mean": 5365.1, |
| "valid_targets_min": 2328 |
| }, |
| { |
| "epoch": 6.914971309337506, |
| "grad_norm": 0.4752856662151638, |
| "learning_rate": 1.907970177684737e-08, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07210240513086319, |
| "step": 6630, |
| "valid_targets_mean": 6072.9, |
| "valid_targets_min": 3350 |
| }, |
| { |
| "epoch": 6.92018779342723, |
| "grad_norm": 0.536334628512583, |
| "learning_rate": 1.687621967875863e-08, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08057719469070435, |
| "step": 6635, |
| "valid_targets_mean": 5156.0, |
| "valid_targets_min": 2835 |
| }, |
| { |
| "epoch": 6.925404277516954, |
| "grad_norm": 0.5605009892985632, |
| "learning_rate": 1.4807846872113563e-08, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08201783895492554, |
| "step": 6640, |
| "valid_targets_mean": 4241.5, |
| "valid_targets_min": 2650 |
| }, |
| { |
| "epoch": 6.9306207616066775, |
| "grad_norm": 0.5315249799499744, |
| "learning_rate": 1.2874597341534512e-08, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08200040459632874, |
| "step": 6645, |
| "valid_targets_mean": 4877.6, |
| "valid_targets_min": 2332 |
| }, |
| { |
| "epoch": 6.9358372456964, |
| "grad_norm": 0.6271880493962537, |
| "learning_rate": 1.1076484158047962e-08, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11016195267438889, |
| "step": 6650, |
| "valid_targets_mean": 4848.4, |
| "valid_targets_min": 2185 |
| }, |
| { |
| "epoch": 6.941053729786124, |
| "grad_norm": 0.4985270702899821, |
| "learning_rate": 9.413519479004596e-09, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06930582225322723, |
| "step": 6655, |
| "valid_targets_mean": 5042.6, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 6.946270213875848, |
| "grad_norm": 0.5376613750357377, |
| "learning_rate": 7.885714547990475e-09, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07879330217838287, |
| "step": 6660, |
| "valid_targets_mean": 5642.0, |
| "valid_targets_min": 1683 |
| }, |
| { |
| "epoch": 6.951486697965571, |
| "grad_norm": 0.6210626987569594, |
| "learning_rate": 6.493079694753768e-09, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08401305973529816, |
| "step": 6665, |
| "valid_targets_mean": 4189.1, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 6.9567031820552945, |
| "grad_norm": 0.6346567450751912, |
| "learning_rate": 5.235624335133693e-09, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11028879135847092, |
| "step": 6670, |
| "valid_targets_mean": 4331.8, |
| "valid_targets_min": 1737 |
| }, |
| { |
| "epoch": 6.961919666145018, |
| "grad_norm": 0.5399427080559815, |
| "learning_rate": 4.113356971002791e-09, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06442070007324219, |
| "step": 6675, |
| "valid_targets_mean": 3822.8, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 6.967136150234742, |
| "grad_norm": 0.5544017097545518, |
| "learning_rate": 3.126285190195866e-09, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.061635371297597885, |
| "step": 6680, |
| "valid_targets_mean": 3973.4, |
| "valid_targets_min": 229 |
| }, |
| { |
| "epoch": 6.972352634324466, |
| "grad_norm": 0.5098397885779282, |
| "learning_rate": 2.2744156664766813e-09, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08478450775146484, |
| "step": 6685, |
| "valid_targets_mean": 4589.8, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 6.977569118414189, |
| "grad_norm": 0.5411222657320197, |
| "learning_rate": 1.5577541594802293e-09, |
| "loss": 0.1663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10507169365882874, |
| "step": 6690, |
| "valid_targets_mean": 6228.5, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 6.982785602503912, |
| "grad_norm": 0.5713424510280001, |
| "learning_rate": 9.7630551467498e-10, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08130859583616257, |
| "step": 6695, |
| "valid_targets_mean": 4436.1, |
| "valid_targets_min": 1928 |
| }, |
| { |
| "epoch": 6.988002086593636, |
| "grad_norm": 0.49450624264968135, |
| "learning_rate": 5.300736633317982e-10, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07469873875379562, |
| "step": 6700, |
| "valid_targets_mean": 5284.1, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 6.993218570683359, |
| "grad_norm": 0.8620431386424838, |
| "learning_rate": 2.1906162250395768e-10, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08396423608064651, |
| "step": 6705, |
| "valid_targets_mean": 5400.6, |
| "valid_targets_min": 1757 |
| }, |
| { |
| "epoch": 6.998435054773083, |
| "grad_norm": 0.5780156319377473, |
| "learning_rate": 4.3271494996055544e-11, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0954805314540863, |
| "step": 6710, |
| "valid_targets_mean": 4702.2, |
| "valid_targets_min": 3222 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14267900586128235, |
| "step": 6712, |
| "total_flos": 3.0948342577517036e+18, |
| "train_loss": 0.11350778881926644, |
| "train_runtime": 136690.7198, |
| "train_samples_per_second": 0.785, |
| "train_steps_per_second": 0.049, |
| "valid_targets_mean": 6167.6, |
| "valid_targets_min": 3936 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 6713, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 200, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": false |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 3.0948342577517036e+18, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|