| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 5.0, |
| "eval_steps": 500, |
| "global_step": 4940, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.005063291139240506, |
| "grad_norm": 4.609051043616223, |
| "learning_rate": 3.238866396761134e-07, |
| "loss": 0.5035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25989317893981934, |
| "step": 5, |
| "valid_targets_mean": 3288.2, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 0.010126582278481013, |
| "grad_norm": 3.6056753367980687, |
| "learning_rate": 7.287449392712551e-07, |
| "loss": 0.4979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23132257163524628, |
| "step": 10, |
| "valid_targets_mean": 4994.0, |
| "valid_targets_min": 1103 |
| }, |
| { |
| "epoch": 0.015189873417721518, |
| "grad_norm": 3.75046312941662, |
| "learning_rate": 1.133603238866397e-06, |
| "loss": 0.5107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23433995246887207, |
| "step": 15, |
| "valid_targets_mean": 4084.1, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 0.020253164556962026, |
| "grad_norm": 4.009323566522028, |
| "learning_rate": 1.5384615384615387e-06, |
| "loss": 0.4757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19289864599704742, |
| "step": 20, |
| "valid_targets_mean": 4351.0, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 0.02531645569620253, |
| "grad_norm": 3.857687726883038, |
| "learning_rate": 1.9433198380566803e-06, |
| "loss": 0.4795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25582650303840637, |
| "step": 25, |
| "valid_targets_mean": 4894.1, |
| "valid_targets_min": 1784 |
| }, |
| { |
| "epoch": 0.030379746835443037, |
| "grad_norm": 2.431783748480512, |
| "learning_rate": 2.348178137651822e-06, |
| "loss": 0.4538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21279120445251465, |
| "step": 30, |
| "valid_targets_mean": 4872.4, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 0.035443037974683546, |
| "grad_norm": 2.0913610531108153, |
| "learning_rate": 2.7530364372469636e-06, |
| "loss": 0.4576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21099823713302612, |
| "step": 35, |
| "valid_targets_mean": 4177.9, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 0.04050632911392405, |
| "grad_norm": 2.1267526423567826, |
| "learning_rate": 3.157894736842105e-06, |
| "loss": 0.4362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21998053789138794, |
| "step": 40, |
| "valid_targets_mean": 5318.6, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 0.04556962025316456, |
| "grad_norm": 1.8229308674567508, |
| "learning_rate": 3.562753036437247e-06, |
| "loss": 0.4107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21922659873962402, |
| "step": 45, |
| "valid_targets_mean": 3793.9, |
| "valid_targets_min": 1470 |
| }, |
| { |
| "epoch": 0.05063291139240506, |
| "grad_norm": 1.1764023018227465, |
| "learning_rate": 3.967611336032389e-06, |
| "loss": 0.3992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1912367194890976, |
| "step": 50, |
| "valid_targets_mean": 4403.0, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 0.05569620253164557, |
| "grad_norm": 1.0017414517719199, |
| "learning_rate": 4.372469635627531e-06, |
| "loss": 0.3867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19108061492443085, |
| "step": 55, |
| "valid_targets_mean": 4060.0, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 0.060759493670886074, |
| "grad_norm": 0.7507852394561627, |
| "learning_rate": 4.7773279352226725e-06, |
| "loss": 0.3841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16387608647346497, |
| "step": 60, |
| "valid_targets_mean": 4424.5, |
| "valid_targets_min": 1409 |
| }, |
| { |
| "epoch": 0.06582278481012659, |
| "grad_norm": 0.557594133353884, |
| "learning_rate": 5.1821862348178145e-06, |
| "loss": 0.3711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16386422514915466, |
| "step": 65, |
| "valid_targets_mean": 3916.2, |
| "valid_targets_min": 1045 |
| }, |
| { |
| "epoch": 0.07088607594936709, |
| "grad_norm": 0.421043632829371, |
| "learning_rate": 5.5870445344129565e-06, |
| "loss": 0.3875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19452455639839172, |
| "step": 70, |
| "valid_targets_mean": 5656.6, |
| "valid_targets_min": 1746 |
| }, |
| { |
| "epoch": 0.0759493670886076, |
| "grad_norm": 0.41166529544187236, |
| "learning_rate": 5.991902834008098e-06, |
| "loss": 0.3747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2017640769481659, |
| "step": 75, |
| "valid_targets_mean": 5565.6, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 0.0810126582278481, |
| "grad_norm": 0.37589937170078513, |
| "learning_rate": 6.39676113360324e-06, |
| "loss": 0.3707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13995295763015747, |
| "step": 80, |
| "valid_targets_mean": 3588.8, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 0.08607594936708861, |
| "grad_norm": 0.3714038081964425, |
| "learning_rate": 6.801619433198381e-06, |
| "loss": 0.3691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21744906902313232, |
| "step": 85, |
| "valid_targets_mean": 5115.6, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 0.09113924050632911, |
| "grad_norm": 0.34597741271059124, |
| "learning_rate": 7.206477732793523e-06, |
| "loss": 0.3564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17021265625953674, |
| "step": 90, |
| "valid_targets_mean": 5033.3, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 0.09620253164556962, |
| "grad_norm": 0.3172791695402959, |
| "learning_rate": 7.611336032388664e-06, |
| "loss": 0.3739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16697894036769867, |
| "step": 95, |
| "valid_targets_mean": 5135.7, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 0.10126582278481013, |
| "grad_norm": 0.3605571673212477, |
| "learning_rate": 8.016194331983806e-06, |
| "loss": 0.3609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17649498581886292, |
| "step": 100, |
| "valid_targets_mean": 4052.9, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 0.10632911392405063, |
| "grad_norm": 0.3126393081213533, |
| "learning_rate": 8.421052631578948e-06, |
| "loss": 0.3512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14957275986671448, |
| "step": 105, |
| "valid_targets_mean": 4704.9, |
| "valid_targets_min": 1914 |
| }, |
| { |
| "epoch": 0.11139240506329114, |
| "grad_norm": 0.3531313178759686, |
| "learning_rate": 8.82591093117409e-06, |
| "loss": 0.3726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16743913292884827, |
| "step": 110, |
| "valid_targets_mean": 3947.0, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 0.11645569620253164, |
| "grad_norm": 0.361312795641348, |
| "learning_rate": 9.230769230769232e-06, |
| "loss": 0.3633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1453179121017456, |
| "step": 115, |
| "valid_targets_mean": 2979.1, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 0.12151898734177215, |
| "grad_norm": 0.3118010440427671, |
| "learning_rate": 9.635627530364373e-06, |
| "loss": 0.3533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1923716962337494, |
| "step": 120, |
| "valid_targets_mean": 5371.9, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 0.12658227848101267, |
| "grad_norm": 0.35948459926380516, |
| "learning_rate": 1.0040485829959515e-05, |
| "loss": 0.348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2048473060131073, |
| "step": 125, |
| "valid_targets_mean": 4750.8, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 0.13164556962025317, |
| "grad_norm": 0.31537572490184773, |
| "learning_rate": 1.0445344129554658e-05, |
| "loss": 0.3713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20135825872421265, |
| "step": 130, |
| "valid_targets_mean": 4831.9, |
| "valid_targets_min": 1663 |
| }, |
| { |
| "epoch": 0.13670886075949368, |
| "grad_norm": 0.36436085249069955, |
| "learning_rate": 1.0850202429149799e-05, |
| "loss": 0.3511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21216928958892822, |
| "step": 135, |
| "valid_targets_mean": 4523.4, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 0.14177215189873418, |
| "grad_norm": 0.3366824015027373, |
| "learning_rate": 1.1255060728744939e-05, |
| "loss": 0.3567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17111346125602722, |
| "step": 140, |
| "valid_targets_mean": 3792.1, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 0.1468354430379747, |
| "grad_norm": 0.35533807007148477, |
| "learning_rate": 1.1659919028340081e-05, |
| "loss": 0.3589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1642487645149231, |
| "step": 145, |
| "valid_targets_mean": 4016.7, |
| "valid_targets_min": 1556 |
| }, |
| { |
| "epoch": 0.1518987341772152, |
| "grad_norm": 0.31790675871917146, |
| "learning_rate": 1.2064777327935225e-05, |
| "loss": 0.3429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.197759211063385, |
| "step": 150, |
| "valid_targets_mean": 5829.0, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 0.1569620253164557, |
| "grad_norm": 0.32375174058174566, |
| "learning_rate": 1.2469635627530365e-05, |
| "loss": 0.3571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1860826313495636, |
| "step": 155, |
| "valid_targets_mean": 4697.8, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 0.1620253164556962, |
| "grad_norm": 0.971603737593077, |
| "learning_rate": 1.2874493927125507e-05, |
| "loss": 0.3655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2078309953212738, |
| "step": 160, |
| "valid_targets_mean": 5384.2, |
| "valid_targets_min": 1144 |
| }, |
| { |
| "epoch": 0.1670886075949367, |
| "grad_norm": 0.47966039195161064, |
| "learning_rate": 1.327935222672065e-05, |
| "loss": 0.3588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18700364232063293, |
| "step": 165, |
| "valid_targets_mean": 4719.9, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 0.17215189873417722, |
| "grad_norm": 0.2955436571363374, |
| "learning_rate": 1.3684210526315791e-05, |
| "loss": 0.3413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16040512919425964, |
| "step": 170, |
| "valid_targets_mean": 5175.4, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 0.17721518987341772, |
| "grad_norm": 0.2909056024011537, |
| "learning_rate": 1.4089068825910932e-05, |
| "loss": 0.3611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14239881932735443, |
| "step": 175, |
| "valid_targets_mean": 4601.9, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 0.18227848101265823, |
| "grad_norm": 0.3684074269197893, |
| "learning_rate": 1.4493927125506074e-05, |
| "loss": 0.3607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17205636203289032, |
| "step": 180, |
| "valid_targets_mean": 3363.9, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 0.18734177215189873, |
| "grad_norm": 0.2978543096994537, |
| "learning_rate": 1.4898785425101216e-05, |
| "loss": 0.3606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1950611174106598, |
| "step": 185, |
| "valid_targets_mean": 5937.9, |
| "valid_targets_min": 1368 |
| }, |
| { |
| "epoch": 0.19240506329113924, |
| "grad_norm": 0.30414263404359004, |
| "learning_rate": 1.5303643724696356e-05, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18548183143138885, |
| "step": 190, |
| "valid_targets_mean": 5815.7, |
| "valid_targets_min": 1087 |
| }, |
| { |
| "epoch": 0.19746835443037974, |
| "grad_norm": 0.3751151244554016, |
| "learning_rate": 1.5708502024291498e-05, |
| "loss": 0.3638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2703745365142822, |
| "step": 195, |
| "valid_targets_mean": 5632.3, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 0.20253164556962025, |
| "grad_norm": 0.3183245241372493, |
| "learning_rate": 1.6113360323886644e-05, |
| "loss": 0.3597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15712594985961914, |
| "step": 200, |
| "valid_targets_mean": 4035.7, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 0.20759493670886076, |
| "grad_norm": 0.3632627857891178, |
| "learning_rate": 1.6518218623481782e-05, |
| "loss": 0.3525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17240820825099945, |
| "step": 205, |
| "valid_targets_mean": 4021.2, |
| "valid_targets_min": 1114 |
| }, |
| { |
| "epoch": 0.21265822784810126, |
| "grad_norm": 0.34057034041346584, |
| "learning_rate": 1.6923076923076924e-05, |
| "loss": 0.3621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22665713727474213, |
| "step": 210, |
| "valid_targets_mean": 5157.8, |
| "valid_targets_min": 1706 |
| }, |
| { |
| "epoch": 0.21772151898734177, |
| "grad_norm": 0.32892662546524415, |
| "learning_rate": 1.7327935222672066e-05, |
| "loss": 0.3516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1358383297920227, |
| "step": 215, |
| "valid_targets_mean": 3612.9, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 0.22278481012658227, |
| "grad_norm": 0.3323805458845017, |
| "learning_rate": 1.7732793522267208e-05, |
| "loss": 0.3405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14480899274349213, |
| "step": 220, |
| "valid_targets_mean": 6220.1, |
| "valid_targets_min": 1090 |
| }, |
| { |
| "epoch": 0.22784810126582278, |
| "grad_norm": 0.2969456771010524, |
| "learning_rate": 1.813765182186235e-05, |
| "loss": 0.345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16806533932685852, |
| "step": 225, |
| "valid_targets_mean": 5594.2, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 0.23291139240506328, |
| "grad_norm": 0.35442807757680916, |
| "learning_rate": 1.8542510121457492e-05, |
| "loss": 0.3466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20088203251361847, |
| "step": 230, |
| "valid_targets_mean": 4364.5, |
| "valid_targets_min": 1537 |
| }, |
| { |
| "epoch": 0.2379746835443038, |
| "grad_norm": 0.32766837251688363, |
| "learning_rate": 1.894736842105263e-05, |
| "loss": 0.3597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12136702239513397, |
| "step": 235, |
| "valid_targets_mean": 2704.7, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 0.2430379746835443, |
| "grad_norm": 0.3298038015043137, |
| "learning_rate": 1.9352226720647776e-05, |
| "loss": 0.3312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17166192829608917, |
| "step": 240, |
| "valid_targets_mean": 4605.7, |
| "valid_targets_min": 1445 |
| }, |
| { |
| "epoch": 0.2481012658227848, |
| "grad_norm": 0.2811058024334916, |
| "learning_rate": 1.9757085020242915e-05, |
| "loss": 0.3647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17767693102359772, |
| "step": 245, |
| "valid_targets_mean": 5949.4, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 0.25316455696202533, |
| "grad_norm": 0.3238895469625763, |
| "learning_rate": 2.016194331983806e-05, |
| "loss": 0.3542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1756962537765503, |
| "step": 250, |
| "valid_targets_mean": 4702.4, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 0.2582278481012658, |
| "grad_norm": 0.30654096002239845, |
| "learning_rate": 2.05668016194332e-05, |
| "loss": 0.3556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18253913521766663, |
| "step": 255, |
| "valid_targets_mean": 5601.0, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 0.26329113924050634, |
| "grad_norm": 0.33818696625352207, |
| "learning_rate": 2.097165991902834e-05, |
| "loss": 0.3604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20197951793670654, |
| "step": 260, |
| "valid_targets_mean": 4999.4, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 0.2683544303797468, |
| "grad_norm": 0.3221593835641881, |
| "learning_rate": 2.1376518218623487e-05, |
| "loss": 0.3356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1421291083097458, |
| "step": 265, |
| "valid_targets_mean": 3732.8, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 0.27341772151898736, |
| "grad_norm": 0.3467001085595146, |
| "learning_rate": 2.1781376518218625e-05, |
| "loss": 0.3541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19689059257507324, |
| "step": 270, |
| "valid_targets_mean": 4544.8, |
| "valid_targets_min": 1627 |
| }, |
| { |
| "epoch": 0.27848101265822783, |
| "grad_norm": 0.3893966405259359, |
| "learning_rate": 2.2186234817813767e-05, |
| "loss": 0.3502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17629346251487732, |
| "step": 275, |
| "valid_targets_mean": 3116.6, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 0.28354430379746837, |
| "grad_norm": 0.34248011251805455, |
| "learning_rate": 2.2591093117408906e-05, |
| "loss": 0.3517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1394365131855011, |
| "step": 280, |
| "valid_targets_mean": 3400.1, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 0.28860759493670884, |
| "grad_norm": 0.34292015860444375, |
| "learning_rate": 2.299595141700405e-05, |
| "loss": 0.3441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18773144483566284, |
| "step": 285, |
| "valid_targets_mean": 4286.1, |
| "valid_targets_min": 1425 |
| }, |
| { |
| "epoch": 0.2936708860759494, |
| "grad_norm": 0.3527832328000518, |
| "learning_rate": 2.3400809716599193e-05, |
| "loss": 0.3441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18093225359916687, |
| "step": 290, |
| "valid_targets_mean": 4568.9, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 0.29873417721518986, |
| "grad_norm": 0.3222755455970598, |
| "learning_rate": 2.3805668016194332e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13850252330303192, |
| "step": 295, |
| "valid_targets_mean": 3603.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 0.3037974683544304, |
| "grad_norm": 0.3081645393207173, |
| "learning_rate": 2.4210526315789474e-05, |
| "loss": 0.3523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1911936104297638, |
| "step": 300, |
| "valid_targets_mean": 6009.3, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 0.30886075949367087, |
| "grad_norm": 0.29187368241351513, |
| "learning_rate": 2.461538461538462e-05, |
| "loss": 0.3484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17911839485168457, |
| "step": 305, |
| "valid_targets_mean": 7036.5, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 0.3139240506329114, |
| "grad_norm": 0.49985981352299386, |
| "learning_rate": 2.5020242914979758e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16296392679214478, |
| "step": 310, |
| "valid_targets_mean": 3887.8, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 0.3189873417721519, |
| "grad_norm": 0.38261294484090613, |
| "learning_rate": 2.54251012145749e-05, |
| "loss": 0.3454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15782615542411804, |
| "step": 315, |
| "valid_targets_mean": 3376.2, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 0.3240506329113924, |
| "grad_norm": 0.45061664130339874, |
| "learning_rate": 2.5829959514170046e-05, |
| "loss": 0.3502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1975603699684143, |
| "step": 320, |
| "valid_targets_mean": 5570.6, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 0.3291139240506329, |
| "grad_norm": 0.3182602149268292, |
| "learning_rate": 2.6234817813765184e-05, |
| "loss": 0.3351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14342699944972992, |
| "step": 325, |
| "valid_targets_mean": 3784.2, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 0.3341772151898734, |
| "grad_norm": 0.3254644437199896, |
| "learning_rate": 2.6639676113360326e-05, |
| "loss": 0.3501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16729095578193665, |
| "step": 330, |
| "valid_targets_mean": 3966.9, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 0.3392405063291139, |
| "grad_norm": 0.32206841245268697, |
| "learning_rate": 2.704453441295547e-05, |
| "loss": 0.3476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1826034039258957, |
| "step": 335, |
| "valid_targets_mean": 4157.9, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 0.34430379746835443, |
| "grad_norm": 0.3602273548100487, |
| "learning_rate": 2.744939271255061e-05, |
| "loss": 0.3625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2222571074962616, |
| "step": 340, |
| "valid_targets_mean": 4895.1, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 0.3493670886075949, |
| "grad_norm": 0.3392767743330912, |
| "learning_rate": 2.7854251012145752e-05, |
| "loss": 0.3455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13851270079612732, |
| "step": 345, |
| "valid_targets_mean": 3250.4, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 0.35443037974683544, |
| "grad_norm": 0.32803869222957094, |
| "learning_rate": 2.825910931174089e-05, |
| "loss": 0.362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18585026264190674, |
| "step": 350, |
| "valid_targets_mean": 4607.0, |
| "valid_targets_min": 1164 |
| }, |
| { |
| "epoch": 0.3594936708860759, |
| "grad_norm": 0.2960837838285842, |
| "learning_rate": 2.8663967611336033e-05, |
| "loss": 0.3539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23394142091274261, |
| "step": 355, |
| "valid_targets_mean": 8210.9, |
| "valid_targets_min": 1637 |
| }, |
| { |
| "epoch": 0.36455696202531646, |
| "grad_norm": 0.3694811833098562, |
| "learning_rate": 2.906882591093118e-05, |
| "loss": 0.3468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16552570462226868, |
| "step": 360, |
| "valid_targets_mean": 2960.9, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 0.369620253164557, |
| "grad_norm": 0.31999701209701786, |
| "learning_rate": 2.9473684210526317e-05, |
| "loss": 0.3466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16295602917671204, |
| "step": 365, |
| "valid_targets_mean": 3841.0, |
| "valid_targets_min": 1068 |
| }, |
| { |
| "epoch": 0.37468354430379747, |
| "grad_norm": 0.29571436256727346, |
| "learning_rate": 2.987854251012146e-05, |
| "loss": 0.3567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19385173916816711, |
| "step": 370, |
| "valid_targets_mean": 5434.1, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 0.379746835443038, |
| "grad_norm": 0.2794237498150064, |
| "learning_rate": 3.0283400809716605e-05, |
| "loss": 0.3384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17324280738830566, |
| "step": 375, |
| "valid_targets_mean": 6533.0, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 0.3848101265822785, |
| "grad_norm": 0.46097531086569304, |
| "learning_rate": 3.068825910931174e-05, |
| "loss": 0.3441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1612202525138855, |
| "step": 380, |
| "valid_targets_mean": 4019.0, |
| "valid_targets_min": 1578 |
| }, |
| { |
| "epoch": 0.389873417721519, |
| "grad_norm": 0.33386509179906093, |
| "learning_rate": 3.1093117408906885e-05, |
| "loss": 0.3495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14520494639873505, |
| "step": 385, |
| "valid_targets_mean": 3415.9, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 0.3949367088607595, |
| "grad_norm": 0.3319526543378725, |
| "learning_rate": 3.149797570850203e-05, |
| "loss": 0.3487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1795864999294281, |
| "step": 390, |
| "valid_targets_mean": 4239.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 0.4, |
| "grad_norm": 0.3406949335779596, |
| "learning_rate": 3.190283400809717e-05, |
| "loss": 0.3384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16871468722820282, |
| "step": 395, |
| "valid_targets_mean": 3474.5, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 0.4050632911392405, |
| "grad_norm": 0.36838681719013816, |
| "learning_rate": 3.230769230769231e-05, |
| "loss": 0.3522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1932060271501541, |
| "step": 400, |
| "valid_targets_mean": 3488.6, |
| "valid_targets_min": 1164 |
| }, |
| { |
| "epoch": 0.41012658227848103, |
| "grad_norm": 0.35042164458126773, |
| "learning_rate": 3.271255060728745e-05, |
| "loss": 0.3588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17853647470474243, |
| "step": 405, |
| "valid_targets_mean": 3956.2, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 0.4151898734177215, |
| "grad_norm": 0.3489327841744588, |
| "learning_rate": 3.311740890688259e-05, |
| "loss": 0.3585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16795890033245087, |
| "step": 410, |
| "valid_targets_mean": 3783.9, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 0.42025316455696204, |
| "grad_norm": 0.3454446525690692, |
| "learning_rate": 3.352226720647774e-05, |
| "loss": 0.3516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2117060422897339, |
| "step": 415, |
| "valid_targets_mean": 4945.9, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 0.4253164556962025, |
| "grad_norm": 0.3098825126338765, |
| "learning_rate": 3.3927125506072876e-05, |
| "loss": 0.3574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20046228170394897, |
| "step": 420, |
| "valid_targets_mean": 6020.4, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 0.43037974683544306, |
| "grad_norm": 0.37532962252838115, |
| "learning_rate": 3.433198380566802e-05, |
| "loss": 0.3467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1575276255607605, |
| "step": 425, |
| "valid_targets_mean": 3148.8, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 0.43544303797468353, |
| "grad_norm": 0.41731233709453813, |
| "learning_rate": 3.473684210526316e-05, |
| "loss": 0.3536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18151873350143433, |
| "step": 430, |
| "valid_targets_mean": 4121.1, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.44050632911392407, |
| "grad_norm": 0.2834549547224196, |
| "learning_rate": 3.51417004048583e-05, |
| "loss": 0.3347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21482950448989868, |
| "step": 435, |
| "valid_targets_mean": 7190.4, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 0.44556962025316454, |
| "grad_norm": 0.30073688146062255, |
| "learning_rate": 3.5546558704453444e-05, |
| "loss": 0.3511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1362500786781311, |
| "step": 440, |
| "valid_targets_mean": 4360.6, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 0.4506329113924051, |
| "grad_norm": 0.3750594432228394, |
| "learning_rate": 3.595141700404859e-05, |
| "loss": 0.3531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20675930380821228, |
| "step": 445, |
| "valid_targets_mean": 4531.2, |
| "valid_targets_min": 1680 |
| }, |
| { |
| "epoch": 0.45569620253164556, |
| "grad_norm": 0.3568782095433956, |
| "learning_rate": 3.635627530364373e-05, |
| "loss": 0.3454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17187099158763885, |
| "step": 450, |
| "valid_targets_mean": 4279.3, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 0.4607594936708861, |
| "grad_norm": 0.31010973542926373, |
| "learning_rate": 3.676113360323887e-05, |
| "loss": 0.349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1888793706893921, |
| "step": 455, |
| "valid_targets_mean": 5464.9, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 0.46582278481012657, |
| "grad_norm": 0.30672819186326156, |
| "learning_rate": 3.716599190283401e-05, |
| "loss": 0.3369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19805072247982025, |
| "step": 460, |
| "valid_targets_mean": 5570.1, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 0.4708860759493671, |
| "grad_norm": 0.33237701694635524, |
| "learning_rate": 3.757085020242915e-05, |
| "loss": 0.3443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17327673733234406, |
| "step": 465, |
| "valid_targets_mean": 4441.7, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 0.4759493670886076, |
| "grad_norm": 0.3157269440092307, |
| "learning_rate": 3.7975708502024296e-05, |
| "loss": 0.3523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036791741847992, |
| "step": 470, |
| "valid_targets_mean": 5480.2, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 0.4810126582278481, |
| "grad_norm": 0.3385448591385259, |
| "learning_rate": 3.8380566801619435e-05, |
| "loss": 0.3254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18548253178596497, |
| "step": 475, |
| "valid_targets_mean": 5158.2, |
| "valid_targets_min": 1322 |
| }, |
| { |
| "epoch": 0.4860759493670886, |
| "grad_norm": 0.3229813339259753, |
| "learning_rate": 3.878542510121458e-05, |
| "loss": 0.3539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19486048817634583, |
| "step": 480, |
| "valid_targets_mean": 5207.5, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 0.4911392405063291, |
| "grad_norm": 0.39888632177896866, |
| "learning_rate": 3.919028340080972e-05, |
| "loss": 0.3367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15041330456733704, |
| "step": 485, |
| "valid_targets_mean": 2910.4, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 0.4962025316455696, |
| "grad_norm": 0.3216838457166851, |
| "learning_rate": 3.959514170040486e-05, |
| "loss": 0.3535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18031927943229675, |
| "step": 490, |
| "valid_targets_mean": 5146.9, |
| "valid_targets_min": 1318 |
| }, |
| { |
| "epoch": 0.5012658227848101, |
| "grad_norm": 0.3463812343689675, |
| "learning_rate": 4e-05, |
| "loss": 0.3538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13655783236026764, |
| "step": 495, |
| "valid_targets_mean": 3592.6, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 0.5063291139240507, |
| "grad_norm": 0.36468197040198047, |
| "learning_rate": 3.999987517534179e-05, |
| "loss": 0.3298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17994073033332825, |
| "step": 500, |
| "valid_targets_mean": 3419.4, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 0.5113924050632911, |
| "grad_norm": 0.3123011360513197, |
| "learning_rate": 3.999950070292526e-05, |
| "loss": 0.3514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13850685954093933, |
| "step": 505, |
| "valid_targets_mean": 4406.6, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 0.5164556962025316, |
| "grad_norm": 0.3110207165348701, |
| "learning_rate": 3.9998876587424764e-05, |
| "loss": 0.3437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13691280782222748, |
| "step": 510, |
| "valid_targets_mean": 4396.4, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 0.5215189873417722, |
| "grad_norm": 0.32363025722531935, |
| "learning_rate": 3.99980028366308e-05, |
| "loss": 0.3569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24637667834758759, |
| "step": 515, |
| "valid_targets_mean": 5892.6, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 0.5265822784810127, |
| "grad_norm": 0.3650846632854969, |
| "learning_rate": 3.999687946144992e-05, |
| "loss": 0.3581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18719391524791718, |
| "step": 520, |
| "valid_targets_mean": 4166.3, |
| "valid_targets_min": 1384 |
| }, |
| { |
| "epoch": 0.5316455696202531, |
| "grad_norm": 0.380513757297641, |
| "learning_rate": 3.999550647590464e-05, |
| "loss": 0.3508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21175450086593628, |
| "step": 525, |
| "valid_targets_mean": 3908.1, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 0.5367088607594936, |
| "grad_norm": 0.3303089638050748, |
| "learning_rate": 3.9993883897133174e-05, |
| "loss": 0.3344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1324310302734375, |
| "step": 530, |
| "valid_targets_mean": 3035.0, |
| "valid_targets_min": 1176 |
| }, |
| { |
| "epoch": 0.5417721518987342, |
| "grad_norm": 0.3065345335498946, |
| "learning_rate": 3.9992011745389335e-05, |
| "loss": 0.3564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18349391222000122, |
| "step": 535, |
| "valid_targets_mean": 5569.8, |
| "valid_targets_min": 1419 |
| }, |
| { |
| "epoch": 0.5468354430379747, |
| "grad_norm": 0.3593697878507127, |
| "learning_rate": 3.998989004404217e-05, |
| "loss": 0.3477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1619454324245453, |
| "step": 540, |
| "valid_targets_mean": 3932.5, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 0.5518987341772152, |
| "grad_norm": 0.25234558053757633, |
| "learning_rate": 3.998751881957576e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16338235139846802, |
| "step": 545, |
| "valid_targets_mean": 5379.0, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 0.5569620253164557, |
| "grad_norm": 0.3445664068863559, |
| "learning_rate": 3.998489810158883e-05, |
| "loss": 0.3475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1785704791545868, |
| "step": 550, |
| "valid_targets_mean": 3962.2, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 0.5620253164556962, |
| "grad_norm": 0.3556936347323425, |
| "learning_rate": 3.99820279227944e-05, |
| "loss": 0.3345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18062683939933777, |
| "step": 555, |
| "valid_targets_mean": 4593.2, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 0.5670886075949367, |
| "grad_norm": 0.3792686598578621, |
| "learning_rate": 3.997890831901938e-05, |
| "loss": 0.3413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19577497243881226, |
| "step": 560, |
| "valid_targets_mean": 4658.2, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 0.5721518987341773, |
| "grad_norm": 0.32913492636939423, |
| "learning_rate": 3.9975539329204116e-05, |
| "loss": 0.3387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17351575195789337, |
| "step": 565, |
| "valid_targets_mean": 4210.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 0.5772151898734177, |
| "grad_norm": 0.296950123523885, |
| "learning_rate": 3.9971920995401905e-05, |
| "loss": 0.3443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20880410075187683, |
| "step": 570, |
| "valid_targets_mean": 6590.1, |
| "valid_targets_min": 1899 |
| }, |
| { |
| "epoch": 0.5822784810126582, |
| "grad_norm": 0.34173998557875557, |
| "learning_rate": 3.996805336277848e-05, |
| "loss": 0.3508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1291336864233017, |
| "step": 575, |
| "valid_targets_mean": 4007.8, |
| "valid_targets_min": 1380 |
| }, |
| { |
| "epoch": 0.5873417721518988, |
| "grad_norm": 0.30049566187413324, |
| "learning_rate": 3.996393647961143e-05, |
| "loss": 0.34, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13710632920265198, |
| "step": 580, |
| "valid_targets_mean": 4320.4, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 0.5924050632911393, |
| "grad_norm": 0.3451273067980245, |
| "learning_rate": 3.995957039728962e-05, |
| "loss": 0.3456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18673017621040344, |
| "step": 585, |
| "valid_targets_mean": 4318.7, |
| "valid_targets_min": 1318 |
| }, |
| { |
| "epoch": 0.5974683544303797, |
| "grad_norm": 0.3248655593711836, |
| "learning_rate": 3.9954955170312504e-05, |
| "loss": 0.335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15301413834095, |
| "step": 590, |
| "valid_targets_mean": 4103.9, |
| "valid_targets_min": 1260 |
| }, |
| { |
| "epoch": 0.6025316455696202, |
| "grad_norm": 0.3874469407061254, |
| "learning_rate": 3.995009085628951e-05, |
| "loss": 0.3417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17825846374034882, |
| "step": 595, |
| "valid_targets_mean": 3280.8, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 0.6075949367088608, |
| "grad_norm": 0.32514023580791557, |
| "learning_rate": 3.994497751593927e-05, |
| "loss": 0.3417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17784975469112396, |
| "step": 600, |
| "valid_targets_mean": 4897.2, |
| "valid_targets_min": 1343 |
| }, |
| { |
| "epoch": 0.6126582278481013, |
| "grad_norm": 0.32015309031323297, |
| "learning_rate": 3.9939615213088865e-05, |
| "loss": 0.3461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1702687293291092, |
| "step": 605, |
| "valid_targets_mean": 5160.1, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 0.6177215189873417, |
| "grad_norm": 0.29531423820767827, |
| "learning_rate": 3.993400401467308e-05, |
| "loss": 0.362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1590127795934677, |
| "step": 610, |
| "valid_targets_mean": 5178.2, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 0.6227848101265823, |
| "grad_norm": 0.30956228742996816, |
| "learning_rate": 3.992814399073349e-05, |
| "loss": 0.3358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1777225136756897, |
| "step": 615, |
| "valid_targets_mean": 5224.1, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 0.6278481012658228, |
| "grad_norm": 0.2946569197224124, |
| "learning_rate": 3.992203521441765e-05, |
| "loss": 0.3566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16454584896564484, |
| "step": 620, |
| "valid_targets_mean": 5873.6, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 0.6329113924050633, |
| "grad_norm": 0.3566548256792116, |
| "learning_rate": 3.991567776197815e-05, |
| "loss": 0.3423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1757839322090149, |
| "step": 625, |
| "valid_targets_mean": 5280.0, |
| "valid_targets_min": 1179 |
| }, |
| { |
| "epoch": 0.6379746835443038, |
| "grad_norm": 0.34702302453822725, |
| "learning_rate": 3.990907171277168e-05, |
| "loss": 0.3406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16491375863552094, |
| "step": 630, |
| "valid_targets_mean": 3738.1, |
| "valid_targets_min": 1437 |
| }, |
| { |
| "epoch": 0.6430379746835443, |
| "grad_norm": 0.3122025130697409, |
| "learning_rate": 3.990221714925802e-05, |
| "loss": 0.3425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19272474944591522, |
| "step": 635, |
| "valid_targets_mean": 5090.6, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 0.6481012658227848, |
| "grad_norm": 0.3289259973223097, |
| "learning_rate": 3.989511415699901e-05, |
| "loss": 0.3492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21416299045085907, |
| "step": 640, |
| "valid_targets_mean": 5687.4, |
| "valid_targets_min": 1558 |
| }, |
| { |
| "epoch": 0.6531645569620254, |
| "grad_norm": 0.31628182785649794, |
| "learning_rate": 3.988776282465752e-05, |
| "loss": 0.3472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16229850053787231, |
| "step": 645, |
| "valid_targets_mean": 5641.7, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 0.6582278481012658, |
| "grad_norm": 0.32370069272186214, |
| "learning_rate": 3.9880163243996314e-05, |
| "loss": 0.3439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1790936440229416, |
| "step": 650, |
| "valid_targets_mean": 4757.5, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 0.6632911392405063, |
| "grad_norm": 0.331462646919884, |
| "learning_rate": 3.9872315509876885e-05, |
| "loss": 0.3465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2034873068332672, |
| "step": 655, |
| "valid_targets_mean": 6825.2, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 0.6683544303797468, |
| "grad_norm": 0.2773031962593845, |
| "learning_rate": 3.986421972025831e-05, |
| "loss": 0.3362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13872382044792175, |
| "step": 660, |
| "valid_targets_mean": 5178.6, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 0.6734177215189874, |
| "grad_norm": 0.3282605048208077, |
| "learning_rate": 3.9855875976196e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1442852020263672, |
| "step": 665, |
| "valid_targets_mean": 3767.0, |
| "valid_targets_min": 1309 |
| }, |
| { |
| "epoch": 0.6784810126582278, |
| "grad_norm": 0.5817158484637879, |
| "learning_rate": 3.984728438184047e-05, |
| "loss": 0.348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867026388645172, |
| "step": 670, |
| "valid_targets_mean": 4197.3, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 0.6835443037974683, |
| "grad_norm": 0.3539656970185502, |
| "learning_rate": 3.9838445044435997e-05, |
| "loss": 0.3543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16187211871147156, |
| "step": 675, |
| "valid_targets_mean": 4067.3, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 0.6886075949367089, |
| "grad_norm": 0.33229865798563013, |
| "learning_rate": 3.9829358074319295e-05, |
| "loss": 0.343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17157503962516785, |
| "step": 680, |
| "valid_targets_mean": 4686.7, |
| "valid_targets_min": 1496 |
| }, |
| { |
| "epoch": 0.6936708860759494, |
| "grad_norm": 0.2791093667927135, |
| "learning_rate": 3.982002358491817e-05, |
| "loss": 0.3385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1936018466949463, |
| "step": 685, |
| "valid_targets_mean": 6395.1, |
| "valid_targets_min": 1038 |
| }, |
| { |
| "epoch": 0.6987341772151898, |
| "grad_norm": 0.3350209099910488, |
| "learning_rate": 3.981044169275006e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1778436303138733, |
| "step": 690, |
| "valid_targets_mean": 4567.5, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 0.7037974683544304, |
| "grad_norm": 0.3531099254353881, |
| "learning_rate": 3.9800612517420626e-05, |
| "loss": 0.3469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16938315331935883, |
| "step": 695, |
| "valid_targets_mean": 3896.1, |
| "valid_targets_min": 1641 |
| }, |
| { |
| "epoch": 0.7088607594936709, |
| "grad_norm": 0.318049795345604, |
| "learning_rate": 3.979053618162219e-05, |
| "loss": 0.3564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1946740746498108, |
| "step": 700, |
| "valid_targets_mean": 5408.9, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 0.7139240506329114, |
| "grad_norm": 0.3320763821369659, |
| "learning_rate": 3.978021281113228e-05, |
| "loss": 0.3393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17016340792179108, |
| "step": 705, |
| "valid_targets_mean": 4967.0, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.7189873417721518, |
| "grad_norm": 0.2847828838514781, |
| "learning_rate": 3.9769642534812e-05, |
| "loss": 0.3414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1707335114479065, |
| "step": 710, |
| "valid_targets_mean": 6450.3, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 0.7240506329113924, |
| "grad_norm": 0.3321384385821899, |
| "learning_rate": 3.9758825484604494e-05, |
| "loss": 0.3447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1961357295513153, |
| "step": 715, |
| "valid_targets_mean": 4652.9, |
| "valid_targets_min": 1387 |
| }, |
| { |
| "epoch": 0.7291139240506329, |
| "grad_norm": 0.3032184720855355, |
| "learning_rate": 3.9747761795533194e-05, |
| "loss": 0.3451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1426798403263092, |
| "step": 720, |
| "valid_targets_mean": 6012.8, |
| "valid_targets_min": 1966 |
| }, |
| { |
| "epoch": 0.7341772151898734, |
| "grad_norm": 0.3448777606898466, |
| "learning_rate": 3.973645160570023e-05, |
| "loss": 0.3546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1586744487285614, |
| "step": 725, |
| "valid_targets_mean": 4090.4, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 0.739240506329114, |
| "grad_norm": 0.3156506831386379, |
| "learning_rate": 3.9724895056284665e-05, |
| "loss": 0.3376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1619202196598053, |
| "step": 730, |
| "valid_targets_mean": 4218.2, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 0.7443037974683544, |
| "grad_norm": 0.35504669537877936, |
| "learning_rate": 3.971309229154072e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21181583404541016, |
| "step": 735, |
| "valid_targets_mean": 4926.1, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 0.7493670886075949, |
| "grad_norm": 0.3201734939222349, |
| "learning_rate": 3.9701043458796015e-05, |
| "loss": 0.3356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22177475690841675, |
| "step": 740, |
| "valid_targets_mean": 6330.8, |
| "valid_targets_min": 1448 |
| }, |
| { |
| "epoch": 0.7544303797468355, |
| "grad_norm": 0.3323013925433624, |
| "learning_rate": 3.9688748708449686e-05, |
| "loss": 0.3383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15360356867313385, |
| "step": 745, |
| "valid_targets_mean": 4397.9, |
| "valid_targets_min": 1528 |
| }, |
| { |
| "epoch": 0.759493670886076, |
| "grad_norm": 0.2700426394697059, |
| "learning_rate": 3.967620819397053e-05, |
| "loss": 0.3308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15975482761859894, |
| "step": 750, |
| "valid_targets_mean": 5138.0, |
| "valid_targets_min": 1494 |
| }, |
| { |
| "epoch": 0.7645569620253164, |
| "grad_norm": 0.32491869195537754, |
| "learning_rate": 3.9663422071895103e-05, |
| "loss": 0.3534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1329491138458252, |
| "step": 755, |
| "valid_targets_mean": 3496.6, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 0.769620253164557, |
| "grad_norm": 0.30201583766650153, |
| "learning_rate": 3.965039050182573e-05, |
| "loss": 0.3444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17797686159610748, |
| "step": 760, |
| "valid_targets_mean": 5996.1, |
| "valid_targets_min": 1405 |
| }, |
| { |
| "epoch": 0.7746835443037975, |
| "grad_norm": 0.28815946203036474, |
| "learning_rate": 3.963711364642854e-05, |
| "loss": 0.3397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19754289090633392, |
| "step": 765, |
| "valid_targets_mean": 6895.8, |
| "valid_targets_min": 1767 |
| }, |
| { |
| "epoch": 0.779746835443038, |
| "grad_norm": 0.3154202174762482, |
| "learning_rate": 3.9623591671431416e-05, |
| "loss": 0.355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18379993736743927, |
| "step": 770, |
| "valid_targets_mean": 5009.2, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 0.7848101265822784, |
| "grad_norm": 0.3575700176888927, |
| "learning_rate": 3.960982474562196e-05, |
| "loss": 0.3389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17523907124996185, |
| "step": 775, |
| "valid_targets_mean": 4694.8, |
| "valid_targets_min": 1661 |
| }, |
| { |
| "epoch": 0.789873417721519, |
| "grad_norm": 0.3310517991000096, |
| "learning_rate": 3.959581304084536e-05, |
| "loss": 0.345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1610376238822937, |
| "step": 780, |
| "valid_targets_mean": 4332.1, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 0.7949367088607595, |
| "grad_norm": 0.31363025202931233, |
| "learning_rate": 3.958155673200223e-05, |
| "loss": 0.3547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2106252908706665, |
| "step": 785, |
| "valid_targets_mean": 5876.1, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 0.8, |
| "grad_norm": 0.2999707270623021, |
| "learning_rate": 3.956705599704645e-05, |
| "loss": 0.3307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19507791101932526, |
| "step": 790, |
| "valid_targets_mean": 5528.2, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 0.8050632911392405, |
| "grad_norm": 0.34798398865892316, |
| "learning_rate": 3.9552311016982964e-05, |
| "loss": 0.3301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1592869609594345, |
| "step": 795, |
| "valid_targets_mean": 3994.4, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 0.810126582278481, |
| "grad_norm": 0.3486093165843197, |
| "learning_rate": 3.953732197586549e-05, |
| "loss": 0.3299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14387521147727966, |
| "step": 800, |
| "valid_targets_mean": 3136.8, |
| "valid_targets_min": 969 |
| }, |
| { |
| "epoch": 0.8151898734177215, |
| "grad_norm": 0.34294729405636676, |
| "learning_rate": 3.952208906079419e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14744120836257935, |
| "step": 805, |
| "valid_targets_mean": 3541.7, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 0.8202531645569621, |
| "grad_norm": 0.29811481034198406, |
| "learning_rate": 3.950661246191344e-05, |
| "loss": 0.3327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20451560616493225, |
| "step": 810, |
| "valid_targets_mean": 5959.1, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 0.8253164556962025, |
| "grad_norm": 0.29859308801266926, |
| "learning_rate": 3.949089237240933e-05, |
| "loss": 0.3261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17102043330669403, |
| "step": 815, |
| "valid_targets_mean": 5425.9, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 0.830379746835443, |
| "grad_norm": 0.33822208957438105, |
| "learning_rate": 3.947492898850736e-05, |
| "loss": 0.3379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12047713249921799, |
| "step": 820, |
| "valid_targets_mean": 2989.9, |
| "valid_targets_min": 1525 |
| }, |
| { |
| "epoch": 0.8354430379746836, |
| "grad_norm": 0.30589016543655284, |
| "learning_rate": 3.94587225094699e-05, |
| "loss": 0.3466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16248869895935059, |
| "step": 825, |
| "valid_targets_mean": 4684.8, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 0.8405063291139241, |
| "grad_norm": 0.2936931469479608, |
| "learning_rate": 3.94422731375938e-05, |
| "loss": 0.3185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12211855500936508, |
| "step": 830, |
| "valid_targets_mean": 3796.8, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 0.8455696202531645, |
| "grad_norm": 0.37559686297102585, |
| "learning_rate": 3.9425581078207764e-05, |
| "loss": 0.3532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12265650928020477, |
| "step": 835, |
| "valid_targets_mean": 2870.8, |
| "valid_targets_min": 1300 |
| }, |
| { |
| "epoch": 0.850632911392405, |
| "grad_norm": 0.35124796916797185, |
| "learning_rate": 3.940864653966985e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1492408812046051, |
| "step": 840, |
| "valid_targets_mean": 3748.4, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 0.8556962025316456, |
| "grad_norm": 0.3196010195709303, |
| "learning_rate": 3.939146973336487e-05, |
| "loss": 0.3411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21070614457130432, |
| "step": 845, |
| "valid_targets_mean": 5815.2, |
| "valid_targets_min": 1741 |
| }, |
| { |
| "epoch": 0.8607594936708861, |
| "grad_norm": 0.278654689286952, |
| "learning_rate": 3.937405087370171e-05, |
| "loss": 0.3373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16281408071517944, |
| "step": 850, |
| "valid_targets_mean": 6301.6, |
| "valid_targets_min": 1867 |
| }, |
| { |
| "epoch": 0.8658227848101265, |
| "grad_norm": 0.32174716361043904, |
| "learning_rate": 3.9356390178110694e-05, |
| "loss": 0.346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11544165015220642, |
| "step": 855, |
| "valid_targets_mean": 3471.2, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 0.8708860759493671, |
| "grad_norm": 0.31597886690897176, |
| "learning_rate": 3.9338487867040855e-05, |
| "loss": 0.3514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1751353144645691, |
| "step": 860, |
| "valid_targets_mean": 4752.5, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 0.8759493670886076, |
| "grad_norm": 0.3376382881344058, |
| "learning_rate": 3.9320344163957177e-05, |
| "loss": 0.3505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1628148853778839, |
| "step": 865, |
| "valid_targets_mean": 4121.5, |
| "valid_targets_min": 1412 |
| }, |
| { |
| "epoch": 0.8810126582278481, |
| "grad_norm": 0.3174487269237297, |
| "learning_rate": 3.9301959295337816e-05, |
| "loss": 0.3381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19904953241348267, |
| "step": 870, |
| "valid_targets_mean": 6095.4, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 0.8860759493670886, |
| "grad_norm": 0.29589750599326486, |
| "learning_rate": 3.928333349067125e-05, |
| "loss": 0.3319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22740904986858368, |
| "step": 875, |
| "valid_targets_mean": 6433.5, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 0.8911392405063291, |
| "grad_norm": 0.28879537949688816, |
| "learning_rate": 3.926446698245347e-05, |
| "loss": 0.3262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1922253668308258, |
| "step": 880, |
| "valid_targets_mean": 5540.3, |
| "valid_targets_min": 1526 |
| }, |
| { |
| "epoch": 0.8962025316455696, |
| "grad_norm": 0.3183527697451739, |
| "learning_rate": 3.924536000618501e-05, |
| "loss": 0.3435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1510843187570572, |
| "step": 885, |
| "valid_targets_mean": 4520.7, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 0.9012658227848102, |
| "grad_norm": 0.3190560534322978, |
| "learning_rate": 3.922601280036805e-05, |
| "loss": 0.328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19017574191093445, |
| "step": 890, |
| "valid_targets_mean": 4967.6, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 0.9063291139240506, |
| "grad_norm": 0.4456031002758009, |
| "learning_rate": 3.920642560650343e-05, |
| "loss": 0.3351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22871103882789612, |
| "step": 895, |
| "valid_targets_mean": 5971.6, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 0.9113924050632911, |
| "grad_norm": 0.30090137054069316, |
| "learning_rate": 3.918659866908762e-05, |
| "loss": 0.3296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15791599452495575, |
| "step": 900, |
| "valid_targets_mean": 5456.4, |
| "valid_targets_min": 1469 |
| }, |
| { |
| "epoch": 0.9164556962025316, |
| "grad_norm": 0.33133512730966574, |
| "learning_rate": 3.9166532235609695e-05, |
| "loss": 0.3397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21240505576133728, |
| "step": 905, |
| "valid_targets_mean": 5933.7, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 0.9215189873417722, |
| "grad_norm": 0.3573450052442163, |
| "learning_rate": 3.914622655654822e-05, |
| "loss": 0.3434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13716688752174377, |
| "step": 910, |
| "valid_targets_mean": 5188.8, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 0.9265822784810127, |
| "grad_norm": 0.3538932529953643, |
| "learning_rate": 3.912568188536814e-05, |
| "loss": 0.3537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16137436032295227, |
| "step": 915, |
| "valid_targets_mean": 3634.4, |
| "valid_targets_min": 1339 |
| }, |
| { |
| "epoch": 0.9316455696202531, |
| "grad_norm": 0.3208113773796828, |
| "learning_rate": 3.910489847851761e-05, |
| "loss": 0.3444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17828276753425598, |
| "step": 920, |
| "valid_targets_mean": 4550.2, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 0.9367088607594937, |
| "grad_norm": 0.3094131187909477, |
| "learning_rate": 3.908387659542481e-05, |
| "loss": 0.3457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14312776923179626, |
| "step": 925, |
| "valid_targets_mean": 4335.3, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 0.9417721518987342, |
| "grad_norm": 0.33010185993106733, |
| "learning_rate": 3.9062616498494656e-05, |
| "loss": 0.3354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17049264907836914, |
| "step": 930, |
| "valid_targets_mean": 3559.0, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 0.9468354430379747, |
| "grad_norm": 0.3152672156222691, |
| "learning_rate": 3.904111845310559e-05, |
| "loss": 0.3347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16469566524028778, |
| "step": 935, |
| "valid_targets_mean": 4357.5, |
| "valid_targets_min": 1218 |
| }, |
| { |
| "epoch": 0.9518987341772152, |
| "grad_norm": 0.3201518158080734, |
| "learning_rate": 3.901938272760623e-05, |
| "loss": 0.3452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1640382707118988, |
| "step": 940, |
| "valid_targets_mean": 4409.8, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 0.9569620253164557, |
| "grad_norm": 0.3422558014341276, |
| "learning_rate": 3.899740959331204e-05, |
| "loss": 0.3411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14299672842025757, |
| "step": 945, |
| "valid_targets_mean": 3149.9, |
| "valid_targets_min": 866 |
| }, |
| { |
| "epoch": 0.9620253164556962, |
| "grad_norm": 0.3039490414348751, |
| "learning_rate": 3.897519932450189e-05, |
| "loss": 0.3421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14147335290908813, |
| "step": 950, |
| "valid_targets_mean": 4333.5, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 0.9670886075949368, |
| "grad_norm": 0.3264243877990281, |
| "learning_rate": 3.8952752198414716e-05, |
| "loss": 0.3515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17327773571014404, |
| "step": 955, |
| "valid_targets_mean": 4177.0, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 0.9721518987341772, |
| "grad_norm": 0.3108694369949979, |
| "learning_rate": 3.893006849524601e-05, |
| "loss": 0.3335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16756384074687958, |
| "step": 960, |
| "valid_targets_mean": 4619.9, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 0.9772151898734177, |
| "grad_norm": 0.3448421182167878, |
| "learning_rate": 3.890714849814431e-05, |
| "loss": 0.343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15267406404018402, |
| "step": 965, |
| "valid_targets_mean": 4085.4, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 0.9822784810126582, |
| "grad_norm": 0.30352124369356204, |
| "learning_rate": 3.8883992493207696e-05, |
| "loss": 0.3489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2034776359796524, |
| "step": 970, |
| "valid_targets_mean": 5403.8, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 0.9873417721518988, |
| "grad_norm": 0.2876598919430634, |
| "learning_rate": 3.8860600769480215e-05, |
| "loss": 0.3446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17782637476921082, |
| "step": 975, |
| "valid_targets_mean": 5421.9, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 0.9924050632911392, |
| "grad_norm": 0.33380559486032607, |
| "learning_rate": 3.883697361894825e-05, |
| "loss": 0.3439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2117309868335724, |
| "step": 980, |
| "valid_targets_mean": 4499.0, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 0.9974683544303797, |
| "grad_norm": 0.3618917728963476, |
| "learning_rate": 3.881311133653691e-05, |
| "loss": 0.3412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16749724745750427, |
| "step": 985, |
| "valid_targets_mean": 3879.4, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 1.0020253164556963, |
| "grad_norm": 0.3195092960965727, |
| "learning_rate": 3.878901422010632e-05, |
| "loss": 0.3347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21217718720436096, |
| "step": 990, |
| "valid_targets_mean": 6226.9, |
| "valid_targets_min": 1827 |
| }, |
| { |
| "epoch": 1.0070886075949368, |
| "grad_norm": 0.32404855006530575, |
| "learning_rate": 3.87646825704479e-05, |
| "loss": 0.3259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1381339430809021, |
| "step": 995, |
| "valid_targets_mean": 3916.4, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 1.0121518987341773, |
| "grad_norm": 0.3141166003779331, |
| "learning_rate": 3.874011669128065e-05, |
| "loss": 0.3446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1709311306476593, |
| "step": 1000, |
| "valid_targets_mean": 4634.4, |
| "valid_targets_min": 1322 |
| }, |
| { |
| "epoch": 1.0172151898734176, |
| "grad_norm": 0.33255131568231555, |
| "learning_rate": 3.871531688924731e-05, |
| "loss": 0.3176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11075881123542786, |
| "step": 1005, |
| "valid_targets_mean": 2777.5, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 1.0222784810126582, |
| "grad_norm": 0.3551119238834457, |
| "learning_rate": 3.8690283473910555e-05, |
| "loss": 0.3343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18998833000659943, |
| "step": 1010, |
| "valid_targets_mean": 5065.8, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 1.0273417721518987, |
| "grad_norm": 0.36295431013252033, |
| "learning_rate": 3.866501675774914e-05, |
| "loss": 0.3282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1773543804883957, |
| "step": 1015, |
| "valid_targets_mean": 3819.9, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 1.0324050632911392, |
| "grad_norm": 0.33540491774621956, |
| "learning_rate": 3.8639517056153997e-05, |
| "loss": 0.3362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16152143478393555, |
| "step": 1020, |
| "valid_targets_mean": 4223.1, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 1.0374683544303798, |
| "grad_norm": 0.32077100355601573, |
| "learning_rate": 3.8613784687424275e-05, |
| "loss": 0.3378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19795547425746918, |
| "step": 1025, |
| "valid_targets_mean": 5295.2, |
| "valid_targets_min": 1496 |
| }, |
| { |
| "epoch": 1.0425316455696203, |
| "grad_norm": 0.3216906551189178, |
| "learning_rate": 3.858781997276337e-05, |
| "loss": 0.3318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16188682615756989, |
| "step": 1030, |
| "valid_targets_mean": 5138.4, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 1.0475949367088608, |
| "grad_norm": 0.4486889227248024, |
| "learning_rate": 3.856162323627497e-05, |
| "loss": 0.3251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09634960442781448, |
| "step": 1035, |
| "valid_targets_mean": 3724.6, |
| "valid_targets_min": 934 |
| }, |
| { |
| "epoch": 1.0526582278481014, |
| "grad_norm": 0.2934117207565638, |
| "learning_rate": 3.8535194804958924e-05, |
| "loss": 0.3367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1526038944721222, |
| "step": 1040, |
| "valid_targets_mean": 4829.0, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 1.0577215189873417, |
| "grad_norm": 0.2931878952686227, |
| "learning_rate": 3.8508535008707236e-05, |
| "loss": 0.346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20354345440864563, |
| "step": 1045, |
| "valid_targets_mean": 6153.3, |
| "valid_targets_min": 1336 |
| }, |
| { |
| "epoch": 1.0627848101265822, |
| "grad_norm": 0.322713813844516, |
| "learning_rate": 3.848164418029989e-05, |
| "loss": 0.3364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1375882625579834, |
| "step": 1050, |
| "valid_targets_mean": 4300.9, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 1.0678481012658227, |
| "grad_norm": 0.31096701689662554, |
| "learning_rate": 3.845452265540074e-05, |
| "loss": 0.3296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1565578281879425, |
| "step": 1055, |
| "valid_targets_mean": 4115.1, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 1.0729113924050633, |
| "grad_norm": 0.31792661099154035, |
| "learning_rate": 3.842717077255329e-05, |
| "loss": 0.3265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18725517392158508, |
| "step": 1060, |
| "valid_targets_mean": 5399.2, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 1.0779746835443038, |
| "grad_norm": 0.2966357451403385, |
| "learning_rate": 3.839958887317649e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1931026577949524, |
| "step": 1065, |
| "valid_targets_mean": 6788.4, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 1.0830379746835443, |
| "grad_norm": 0.32526509145376603, |
| "learning_rate": 3.837177730156045e-05, |
| "loss": 0.3283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18849416077136993, |
| "step": 1070, |
| "valid_targets_mean": 5493.9, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 1.0881012658227849, |
| "grad_norm": 0.3176994766517001, |
| "learning_rate": 3.834373640486216e-05, |
| "loss": 0.329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13460056483745575, |
| "step": 1075, |
| "valid_targets_mean": 3655.2, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 1.0931645569620254, |
| "grad_norm": 0.3802547345823635, |
| "learning_rate": 3.8315466533101154e-05, |
| "loss": 0.3191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1390688419342041, |
| "step": 1080, |
| "valid_targets_mean": 3724.8, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 1.0982278481012657, |
| "grad_norm": 0.30409901587440336, |
| "learning_rate": 3.828696803915515e-05, |
| "loss": 0.3295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19093772768974304, |
| "step": 1085, |
| "valid_targets_mean": 5509.2, |
| "valid_targets_min": 1316 |
| }, |
| { |
| "epoch": 1.1032911392405063, |
| "grad_norm": 0.31857188574561196, |
| "learning_rate": 3.8258241278755613e-05, |
| "loss": 0.3259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18015238642692566, |
| "step": 1090, |
| "valid_targets_mean": 5178.9, |
| "valid_targets_min": 1381 |
| }, |
| { |
| "epoch": 1.1083544303797468, |
| "grad_norm": 0.32050011818280044, |
| "learning_rate": 3.8229286610483356e-05, |
| "loss": 0.3233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18884283304214478, |
| "step": 1095, |
| "valid_targets_mean": 5116.2, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 1.1134177215189873, |
| "grad_norm": 0.3113272756450795, |
| "learning_rate": 3.820010439576403e-05, |
| "loss": 0.3164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16775749623775482, |
| "step": 1100, |
| "valid_targets_mean": 4514.6, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 1.1184810126582279, |
| "grad_norm": 0.33153340730169845, |
| "learning_rate": 3.817069499886364e-05, |
| "loss": 0.3196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12046626210212708, |
| "step": 1105, |
| "valid_targets_mean": 3291.4, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 1.1235443037974684, |
| "grad_norm": 0.3013874756589958, |
| "learning_rate": 3.814105878688397e-05, |
| "loss": 0.3325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16391009092330933, |
| "step": 1110, |
| "valid_targets_mean": 6036.4, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 1.128607594936709, |
| "grad_norm": 0.331804851918644, |
| "learning_rate": 3.8111196129758025e-05, |
| "loss": 0.3281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1217694953083992, |
| "step": 1115, |
| "valid_targets_mean": 2960.4, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 1.1336708860759495, |
| "grad_norm": 0.35058089757688515, |
| "learning_rate": 3.808110740024541e-05, |
| "loss": 0.3189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18976081907749176, |
| "step": 1120, |
| "valid_targets_mean": 4311.5, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 1.13873417721519, |
| "grad_norm": 0.2598654453403866, |
| "learning_rate": 3.8050792973927654e-05, |
| "loss": 0.3227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16648131608963013, |
| "step": 1125, |
| "valid_targets_mean": 6690.9, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 1.1437974683544303, |
| "grad_norm": 0.36580297380970445, |
| "learning_rate": 3.8020253229203555e-05, |
| "loss": 0.327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.173434779047966, |
| "step": 1130, |
| "valid_targets_mean": 3429.3, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 1.1488607594936708, |
| "grad_norm": 0.3170699501916741, |
| "learning_rate": 3.798948854728441e-05, |
| "loss": 0.3303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12679925560951233, |
| "step": 1135, |
| "valid_targets_mean": 3721.6, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 1.1539240506329114, |
| "grad_norm": 0.3315048726728199, |
| "learning_rate": 3.7958499312189344e-05, |
| "loss": 0.3389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11187270283699036, |
| "step": 1140, |
| "valid_targets_mean": 3303.8, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 1.158987341772152, |
| "grad_norm": 0.2969536976332786, |
| "learning_rate": 3.792728591074041e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11002499610185623, |
| "step": 1145, |
| "valid_targets_mean": 4168.6, |
| "valid_targets_min": 1316 |
| }, |
| { |
| "epoch": 1.1640506329113924, |
| "grad_norm": 0.29906816062312314, |
| "learning_rate": 3.7895848732557815e-05, |
| "loss": 0.3329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1309490203857422, |
| "step": 1150, |
| "valid_targets_mean": 4264.5, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 1.169113924050633, |
| "grad_norm": 0.3373393294160328, |
| "learning_rate": 3.786418817005507e-05, |
| "loss": 0.3299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16449810564517975, |
| "step": 1155, |
| "valid_targets_mean": 4430.1, |
| "valid_targets_min": 1548 |
| }, |
| { |
| "epoch": 1.1741772151898735, |
| "grad_norm": 0.31814918332777564, |
| "learning_rate": 3.783230461843406e-05, |
| "loss": 0.3211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1603396236896515, |
| "step": 1160, |
| "valid_targets_mean": 4611.4, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 1.1792405063291138, |
| "grad_norm": 0.37957067548492934, |
| "learning_rate": 3.7800198475680136e-05, |
| "loss": 0.3264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09246158599853516, |
| "step": 1165, |
| "valid_targets_mean": 2677.1, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 1.1843037974683543, |
| "grad_norm": 0.3094282166752189, |
| "learning_rate": 3.776787014255712e-05, |
| "loss": 0.3292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1497591733932495, |
| "step": 1170, |
| "valid_targets_mean": 4014.9, |
| "valid_targets_min": 1510 |
| }, |
| { |
| "epoch": 1.1893670886075949, |
| "grad_norm": 0.35082198305199175, |
| "learning_rate": 3.773532002260233e-05, |
| "loss": 0.3276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1902400553226471, |
| "step": 1175, |
| "valid_targets_mean": 4051.2, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 1.1944303797468354, |
| "grad_norm": 0.3363300235759021, |
| "learning_rate": 3.770254852212152e-05, |
| "loss": 0.3236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1484481394290924, |
| "step": 1180, |
| "valid_targets_mean": 4022.1, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 1.199493670886076, |
| "grad_norm": 0.2959219712023686, |
| "learning_rate": 3.766955605018384e-05, |
| "loss": 0.3197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17988604307174683, |
| "step": 1185, |
| "valid_targets_mean": 5788.9, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 1.2045569620253165, |
| "grad_norm": 0.30513862700761135, |
| "learning_rate": 3.7636343018616675e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.162398099899292, |
| "step": 1190, |
| "valid_targets_mean": 4152.4, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 1.209620253164557, |
| "grad_norm": 0.3256099867852839, |
| "learning_rate": 3.7602909842000565e-05, |
| "loss": 0.3255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1604665219783783, |
| "step": 1195, |
| "valid_targets_mean": 4510.4, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 1.2146835443037975, |
| "grad_norm": 0.31652452857276137, |
| "learning_rate": 3.7569256937663995e-05, |
| "loss": 0.3228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11722761392593384, |
| "step": 1200, |
| "valid_targets_mean": 3867.2, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 1.219746835443038, |
| "grad_norm": 0.3570058144248121, |
| "learning_rate": 3.753538472567819e-05, |
| "loss": 0.3343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.132009819149971, |
| "step": 1205, |
| "valid_targets_mean": 3776.8, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 1.2248101265822784, |
| "grad_norm": 0.3253492095946553, |
| "learning_rate": 3.750129362885188e-05, |
| "loss": 0.3491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20971378684043884, |
| "step": 1210, |
| "valid_targets_mean": 5854.2, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 1.229873417721519, |
| "grad_norm": 0.31813799271358817, |
| "learning_rate": 3.7466984072726014e-05, |
| "loss": 0.3278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14392566680908203, |
| "step": 1215, |
| "valid_targets_mean": 4255.3, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 1.2349367088607595, |
| "grad_norm": 0.3161090773410782, |
| "learning_rate": 3.743245648556845e-05, |
| "loss": 0.333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15600383281707764, |
| "step": 1220, |
| "valid_targets_mean": 4627.6, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 1.24, |
| "grad_norm": 0.3383098606932185, |
| "learning_rate": 3.739771129836863e-05, |
| "loss": 0.3106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15630879998207092, |
| "step": 1225, |
| "valid_targets_mean": 3907.4, |
| "valid_targets_min": 1318 |
| }, |
| { |
| "epoch": 1.2450632911392405, |
| "grad_norm": 0.380311170159032, |
| "learning_rate": 3.736274894483215e-05, |
| "loss": 0.3443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17396849393844604, |
| "step": 1230, |
| "valid_targets_mean": 3654.8, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 1.250126582278481, |
| "grad_norm": 0.29633634831203143, |
| "learning_rate": 3.7327569861375404e-05, |
| "loss": 0.3368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20720690488815308, |
| "step": 1235, |
| "valid_targets_mean": 6698.7, |
| "valid_targets_min": 1554 |
| }, |
| { |
| "epoch": 1.2551898734177216, |
| "grad_norm": 0.32181581382324975, |
| "learning_rate": 3.729217448712009e-05, |
| "loss": 0.31, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15546496212482452, |
| "step": 1240, |
| "valid_targets_mean": 4598.5, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 1.260253164556962, |
| "grad_norm": 0.2876370801591027, |
| "learning_rate": 3.725656326388776e-05, |
| "loss": 0.312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12497955560684204, |
| "step": 1245, |
| "valid_targets_mean": 4425.2, |
| "valid_targets_min": 1167 |
| }, |
| { |
| "epoch": 1.2653164556962024, |
| "grad_norm": 0.3193054610028216, |
| "learning_rate": 3.722073663619429e-05, |
| "loss": 0.3268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15073925256729126, |
| "step": 1250, |
| "valid_targets_mean": 4511.2, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 1.270379746835443, |
| "grad_norm": 0.39145813292181675, |
| "learning_rate": 3.718469505124434e-05, |
| "loss": 0.3246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15670371055603027, |
| "step": 1255, |
| "valid_targets_mean": 4593.4, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 1.2754430379746835, |
| "grad_norm": 0.3007158793143366, |
| "learning_rate": 3.714843895892576e-05, |
| "loss": 0.332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14526674151420593, |
| "step": 1260, |
| "valid_targets_mean": 4201.2, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 1.280506329113924, |
| "grad_norm": 0.3431473760602178, |
| "learning_rate": 3.7111968811803985e-05, |
| "loss": 0.3374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11407409608364105, |
| "step": 1265, |
| "valid_targets_mean": 2609.9, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 1.2855696202531646, |
| "grad_norm": 0.31430226120597105, |
| "learning_rate": 3.7075285065116376e-05, |
| "loss": 0.3255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21788525581359863, |
| "step": 1270, |
| "valid_targets_mean": 5227.1, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 1.290632911392405, |
| "grad_norm": 0.2942207875130029, |
| "learning_rate": 3.703838817676654e-05, |
| "loss": 0.3248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16078102588653564, |
| "step": 1275, |
| "valid_targets_mean": 5179.4, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 1.2956962025316456, |
| "grad_norm": 0.33801133523700155, |
| "learning_rate": 3.7001278607318646e-05, |
| "loss": 0.3293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13204364478588104, |
| "step": 1280, |
| "valid_targets_mean": 3593.9, |
| "valid_targets_min": 1351 |
| }, |
| { |
| "epoch": 1.3007594936708862, |
| "grad_norm": 0.36194997437445076, |
| "learning_rate": 3.696395681999161e-05, |
| "loss": 0.3315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15205729007720947, |
| "step": 1285, |
| "valid_targets_mean": 3709.8, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 1.3058227848101267, |
| "grad_norm": 0.37635182260044775, |
| "learning_rate": 3.692642328065337e-05, |
| "loss": 0.3373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12143959850072861, |
| "step": 1290, |
| "valid_targets_mean": 3222.8, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 1.310886075949367, |
| "grad_norm": 0.3080355652465348, |
| "learning_rate": 3.688867845781506e-05, |
| "loss": 0.327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14508505165576935, |
| "step": 1295, |
| "valid_targets_mean": 3859.7, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 1.3159493670886075, |
| "grad_norm": 0.3439159780043492, |
| "learning_rate": 3.685072282262511e-05, |
| "loss": 0.3302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14666421711444855, |
| "step": 1300, |
| "valid_targets_mean": 3587.8, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 1.321012658227848, |
| "grad_norm": 0.30506292484752023, |
| "learning_rate": 3.6812556848863474e-05, |
| "loss": 0.3253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15456736087799072, |
| "step": 1305, |
| "valid_targets_mean": 3908.8, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 1.3260759493670886, |
| "grad_norm": 0.32896698136778196, |
| "learning_rate": 3.6774181012935595e-05, |
| "loss": 0.3302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14750021696090698, |
| "step": 1310, |
| "valid_targets_mean": 3579.4, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 1.3311392405063291, |
| "grad_norm": 0.3494681443588045, |
| "learning_rate": 3.673559579386653e-05, |
| "loss": 0.3329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16966864466667175, |
| "step": 1315, |
| "valid_targets_mean": 3639.5, |
| "valid_targets_min": 1136 |
| }, |
| { |
| "epoch": 1.3362025316455697, |
| "grad_norm": 0.3191056529939702, |
| "learning_rate": 3.6696801673294984e-05, |
| "loss": 0.3274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2022847682237625, |
| "step": 1320, |
| "valid_targets_mean": 6126.2, |
| "valid_targets_min": 1760 |
| }, |
| { |
| "epoch": 1.34126582278481, |
| "grad_norm": 0.40439808049151743, |
| "learning_rate": 3.665779913546721e-05, |
| "loss": 0.3207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1815149486064911, |
| "step": 1325, |
| "valid_targets_mean": 3929.4, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 1.3463291139240505, |
| "grad_norm": 0.29566683990417303, |
| "learning_rate": 3.6618588667231064e-05, |
| "loss": 0.3244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1440686285495758, |
| "step": 1330, |
| "valid_targets_mean": 4236.4, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 1.351392405063291, |
| "grad_norm": 0.3344359616665295, |
| "learning_rate": 3.6579170758029885e-05, |
| "loss": 0.324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15648147463798523, |
| "step": 1335, |
| "valid_targets_mean": 3588.6, |
| "valid_targets_min": 1635 |
| }, |
| { |
| "epoch": 1.3564556962025316, |
| "grad_norm": 0.2879031761545053, |
| "learning_rate": 3.653954589989637e-05, |
| "loss": 0.3215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16395555436611176, |
| "step": 1340, |
| "valid_targets_mean": 4903.5, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 1.3615189873417721, |
| "grad_norm": 0.3076034430138629, |
| "learning_rate": 3.649971458744645e-05, |
| "loss": 0.3332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14920540153980255, |
| "step": 1345, |
| "valid_targets_mean": 4404.3, |
| "valid_targets_min": 1479 |
| }, |
| { |
| "epoch": 1.3665822784810127, |
| "grad_norm": 0.37728920822736073, |
| "learning_rate": 3.645967731787313e-05, |
| "loss": 0.3273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16919684410095215, |
| "step": 1350, |
| "valid_targets_mean": 3916.3, |
| "valid_targets_min": 1491 |
| }, |
| { |
| "epoch": 1.3716455696202532, |
| "grad_norm": 0.2944205665752948, |
| "learning_rate": 3.641943459094026e-05, |
| "loss": 0.32, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20011773705482483, |
| "step": 1355, |
| "valid_targets_mean": 6104.8, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 1.3767088607594937, |
| "grad_norm": 0.31998862065193057, |
| "learning_rate": 3.63789869089763e-05, |
| "loss": 0.3281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17156195640563965, |
| "step": 1360, |
| "valid_targets_mean": 4435.9, |
| "valid_targets_min": 1056 |
| }, |
| { |
| "epoch": 1.3817721518987343, |
| "grad_norm": 0.3359058600132148, |
| "learning_rate": 3.633833477686805e-05, |
| "loss": 0.326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1116013303399086, |
| "step": 1365, |
| "valid_targets_mean": 2720.7, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 1.3868354430379748, |
| "grad_norm": 0.3167283899854193, |
| "learning_rate": 3.629747870205438e-05, |
| "loss": 0.3375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15123698115348816, |
| "step": 1370, |
| "valid_targets_mean": 4809.0, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 1.3918987341772153, |
| "grad_norm": 0.3176638421764831, |
| "learning_rate": 3.625641919451982e-05, |
| "loss": 0.3251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.116270050406456, |
| "step": 1375, |
| "valid_targets_mean": 3099.4, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 1.3969620253164556, |
| "grad_norm": 0.3567607135105218, |
| "learning_rate": 3.621515676678829e-05, |
| "loss": 0.3403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18901550769805908, |
| "step": 1380, |
| "valid_targets_mean": 4234.6, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 1.4020253164556962, |
| "grad_norm": 0.33150001426521647, |
| "learning_rate": 3.617369193391663e-05, |
| "loss": 0.3257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14285731315612793, |
| "step": 1385, |
| "valid_targets_mean": 3883.8, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 1.4070886075949367, |
| "grad_norm": 0.32040861152447253, |
| "learning_rate": 3.61320252134882e-05, |
| "loss": 0.3202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15014925599098206, |
| "step": 1390, |
| "valid_targets_mean": 4633.4, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 1.4121518987341772, |
| "grad_norm": 0.3364407178912512, |
| "learning_rate": 3.6090157125606405e-05, |
| "loss": 0.3308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19701796770095825, |
| "step": 1395, |
| "valid_targets_mean": 4298.4, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 1.4172151898734178, |
| "grad_norm": 0.2998592984370577, |
| "learning_rate": 3.604808819288823e-05, |
| "loss": 0.3213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21334891021251678, |
| "step": 1400, |
| "valid_targets_mean": 6774.6, |
| "valid_targets_min": 1471 |
| }, |
| { |
| "epoch": 1.4222784810126583, |
| "grad_norm": 0.32266679078127786, |
| "learning_rate": 3.600581894045768e-05, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10229863971471786, |
| "step": 1405, |
| "valid_targets_mean": 2818.3, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 1.4273417721518986, |
| "grad_norm": 0.2989355644726402, |
| "learning_rate": 3.596334989593927e-05, |
| "loss": 0.3324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16216593980789185, |
| "step": 1410, |
| "valid_targets_mean": 4271.4, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 1.4324050632911391, |
| "grad_norm": 0.33686789223908364, |
| "learning_rate": 3.5920681589451385e-05, |
| "loss": 0.3177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16129520535469055, |
| "step": 1415, |
| "valid_targets_mean": 3987.1, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.4374683544303797, |
| "grad_norm": 0.2948991655130385, |
| "learning_rate": 3.58778145535997e-05, |
| "loss": 0.3152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14479148387908936, |
| "step": 1420, |
| "valid_targets_mean": 4191.2, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 1.4425316455696202, |
| "grad_norm": 0.278153706236472, |
| "learning_rate": 3.583474932347054e-05, |
| "loss": 0.3194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15073184669017792, |
| "step": 1425, |
| "valid_targets_mean": 5600.0, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 1.4475949367088607, |
| "grad_norm": 0.2989703152632012, |
| "learning_rate": 3.5791486436624145e-05, |
| "loss": 0.322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1581433117389679, |
| "step": 1430, |
| "valid_targets_mean": 4557.4, |
| "valid_targets_min": 1311 |
| }, |
| { |
| "epoch": 1.4526582278481013, |
| "grad_norm": 0.3156763543957603, |
| "learning_rate": 3.5748026433088036e-05, |
| "loss": 0.3234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1554793417453766, |
| "step": 1435, |
| "valid_targets_mean": 5105.0, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 1.4577215189873418, |
| "grad_norm": 0.30549649598454104, |
| "learning_rate": 3.5704369855350226e-05, |
| "loss": 0.3285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10838840901851654, |
| "step": 1440, |
| "valid_targets_mean": 2855.1, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 1.4627848101265823, |
| "grad_norm": 0.37394597619150627, |
| "learning_rate": 3.566051724835245e-05, |
| "loss": 0.3409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13602185249328613, |
| "step": 1445, |
| "valid_targets_mean": 3419.4, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 1.4678481012658229, |
| "grad_norm": 0.3156375413907948, |
| "learning_rate": 3.5616469159483363e-05, |
| "loss": 0.3224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14657479524612427, |
| "step": 1450, |
| "valid_targets_mean": 4287.6, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 1.4729113924050634, |
| "grad_norm": 0.32282455141307365, |
| "learning_rate": 3.5572226138571753e-05, |
| "loss": 0.3428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21434099972248077, |
| "step": 1455, |
| "valid_targets_mean": 6099.5, |
| "valid_targets_min": 1650 |
| }, |
| { |
| "epoch": 1.4779746835443037, |
| "grad_norm": 0.3934165636040704, |
| "learning_rate": 3.5527788737879595e-05, |
| "loss": 0.3293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13554619252681732, |
| "step": 1460, |
| "valid_targets_mean": 3898.6, |
| "valid_targets_min": 749 |
| }, |
| { |
| "epoch": 1.4830379746835443, |
| "grad_norm": 0.3532333332147838, |
| "learning_rate": 3.548315751209524e-05, |
| "loss": 0.3211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1423749029636383, |
| "step": 1465, |
| "valid_targets_mean": 3396.2, |
| "valid_targets_min": 1245 |
| }, |
| { |
| "epoch": 1.4881012658227848, |
| "grad_norm": 0.3046035862379382, |
| "learning_rate": 3.543833301832642e-05, |
| "loss": 0.3092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11005077511072159, |
| "step": 1470, |
| "valid_targets_mean": 3165.8, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 1.4931645569620253, |
| "grad_norm": 0.2934515113132098, |
| "learning_rate": 3.539331581609337e-05, |
| "loss": 0.3228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16373209655284882, |
| "step": 1475, |
| "valid_targets_mean": 5422.3, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 1.4982278481012659, |
| "grad_norm": 0.29330851366159866, |
| "learning_rate": 3.5348106467321756e-05, |
| "loss": 0.3204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1334601640701294, |
| "step": 1480, |
| "valid_targets_mean": 4623.2, |
| "valid_targets_min": 1060 |
| }, |
| { |
| "epoch": 1.5032911392405062, |
| "grad_norm": 0.3494149115756711, |
| "learning_rate": 3.530270553633574e-05, |
| "loss": 0.3347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14463084936141968, |
| "step": 1485, |
| "valid_targets_mean": 3681.4, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 1.5083544303797467, |
| "grad_norm": 0.34094476372572885, |
| "learning_rate": 3.5257113589850895e-05, |
| "loss": 0.3283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13542452454566956, |
| "step": 1490, |
| "valid_targets_mean": 3142.8, |
| "valid_targets_min": 1338 |
| }, |
| { |
| "epoch": 1.5134177215189872, |
| "grad_norm": 0.33689606267312805, |
| "learning_rate": 3.521133119696712e-05, |
| "loss": 0.3264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16328886151313782, |
| "step": 1495, |
| "valid_targets_mean": 4708.0, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 1.5184810126582278, |
| "grad_norm": 0.8587040130178458, |
| "learning_rate": 3.516535892916159e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.166406512260437, |
| "step": 1500, |
| "valid_targets_mean": 4267.1, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 1.5235443037974683, |
| "grad_norm": 0.31747165527732263, |
| "learning_rate": 3.5119197360281553e-05, |
| "loss": 0.332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1378452181816101, |
| "step": 1505, |
| "valid_targets_mean": 3656.2, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 1.5286075949367088, |
| "grad_norm": 0.3521429432867297, |
| "learning_rate": 3.507284706653722e-05, |
| "loss": 0.3369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22082693874835968, |
| "step": 1510, |
| "valid_targets_mean": 4618.8, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 1.5336708860759494, |
| "grad_norm": 0.3319407091362445, |
| "learning_rate": 3.5026308626494545e-05, |
| "loss": 0.3134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18031668663024902, |
| "step": 1515, |
| "valid_targets_mean": 3750.2, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 1.53873417721519, |
| "grad_norm": 0.33498834727615584, |
| "learning_rate": 3.497958262106801e-05, |
| "loss": 0.3205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1643165647983551, |
| "step": 1520, |
| "valid_targets_mean": 3328.2, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 1.5437974683544304, |
| "grad_norm": 0.3537186281988192, |
| "learning_rate": 3.493266963351339e-05, |
| "loss": 0.3115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1584773063659668, |
| "step": 1525, |
| "valid_targets_mean": 3274.9, |
| "valid_targets_min": 1245 |
| }, |
| { |
| "epoch": 1.548860759493671, |
| "grad_norm": 0.30657928098680826, |
| "learning_rate": 3.4885570249420454e-05, |
| "loss": 0.3272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1703530102968216, |
| "step": 1530, |
| "valid_targets_mean": 5461.6, |
| "valid_targets_min": 1154 |
| }, |
| { |
| "epoch": 1.5539240506329115, |
| "grad_norm": 0.338680368171272, |
| "learning_rate": 3.483828505670563e-05, |
| "loss": 0.3255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15479744970798492, |
| "step": 1535, |
| "valid_targets_mean": 4522.8, |
| "valid_targets_min": 1326 |
| }, |
| { |
| "epoch": 1.558987341772152, |
| "grad_norm": 0.369309200288726, |
| "learning_rate": 3.479081464560475e-05, |
| "loss": 0.3191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12721368670463562, |
| "step": 1540, |
| "valid_targets_mean": 2568.1, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 1.5640506329113926, |
| "grad_norm": 0.3519884099657949, |
| "learning_rate": 3.474315960866558e-05, |
| "loss": 0.326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21022453904151917, |
| "step": 1545, |
| "valid_targets_mean": 5003.4, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 1.5691139240506329, |
| "grad_norm": 0.33365501094495986, |
| "learning_rate": 3.469532054074049e-05, |
| "loss": 0.3275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11454639583826065, |
| "step": 1550, |
| "valid_targets_mean": 3473.1, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 1.5741772151898734, |
| "grad_norm": 0.3487036569312814, |
| "learning_rate": 3.464729803897902e-05, |
| "loss": 0.3207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0789409726858139, |
| "step": 1555, |
| "valid_targets_mean": 2519.6, |
| "valid_targets_min": 1102 |
| }, |
| { |
| "epoch": 1.579240506329114, |
| "grad_norm": 0.33603816281790033, |
| "learning_rate": 3.4599092702820394e-05, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11025889217853546, |
| "step": 1560, |
| "valid_targets_mean": 2999.4, |
| "valid_targets_min": 1318 |
| }, |
| { |
| "epoch": 1.5843037974683545, |
| "grad_norm": 0.33746214929234886, |
| "learning_rate": 3.4550705133986085e-05, |
| "loss": 0.3297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1540479212999344, |
| "step": 1565, |
| "valid_targets_mean": 3550.0, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 1.5893670886075948, |
| "grad_norm": 0.3700007824527567, |
| "learning_rate": 3.450213593647226e-05, |
| "loss": 0.3235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.179176926612854, |
| "step": 1570, |
| "valid_targets_mean": 3797.9, |
| "valid_targets_min": 1468 |
| }, |
| { |
| "epoch": 1.5944303797468353, |
| "grad_norm": 0.43557784622964635, |
| "learning_rate": 3.445338571654227e-05, |
| "loss": 0.3245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12111867964267731, |
| "step": 1575, |
| "valid_targets_mean": 3459.7, |
| "valid_targets_min": 1321 |
| }, |
| { |
| "epoch": 1.5994936708860759, |
| "grad_norm": 0.3234005911683535, |
| "learning_rate": 3.440445508271907e-05, |
| "loss": 0.3303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11545059829950333, |
| "step": 1580, |
| "valid_targets_mean": 3151.1, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 1.6045569620253164, |
| "grad_norm": 0.31481487050082757, |
| "learning_rate": 3.435534464577762e-05, |
| "loss": 0.3185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14349615573883057, |
| "step": 1585, |
| "valid_targets_mean": 4098.8, |
| "valid_targets_min": 1553 |
| }, |
| { |
| "epoch": 1.609620253164557, |
| "grad_norm": 0.3263020753319533, |
| "learning_rate": 3.4306055018737274e-05, |
| "loss": 0.3262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1886909306049347, |
| "step": 1590, |
| "valid_targets_mean": 5531.9, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 1.6146835443037975, |
| "grad_norm": 0.3440773642804762, |
| "learning_rate": 3.425658681685412e-05, |
| "loss": 0.3247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17707081139087677, |
| "step": 1595, |
| "valid_targets_mean": 3534.2, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 1.619746835443038, |
| "grad_norm": 0.32440177535383535, |
| "learning_rate": 3.420694065761328e-05, |
| "loss": 0.3282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16896334290504456, |
| "step": 1600, |
| "valid_targets_mean": 4122.1, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 1.6248101265822785, |
| "grad_norm": 0.2928837040048521, |
| "learning_rate": 3.415711716072126e-05, |
| "loss": 0.3318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17395883798599243, |
| "step": 1605, |
| "valid_targets_mean": 5510.7, |
| "valid_targets_min": 1836 |
| }, |
| { |
| "epoch": 1.629873417721519, |
| "grad_norm": 0.29996111358110616, |
| "learning_rate": 3.4107116948098155e-05, |
| "loss": 0.3208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16087687015533447, |
| "step": 1610, |
| "valid_targets_mean": 5291.1, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 1.6349367088607596, |
| "grad_norm": 0.3391636106718898, |
| "learning_rate": 3.4056940643869905e-05, |
| "loss": 0.328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12102165073156357, |
| "step": 1615, |
| "valid_targets_mean": 2991.2, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 1.6400000000000001, |
| "grad_norm": 0.30250385799846535, |
| "learning_rate": 3.400658887436051e-05, |
| "loss": 0.3274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15453828871250153, |
| "step": 1620, |
| "valid_targets_mean": 4200.3, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 1.6450632911392407, |
| "grad_norm": 0.31602413877978186, |
| "learning_rate": 3.3956062268084215e-05, |
| "loss": 0.3167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1669228971004486, |
| "step": 1625, |
| "valid_targets_mean": 4059.0, |
| "valid_targets_min": 1494 |
| }, |
| { |
| "epoch": 1.650126582278481, |
| "grad_norm": 0.3430073741627476, |
| "learning_rate": 3.390536145573766e-05, |
| "loss": 0.3311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15472730994224548, |
| "step": 1630, |
| "valid_targets_mean": 4020.9, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 1.6551898734177215, |
| "grad_norm": 0.30844530157775457, |
| "learning_rate": 3.385448707019199e-05, |
| "loss": 0.3353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13865000009536743, |
| "step": 1635, |
| "valid_targets_mean": 3493.1, |
| "valid_targets_min": 1516 |
| }, |
| { |
| "epoch": 1.660253164556962, |
| "grad_norm": 0.29309820401088355, |
| "learning_rate": 3.3803439746484996e-05, |
| "loss": 0.3371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18344934284687042, |
| "step": 1640, |
| "valid_targets_mean": 5938.8, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 1.6653164556962026, |
| "grad_norm": 0.2917099753276015, |
| "learning_rate": 3.375222012181315e-05, |
| "loss": 0.3324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15374572575092316, |
| "step": 1645, |
| "valid_targets_mean": 4424.8, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 1.6703797468354429, |
| "grad_norm": 0.31174326634371047, |
| "learning_rate": 3.370082883552366e-05, |
| "loss": 0.3248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18676675856113434, |
| "step": 1650, |
| "valid_targets_mean": 4577.7, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 1.6754430379746834, |
| "grad_norm": 0.2937468748877549, |
| "learning_rate": 3.364926652910651e-05, |
| "loss": 0.328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14714813232421875, |
| "step": 1655, |
| "valid_targets_mean": 4791.8, |
| "valid_targets_min": 1213 |
| }, |
| { |
| "epoch": 1.680506329113924, |
| "grad_norm": 0.2879601888076102, |
| "learning_rate": 3.359753384618641e-05, |
| "loss": 0.3339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19825273752212524, |
| "step": 1660, |
| "valid_targets_mean": 6597.8, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 1.6855696202531645, |
| "grad_norm": 0.28734174588103684, |
| "learning_rate": 3.354563143251483e-05, |
| "loss": 0.3251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13350191712379456, |
| "step": 1665, |
| "valid_targets_mean": 4193.6, |
| "valid_targets_min": 1311 |
| }, |
| { |
| "epoch": 1.690632911392405, |
| "grad_norm": 0.3163624678749021, |
| "learning_rate": 3.3493559935961854e-05, |
| "loss": 0.3332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19836895167827606, |
| "step": 1670, |
| "valid_targets_mean": 4911.9, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 1.6956962025316455, |
| "grad_norm": 0.26723388677186943, |
| "learning_rate": 3.344132000650817e-05, |
| "loss": 0.3229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14954085648059845, |
| "step": 1675, |
| "valid_targets_mean": 5300.8, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 1.700759493670886, |
| "grad_norm": 0.3367011427653921, |
| "learning_rate": 3.3388912296236906e-05, |
| "loss": 0.3369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15727460384368896, |
| "step": 1680, |
| "valid_targets_mean": 3988.7, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 1.7058227848101266, |
| "grad_norm": 0.46226016366837236, |
| "learning_rate": 3.3336337459325526e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18564224243164062, |
| "step": 1685, |
| "valid_targets_mean": 6143.1, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 1.7108860759493671, |
| "grad_norm": 0.3175894026472926, |
| "learning_rate": 3.328359615203762e-05, |
| "loss": 0.3183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19139517843723297, |
| "step": 1690, |
| "valid_targets_mean": 5133.2, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 1.7159493670886077, |
| "grad_norm": 0.27972490266827565, |
| "learning_rate": 3.323068903271476e-05, |
| "loss": 0.3344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11912492662668228, |
| "step": 1695, |
| "valid_targets_mean": 4236.9, |
| "valid_targets_min": 1213 |
| }, |
| { |
| "epoch": 1.7210126582278482, |
| "grad_norm": 0.28905133463909916, |
| "learning_rate": 3.317761676176825e-05, |
| "loss": 0.326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1582462191581726, |
| "step": 1700, |
| "valid_targets_mean": 5365.8, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 1.7260759493670887, |
| "grad_norm": 0.2928951231194897, |
| "learning_rate": 3.31243800016709e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16399666666984558, |
| "step": 1705, |
| "valid_targets_mean": 4478.1, |
| "valid_targets_min": 913 |
| }, |
| { |
| "epoch": 1.7311392405063293, |
| "grad_norm": 0.3067909993527847, |
| "learning_rate": 3.307097941694876e-05, |
| "loss": 0.3203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1793975532054901, |
| "step": 1710, |
| "valid_targets_mean": 4923.8, |
| "valid_targets_min": 1793 |
| }, |
| { |
| "epoch": 1.7362025316455696, |
| "grad_norm": 0.29679310025747774, |
| "learning_rate": 3.3017415674172795e-05, |
| "loss": 0.3205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1398848444223404, |
| "step": 1715, |
| "valid_targets_mean": 3729.8, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 1.7412658227848101, |
| "grad_norm": 0.33157110353633035, |
| "learning_rate": 3.296368944195059e-05, |
| "loss": 0.3258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16532516479492188, |
| "step": 1720, |
| "valid_targets_mean": 4614.5, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 1.7463291139240507, |
| "grad_norm": 0.3237383031466305, |
| "learning_rate": 3.2909801390918e-05, |
| "loss": 0.3165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16484834253787994, |
| "step": 1725, |
| "valid_targets_mean": 4277.1, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 1.7513924050632912, |
| "grad_norm": 0.30303998742275196, |
| "learning_rate": 3.285575219373079e-05, |
| "loss": 0.3068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1231764703989029, |
| "step": 1730, |
| "valid_targets_mean": 3492.9, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 1.7564556962025315, |
| "grad_norm": 0.3131204074959935, |
| "learning_rate": 3.2801542525056204e-05, |
| "loss": 0.3236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16018734872341156, |
| "step": 1735, |
| "valid_targets_mean": 4216.1, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 1.761518987341772, |
| "grad_norm": 0.5226006047690179, |
| "learning_rate": 3.27471730615646e-05, |
| "loss": 0.3168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13336879014968872, |
| "step": 1740, |
| "valid_targets_mean": 3926.2, |
| "valid_targets_min": 1825 |
| }, |
| { |
| "epoch": 1.7665822784810126, |
| "grad_norm": 0.288468699839479, |
| "learning_rate": 3.2692644481920926e-05, |
| "loss": 0.3091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1637478768825531, |
| "step": 1745, |
| "valid_targets_mean": 5375.8, |
| "valid_targets_min": 1193 |
| }, |
| { |
| "epoch": 1.771645569620253, |
| "grad_norm": 0.3345448593431147, |
| "learning_rate": 3.263795746677633e-05, |
| "loss": 0.3169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1924804151058197, |
| "step": 1750, |
| "valid_targets_mean": 4262.6, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 1.7767088607594936, |
| "grad_norm": 0.31362215927542564, |
| "learning_rate": 3.258311269875959e-05, |
| "loss": 0.3295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17079243063926697, |
| "step": 1755, |
| "valid_targets_mean": 4860.1, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 1.7817721518987342, |
| "grad_norm": 0.2881402537381144, |
| "learning_rate": 3.2528110862468664e-05, |
| "loss": 0.3212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1843501329421997, |
| "step": 1760, |
| "valid_targets_mean": 5736.6, |
| "valid_targets_min": 1442 |
| }, |
| { |
| "epoch": 1.7868354430379747, |
| "grad_norm": 0.33940507923082636, |
| "learning_rate": 3.247295264446209e-05, |
| "loss": 0.332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14896419644355774, |
| "step": 1765, |
| "valid_targets_mean": 4003.1, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 1.7918987341772152, |
| "grad_norm": 0.305481958944062, |
| "learning_rate": 3.241763873325044e-05, |
| "loss": 0.3321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1464659869670868, |
| "step": 1770, |
| "valid_targets_mean": 4571.4, |
| "valid_targets_min": 1342 |
| }, |
| { |
| "epoch": 1.7969620253164558, |
| "grad_norm": 0.3372959294620817, |
| "learning_rate": 3.2362169819287714e-05, |
| "loss": 0.3198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17976534366607666, |
| "step": 1775, |
| "valid_targets_mean": 4028.4, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 1.8020253164556963, |
| "grad_norm": 0.3104430678347615, |
| "learning_rate": 3.2306546594962744e-05, |
| "loss": 0.3274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16419640183448792, |
| "step": 1780, |
| "valid_targets_mean": 4230.2, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 1.8070886075949368, |
| "grad_norm": 0.3241781257834898, |
| "learning_rate": 3.225076975459051e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21455496549606323, |
| "step": 1785, |
| "valid_targets_mean": 7327.5, |
| "valid_targets_min": 1343 |
| }, |
| { |
| "epoch": 1.8121518987341774, |
| "grad_norm": 0.3169044936479542, |
| "learning_rate": 3.219483999440354e-05, |
| "loss": 0.3169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12079709023237228, |
| "step": 1790, |
| "valid_targets_mean": 3173.1, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 1.8172151898734177, |
| "grad_norm": 0.331980276874436, |
| "learning_rate": 3.213875801254314e-05, |
| "loss": 0.3276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14299997687339783, |
| "step": 1795, |
| "valid_targets_mean": 3476.8, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 1.8222784810126582, |
| "grad_norm": 0.25978521097127444, |
| "learning_rate": 3.2082524509050723e-05, |
| "loss": 0.3194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14637430012226105, |
| "step": 1800, |
| "valid_targets_mean": 5356.4, |
| "valid_targets_min": 1492 |
| }, |
| { |
| "epoch": 1.8273417721518987, |
| "grad_norm": 0.4563427674089283, |
| "learning_rate": 3.20261401858591e-05, |
| "loss": 0.3246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16923454403877258, |
| "step": 1805, |
| "valid_targets_mean": 4621.6, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 1.8324050632911393, |
| "grad_norm": 0.28306126650762187, |
| "learning_rate": 3.196960574678363e-05, |
| "loss": 0.3335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11796549707651138, |
| "step": 1810, |
| "valid_targets_mean": 4214.6, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 1.8374683544303796, |
| "grad_norm": 0.32499866336342004, |
| "learning_rate": 3.191292189751353e-05, |
| "loss": 0.3441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1776324212551117, |
| "step": 1815, |
| "valid_targets_mean": 5706.0, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 1.8425316455696201, |
| "grad_norm": 0.29118017187843964, |
| "learning_rate": 3.185608934560301e-05, |
| "loss": 0.3105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12048833072185516, |
| "step": 1820, |
| "valid_targets_mean": 3490.6, |
| "valid_targets_min": 1465 |
| }, |
| { |
| "epoch": 1.8475949367088607, |
| "grad_norm": 0.3114271880772345, |
| "learning_rate": 3.1799108800462466e-05, |
| "loss": 0.3377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14511121809482574, |
| "step": 1825, |
| "valid_targets_mean": 3770.2, |
| "valid_targets_min": 1165 |
| }, |
| { |
| "epoch": 1.8526582278481012, |
| "grad_norm": 0.28385385385120393, |
| "learning_rate": 3.174198097334959e-05, |
| "loss": 0.3248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16951501369476318, |
| "step": 1830, |
| "valid_targets_mean": 4812.1, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 1.8577215189873417, |
| "grad_norm": 0.33205815359378843, |
| "learning_rate": 3.168470657736053e-05, |
| "loss": 0.3306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1585332751274109, |
| "step": 1835, |
| "valid_targets_mean": 5364.6, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 1.8627848101265823, |
| "grad_norm": 0.31689534847164214, |
| "learning_rate": 3.162728632742098e-05, |
| "loss": 0.3115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16908031702041626, |
| "step": 1840, |
| "valid_targets_mean": 4225.1, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 1.8678481012658228, |
| "grad_norm": 0.3087921045352938, |
| "learning_rate": 3.1569720940277267e-05, |
| "loss": 0.3178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17665991187095642, |
| "step": 1845, |
| "valid_targets_mean": 4580.1, |
| "valid_targets_min": 1284 |
| }, |
| { |
| "epoch": 1.8729113924050633, |
| "grad_norm": 0.28162350739466746, |
| "learning_rate": 3.151201113448735e-05, |
| "loss": 0.3198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16834816336631775, |
| "step": 1850, |
| "valid_targets_mean": 5581.1, |
| "valid_targets_min": 1362 |
| }, |
| { |
| "epoch": 1.8779746835443039, |
| "grad_norm": 0.33622728572725646, |
| "learning_rate": 3.1454157630411905e-05, |
| "loss": 0.3297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13378959894180298, |
| "step": 1855, |
| "valid_targets_mean": 3264.8, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 1.8830379746835444, |
| "grad_norm": 0.2888883767197038, |
| "learning_rate": 3.1396161150205324e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15173028409481049, |
| "step": 1860, |
| "valid_targets_mean": 5245.6, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 1.888101265822785, |
| "grad_norm": 0.3008873149690533, |
| "learning_rate": 3.133802241780669e-05, |
| "loss": 0.3417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.168132483959198, |
| "step": 1865, |
| "valid_targets_mean": 5342.9, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 1.8931645569620255, |
| "grad_norm": 0.30961408751335806, |
| "learning_rate": 3.127974215893075e-05, |
| "loss": 0.3319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15519672632217407, |
| "step": 1870, |
| "valid_targets_mean": 4829.4, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 1.8982278481012658, |
| "grad_norm": 0.3375894079078535, |
| "learning_rate": 3.1221321101058826e-05, |
| "loss": 0.3233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2031598687171936, |
| "step": 1875, |
| "valid_targets_mean": 4846.2, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 1.9032911392405063, |
| "grad_norm": 0.30102939403192525, |
| "learning_rate": 3.116275997342979e-05, |
| "loss": 0.3328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1768466830253601, |
| "step": 1880, |
| "valid_targets_mean": 5417.4, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 1.9083544303797468, |
| "grad_norm": 0.31204461528240096, |
| "learning_rate": 3.110405950703091e-05, |
| "loss": 0.3286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15786431729793549, |
| "step": 1885, |
| "valid_targets_mean": 4424.1, |
| "valid_targets_min": 1590 |
| }, |
| { |
| "epoch": 1.9134177215189874, |
| "grad_norm": 0.3212411559315451, |
| "learning_rate": 3.104522043458875e-05, |
| "loss": 0.3326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15173178911209106, |
| "step": 1890, |
| "valid_targets_mean": 3546.5, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 1.918481012658228, |
| "grad_norm": 0.3477054279687247, |
| "learning_rate": 3.098624349056003e-05, |
| "loss": 0.3131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09834770858287811, |
| "step": 1895, |
| "valid_targets_mean": 3314.4, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 1.9235443037974682, |
| "grad_norm": 0.3224350947488976, |
| "learning_rate": 3.0927129411122433e-05, |
| "loss": 0.3307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1967785656452179, |
| "step": 1900, |
| "valid_targets_mean": 5401.0, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 1.9286075949367087, |
| "grad_norm": 0.3407210065894635, |
| "learning_rate": 3.086787893416543e-05, |
| "loss": 0.3344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15977072715759277, |
| "step": 1905, |
| "valid_targets_mean": 3843.9, |
| "valid_targets_min": 1465 |
| }, |
| { |
| "epoch": 1.9336708860759493, |
| "grad_norm": 0.3048824087454436, |
| "learning_rate": 3.080849279928108e-05, |
| "loss": 0.3186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21388033032417297, |
| "step": 1910, |
| "valid_targets_mean": 5811.2, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 1.9387341772151898, |
| "grad_norm": 0.3220507717171466, |
| "learning_rate": 3.074897174775478e-05, |
| "loss": 0.3231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17468535900115967, |
| "step": 1915, |
| "valid_targets_mean": 4189.4, |
| "valid_targets_min": 1442 |
| }, |
| { |
| "epoch": 1.9437974683544303, |
| "grad_norm": 0.33220201972445723, |
| "learning_rate": 3.0689316522556026e-05, |
| "loss": 0.3242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1948956400156021, |
| "step": 1920, |
| "valid_targets_mean": 4742.3, |
| "valid_targets_min": 1598 |
| }, |
| { |
| "epoch": 1.9488607594936709, |
| "grad_norm": 0.32448507249493624, |
| "learning_rate": 3.062952786832912e-05, |
| "loss": 0.3189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1440562605857849, |
| "step": 1925, |
| "valid_targets_mean": 4186.6, |
| "valid_targets_min": 1640 |
| }, |
| { |
| "epoch": 1.9539240506329114, |
| "grad_norm": 0.29766519811078285, |
| "learning_rate": 3.05696065313839e-05, |
| "loss": 0.3306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18304754793643951, |
| "step": 1930, |
| "valid_targets_mean": 6132.7, |
| "valid_targets_min": 1516 |
| }, |
| { |
| "epoch": 1.958987341772152, |
| "grad_norm": 0.2949900786324887, |
| "learning_rate": 3.050955325968641e-05, |
| "loss": 0.3211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15778782963752747, |
| "step": 1935, |
| "valid_targets_mean": 5078.4, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 1.9640506329113925, |
| "grad_norm": 0.3263199970381054, |
| "learning_rate": 3.0449368802849553e-05, |
| "loss": 0.3181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14029563963413239, |
| "step": 1940, |
| "valid_targets_mean": 4289.6, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 1.969113924050633, |
| "grad_norm": 0.3116697424009326, |
| "learning_rate": 3.0389053912123755e-05, |
| "loss": 0.3215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1622355878353119, |
| "step": 1945, |
| "valid_targets_mean": 4043.3, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 1.9741772151898735, |
| "grad_norm": 0.33957146598689614, |
| "learning_rate": 3.0328609340387584e-05, |
| "loss": 0.319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1829889565706253, |
| "step": 1950, |
| "valid_targets_mean": 3790.2, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.979240506329114, |
| "grad_norm": 0.31004887940586384, |
| "learning_rate": 3.026803584213834e-05, |
| "loss": 0.3196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1571284979581833, |
| "step": 1955, |
| "valid_targets_mean": 4538.4, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 1.9843037974683544, |
| "grad_norm": 0.2945095160712328, |
| "learning_rate": 3.0207334173482635e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14519169926643372, |
| "step": 1960, |
| "valid_targets_mean": 3616.2, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 1.989367088607595, |
| "grad_norm": 0.29690655635239654, |
| "learning_rate": 3.0146505092126987e-05, |
| "loss": 0.3159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14115923643112183, |
| "step": 1965, |
| "valid_targets_mean": 4046.1, |
| "valid_targets_min": 1832 |
| }, |
| { |
| "epoch": 1.9944303797468355, |
| "grad_norm": 0.3836659337432429, |
| "learning_rate": 3.0085549357368316e-05, |
| "loss": 0.3245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16044825315475464, |
| "step": 1970, |
| "valid_targets_mean": 4667.9, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 1.999493670886076, |
| "grad_norm": 0.3322124150108135, |
| "learning_rate": 3.0024467730084508e-05, |
| "loss": 0.3169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12640810012817383, |
| "step": 1975, |
| "valid_targets_mean": 3170.9, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 2.0040506329113925, |
| "grad_norm": 0.3291075554103832, |
| "learning_rate": 2.996326097272487e-05, |
| "loss": 0.2897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16433456540107727, |
| "step": 1980, |
| "valid_targets_mean": 4258.9, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 2.009113924050633, |
| "grad_norm": 0.28624539538450133, |
| "learning_rate": 2.9901929849300676e-05, |
| "loss": 0.3121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.156062513589859, |
| "step": 1985, |
| "valid_targets_mean": 5479.2, |
| "valid_targets_min": 1383 |
| }, |
| { |
| "epoch": 2.0141772151898736, |
| "grad_norm": 0.31864237413570884, |
| "learning_rate": 2.984047512537557e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17700161039829254, |
| "step": 1990, |
| "valid_targets_mean": 4326.2, |
| "valid_targets_min": 1491 |
| }, |
| { |
| "epoch": 2.019240506329114, |
| "grad_norm": 0.29138155253699194, |
| "learning_rate": 2.977889756805604e-05, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19598735868930817, |
| "step": 1995, |
| "valid_targets_mean": 5823.9, |
| "valid_targets_min": 1470 |
| }, |
| { |
| "epoch": 2.0243037974683546, |
| "grad_norm": 0.32618376749689376, |
| "learning_rate": 2.9717197945981844e-05, |
| "loss": 0.3078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14639677107334137, |
| "step": 2000, |
| "valid_targets_mean": 3956.3, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 2.0293670886075947, |
| "grad_norm": 0.3231822134904899, |
| "learning_rate": 2.9655377029316415e-05, |
| "loss": 0.3038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1973341703414917, |
| "step": 2005, |
| "valid_targets_mean": 6070.5, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 2.0344303797468353, |
| "grad_norm": 0.4445885950556669, |
| "learning_rate": 2.9593435589737212e-05, |
| "loss": 0.3081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1424170434474945, |
| "step": 2010, |
| "valid_targets_mean": 3355.1, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 2.039493670886076, |
| "grad_norm": 0.31012702805843667, |
| "learning_rate": 2.9531374400426158e-05, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17267721891403198, |
| "step": 2015, |
| "valid_targets_mean": 5018.6, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.0445569620253163, |
| "grad_norm": 0.27456099255552485, |
| "learning_rate": 2.9469194236059916e-05, |
| "loss": 0.3109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18913531303405762, |
| "step": 2020, |
| "valid_targets_mean": 6316.9, |
| "valid_targets_min": 1565 |
| }, |
| { |
| "epoch": 2.049620253164557, |
| "grad_norm": 0.30759866121772944, |
| "learning_rate": 2.940689587280027e-05, |
| "loss": 0.3056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17620842158794403, |
| "step": 2025, |
| "valid_targets_mean": 5025.1, |
| "valid_targets_min": 1103 |
| }, |
| { |
| "epoch": 2.0546835443037974, |
| "grad_norm": 0.3107498769401775, |
| "learning_rate": 2.9344480088284403e-05, |
| "loss": 0.3108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14356273412704468, |
| "step": 2030, |
| "valid_targets_mean": 3878.3, |
| "valid_targets_min": 1435 |
| }, |
| { |
| "epoch": 2.059746835443038, |
| "grad_norm": 0.3272342894958522, |
| "learning_rate": 2.9281947661615206e-05, |
| "loss": 0.3141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11045265197753906, |
| "step": 2035, |
| "valid_targets_mean": 2769.6, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 2.0648101265822785, |
| "grad_norm": 0.28376297804532025, |
| "learning_rate": 2.921929937335157e-05, |
| "loss": 0.3134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18254786729812622, |
| "step": 2040, |
| "valid_targets_mean": 6384.8, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 2.069873417721519, |
| "grad_norm": 0.3494712370742931, |
| "learning_rate": 2.9156536005498616e-05, |
| "loss": 0.3226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15539231896400452, |
| "step": 2045, |
| "valid_targets_mean": 3678.8, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 2.0749367088607595, |
| "grad_norm": 0.36306320132408093, |
| "learning_rate": 2.909365834149792e-05, |
| "loss": 0.3188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16074064373970032, |
| "step": 2050, |
| "valid_targets_mean": 3803.6, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 2.08, |
| "grad_norm": 0.28771743850152404, |
| "learning_rate": 2.903066716621779e-05, |
| "loss": 0.3257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17194947600364685, |
| "step": 2055, |
| "valid_targets_mean": 6007.1, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 2.0850632911392406, |
| "grad_norm": 0.3176958806269076, |
| "learning_rate": 2.896756326594341e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15832051634788513, |
| "step": 2060, |
| "valid_targets_mean": 4807.6, |
| "valid_targets_min": 1533 |
| }, |
| { |
| "epoch": 2.090126582278481, |
| "grad_norm": 0.30643347389492315, |
| "learning_rate": 2.890434742836706e-05, |
| "loss": 0.3061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17868554592132568, |
| "step": 2065, |
| "valid_targets_mean": 5870.9, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 2.0951898734177217, |
| "grad_norm": 0.328300503212321, |
| "learning_rate": 2.8841020442578274e-05, |
| "loss": 0.3219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15090826153755188, |
| "step": 2070, |
| "valid_targets_mean": 4159.4, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 2.100253164556962, |
| "grad_norm": 0.3116451598810816, |
| "learning_rate": 2.8777583099053985e-05, |
| "loss": 0.3096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15223953127861023, |
| "step": 2075, |
| "valid_targets_mean": 4922.9, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 2.1053164556962027, |
| "grad_norm": 0.32927381366700853, |
| "learning_rate": 2.871403618964867e-05, |
| "loss": 0.3177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18153706192970276, |
| "step": 2080, |
| "valid_targets_mean": 4833.8, |
| "valid_targets_min": 1513 |
| }, |
| { |
| "epoch": 2.110379746835443, |
| "grad_norm": 0.30099077420276216, |
| "learning_rate": 2.8650380507584444e-05, |
| "loss": 0.3185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11155495047569275, |
| "step": 2085, |
| "valid_targets_mean": 3890.5, |
| "valid_targets_min": 1469 |
| }, |
| { |
| "epoch": 2.1154430379746834, |
| "grad_norm": 0.304896658143913, |
| "learning_rate": 2.8586616847441192e-05, |
| "loss": 0.3203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.143421471118927, |
| "step": 2090, |
| "valid_targets_mean": 4747.4, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 2.120506329113924, |
| "grad_norm": 0.33627609235395134, |
| "learning_rate": 2.852274600514662e-05, |
| "loss": 0.3236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17665691673755646, |
| "step": 2095, |
| "valid_targets_mean": 4558.9, |
| "valid_targets_min": 1540 |
| }, |
| { |
| "epoch": 2.1255696202531644, |
| "grad_norm": 0.3025889533254811, |
| "learning_rate": 2.8458768777966333e-05, |
| "loss": 0.3151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16682836413383484, |
| "step": 2100, |
| "valid_targets_mean": 5740.6, |
| "valid_targets_min": 1809 |
| }, |
| { |
| "epoch": 2.130632911392405, |
| "grad_norm": 0.3039388867958498, |
| "learning_rate": 2.8394685964493886e-05, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0811905711889267, |
| "step": 2105, |
| "valid_targets_mean": 3185.6, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 2.1356962025316455, |
| "grad_norm": 0.34645798201468236, |
| "learning_rate": 2.8330498364640803e-05, |
| "loss": 0.3169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20455661416053772, |
| "step": 2110, |
| "valid_targets_mean": 5101.9, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 2.140759493670886, |
| "grad_norm": 0.2965620255799478, |
| "learning_rate": 2.8266206779626604e-05, |
| "loss": 0.2991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15685412287712097, |
| "step": 2115, |
| "valid_targets_mean": 5286.0, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 2.1458227848101266, |
| "grad_norm": 0.3555931137634147, |
| "learning_rate": 2.8201812011968807e-05, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16602477431297302, |
| "step": 2120, |
| "valid_targets_mean": 4031.6, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 2.150886075949367, |
| "grad_norm": 0.31549642905504277, |
| "learning_rate": 2.8137314865472896e-05, |
| "loss": 0.3115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2147747278213501, |
| "step": 2125, |
| "valid_targets_mean": 5917.6, |
| "valid_targets_min": 1516 |
| }, |
| { |
| "epoch": 2.1559493670886076, |
| "grad_norm": 0.3817360788487001, |
| "learning_rate": 2.8072716145222295e-05, |
| "loss": 0.3204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1429363489151001, |
| "step": 2130, |
| "valid_targets_mean": 4846.5, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 2.161012658227848, |
| "grad_norm": 0.29099253723913165, |
| "learning_rate": 2.800801665756833e-05, |
| "loss": 0.3076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1667858213186264, |
| "step": 2135, |
| "valid_targets_mean": 5250.2, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 2.1660759493670887, |
| "grad_norm": 0.31033307443976493, |
| "learning_rate": 2.794321721012013e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15342216193675995, |
| "step": 2140, |
| "valid_targets_mean": 4172.6, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.1711392405063292, |
| "grad_norm": 0.32002549909894445, |
| "learning_rate": 2.78783186117346e-05, |
| "loss": 0.3136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1935744285583496, |
| "step": 2145, |
| "valid_targets_mean": 5775.0, |
| "valid_targets_min": 1696 |
| }, |
| { |
| "epoch": 2.1762025316455698, |
| "grad_norm": 0.3337487659466844, |
| "learning_rate": 2.7813321672506268e-05, |
| "loss": 0.3176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19408701360225677, |
| "step": 2150, |
| "valid_targets_mean": 5285.5, |
| "valid_targets_min": 1837 |
| }, |
| { |
| "epoch": 2.1812658227848103, |
| "grad_norm": 0.30999599957531293, |
| "learning_rate": 2.77482272037572e-05, |
| "loss": 0.3085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16555137932300568, |
| "step": 2155, |
| "valid_targets_mean": 4545.2, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 2.186329113924051, |
| "grad_norm": 0.32893298945558314, |
| "learning_rate": 2.768303601802689e-05, |
| "loss": 0.3059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15684665739536285, |
| "step": 2160, |
| "valid_targets_mean": 3914.8, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 2.191392405063291, |
| "grad_norm": 0.32177861173163685, |
| "learning_rate": 2.7617748929062084e-05, |
| "loss": 0.3113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13835042715072632, |
| "step": 2165, |
| "valid_targets_mean": 4624.2, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 2.1964556962025314, |
| "grad_norm": 0.2604316010544582, |
| "learning_rate": 2.7552366751806624e-05, |
| "loss": 0.296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14997389912605286, |
| "step": 2170, |
| "valid_targets_mean": 6796.2, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 2.201518987341772, |
| "grad_norm": 0.30476092949327993, |
| "learning_rate": 2.7486890302391316e-05, |
| "loss": 0.3064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1621738076210022, |
| "step": 2175, |
| "valid_targets_mean": 5079.0, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 2.2065822784810125, |
| "grad_norm": 0.3322580301103298, |
| "learning_rate": 2.7421320398123702e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1476869136095047, |
| "step": 2180, |
| "valid_targets_mean": 3784.2, |
| "valid_targets_min": 1640 |
| }, |
| { |
| "epoch": 2.211645569620253, |
| "grad_norm": 0.2990722276821268, |
| "learning_rate": 2.735565785747787e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13568082451820374, |
| "step": 2185, |
| "valid_targets_mean": 4330.4, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 2.2167088607594936, |
| "grad_norm": 0.30616718547526817, |
| "learning_rate": 2.728990350008423e-05, |
| "loss": 0.3215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17533037066459656, |
| "step": 2190, |
| "valid_targets_mean": 5132.6, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 2.221772151898734, |
| "grad_norm": 0.28127500881615763, |
| "learning_rate": 2.722405814671931e-05, |
| "loss": 0.2974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.134933739900589, |
| "step": 2195, |
| "valid_targets_mean": 5636.6, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 2.2268354430379746, |
| "grad_norm": 0.27748602615715384, |
| "learning_rate": 2.715812261929548e-05, |
| "loss": 0.3208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1636897474527359, |
| "step": 2200, |
| "valid_targets_mean": 5998.6, |
| "valid_targets_min": 1351 |
| }, |
| { |
| "epoch": 2.231898734177215, |
| "grad_norm": 0.3255757575300295, |
| "learning_rate": 2.7092097740850712e-05, |
| "loss": 0.3094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1682029664516449, |
| "step": 2205, |
| "valid_targets_mean": 4255.6, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 2.2369620253164557, |
| "grad_norm": 0.30015032841488015, |
| "learning_rate": 2.7025984335538297e-05, |
| "loss": 0.3163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1712615191936493, |
| "step": 2210, |
| "valid_targets_mean": 5242.7, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.2420253164556962, |
| "grad_norm": 0.35257346632541897, |
| "learning_rate": 2.6959783228616543e-05, |
| "loss": 0.3258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14988690614700317, |
| "step": 2215, |
| "valid_targets_mean": 3744.8, |
| "valid_targets_min": 1368 |
| }, |
| { |
| "epoch": 2.247088607594937, |
| "grad_norm": 0.34270763531215714, |
| "learning_rate": 2.6893495246438512e-05, |
| "loss": 0.3099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13658785820007324, |
| "step": 2220, |
| "valid_targets_mean": 3438.7, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 2.2521518987341773, |
| "grad_norm": 0.3370660380071177, |
| "learning_rate": 2.682712121644168e-05, |
| "loss": 0.3137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1949615478515625, |
| "step": 2225, |
| "valid_targets_mean": 4599.9, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 2.257215189873418, |
| "grad_norm": 0.348355336462014, |
| "learning_rate": 2.6760661967137597e-05, |
| "loss": 0.3047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16294927895069122, |
| "step": 2230, |
| "valid_targets_mean": 4107.5, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 2.2622784810126584, |
| "grad_norm": 0.3249186301351007, |
| "learning_rate": 2.6694118328101592e-05, |
| "loss": 0.3144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09672749042510986, |
| "step": 2235, |
| "valid_targets_mean": 2920.3, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 2.267341772151899, |
| "grad_norm": 0.30303571071751967, |
| "learning_rate": 2.6627491129962343e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1442355215549469, |
| "step": 2240, |
| "valid_targets_mean": 4454.2, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 2.2724050632911394, |
| "grad_norm": 0.31715305103924707, |
| "learning_rate": 2.6560781204391584e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10361987352371216, |
| "step": 2245, |
| "valid_targets_mean": 3143.1, |
| "valid_targets_min": 1447 |
| }, |
| { |
| "epoch": 2.27746835443038, |
| "grad_norm": 0.28484792889639327, |
| "learning_rate": 2.6493989384093674e-05, |
| "loss": 0.3142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14160794019699097, |
| "step": 2250, |
| "valid_targets_mean": 4650.6, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 2.28253164556962, |
| "grad_norm": 0.2878082890562957, |
| "learning_rate": 2.642711650279523e-05, |
| "loss": 0.3094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1957184076309204, |
| "step": 2255, |
| "valid_targets_mean": 5700.1, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 2.2875949367088606, |
| "grad_norm": 0.28921634890872305, |
| "learning_rate": 2.636016339523472e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1497688591480255, |
| "step": 2260, |
| "valid_targets_mean": 5892.9, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 2.292658227848101, |
| "grad_norm": 0.374304372121314, |
| "learning_rate": 2.6293130897152005e-05, |
| "loss": 0.3046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10483106970787048, |
| "step": 2265, |
| "valid_targets_mean": 2732.1, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 2.2977215189873417, |
| "grad_norm": 0.360265224368032, |
| "learning_rate": 2.6226019845277954e-05, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15251410007476807, |
| "step": 2270, |
| "valid_targets_mean": 3089.3, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 2.302784810126582, |
| "grad_norm": 0.3076018448534471, |
| "learning_rate": 2.615883107732398e-05, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10678346455097198, |
| "step": 2275, |
| "valid_targets_mean": 3471.9, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 2.3078481012658227, |
| "grad_norm": 0.30671877576562406, |
| "learning_rate": 2.609156543197158e-05, |
| "loss": 0.3101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18611571192741394, |
| "step": 2280, |
| "valid_targets_mean": 5213.1, |
| "valid_targets_min": 1379 |
| }, |
| { |
| "epoch": 2.3129113924050633, |
| "grad_norm": 0.42457395280342314, |
| "learning_rate": 2.6024223748861883e-05, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17773228883743286, |
| "step": 2285, |
| "valid_targets_mean": 5313.4, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 2.317974683544304, |
| "grad_norm": 0.343397113662205, |
| "learning_rate": 2.5956806868585136e-05, |
| "loss": 0.305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1606595367193222, |
| "step": 2290, |
| "valid_targets_mean": 3827.6, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 2.3230379746835443, |
| "grad_norm": 0.2808278753890521, |
| "learning_rate": 2.5889315632670247e-05, |
| "loss": 0.3132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11440195143222809, |
| "step": 2295, |
| "valid_targets_mean": 3889.9, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 2.328101265822785, |
| "grad_norm": 0.3112053561319972, |
| "learning_rate": 2.582175088357426e-05, |
| "loss": 0.3108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14229443669319153, |
| "step": 2300, |
| "valid_targets_mean": 3906.9, |
| "valid_targets_min": 1129 |
| }, |
| { |
| "epoch": 2.3331645569620254, |
| "grad_norm": 0.29738973838136984, |
| "learning_rate": 2.575411346467185e-05, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12370048463344574, |
| "step": 2305, |
| "valid_targets_mean": 4034.3, |
| "valid_targets_min": 1620 |
| }, |
| { |
| "epoch": 2.338227848101266, |
| "grad_norm": 0.3012147807699108, |
| "learning_rate": 2.568640422024478e-05, |
| "loss": 0.3076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2278967797756195, |
| "step": 2310, |
| "valid_targets_mean": 5961.9, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 2.3432911392405065, |
| "grad_norm": 0.2922942701946769, |
| "learning_rate": 2.5618623995471394e-05, |
| "loss": 0.3133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16622743010520935, |
| "step": 2315, |
| "valid_targets_mean": 5404.4, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 2.348354430379747, |
| "grad_norm": 0.36432427585365534, |
| "learning_rate": 2.5550773636416008e-05, |
| "loss": 0.3196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1854952722787857, |
| "step": 2320, |
| "valid_targets_mean": 3965.4, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 2.353417721518987, |
| "grad_norm": 0.33468505049542446, |
| "learning_rate": 2.548285399001843e-05, |
| "loss": 0.3099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15984870493412018, |
| "step": 2325, |
| "valid_targets_mean": 3767.3, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 2.3584810126582276, |
| "grad_norm": 0.30206170793614096, |
| "learning_rate": 2.5414865904083314e-05, |
| "loss": 0.3161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18496757745742798, |
| "step": 2330, |
| "valid_targets_mean": 5605.0, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 2.363544303797468, |
| "grad_norm": 0.3069574368019458, |
| "learning_rate": 2.534681022726962e-05, |
| "loss": 0.3143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20892611145973206, |
| "step": 2335, |
| "valid_targets_mean": 5443.6, |
| "valid_targets_min": 1904 |
| }, |
| { |
| "epoch": 2.3686075949367087, |
| "grad_norm": 0.324406187683953, |
| "learning_rate": 2.5278687809080017e-05, |
| "loss": 0.3157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13418112695217133, |
| "step": 2340, |
| "valid_targets_mean": 3362.5, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 2.3736708860759492, |
| "grad_norm": 0.32283224636579144, |
| "learning_rate": 2.5210499499850252e-05, |
| "loss": 0.3236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14372019469738007, |
| "step": 2345, |
| "valid_targets_mean": 3757.2, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 2.3787341772151898, |
| "grad_norm": 0.2954201993306155, |
| "learning_rate": 2.5142246150738566e-05, |
| "loss": 0.3132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16226419806480408, |
| "step": 2350, |
| "valid_targets_mean": 5083.2, |
| "valid_targets_min": 1909 |
| }, |
| { |
| "epoch": 2.3837974683544303, |
| "grad_norm": 0.278033728430402, |
| "learning_rate": 2.5073928613715053e-05, |
| "loss": 0.3122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13732075691223145, |
| "step": 2355, |
| "valid_targets_mean": 5177.6, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 2.388860759493671, |
| "grad_norm": 0.3406821151852307, |
| "learning_rate": 2.5005547741551045e-05, |
| "loss": 0.3207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1702435463666916, |
| "step": 2360, |
| "valid_targets_mean": 3885.0, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 2.3939240506329114, |
| "grad_norm": 0.2924901782943758, |
| "learning_rate": 2.4937104387808434e-05, |
| "loss": 0.3117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17096886038780212, |
| "step": 2365, |
| "valid_targets_mean": 5283.7, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 2.398987341772152, |
| "grad_norm": 0.30986779863862535, |
| "learning_rate": 2.4868599406829045e-05, |
| "loss": 0.308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17868509888648987, |
| "step": 2370, |
| "valid_targets_mean": 4610.5, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 2.4040506329113924, |
| "grad_norm": 0.2951664773380052, |
| "learning_rate": 2.4800033653723962e-05, |
| "loss": 0.3137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14138385653495789, |
| "step": 2375, |
| "valid_targets_mean": 4383.0, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 2.409113924050633, |
| "grad_norm": 0.3206066119244924, |
| "learning_rate": 2.473140798436285e-05, |
| "loss": 0.3221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.150266632437706, |
| "step": 2380, |
| "valid_targets_mean": 3835.7, |
| "valid_targets_min": 1476 |
| }, |
| { |
| "epoch": 2.4141772151898735, |
| "grad_norm": 0.30473370037176944, |
| "learning_rate": 2.466272325536329e-05, |
| "loss": 0.3015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19058401882648468, |
| "step": 2385, |
| "valid_targets_mean": 6384.8, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 2.419240506329114, |
| "grad_norm": 0.31479938811797176, |
| "learning_rate": 2.4593980324080054e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11872898042201996, |
| "step": 2390, |
| "valid_targets_mean": 3557.1, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 2.4243037974683546, |
| "grad_norm": 0.3392666541666469, |
| "learning_rate": 2.4525180048594452e-05, |
| "loss": 0.3163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15524475276470184, |
| "step": 2395, |
| "valid_targets_mean": 4042.5, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 2.429367088607595, |
| "grad_norm": 0.3116160865837986, |
| "learning_rate": 2.445632328770354e-05, |
| "loss": 0.3079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14736303687095642, |
| "step": 2400, |
| "valid_targets_mean": 4778.8, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 2.4344303797468356, |
| "grad_norm": 0.3248761370284341, |
| "learning_rate": 2.438741090090951e-05, |
| "loss": 0.3148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1985064595937729, |
| "step": 2405, |
| "valid_targets_mean": 6140.9, |
| "valid_targets_min": 1429 |
| }, |
| { |
| "epoch": 2.439493670886076, |
| "grad_norm": 0.2819598660386808, |
| "learning_rate": 2.431844374840886e-05, |
| "loss": 0.3066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13578057289123535, |
| "step": 2410, |
| "valid_targets_mean": 4853.0, |
| "valid_targets_min": 1602 |
| }, |
| { |
| "epoch": 2.4445569620253167, |
| "grad_norm": 0.31885986982040326, |
| "learning_rate": 2.4249422691081722e-05, |
| "loss": 0.3057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15936186909675598, |
| "step": 2415, |
| "valid_targets_mean": 4181.2, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 2.449620253164557, |
| "grad_norm": 0.30296726343845826, |
| "learning_rate": 2.4180348590481075e-05, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12165558338165283, |
| "step": 2420, |
| "valid_targets_mean": 3419.1, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 2.4546835443037973, |
| "grad_norm": 0.309483869681844, |
| "learning_rate": 2.411122230882203e-05, |
| "loss": 0.3102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1562597155570984, |
| "step": 2425, |
| "valid_targets_mean": 4920.2, |
| "valid_targets_min": 983 |
| }, |
| { |
| "epoch": 2.459746835443038, |
| "grad_norm": 1.2885193054997446, |
| "learning_rate": 2.4042044708971027e-05, |
| "loss": 0.3045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1394486129283905, |
| "step": 2430, |
| "valid_targets_mean": 4328.4, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 2.4648101265822784, |
| "grad_norm": 0.27206002510649857, |
| "learning_rate": 2.3972816654435103e-05, |
| "loss": 0.3161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16065040230751038, |
| "step": 2435, |
| "valid_targets_mean": 6525.3, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 2.469873417721519, |
| "grad_norm": 0.3427940884240252, |
| "learning_rate": 2.390353900935107e-05, |
| "loss": 0.3198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19091764092445374, |
| "step": 2440, |
| "valid_targets_mean": 4360.0, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 2.4749367088607594, |
| "grad_norm": 0.42327373841330385, |
| "learning_rate": 2.3834212638474773e-05, |
| "loss": 0.306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12319037318229675, |
| "step": 2445, |
| "valid_targets_mean": 3837.3, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 2.48, |
| "grad_norm": 0.49287136211086113, |
| "learning_rate": 2.376483840717026e-05, |
| "loss": 0.3236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15457025170326233, |
| "step": 2450, |
| "valid_targets_mean": 3929.6, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 2.4850632911392405, |
| "grad_norm": 0.32265608836896076, |
| "learning_rate": 2.3695417181399004e-05, |
| "loss": 0.3138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13117042183876038, |
| "step": 2455, |
| "valid_targets_mean": 3683.8, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 2.490126582278481, |
| "grad_norm": 0.28497626230687617, |
| "learning_rate": 2.362594982770909e-05, |
| "loss": 0.3071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13846123218536377, |
| "step": 2460, |
| "valid_targets_mean": 4725.8, |
| "valid_targets_min": 1651 |
| }, |
| { |
| "epoch": 2.4951898734177216, |
| "grad_norm": 0.30556606202877784, |
| "learning_rate": 2.3556437213224378e-05, |
| "loss": 0.3149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1903924196958542, |
| "step": 2465, |
| "valid_targets_mean": 5195.9, |
| "valid_targets_min": 1317 |
| }, |
| { |
| "epoch": 2.500253164556962, |
| "grad_norm": 0.2957801020557521, |
| "learning_rate": 2.348688020563371e-05, |
| "loss": 0.3202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15225407481193542, |
| "step": 2470, |
| "valid_targets_mean": 4614.5, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 2.5053164556962026, |
| "grad_norm": 0.29068264222113155, |
| "learning_rate": 2.3417279673180048e-05, |
| "loss": 0.312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15005727112293243, |
| "step": 2475, |
| "valid_targets_mean": 5253.2, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 2.510379746835443, |
| "grad_norm": 0.34824655792906656, |
| "learning_rate": 2.3347636484649662e-05, |
| "loss": 0.3107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11774547398090363, |
| "step": 2480, |
| "valid_targets_mean": 3077.8, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 2.5154430379746833, |
| "grad_norm": 0.3255931573908884, |
| "learning_rate": 2.3277951509361273e-05, |
| "loss": 0.3317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20479710400104523, |
| "step": 2485, |
| "valid_targets_mean": 5133.7, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 2.520506329113924, |
| "grad_norm": 0.30263280385351665, |
| "learning_rate": 2.3208225617155206e-05, |
| "loss": 0.3121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14676184952259064, |
| "step": 2490, |
| "valid_targets_mean": 4788.9, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 2.5255696202531643, |
| "grad_norm": 0.34344447055299104, |
| "learning_rate": 2.3138459678382524e-05, |
| "loss": 0.3156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18363483250141144, |
| "step": 2495, |
| "valid_targets_mean": 4170.4, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 2.530632911392405, |
| "grad_norm": 0.2844384480121892, |
| "learning_rate": 2.3068654563894183e-05, |
| "loss": 0.3172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12592104077339172, |
| "step": 2500, |
| "valid_targets_mean": 4493.2, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 2.5356962025316454, |
| "grad_norm": 0.32631729959150463, |
| "learning_rate": 2.2998811145030117e-05, |
| "loss": 0.3101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15357106924057007, |
| "step": 2505, |
| "valid_targets_mean": 4361.8, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 2.540759493670886, |
| "grad_norm": 0.2650853449197667, |
| "learning_rate": 2.2928930293608435e-05, |
| "loss": 0.307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13759788870811462, |
| "step": 2510, |
| "valid_targets_mean": 5130.8, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 2.5458227848101265, |
| "grad_norm": 0.3267807848788021, |
| "learning_rate": 2.2859012881914464e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16794613003730774, |
| "step": 2515, |
| "valid_targets_mean": 4673.6, |
| "valid_targets_min": 1083 |
| }, |
| { |
| "epoch": 2.550886075949367, |
| "grad_norm": 0.278879282582265, |
| "learning_rate": 2.278905978268992e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11442182958126068, |
| "step": 2520, |
| "valid_targets_mean": 4874.6, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 2.5559493670886075, |
| "grad_norm": 0.32085560175743244, |
| "learning_rate": 2.271907186912196e-05, |
| "loss": 0.3119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12187394499778748, |
| "step": 2525, |
| "valid_targets_mean": 3503.1, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 2.561012658227848, |
| "grad_norm": 0.3284259732307929, |
| "learning_rate": 2.2649050014832326e-05, |
| "loss": 0.3112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16201844811439514, |
| "step": 2530, |
| "valid_targets_mean": 4727.4, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 2.5660759493670886, |
| "grad_norm": 0.2991569094124765, |
| "learning_rate": 2.2578995093866424e-05, |
| "loss": 0.3126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1367436945438385, |
| "step": 2535, |
| "valid_targets_mean": 5286.4, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 2.571139240506329, |
| "grad_norm": 0.2923839601296598, |
| "learning_rate": 2.2508907980682406e-05, |
| "loss": 0.3066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15937817096710205, |
| "step": 2540, |
| "valid_targets_mean": 5033.3, |
| "valid_targets_min": 1409 |
| }, |
| { |
| "epoch": 2.5762025316455697, |
| "grad_norm": 0.29834149017437644, |
| "learning_rate": 2.2438789550140272e-05, |
| "loss": 0.3208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1662355363368988, |
| "step": 2545, |
| "valid_targets_mean": 4474.9, |
| "valid_targets_min": 1458 |
| }, |
| { |
| "epoch": 2.58126582278481, |
| "grad_norm": 0.31248285204558157, |
| "learning_rate": 2.2368640677490935e-05, |
| "loss": 0.3111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12987586855888367, |
| "step": 2550, |
| "valid_targets_mean": 4253.7, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 2.5863291139240507, |
| "grad_norm": 0.2913592791130016, |
| "learning_rate": 2.2298462238365293e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20642492175102234, |
| "step": 2555, |
| "valid_targets_mean": 6304.3, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 2.5913924050632913, |
| "grad_norm": 0.35349413261981677, |
| "learning_rate": 2.222825510876332e-05, |
| "loss": 0.3202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17145583033561707, |
| "step": 2560, |
| "valid_targets_mean": 4713.6, |
| "valid_targets_min": 1409 |
| }, |
| { |
| "epoch": 2.596455696202532, |
| "grad_norm": 0.3451688511848506, |
| "learning_rate": 2.2158020165043114e-05, |
| "loss": 0.3105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16764461994171143, |
| "step": 2565, |
| "valid_targets_mean": 3924.4, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 2.6015189873417723, |
| "grad_norm": 0.2797909726976478, |
| "learning_rate": 2.2087758283909954e-05, |
| "loss": 0.3196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1547449380159378, |
| "step": 2570, |
| "valid_targets_mean": 5481.8, |
| "valid_targets_min": 1376 |
| }, |
| { |
| "epoch": 2.606582278481013, |
| "grad_norm": 0.3101010476898593, |
| "learning_rate": 2.201747034240537e-05, |
| "loss": 0.3135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1627534031867981, |
| "step": 2575, |
| "valid_targets_mean": 4466.9, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 2.6116455696202534, |
| "grad_norm": 1.1618173704395123, |
| "learning_rate": 2.1947157217896188e-05, |
| "loss": 0.3095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.165956050157547, |
| "step": 2580, |
| "valid_targets_mean": 4300.5, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 2.616708860759494, |
| "grad_norm": 0.31858634458407287, |
| "learning_rate": 2.1876819788063586e-05, |
| "loss": 0.3115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15230509638786316, |
| "step": 2585, |
| "valid_targets_mean": 3920.5, |
| "valid_targets_min": 1479 |
| }, |
| { |
| "epoch": 2.621772151898734, |
| "grad_norm": 0.30557996470586596, |
| "learning_rate": 2.1806458930892127e-05, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18883772194385529, |
| "step": 2590, |
| "valid_targets_mean": 6008.9, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 2.6268354430379746, |
| "grad_norm": 0.2883450262202285, |
| "learning_rate": 2.173607552465881e-05, |
| "loss": 0.3166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17338699102401733, |
| "step": 2595, |
| "valid_targets_mean": 5570.2, |
| "valid_targets_min": 1526 |
| }, |
| { |
| "epoch": 2.631898734177215, |
| "grad_norm": 0.33234113394369846, |
| "learning_rate": 2.1665670447922084e-05, |
| "loss": 0.3129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12816452980041504, |
| "step": 2600, |
| "valid_targets_mean": 4282.2, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.6369620253164556, |
| "grad_norm": 0.31643919888427663, |
| "learning_rate": 2.1595244579510933e-05, |
| "loss": 0.3073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17621192336082458, |
| "step": 2605, |
| "valid_targets_mean": 5060.8, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 2.642025316455696, |
| "grad_norm": 0.30039427757871706, |
| "learning_rate": 2.1524798798513835e-05, |
| "loss": 0.3023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16294711828231812, |
| "step": 2610, |
| "valid_targets_mean": 4472.4, |
| "valid_targets_min": 1304 |
| }, |
| { |
| "epoch": 2.6470886075949367, |
| "grad_norm": 0.3231328181820057, |
| "learning_rate": 2.1454333984267852e-05, |
| "loss": 0.322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16857695579528809, |
| "step": 2615, |
| "valid_targets_mean": 5128.5, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 2.6521518987341772, |
| "grad_norm": 0.331376941255876, |
| "learning_rate": 2.1383851016347614e-05, |
| "loss": 0.3105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1293996274471283, |
| "step": 2620, |
| "valid_targets_mean": 3696.2, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 2.6572151898734178, |
| "grad_norm": 0.2898986778677013, |
| "learning_rate": 2.1313350774554366e-05, |
| "loss": 0.308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14066889882087708, |
| "step": 2625, |
| "valid_targets_mean": 4409.5, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 2.6622784810126583, |
| "grad_norm": 0.3792545064079998, |
| "learning_rate": 2.1242834138904962e-05, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14408881962299347, |
| "step": 2630, |
| "valid_targets_mean": 3892.1, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 2.667341772151899, |
| "grad_norm": 0.34582044479522395, |
| "learning_rate": 2.1172301989620898e-05, |
| "loss": 0.3087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15445685386657715, |
| "step": 2635, |
| "valid_targets_mean": 4015.2, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 2.6724050632911394, |
| "grad_norm": 0.31734348855671907, |
| "learning_rate": 2.110175520711731e-05, |
| "loss": 0.3182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14247769117355347, |
| "step": 2640, |
| "valid_targets_mean": 4152.1, |
| "valid_targets_min": 1532 |
| }, |
| { |
| "epoch": 2.67746835443038, |
| "grad_norm": 0.3108375470698165, |
| "learning_rate": 2.1031194671992013e-05, |
| "loss": 0.3145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13973818719387054, |
| "step": 2645, |
| "valid_targets_mean": 4321.8, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 2.68253164556962, |
| "grad_norm": 0.3378134291776038, |
| "learning_rate": 2.0960621265014462e-05, |
| "loss": 0.3105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17127710580825806, |
| "step": 2650, |
| "valid_targets_mean": 4009.1, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 2.6875949367088605, |
| "grad_norm": 0.29939660412855834, |
| "learning_rate": 2.0890035867114808e-05, |
| "loss": 0.3131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15695559978485107, |
| "step": 2655, |
| "valid_targets_mean": 5238.8, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 2.692658227848101, |
| "grad_norm": 0.3230482978021318, |
| "learning_rate": 2.081943935937286e-05, |
| "loss": 0.3075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1587713658809662, |
| "step": 2660, |
| "valid_targets_mean": 4748.3, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 2.6977215189873416, |
| "grad_norm": 0.29402248645547446, |
| "learning_rate": 2.0748832623007117e-05, |
| "loss": 0.3217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10896088182926178, |
| "step": 2665, |
| "valid_targets_mean": 3750.2, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 2.702784810126582, |
| "grad_norm": 0.27936531158953143, |
| "learning_rate": 2.067821653936375e-05, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1711559295654297, |
| "step": 2670, |
| "valid_targets_mean": 6852.6, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 2.7078481012658226, |
| "grad_norm": 0.28924656402783777, |
| "learning_rate": 2.060759198990561e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14176371693611145, |
| "step": 2675, |
| "valid_targets_mean": 5084.8, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 2.712911392405063, |
| "grad_norm": 0.3123266627731589, |
| "learning_rate": 2.053695985620123e-05, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15624725818634033, |
| "step": 2680, |
| "valid_targets_mean": 4276.9, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 2.7179746835443037, |
| "grad_norm": 0.30428837341523135, |
| "learning_rate": 2.0466321019913787e-05, |
| "loss": 0.3083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12444409728050232, |
| "step": 2685, |
| "valid_targets_mean": 5104.2, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 2.7230379746835442, |
| "grad_norm": 0.2899541063761625, |
| "learning_rate": 2.0395676362790157e-05, |
| "loss": 0.3139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18925632536411285, |
| "step": 2690, |
| "valid_targets_mean": 6929.8, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 2.728101265822785, |
| "grad_norm": 0.3000387772557557, |
| "learning_rate": 2.032502676664985e-05, |
| "loss": 0.3256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15346036851406097, |
| "step": 2695, |
| "valid_targets_mean": 4285.7, |
| "valid_targets_min": 1379 |
| }, |
| { |
| "epoch": 2.7331645569620253, |
| "grad_norm": 0.3021057118413619, |
| "learning_rate": 2.025437311337404e-05, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14610332250595093, |
| "step": 2700, |
| "valid_targets_mean": 4591.1, |
| "valid_targets_min": 1675 |
| }, |
| { |
| "epoch": 2.738227848101266, |
| "grad_norm": 0.32691877516784146, |
| "learning_rate": 2.0183716284894533e-05, |
| "loss": 0.3225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14551448822021484, |
| "step": 2705, |
| "valid_targets_mean": 3989.2, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 2.7432911392405064, |
| "grad_norm": 0.3657473594680315, |
| "learning_rate": 2.011305716318278e-05, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22241473197937012, |
| "step": 2710, |
| "valid_targets_mean": 6030.1, |
| "valid_targets_min": 1316 |
| }, |
| { |
| "epoch": 2.748354430379747, |
| "grad_norm": 0.3038961961226564, |
| "learning_rate": 2.004239663023885e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16947516798973083, |
| "step": 2715, |
| "valid_targets_mean": 5248.6, |
| "valid_targets_min": 1555 |
| }, |
| { |
| "epoch": 2.7534177215189874, |
| "grad_norm": 0.3050248442776484, |
| "learning_rate": 1.997173556808043e-05, |
| "loss": 0.294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1630948781967163, |
| "step": 2720, |
| "valid_targets_mean": 5884.7, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 2.758481012658228, |
| "grad_norm": 0.35402206211471576, |
| "learning_rate": 1.9901074858731825e-05, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1823733150959015, |
| "step": 2725, |
| "valid_targets_mean": 4029.6, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 2.7635443037974685, |
| "grad_norm": 0.2902629337004639, |
| "learning_rate": 1.98304153842129e-05, |
| "loss": 0.313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1647607535123825, |
| "step": 2730, |
| "valid_targets_mean": 5231.3, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 2.768607594936709, |
| "grad_norm": 0.2844550099011252, |
| "learning_rate": 1.9759758026528162e-05, |
| "loss": 0.3181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20809857547283173, |
| "step": 2735, |
| "valid_targets_mean": 6735.6, |
| "valid_targets_min": 1644 |
| }, |
| { |
| "epoch": 2.7736708860759496, |
| "grad_norm": 0.3348579330081765, |
| "learning_rate": 1.9689103667655634e-05, |
| "loss": 0.3088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1527232825756073, |
| "step": 2740, |
| "valid_targets_mean": 3877.4, |
| "valid_targets_min": 1491 |
| }, |
| { |
| "epoch": 2.77873417721519, |
| "grad_norm": 0.33857120124730805, |
| "learning_rate": 1.9618453189535958e-05, |
| "loss": 0.3168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20601877570152283, |
| "step": 2745, |
| "valid_targets_mean": 4548.2, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 2.7837974683544306, |
| "grad_norm": 0.3346701582946249, |
| "learning_rate": 1.9547807474061303e-05, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13511428236961365, |
| "step": 2750, |
| "valid_targets_mean": 3345.6, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 2.7888607594936707, |
| "grad_norm": 0.3375591584241796, |
| "learning_rate": 1.947716740306439e-05, |
| "loss": 0.3089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16758695244789124, |
| "step": 2755, |
| "valid_targets_mean": 3964.9, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 2.7939240506329113, |
| "grad_norm": 0.340384343325027, |
| "learning_rate": 1.9406533858307503e-05, |
| "loss": 0.3178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1304406374692917, |
| "step": 2760, |
| "valid_targets_mean": 3351.9, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 2.798987341772152, |
| "grad_norm": 0.29188887212643894, |
| "learning_rate": 1.9335907721471438e-05, |
| "loss": 0.3042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15948455035686493, |
| "step": 2765, |
| "valid_targets_mean": 4508.9, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 2.8040506329113923, |
| "grad_norm": 0.2914363526376243, |
| "learning_rate": 1.9265289874144554e-05, |
| "loss": 0.3112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18582302331924438, |
| "step": 2770, |
| "valid_targets_mean": 6648.4, |
| "valid_targets_min": 2048 |
| }, |
| { |
| "epoch": 2.809113924050633, |
| "grad_norm": 0.3447263204953251, |
| "learning_rate": 1.9194681197811703e-05, |
| "loss": 0.3154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11537902057170868, |
| "step": 2775, |
| "valid_targets_mean": 3061.1, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 2.8141772151898734, |
| "grad_norm": 0.28824906654455074, |
| "learning_rate": 1.912408257384327e-05, |
| "loss": 0.3173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18753370642662048, |
| "step": 2780, |
| "valid_targets_mean": 6277.4, |
| "valid_targets_min": 1561 |
| }, |
| { |
| "epoch": 2.819240506329114, |
| "grad_norm": 0.31551057795248955, |
| "learning_rate": 1.9053494883484177e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1113462746143341, |
| "step": 2785, |
| "valid_targets_mean": 3603.0, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 2.8243037974683545, |
| "grad_norm": 0.3130169957194376, |
| "learning_rate": 1.898291900784284e-05, |
| "loss": 0.3045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17591753602027893, |
| "step": 2790, |
| "valid_targets_mean": 4849.0, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 2.829367088607595, |
| "grad_norm": 0.36153291519489483, |
| "learning_rate": 1.8912355827880237e-05, |
| "loss": 0.3166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13046428561210632, |
| "step": 2795, |
| "valid_targets_mean": 3138.6, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 2.8344303797468355, |
| "grad_norm": 0.35818567026601295, |
| "learning_rate": 1.884180622439884e-05, |
| "loss": 0.3105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15154902637004852, |
| "step": 2800, |
| "valid_targets_mean": 3774.6, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 2.839493670886076, |
| "grad_norm": 0.33153674409005546, |
| "learning_rate": 1.8771271078031648e-05, |
| "loss": 0.3064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17227354645729065, |
| "step": 2805, |
| "valid_targets_mean": 5559.2, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 2.8445569620253166, |
| "grad_norm": 0.30646195273462673, |
| "learning_rate": 1.8700751269231243e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17971369624137878, |
| "step": 2810, |
| "valid_targets_mean": 5315.5, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 2.8496202531645567, |
| "grad_norm": 0.3147470597121468, |
| "learning_rate": 1.86302476782587e-05, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1408463716506958, |
| "step": 2815, |
| "valid_targets_mean": 3962.4, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 2.8546835443037972, |
| "grad_norm": 0.35549269402291417, |
| "learning_rate": 1.855976118517271e-05, |
| "loss": 0.3075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19130544364452362, |
| "step": 2820, |
| "valid_targets_mean": 4855.5, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.8597468354430378, |
| "grad_norm": 0.2823602428424915, |
| "learning_rate": 1.8489292669818494e-05, |
| "loss": 0.3066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1796441674232483, |
| "step": 2825, |
| "valid_targets_mean": 5933.9, |
| "valid_targets_min": 1652 |
| }, |
| { |
| "epoch": 2.8648101265822783, |
| "grad_norm": 0.3086469012489834, |
| "learning_rate": 1.8418843011816894e-05, |
| "loss": 0.3113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14876966178417206, |
| "step": 2830, |
| "valid_targets_mean": 4459.1, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 2.869873417721519, |
| "grad_norm": 0.33219619271405165, |
| "learning_rate": 1.8348413090553356e-05, |
| "loss": 0.3147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1837439239025116, |
| "step": 2835, |
| "valid_targets_mean": 5042.5, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 2.8749367088607594, |
| "grad_norm": 0.28160060670414677, |
| "learning_rate": 1.8278003785166967e-05, |
| "loss": 0.2942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13023114204406738, |
| "step": 2840, |
| "valid_targets_mean": 4408.2, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 2.88, |
| "grad_norm": 0.2701611603230975, |
| "learning_rate": 1.8207615974539476e-05, |
| "loss": 0.3064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12874723970890045, |
| "step": 2845, |
| "valid_targets_mean": 4858.8, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 2.8850632911392404, |
| "grad_norm": 0.33079935847646824, |
| "learning_rate": 1.8137250537284325e-05, |
| "loss": 0.3093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17800703644752502, |
| "step": 2850, |
| "valid_targets_mean": 4857.1, |
| "valid_targets_min": 1713 |
| }, |
| { |
| "epoch": 2.890126582278481, |
| "grad_norm": 0.23595757958591787, |
| "learning_rate": 1.8066908351735666e-05, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1269092708826065, |
| "step": 2855, |
| "valid_targets_mean": 5766.2, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 2.8951898734177215, |
| "grad_norm": 0.33538165041242207, |
| "learning_rate": 1.7996590295937448e-05, |
| "loss": 0.3038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1899298131465912, |
| "step": 2860, |
| "valid_targets_mean": 5260.9, |
| "valid_targets_min": 1500 |
| }, |
| { |
| "epoch": 2.900253164556962, |
| "grad_norm": 0.3124645131733068, |
| "learning_rate": 1.7926297247632383e-05, |
| "loss": 0.3207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1435328722000122, |
| "step": 2865, |
| "valid_targets_mean": 3785.1, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 2.9053164556962026, |
| "grad_norm": 0.3305614452127962, |
| "learning_rate": 1.7856030084251045e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1552894562482834, |
| "step": 2870, |
| "valid_targets_mean": 4255.3, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 2.910379746835443, |
| "grad_norm": 0.34874837954634086, |
| "learning_rate": 1.7785789682900908e-05, |
| "loss": 0.3082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14497388899326324, |
| "step": 2875, |
| "valid_targets_mean": 3286.0, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 2.9154430379746836, |
| "grad_norm": 0.3321474887097409, |
| "learning_rate": 1.771557692035537e-05, |
| "loss": 0.3062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14671984314918518, |
| "step": 2880, |
| "valid_targets_mean": 4362.1, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 2.920506329113924, |
| "grad_norm": 0.36664765144869893, |
| "learning_rate": 1.7645392673042853e-05, |
| "loss": 0.3298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20450638234615326, |
| "step": 2885, |
| "valid_targets_mean": 3744.9, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 2.9255696202531647, |
| "grad_norm": 0.30800064070091415, |
| "learning_rate": 1.757523781703581e-05, |
| "loss": 0.3135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13620543479919434, |
| "step": 2890, |
| "valid_targets_mean": 4010.2, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 2.9306329113924052, |
| "grad_norm": 0.39874064817665694, |
| "learning_rate": 1.7505113228039848e-05, |
| "loss": 0.3146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17097340524196625, |
| "step": 2895, |
| "valid_targets_mean": 4104.1, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 2.9356962025316458, |
| "grad_norm": 0.30804629166037306, |
| "learning_rate": 1.7435019781382737e-05, |
| "loss": 0.297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14079098403453827, |
| "step": 2900, |
| "valid_targets_mean": 4534.0, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 2.9407594936708863, |
| "grad_norm": 0.306220364172818, |
| "learning_rate": 1.7364958352003548e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17645467817783356, |
| "step": 2905, |
| "valid_targets_mean": 4994.2, |
| "valid_targets_min": 1148 |
| }, |
| { |
| "epoch": 2.945822784810127, |
| "grad_norm": 0.3179633647838338, |
| "learning_rate": 1.7294929814441666e-05, |
| "loss": 0.3231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16111071407794952, |
| "step": 2910, |
| "valid_targets_mean": 4938.6, |
| "valid_targets_min": 1387 |
| }, |
| { |
| "epoch": 2.9508860759493674, |
| "grad_norm": 0.31641771807614866, |
| "learning_rate": 1.7224935042825912e-05, |
| "loss": 0.3152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16131725907325745, |
| "step": 2915, |
| "valid_targets_mean": 4423.9, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 2.9559493670886074, |
| "grad_norm": 0.2900729323232742, |
| "learning_rate": 1.7154974910863646e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10794432461261749, |
| "step": 2920, |
| "valid_targets_mean": 3454.4, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 2.961012658227848, |
| "grad_norm": 0.3432477720018123, |
| "learning_rate": 1.7085050291829813e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15215110778808594, |
| "step": 2925, |
| "valid_targets_mean": 4236.8, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 2.9660759493670885, |
| "grad_norm": 0.31507659068073507, |
| "learning_rate": 1.7015162058556088e-05, |
| "loss": 0.3208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16133321821689606, |
| "step": 2930, |
| "valid_targets_mean": 4263.9, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 2.971139240506329, |
| "grad_norm": 0.29285158348676216, |
| "learning_rate": 1.6945311083419947e-05, |
| "loss": 0.2976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1742202341556549, |
| "step": 2935, |
| "valid_targets_mean": 5417.0, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 2.9762025316455696, |
| "grad_norm": 0.2918602342182722, |
| "learning_rate": 1.68754982383338e-05, |
| "loss": 0.3007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1684986650943756, |
| "step": 2940, |
| "valid_targets_mean": 5456.4, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 2.98126582278481, |
| "grad_norm": 0.30561630865463585, |
| "learning_rate": 1.6805724394734107e-05, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10106837749481201, |
| "step": 2945, |
| "valid_targets_mean": 3017.5, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 2.9863291139240506, |
| "grad_norm": 0.29442534234659645, |
| "learning_rate": 1.6735990423570477e-05, |
| "loss": 0.3234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13497650623321533, |
| "step": 2950, |
| "valid_targets_mean": 3993.2, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 2.991392405063291, |
| "grad_norm": 0.2700507094407274, |
| "learning_rate": 1.666629719529483e-05, |
| "loss": 0.3185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15681613981723785, |
| "step": 2955, |
| "valid_targets_mean": 4630.2, |
| "valid_targets_min": 1176 |
| }, |
| { |
| "epoch": 2.9964556962025317, |
| "grad_norm": 0.3447693878105072, |
| "learning_rate": 1.6596645579850505e-05, |
| "loss": 0.3107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1600763201713562, |
| "step": 2960, |
| "valid_targets_mean": 3677.3, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 3.001012658227848, |
| "grad_norm": 0.29622484390463744, |
| "learning_rate": 1.6527036446661396e-05, |
| "loss": 0.3123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14927029609680176, |
| "step": 2965, |
| "valid_targets_mean": 4862.4, |
| "valid_targets_min": 1322 |
| }, |
| { |
| "epoch": 3.0060759493670886, |
| "grad_norm": 0.29785828676100873, |
| "learning_rate": 1.645747066462115e-05, |
| "loss": 0.3021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19526249170303345, |
| "step": 2970, |
| "valid_targets_mean": 5885.6, |
| "valid_targets_min": 1447 |
| }, |
| { |
| "epoch": 3.011139240506329, |
| "grad_norm": 0.35112230405979555, |
| "learning_rate": 1.638794910208225e-05, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10469535738229752, |
| "step": 2975, |
| "valid_targets_mean": 2940.2, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 3.0162025316455696, |
| "grad_norm": 0.3772315133305102, |
| "learning_rate": 1.631847262684523e-05, |
| "loss": 0.3108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16602087020874023, |
| "step": 2980, |
| "valid_targets_mean": 4357.8, |
| "valid_targets_min": 1389 |
| }, |
| { |
| "epoch": 3.02126582278481, |
| "grad_norm": 0.30911220110322923, |
| "learning_rate": 1.624904210614782e-05, |
| "loss": 0.3033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1612570881843567, |
| "step": 2985, |
| "valid_targets_mean": 4494.7, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 3.0263291139240507, |
| "grad_norm": 0.3517033326754291, |
| "learning_rate": 1.6179658406654113e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17958399653434753, |
| "step": 2990, |
| "valid_targets_mean": 4044.6, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 3.031392405063291, |
| "grad_norm": 0.28226563989162823, |
| "learning_rate": 1.6110322394443773e-05, |
| "loss": 0.2853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11023816466331482, |
| "step": 2995, |
| "valid_targets_mean": 4105.8, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 3.0364556962025318, |
| "grad_norm": 0.3395674314450887, |
| "learning_rate": 1.60410349350012e-05, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17015889286994934, |
| "step": 3000, |
| "valid_targets_mean": 5613.8, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 3.0415189873417723, |
| "grad_norm": 0.3328019254619737, |
| "learning_rate": 1.597179689320474e-05, |
| "loss": 0.3068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16885250806808472, |
| "step": 3005, |
| "valid_targets_mean": 4626.2, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 3.046582278481013, |
| "grad_norm": 0.30137258092800007, |
| "learning_rate": 1.5902609133315888e-05, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14555740356445312, |
| "step": 3010, |
| "valid_targets_mean": 5118.1, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 3.0516455696202534, |
| "grad_norm": 0.32251822208809916, |
| "learning_rate": 1.5833472518968478e-05, |
| "loss": 0.3049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13226641714572906, |
| "step": 3015, |
| "valid_targets_mean": 4081.9, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 3.056708860759494, |
| "grad_norm": 0.3211101552341726, |
| "learning_rate": 1.5764387913157952e-05, |
| "loss": 0.3185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0971713736653328, |
| "step": 3020, |
| "valid_targets_mean": 3146.8, |
| "valid_targets_min": 1380 |
| }, |
| { |
| "epoch": 3.061772151898734, |
| "grad_norm": 0.3360390373855527, |
| "learning_rate": 1.5695356178230527e-05, |
| "loss": 0.3062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12469463050365448, |
| "step": 3025, |
| "valid_targets_mean": 3152.8, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 3.0668354430379745, |
| "grad_norm": 0.29385960506365055, |
| "learning_rate": 1.5626378175872486e-05, |
| "loss": 0.2921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16584698855876923, |
| "step": 3030, |
| "valid_targets_mean": 5578.9, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 3.071898734177215, |
| "grad_norm": 0.32789137808560437, |
| "learning_rate": 1.5557454767099382e-05, |
| "loss": 0.2935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17390216886997223, |
| "step": 3035, |
| "valid_targets_mean": 4741.9, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 3.0769620253164556, |
| "grad_norm": 0.3234941533877886, |
| "learning_rate": 1.5488586812245302e-05, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17046749591827393, |
| "step": 3040, |
| "valid_targets_mean": 4481.4, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 3.082025316455696, |
| "grad_norm": 0.28075430375987626, |
| "learning_rate": 1.541977517095215e-05, |
| "loss": 0.3003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14547553658485413, |
| "step": 3045, |
| "valid_targets_mean": 5410.0, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 3.0870886075949366, |
| "grad_norm": 0.28635813947594835, |
| "learning_rate": 1.5351020702158875e-05, |
| "loss": 0.3099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13441359996795654, |
| "step": 3050, |
| "valid_targets_mean": 5051.8, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 3.092151898734177, |
| "grad_norm": 0.34800039286889395, |
| "learning_rate": 1.52823242640908e-05, |
| "loss": 0.3096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15158754587173462, |
| "step": 3055, |
| "valid_targets_mean": 3697.4, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 3.0972151898734177, |
| "grad_norm": 0.32310977392742785, |
| "learning_rate": 1.5213686714248852e-05, |
| "loss": 0.3082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16765525937080383, |
| "step": 3060, |
| "valid_targets_mean": 4845.2, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 3.1022784810126582, |
| "grad_norm": 0.296724917732042, |
| "learning_rate": 1.5145108909398896e-05, |
| "loss": 0.3042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14354108273983002, |
| "step": 3065, |
| "valid_targets_mean": 4783.9, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 3.1073417721518988, |
| "grad_norm": 0.42288485229336514, |
| "learning_rate": 1.5076591705561056e-05, |
| "loss": 0.3054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16323769092559814, |
| "step": 3070, |
| "valid_targets_mean": 3961.5, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 3.1124050632911393, |
| "grad_norm": 0.29888536735808585, |
| "learning_rate": 1.5008135957998968e-05, |
| "loss": 0.3097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16281160712242126, |
| "step": 3075, |
| "valid_targets_mean": 5095.7, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 3.11746835443038, |
| "grad_norm": 0.32246738234879885, |
| "learning_rate": 1.4939742521209178e-05, |
| "loss": 0.3136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.142366424202919, |
| "step": 3080, |
| "valid_targets_mean": 3786.1, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 3.1225316455696204, |
| "grad_norm": 0.2885458143447489, |
| "learning_rate": 1.4871412248910416e-05, |
| "loss": 0.3112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1399984061717987, |
| "step": 3085, |
| "valid_targets_mean": 5652.7, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 3.127594936708861, |
| "grad_norm": 0.3436698843544968, |
| "learning_rate": 1.480314599403296e-05, |
| "loss": 0.3051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12947720289230347, |
| "step": 3090, |
| "valid_targets_mean": 3113.7, |
| "valid_targets_min": 1129 |
| }, |
| { |
| "epoch": 3.1326582278481014, |
| "grad_norm": 0.3034361762747695, |
| "learning_rate": 1.4734944608708022e-05, |
| "loss": 0.2819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1270906925201416, |
| "step": 3095, |
| "valid_targets_mean": 4283.6, |
| "valid_targets_min": 1371 |
| }, |
| { |
| "epoch": 3.137721518987342, |
| "grad_norm": 0.2910061490791564, |
| "learning_rate": 1.4666808944257044e-05, |
| "loss": 0.3011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1065504252910614, |
| "step": 3100, |
| "valid_targets_mean": 4013.8, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 3.1427848101265825, |
| "grad_norm": 0.29375562777524983, |
| "learning_rate": 1.459873985118115e-05, |
| "loss": 0.2913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20948265492916107, |
| "step": 3105, |
| "valid_targets_mean": 6254.6, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 3.1478481012658226, |
| "grad_norm": 0.32610939195307226, |
| "learning_rate": 1.4530738179150445e-05, |
| "loss": 0.3091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16477391123771667, |
| "step": 3110, |
| "valid_targets_mean": 4672.6, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 3.152911392405063, |
| "grad_norm": 0.34376610077811187, |
| "learning_rate": 1.44628047769935e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12125621736049652, |
| "step": 3115, |
| "valid_targets_mean": 3024.9, |
| "valid_targets_min": 1154 |
| }, |
| { |
| "epoch": 3.1579746835443037, |
| "grad_norm": 0.24961470242170858, |
| "learning_rate": 1.4394940492686666e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18956081569194794, |
| "step": 3120, |
| "valid_targets_mean": 8850.2, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 3.163037974683544, |
| "grad_norm": 0.3213177133533683, |
| "learning_rate": 1.4327146173343561e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16393819451332092, |
| "step": 3125, |
| "valid_targets_mean": 4351.1, |
| "valid_targets_min": 1322 |
| }, |
| { |
| "epoch": 3.1681012658227847, |
| "grad_norm": 0.3207864682050949, |
| "learning_rate": 1.4259422665204458e-05, |
| "loss": 0.3097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19772255420684814, |
| "step": 3130, |
| "valid_targets_mean": 5234.6, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 3.1731645569620253, |
| "grad_norm": 0.3306680712851493, |
| "learning_rate": 1.4191770813625732e-05, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1288958340883255, |
| "step": 3135, |
| "valid_targets_mean": 3816.3, |
| "valid_targets_min": 1339 |
| }, |
| { |
| "epoch": 3.178227848101266, |
| "grad_norm": 0.33226796696180216, |
| "learning_rate": 1.4124191463069305e-05, |
| "loss": 0.2918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1820456087589264, |
| "step": 3140, |
| "valid_targets_mean": 4462.9, |
| "valid_targets_min": 1300 |
| }, |
| { |
| "epoch": 3.1832911392405063, |
| "grad_norm": 0.25066525871506057, |
| "learning_rate": 1.4056685457092122e-05, |
| "loss": 0.2981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.108408123254776, |
| "step": 3145, |
| "valid_targets_mean": 4348.1, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 3.188354430379747, |
| "grad_norm": 0.2799683914898738, |
| "learning_rate": 1.3989253638335577e-05, |
| "loss": 0.3048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140926331281662, |
| "step": 3150, |
| "valid_targets_mean": 5334.3, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 3.1934177215189874, |
| "grad_norm": 0.364904271269176, |
| "learning_rate": 1.3921896848515064e-05, |
| "loss": 0.3009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1611071527004242, |
| "step": 3155, |
| "valid_targets_mean": 3846.9, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 3.198481012658228, |
| "grad_norm": 0.31469570152651777, |
| "learning_rate": 1.385461592840939e-05, |
| "loss": 0.2914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16711470484733582, |
| "step": 3160, |
| "valid_targets_mean": 4945.6, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 3.2035443037974685, |
| "grad_norm": 0.40871004437684494, |
| "learning_rate": 1.3787411717850358e-05, |
| "loss": 0.2874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14797160029411316, |
| "step": 3165, |
| "valid_targets_mean": 3367.9, |
| "valid_targets_min": 1380 |
| }, |
| { |
| "epoch": 3.208607594936709, |
| "grad_norm": 0.3063676754341602, |
| "learning_rate": 1.3720285055712222e-05, |
| "loss": 0.3, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12202514708042145, |
| "step": 3170, |
| "valid_targets_mean": 3846.6, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 3.2136708860759495, |
| "grad_norm": 0.33920699542879207, |
| "learning_rate": 1.3653236779901236e-05, |
| "loss": 0.3022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08881708979606628, |
| "step": 3175, |
| "valid_targets_mean": 2589.6, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 3.21873417721519, |
| "grad_norm": 0.3118478710909973, |
| "learning_rate": 1.3586267727345232e-05, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13673335313796997, |
| "step": 3180, |
| "valid_targets_mean": 4171.1, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 3.22379746835443, |
| "grad_norm": 0.3657648017370462, |
| "learning_rate": 1.35193787339831e-05, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13656803965568542, |
| "step": 3185, |
| "valid_targets_mean": 4186.0, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 3.2288607594936707, |
| "grad_norm": 0.29575714520451474, |
| "learning_rate": 1.3452570634754434e-05, |
| "loss": 0.2919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14770013093948364, |
| "step": 3190, |
| "valid_targets_mean": 5272.9, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 3.233924050632911, |
| "grad_norm": 0.29496009702650783, |
| "learning_rate": 1.3385844263589033e-05, |
| "loss": 0.2984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17479810118675232, |
| "step": 3195, |
| "valid_targets_mean": 5597.1, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 3.2389873417721518, |
| "grad_norm": 0.35581177858551544, |
| "learning_rate": 1.3319200453396548e-05, |
| "loss": 0.294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15500982105731964, |
| "step": 3200, |
| "valid_targets_mean": 4076.4, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 3.2440506329113923, |
| "grad_norm": 0.292951167708079, |
| "learning_rate": 1.3252640036056068e-05, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1567637026309967, |
| "step": 3205, |
| "valid_targets_mean": 5367.4, |
| "valid_targets_min": 1424 |
| }, |
| { |
| "epoch": 3.249113924050633, |
| "grad_norm": 0.3182836504556952, |
| "learning_rate": 1.318616384240572e-05, |
| "loss": 0.3043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1862029880285263, |
| "step": 3210, |
| "valid_targets_mean": 5235.2, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 3.2541772151898734, |
| "grad_norm": 0.5962356962936214, |
| "learning_rate": 1.3119772702232325e-05, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15173543989658356, |
| "step": 3215, |
| "valid_targets_mean": 3896.9, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 3.259240506329114, |
| "grad_norm": 0.30446119131111943, |
| "learning_rate": 1.3053467444261021e-05, |
| "loss": 0.3035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16218072175979614, |
| "step": 3220, |
| "valid_targets_mean": 5058.7, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 3.2643037974683544, |
| "grad_norm": 0.30100968288795926, |
| "learning_rate": 1.2987248896144915e-05, |
| "loss": 0.3025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1766858994960785, |
| "step": 3225, |
| "valid_targets_mean": 5638.7, |
| "valid_targets_min": 1494 |
| }, |
| { |
| "epoch": 3.269367088607595, |
| "grad_norm": 0.3043172862585619, |
| "learning_rate": 1.2921117884454784e-05, |
| "loss": 0.3111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13346105813980103, |
| "step": 3230, |
| "valid_targets_mean": 4191.2, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 3.2744303797468355, |
| "grad_norm": 0.30601688850305675, |
| "learning_rate": 1.2855075234668708e-05, |
| "loss": 0.2969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17442500591278076, |
| "step": 3235, |
| "valid_targets_mean": 5185.5, |
| "valid_targets_min": 1463 |
| }, |
| { |
| "epoch": 3.279493670886076, |
| "grad_norm": 0.32710194023512384, |
| "learning_rate": 1.278912177116182e-05, |
| "loss": 0.2987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18517401814460754, |
| "step": 3240, |
| "valid_targets_mean": 4748.3, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 3.2845569620253166, |
| "grad_norm": 0.2832311914633299, |
| "learning_rate": 1.2723258317195965e-05, |
| "loss": 0.3118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1336306631565094, |
| "step": 3245, |
| "valid_targets_mean": 4846.2, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 3.289620253164557, |
| "grad_norm": 0.2859981419544709, |
| "learning_rate": 1.2657485694909451e-05, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12190467119216919, |
| "step": 3250, |
| "valid_targets_mean": 4372.2, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 3.2946835443037976, |
| "grad_norm": 0.3133461443068576, |
| "learning_rate": 1.2591804725306802e-05, |
| "loss": 0.3056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09984530508518219, |
| "step": 3255, |
| "valid_targets_mean": 3387.1, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 3.299746835443038, |
| "grad_norm": 0.3066068642940143, |
| "learning_rate": 1.252621622824846e-05, |
| "loss": 0.3049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10505147278308868, |
| "step": 3260, |
| "valid_targets_mean": 3119.9, |
| "valid_targets_min": 1415 |
| }, |
| { |
| "epoch": 3.3048101265822787, |
| "grad_norm": 0.30638690017522713, |
| "learning_rate": 1.2460721022440617e-05, |
| "loss": 0.3023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1329905241727829, |
| "step": 3265, |
| "valid_targets_mean": 3749.8, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 3.309873417721519, |
| "grad_norm": 0.3893581538313894, |
| "learning_rate": 1.2395319925424922e-05, |
| "loss": 0.301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12106384336948395, |
| "step": 3270, |
| "valid_targets_mean": 3750.2, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 3.3149367088607593, |
| "grad_norm": 0.2915580190067732, |
| "learning_rate": 1.2330013753568345e-05, |
| "loss": 0.3046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15587478876113892, |
| "step": 3275, |
| "valid_targets_mean": 5153.9, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 3.32, |
| "grad_norm": 0.32454051814127005, |
| "learning_rate": 1.2264803322052938e-05, |
| "loss": 0.2902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14347532391548157, |
| "step": 3280, |
| "valid_targets_mean": 3715.8, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 3.3250632911392404, |
| "grad_norm": 0.3014718100183408, |
| "learning_rate": 1.2199689444865688e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11024832725524902, |
| "step": 3285, |
| "valid_targets_mean": 3356.6, |
| "valid_targets_min": 1346 |
| }, |
| { |
| "epoch": 3.330126582278481, |
| "grad_norm": 0.3180605843827969, |
| "learning_rate": 1.2134672934788338e-05, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1348501592874527, |
| "step": 3290, |
| "valid_targets_mean": 4180.2, |
| "valid_targets_min": 1405 |
| }, |
| { |
| "epoch": 3.3351898734177214, |
| "grad_norm": 0.31070898369108957, |
| "learning_rate": 1.206975460338726e-05, |
| "loss": 0.2962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14836883544921875, |
| "step": 3295, |
| "valid_targets_mean": 4112.2, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 3.340253164556962, |
| "grad_norm": 0.28528395978629406, |
| "learning_rate": 1.2004935261003292e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11711958050727844, |
| "step": 3300, |
| "valid_targets_mean": 5100.1, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 3.3453164556962025, |
| "grad_norm": 0.3708665183674031, |
| "learning_rate": 1.194021571674168e-05, |
| "loss": 0.2891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13884302973747253, |
| "step": 3305, |
| "valid_targets_mean": 4049.6, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 3.350379746835443, |
| "grad_norm": 0.3298858637588618, |
| "learning_rate": 1.1875596778461903e-05, |
| "loss": 0.2893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1451665610074997, |
| "step": 3310, |
| "valid_targets_mean": 4987.6, |
| "valid_targets_min": 1624 |
| }, |
| { |
| "epoch": 3.3554430379746836, |
| "grad_norm": 0.30292570807469854, |
| "learning_rate": 1.1811079252767663e-05, |
| "loss": 0.2858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12376505136489868, |
| "step": 3315, |
| "valid_targets_mean": 3583.1, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 3.360506329113924, |
| "grad_norm": 0.32294869729997133, |
| "learning_rate": 1.174666394499677e-05, |
| "loss": 0.2914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11844268441200256, |
| "step": 3320, |
| "valid_targets_mean": 3262.4, |
| "valid_targets_min": 1554 |
| }, |
| { |
| "epoch": 3.3655696202531646, |
| "grad_norm": 0.3438389100269291, |
| "learning_rate": 1.1682351659211088e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1457480937242508, |
| "step": 3325, |
| "valid_targets_mean": 3745.7, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 3.370632911392405, |
| "grad_norm": 0.33249792748827744, |
| "learning_rate": 1.1618143198186544e-05, |
| "loss": 0.2956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15856462717056274, |
| "step": 3330, |
| "valid_targets_mean": 4305.5, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 3.3756962025316457, |
| "grad_norm": 0.3173034049275177, |
| "learning_rate": 1.155403936340304e-05, |
| "loss": 0.2947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18826264142990112, |
| "step": 3335, |
| "valid_targets_mean": 5404.1, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 3.3807594936708862, |
| "grad_norm": 0.3178276101310362, |
| "learning_rate": 1.149004095503452e-05, |
| "loss": 0.297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15395784378051758, |
| "step": 3340, |
| "valid_targets_mean": 5008.1, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 3.3858227848101268, |
| "grad_norm": 0.3025604254884791, |
| "learning_rate": 1.1426148771938915e-05, |
| "loss": 0.3065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1488351970911026, |
| "step": 3345, |
| "valid_targets_mean": 4703.1, |
| "valid_targets_min": 1506 |
| }, |
| { |
| "epoch": 3.390886075949367, |
| "grad_norm": 0.3037731465395097, |
| "learning_rate": 1.1362363611648228e-05, |
| "loss": 0.3069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11465154588222504, |
| "step": 3350, |
| "valid_targets_mean": 3727.4, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 3.3959493670886074, |
| "grad_norm": 0.3441348411116797, |
| "learning_rate": 1.1298686270358542e-05, |
| "loss": 0.301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17264041304588318, |
| "step": 3355, |
| "valid_targets_mean": 3737.4, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 3.401012658227848, |
| "grad_norm": 0.2922925569041438, |
| "learning_rate": 1.1235117542920077e-05, |
| "loss": 0.2984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11297699809074402, |
| "step": 3360, |
| "valid_targets_mean": 4023.7, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 3.4060759493670885, |
| "grad_norm": 0.3304527382358981, |
| "learning_rate": 1.1171658222827321e-05, |
| "loss": 0.308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21652498841285706, |
| "step": 3365, |
| "valid_targets_mean": 5499.5, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 3.411139240506329, |
| "grad_norm": 0.34098724945316766, |
| "learning_rate": 1.110830910220905e-05, |
| "loss": 0.3065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17756357789039612, |
| "step": 3370, |
| "valid_targets_mean": 3859.3, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 3.4162025316455695, |
| "grad_norm": 0.29556792434414897, |
| "learning_rate": 1.1045070971818515e-05, |
| "loss": 0.2959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.130351722240448, |
| "step": 3375, |
| "valid_targets_mean": 3860.4, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 3.42126582278481, |
| "grad_norm": 0.2817393837564735, |
| "learning_rate": 1.0981944621023508e-05, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.172260582447052, |
| "step": 3380, |
| "valid_targets_mean": 6195.1, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 3.4263291139240506, |
| "grad_norm": 0.3019678707113778, |
| "learning_rate": 1.0918930837796538e-05, |
| "loss": 0.2909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14187800884246826, |
| "step": 3385, |
| "valid_targets_mean": 4729.5, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 3.431392405063291, |
| "grad_norm": 0.32014190449807, |
| "learning_rate": 1.0856030408705016e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15517304837703705, |
| "step": 3390, |
| "valid_targets_mean": 4351.6, |
| "valid_targets_min": 1381 |
| }, |
| { |
| "epoch": 3.4364556962025317, |
| "grad_norm": 0.28577315150998106, |
| "learning_rate": 1.0793244118901383e-05, |
| "loss": 0.3001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16560965776443481, |
| "step": 3395, |
| "valid_targets_mean": 5708.4, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 3.441518987341772, |
| "grad_norm": 0.2895330117490245, |
| "learning_rate": 1.0730572752113368e-05, |
| "loss": 0.3004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16116517782211304, |
| "step": 3400, |
| "valid_targets_mean": 6122.2, |
| "valid_targets_min": 1191 |
| }, |
| { |
| "epoch": 3.4465822784810127, |
| "grad_norm": 0.3276147158732667, |
| "learning_rate": 1.0668017090634164e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1463163197040558, |
| "step": 3405, |
| "valid_targets_mean": 3868.4, |
| "valid_targets_min": 1560 |
| }, |
| { |
| "epoch": 3.4516455696202533, |
| "grad_norm": 0.27522935687650096, |
| "learning_rate": 1.0605577915312662e-05, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14057275652885437, |
| "step": 3410, |
| "valid_targets_mean": 5501.4, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 3.456708860759494, |
| "grad_norm": 0.2546793488548092, |
| "learning_rate": 1.0543256005543752e-05, |
| "loss": 0.2931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17178791761398315, |
| "step": 3415, |
| "valid_targets_mean": 6257.9, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 3.4617721518987343, |
| "grad_norm": 0.2887049078859965, |
| "learning_rate": 1.048105213925853e-05, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15336082875728607, |
| "step": 3420, |
| "valid_targets_mean": 5676.3, |
| "valid_targets_min": 1581 |
| }, |
| { |
| "epoch": 3.466835443037975, |
| "grad_norm": 0.3248981947583244, |
| "learning_rate": 1.0418967092914643e-05, |
| "loss": 0.296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12593376636505127, |
| "step": 3425, |
| "valid_targets_mean": 3572.3, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 3.4718987341772154, |
| "grad_norm": 0.33097897236242024, |
| "learning_rate": 1.0357001641486556e-05, |
| "loss": 0.2969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16061154007911682, |
| "step": 3430, |
| "valid_targets_mean": 6276.2, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 3.476962025316456, |
| "grad_norm": 0.29614677485829893, |
| "learning_rate": 1.0295156558455885e-05, |
| "loss": 0.3058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1872052550315857, |
| "step": 3435, |
| "valid_targets_mean": 6640.8, |
| "valid_targets_min": 1160 |
| }, |
| { |
| "epoch": 3.482025316455696, |
| "grad_norm": 0.27705637796463173, |
| "learning_rate": 1.0233432615801786e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14229699969291687, |
| "step": 3440, |
| "valid_targets_mean": 5945.9, |
| "valid_targets_min": 1284 |
| }, |
| { |
| "epoch": 3.4870886075949366, |
| "grad_norm": 0.26237225876364956, |
| "learning_rate": 1.0171830583991245e-05, |
| "loss": 0.3011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17002148926258087, |
| "step": 3445, |
| "valid_targets_mean": 6348.2, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 3.492151898734177, |
| "grad_norm": 0.33818695188520737, |
| "learning_rate": 1.0110351231969532e-05, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19817857444286346, |
| "step": 3450, |
| "valid_targets_mean": 4845.8, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 3.4972151898734176, |
| "grad_norm": 0.27766136414994197, |
| "learning_rate": 1.0048995327150556e-05, |
| "loss": 0.2994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17715927958488464, |
| "step": 3455, |
| "valid_targets_mean": 6080.2, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 3.502278481012658, |
| "grad_norm": 0.3385690737736752, |
| "learning_rate": 9.987763635407293e-06, |
| "loss": 0.2976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18266132473945618, |
| "step": 3460, |
| "valid_targets_mean": 4562.4, |
| "valid_targets_min": 1570 |
| }, |
| { |
| "epoch": 3.5073417721518987, |
| "grad_norm": 0.35240157099060987, |
| "learning_rate": 9.926656921062254e-06, |
| "loss": 0.3082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18275323510169983, |
| "step": 3465, |
| "valid_targets_mean": 4161.0, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 3.512405063291139, |
| "grad_norm": 0.37082127798975295, |
| "learning_rate": 9.865675946877897e-06, |
| "loss": 0.2964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.137416809797287, |
| "step": 3470, |
| "valid_targets_mean": 3108.2, |
| "valid_targets_min": 1222 |
| }, |
| { |
| "epoch": 3.5174683544303798, |
| "grad_norm": 0.32990352870182205, |
| "learning_rate": 9.804821474047166e-06, |
| "loss": 0.3071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13373905420303345, |
| "step": 3475, |
| "valid_targets_mean": 3385.4, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 3.5225316455696203, |
| "grad_norm": 0.3159470821550788, |
| "learning_rate": 9.744094262183922e-06, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1414027214050293, |
| "step": 3480, |
| "valid_targets_mean": 3928.0, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 3.527594936708861, |
| "grad_norm": 0.2903957000330617, |
| "learning_rate": 9.683495069313527e-06, |
| "loss": 0.3091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1404920518398285, |
| "step": 3485, |
| "valid_targets_mean": 4963.7, |
| "valid_targets_min": 1699 |
| }, |
| { |
| "epoch": 3.5326582278481014, |
| "grad_norm": 0.28971614608089746, |
| "learning_rate": 9.623024651863317e-06, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12896308302879333, |
| "step": 3490, |
| "valid_targets_mean": 4057.2, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 3.537721518987342, |
| "grad_norm": 0.32570265544900434, |
| "learning_rate": 9.56268376465323e-06, |
| "loss": 0.2962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14747750759124756, |
| "step": 3495, |
| "valid_targets_mean": 3836.9, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 3.5427848101265824, |
| "grad_norm": 0.3186509490983858, |
| "learning_rate": 9.502473160886309e-06, |
| "loss": 0.3055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13043725490570068, |
| "step": 3500, |
| "valid_targets_mean": 3738.1, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 3.547848101265823, |
| "grad_norm": 0.2738590358023834, |
| "learning_rate": 9.442393592139378e-06, |
| "loss": 0.31, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14587613940238953, |
| "step": 3505, |
| "valid_targets_mean": 4865.2, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 3.552911392405063, |
| "grad_norm": 0.3247037129452682, |
| "learning_rate": 9.382445808353582e-06, |
| "loss": 0.2935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1686377227306366, |
| "step": 3510, |
| "valid_targets_mean": 4436.3, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 3.5579746835443036, |
| "grad_norm": 0.3180620836755935, |
| "learning_rate": 9.322630557825099e-06, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.181858628988266, |
| "step": 3515, |
| "valid_targets_mean": 5233.6, |
| "valid_targets_min": 1452 |
| }, |
| { |
| "epoch": 3.563037974683544, |
| "grad_norm": 0.389889167724953, |
| "learning_rate": 9.262948587195733e-06, |
| "loss": 0.3152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15717878937721252, |
| "step": 3520, |
| "valid_targets_mean": 3013.9, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 3.5681012658227846, |
| "grad_norm": 0.29747778586225904, |
| "learning_rate": 9.203400641443659e-06, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1657101958990097, |
| "step": 3525, |
| "valid_targets_mean": 5011.9, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 3.573164556962025, |
| "grad_norm": 0.32589494828857773, |
| "learning_rate": 9.143987463874067e-06, |
| "loss": 0.3156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1313675493001938, |
| "step": 3530, |
| "valid_targets_mean": 3697.8, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 3.5782278481012657, |
| "grad_norm": 0.3014059728019354, |
| "learning_rate": 9.084709796109907e-06, |
| "loss": 0.2868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1120418906211853, |
| "step": 3535, |
| "valid_targets_mean": 3755.7, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 3.5832911392405062, |
| "grad_norm": 0.2948674668221632, |
| "learning_rate": 9.025568378082656e-06, |
| "loss": 0.3131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2535429894924164, |
| "step": 3540, |
| "valid_targets_mean": 5356.3, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 3.5883544303797468, |
| "grad_norm": 0.33956864916271323, |
| "learning_rate": 8.96656394802303e-06, |
| "loss": 0.3003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18608632683753967, |
| "step": 3545, |
| "valid_targets_mean": 4867.1, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 3.5934177215189873, |
| "grad_norm": 0.2894977962731721, |
| "learning_rate": 8.907697242451825e-06, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1488334834575653, |
| "step": 3550, |
| "valid_targets_mean": 4891.0, |
| "valid_targets_min": 1716 |
| }, |
| { |
| "epoch": 3.598481012658228, |
| "grad_norm": 0.3343791939565901, |
| "learning_rate": 8.84896899617067e-06, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.141134113073349, |
| "step": 3555, |
| "valid_targets_mean": 3341.7, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 3.6035443037974684, |
| "grad_norm": 0.33452158631970796, |
| "learning_rate": 8.790379942252888e-06, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10691896080970764, |
| "step": 3560, |
| "valid_targets_mean": 2877.1, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 3.608607594936709, |
| "grad_norm": 0.36142037308609365, |
| "learning_rate": 8.73193081203436e-06, |
| "loss": 0.2975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11998053640127182, |
| "step": 3565, |
| "valid_targets_mean": 2745.8, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 3.6136708860759494, |
| "grad_norm": 0.29136587900708333, |
| "learning_rate": 8.673622335104335e-06, |
| "loss": 0.3143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1345549076795578, |
| "step": 3570, |
| "valid_targets_mean": 4353.7, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 3.61873417721519, |
| "grad_norm": 0.3065976409246481, |
| "learning_rate": 8.6154552392964e-06, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10774962604045868, |
| "step": 3575, |
| "valid_targets_mean": 3904.3, |
| "valid_targets_min": 1176 |
| }, |
| { |
| "epoch": 3.6237974683544305, |
| "grad_norm": 0.31612983755964325, |
| "learning_rate": 8.557430250679329e-06, |
| "loss": 0.302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13469217717647552, |
| "step": 3580, |
| "valid_targets_mean": 3963.2, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 3.628860759493671, |
| "grad_norm": 0.355565500659515, |
| "learning_rate": 8.499548093548069e-06, |
| "loss": 0.2915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1492483913898468, |
| "step": 3585, |
| "valid_targets_mean": 3815.0, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 3.6339240506329116, |
| "grad_norm": 0.3209640823808966, |
| "learning_rate": 8.441809490414664e-06, |
| "loss": 0.2943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10731847584247589, |
| "step": 3590, |
| "valid_targets_mean": 3390.2, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 3.638987341772152, |
| "grad_norm": 0.3111850353285487, |
| "learning_rate": 8.384215161999245e-06, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12559540569782257, |
| "step": 3595, |
| "valid_targets_mean": 3864.8, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 3.6440506329113926, |
| "grad_norm": 0.3021980554963678, |
| "learning_rate": 8.326765827221066e-06, |
| "loss": 0.3006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16643747687339783, |
| "step": 3600, |
| "valid_targets_mean": 4737.3, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 3.649113924050633, |
| "grad_norm": 0.3299126612802994, |
| "learning_rate": 8.269462203189467e-06, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1495143473148346, |
| "step": 3605, |
| "valid_targets_mean": 4373.2, |
| "valid_targets_min": 1652 |
| }, |
| { |
| "epoch": 3.6541772151898733, |
| "grad_norm": 0.3046029741964782, |
| "learning_rate": 8.212305005194992e-06, |
| "loss": 0.2926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12610015273094177, |
| "step": 3610, |
| "valid_targets_mean": 4068.0, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 3.659240506329114, |
| "grad_norm": 0.2889811661916004, |
| "learning_rate": 8.155294946700402e-06, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14253506064414978, |
| "step": 3615, |
| "valid_targets_mean": 4970.4, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 3.6643037974683543, |
| "grad_norm": 0.3058585932521842, |
| "learning_rate": 8.098432739331803e-06, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14140847325325012, |
| "step": 3620, |
| "valid_targets_mean": 4990.8, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 3.669367088607595, |
| "grad_norm": 0.3078512961350209, |
| "learning_rate": 8.041719092869761e-06, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13041014969348907, |
| "step": 3625, |
| "valid_targets_mean": 4127.6, |
| "valid_targets_min": 1226 |
| }, |
| { |
| "epoch": 3.6744303797468354, |
| "grad_norm": 0.2557971332829355, |
| "learning_rate": 7.98515471524042e-06, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13294486701488495, |
| "step": 3630, |
| "valid_targets_mean": 5826.9, |
| "valid_targets_min": 1621 |
| }, |
| { |
| "epoch": 3.679493670886076, |
| "grad_norm": 0.3421960754823531, |
| "learning_rate": 7.928740312506704e-06, |
| "loss": 0.3055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11804340779781342, |
| "step": 3635, |
| "valid_targets_mean": 3220.9, |
| "valid_targets_min": 1529 |
| }, |
| { |
| "epoch": 3.6845569620253165, |
| "grad_norm": 0.30370702242210657, |
| "learning_rate": 7.87247658885946e-06, |
| "loss": 0.2923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1813192367553711, |
| "step": 3640, |
| "valid_targets_mean": 5260.7, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 3.689620253164557, |
| "grad_norm": 0.3275936364034654, |
| "learning_rate": 7.816364246608688e-06, |
| "loss": 0.303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16349400579929352, |
| "step": 3645, |
| "valid_targets_mean": 4485.0, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 3.6946835443037975, |
| "grad_norm": 0.36264702848645247, |
| "learning_rate": 7.760403986174796e-06, |
| "loss": 0.3064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13801871240139008, |
| "step": 3650, |
| "valid_targets_mean": 3051.1, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 3.699746835443038, |
| "grad_norm": 0.2776099144093922, |
| "learning_rate": 7.70459650607981e-06, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1680225133895874, |
| "step": 3655, |
| "valid_targets_mean": 6631.8, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 3.7048101265822786, |
| "grad_norm": 0.34172337758905963, |
| "learning_rate": 7.648942502938705e-06, |
| "loss": 0.3048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16763363778591156, |
| "step": 3660, |
| "valid_targets_mean": 4061.8, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 3.709873417721519, |
| "grad_norm": 0.31939393718066644, |
| "learning_rate": 7.593442671450666e-06, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17321282625198364, |
| "step": 3665, |
| "valid_targets_mean": 4894.1, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 3.714936708860759, |
| "grad_norm": 0.32132553979600637, |
| "learning_rate": 7.5380977043904365e-06, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16710880398750305, |
| "step": 3670, |
| "valid_targets_mean": 4925.1, |
| "valid_targets_min": 1393 |
| }, |
| { |
| "epoch": 3.7199999999999998, |
| "grad_norm": 0.32445408393836617, |
| "learning_rate": 7.482908292599689e-06, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12341426312923431, |
| "step": 3675, |
| "valid_targets_mean": 3606.6, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 3.7250632911392403, |
| "grad_norm": 0.3064797642539383, |
| "learning_rate": 7.427875124978359e-06, |
| "loss": 0.2968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1298845112323761, |
| "step": 3680, |
| "valid_targets_mean": 4494.2, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 3.730126582278481, |
| "grad_norm": 0.2891043975748266, |
| "learning_rate": 7.372998888476091e-06, |
| "loss": 0.307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14520198106765747, |
| "step": 3685, |
| "valid_targets_mean": 4642.1, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 3.7351898734177214, |
| "grad_norm": 0.2986519000501888, |
| "learning_rate": 7.318280268083624e-06, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19568581879138947, |
| "step": 3690, |
| "valid_targets_mean": 5491.8, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 3.740253164556962, |
| "grad_norm": 0.32054148131031535, |
| "learning_rate": 7.263719946824264e-06, |
| "loss": 0.3001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12194908410310745, |
| "step": 3695, |
| "valid_targets_mean": 3993.2, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 3.7453164556962024, |
| "grad_norm": 0.29536657640379355, |
| "learning_rate": 7.209318605745368e-06, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14819620549678802, |
| "step": 3700, |
| "valid_targets_mean": 4433.9, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 3.750379746835443, |
| "grad_norm": 0.28146869288224746, |
| "learning_rate": 7.1550769239098e-06, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18099471926689148, |
| "step": 3705, |
| "valid_targets_mean": 7152.2, |
| "valid_targets_min": 1449 |
| }, |
| { |
| "epoch": 3.7554430379746835, |
| "grad_norm": 0.31596675118829165, |
| "learning_rate": 7.100995578387519e-06, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13141889870166779, |
| "step": 3710, |
| "valid_targets_mean": 3884.0, |
| "valid_targets_min": 1459 |
| }, |
| { |
| "epoch": 3.760506329113924, |
| "grad_norm": 0.31422332389376245, |
| "learning_rate": 7.047075244247061e-06, |
| "loss": 0.3058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1718595027923584, |
| "step": 3715, |
| "valid_targets_mean": 4909.5, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 3.7655696202531646, |
| "grad_norm": 0.3058451914869696, |
| "learning_rate": 6.993316594547148e-06, |
| "loss": 0.3043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12041142582893372, |
| "step": 3720, |
| "valid_targets_mean": 3857.4, |
| "valid_targets_min": 1341 |
| }, |
| { |
| "epoch": 3.770632911392405, |
| "grad_norm": 0.3285101705687896, |
| "learning_rate": 6.939720300328303e-06, |
| "loss": 0.3109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15424466133117676, |
| "step": 3725, |
| "valid_targets_mean": 4029.8, |
| "valid_targets_min": 1388 |
| }, |
| { |
| "epoch": 3.7756962025316456, |
| "grad_norm": 0.2852711508998474, |
| "learning_rate": 6.886287030604422e-06, |
| "loss": 0.2974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15062718093395233, |
| "step": 3730, |
| "valid_targets_mean": 5311.7, |
| "valid_targets_min": 1383 |
| }, |
| { |
| "epoch": 3.780759493670886, |
| "grad_norm": 0.32830150851392953, |
| "learning_rate": 6.83301745235448e-06, |
| "loss": 0.3073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1865895390510559, |
| "step": 3735, |
| "valid_targets_mean": 4781.8, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 3.7858227848101267, |
| "grad_norm": 0.33756549066729197, |
| "learning_rate": 6.779912230514161e-06, |
| "loss": 0.2807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12055318802595139, |
| "step": 3740, |
| "valid_targets_mean": 3463.3, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 3.790886075949367, |
| "grad_norm": 0.3152172059583756, |
| "learning_rate": 6.7269720279675755e-06, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17137764394283295, |
| "step": 3745, |
| "valid_targets_mean": 4888.2, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 3.7959493670886078, |
| "grad_norm": 0.3239318373383687, |
| "learning_rate": 6.674197505539006e-06, |
| "loss": 0.3045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14893168210983276, |
| "step": 3750, |
| "valid_targets_mean": 4158.4, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 3.8010126582278483, |
| "grad_norm": 0.2919220688770005, |
| "learning_rate": 6.621589321984611e-06, |
| "loss": 0.2953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14690950512886047, |
| "step": 3755, |
| "valid_targets_mean": 4748.6, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 3.806075949367089, |
| "grad_norm": 0.3025582373018823, |
| "learning_rate": 6.569148133984258e-06, |
| "loss": 0.2936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17515698075294495, |
| "step": 3760, |
| "valid_targets_mean": 5047.3, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 3.8111392405063294, |
| "grad_norm": 0.2952019372668243, |
| "learning_rate": 6.516874596133269e-06, |
| "loss": 0.2869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15086880326271057, |
| "step": 3765, |
| "valid_targets_mean": 5131.5, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 3.81620253164557, |
| "grad_norm": 0.29724809214492576, |
| "learning_rate": 6.464769360934306e-06, |
| "loss": 0.2927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19773977994918823, |
| "step": 3770, |
| "valid_targets_mean": 6146.5, |
| "valid_targets_min": 1366 |
| }, |
| { |
| "epoch": 3.82126582278481, |
| "grad_norm": 0.33270725662814826, |
| "learning_rate": 6.412833078789178e-06, |
| "loss": 0.3024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15699324011802673, |
| "step": 3775, |
| "valid_targets_mean": 4472.4, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 3.8263291139240505, |
| "grad_norm": 0.2963372278675901, |
| "learning_rate": 6.361066397990758e-06, |
| "loss": 0.2956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1388930231332779, |
| "step": 3780, |
| "valid_targets_mean": 4676.4, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 3.831392405063291, |
| "grad_norm": 0.2786191474125972, |
| "learning_rate": 6.309469964714863e-06, |
| "loss": 0.298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14243824779987335, |
| "step": 3785, |
| "valid_targets_mean": 4964.9, |
| "valid_targets_min": 1391 |
| }, |
| { |
| "epoch": 3.8364556962025316, |
| "grad_norm": 0.3057769621782611, |
| "learning_rate": 6.2580444230122175e-06, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1198386549949646, |
| "step": 3790, |
| "valid_targets_mean": 3840.2, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 3.841518987341772, |
| "grad_norm": 0.31205008704708975, |
| "learning_rate": 6.2067904148003764e-06, |
| "loss": 0.3096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17915937304496765, |
| "step": 3795, |
| "valid_targets_mean": 5550.8, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 3.8465822784810126, |
| "grad_norm": 0.3072712018089592, |
| "learning_rate": 6.155708579855759e-06, |
| "loss": 0.3163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15422801673412323, |
| "step": 3800, |
| "valid_targets_mean": 4714.1, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 3.851645569620253, |
| "grad_norm": 0.3056625890719376, |
| "learning_rate": 6.104799555805607e-06, |
| "loss": 0.2963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10852354019880295, |
| "step": 3805, |
| "valid_targets_mean": 3481.8, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 3.8567088607594937, |
| "grad_norm": 0.33415927615785906, |
| "learning_rate": 6.054063978120093e-06, |
| "loss": 0.3035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16793662309646606, |
| "step": 3810, |
| "valid_targets_mean": 3962.6, |
| "valid_targets_min": 1458 |
| }, |
| { |
| "epoch": 3.8617721518987342, |
| "grad_norm": 0.2859437483451691, |
| "learning_rate": 6.00350248010431e-06, |
| "loss": 0.2964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11396883428096771, |
| "step": 3815, |
| "valid_targets_mean": 4421.5, |
| "valid_targets_min": 1527 |
| }, |
| { |
| "epoch": 3.8668354430379748, |
| "grad_norm": 0.32446773366076725, |
| "learning_rate": 5.95311569289045e-06, |
| "loss": 0.2976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14191418886184692, |
| "step": 3820, |
| "valid_targets_mean": 3904.6, |
| "valid_targets_min": 1346 |
| }, |
| { |
| "epoch": 3.8718987341772153, |
| "grad_norm": 0.33241644171629736, |
| "learning_rate": 5.902904245429852e-06, |
| "loss": 0.3066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15994411706924438, |
| "step": 3825, |
| "valid_targets_mean": 4205.2, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 3.876962025316456, |
| "grad_norm": 0.33295558620330956, |
| "learning_rate": 5.852868764485185e-06, |
| "loss": 0.2951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11764267832040787, |
| "step": 3830, |
| "valid_targets_mean": 3148.9, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 3.882025316455696, |
| "grad_norm": 0.3094377142586556, |
| "learning_rate": 5.803009874622645e-06, |
| "loss": 0.3014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13288931548595428, |
| "step": 3835, |
| "valid_targets_mean": 3723.9, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 3.8870886075949365, |
| "grad_norm": 0.28966742570043214, |
| "learning_rate": 5.753328198204107e-06, |
| "loss": 0.2827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14470314979553223, |
| "step": 3840, |
| "valid_targets_mean": 5011.6, |
| "valid_targets_min": 1536 |
| }, |
| { |
| "epoch": 3.892151898734177, |
| "grad_norm": 0.3556764011843303, |
| "learning_rate": 5.7038243553794105e-06, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15663528442382812, |
| "step": 3845, |
| "valid_targets_mean": 3704.3, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 3.8972151898734175, |
| "grad_norm": 0.4434641609697601, |
| "learning_rate": 5.654498964078578e-06, |
| "loss": 0.3071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15775218605995178, |
| "step": 3850, |
| "valid_targets_mean": 5224.2, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 3.902278481012658, |
| "grad_norm": 0.28354591909624743, |
| "learning_rate": 5.605352640004111e-06, |
| "loss": 0.2998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20830413699150085, |
| "step": 3855, |
| "valid_targets_mean": 6659.2, |
| "valid_targets_min": 1634 |
| }, |
| { |
| "epoch": 3.9073417721518986, |
| "grad_norm": 0.31278015955485905, |
| "learning_rate": 5.556385996623334e-06, |
| "loss": 0.3024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1927700638771057, |
| "step": 3860, |
| "valid_targets_mean": 6460.9, |
| "valid_targets_min": 1493 |
| }, |
| { |
| "epoch": 3.912405063291139, |
| "grad_norm": 0.3183546633710576, |
| "learning_rate": 5.507599645160688e-06, |
| "loss": 0.2956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14958074688911438, |
| "step": 3865, |
| "valid_targets_mean": 4336.2, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 3.9174683544303797, |
| "grad_norm": 0.2926146837393363, |
| "learning_rate": 5.45899419459015e-06, |
| "loss": 0.317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11325857788324356, |
| "step": 3870, |
| "valid_targets_mean": 3313.8, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 3.92253164556962, |
| "grad_norm": 0.2947057963950262, |
| "learning_rate": 5.410570251627587e-06, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1467699259519577, |
| "step": 3875, |
| "valid_targets_mean": 5764.1, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 3.9275949367088607, |
| "grad_norm": 0.29570913844534924, |
| "learning_rate": 5.362328420723208e-06, |
| "loss": 0.2956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14309361577033997, |
| "step": 3880, |
| "valid_targets_mean": 4847.8, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 3.9326582278481013, |
| "grad_norm": 0.3026281684204848, |
| "learning_rate": 5.314269304054029e-06, |
| "loss": 0.29, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19492954015731812, |
| "step": 3885, |
| "valid_targets_mean": 5634.2, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 3.937721518987342, |
| "grad_norm": 0.30964406158183067, |
| "learning_rate": 5.26639350151632e-06, |
| "loss": 0.3055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13411834836006165, |
| "step": 3890, |
| "valid_targets_mean": 4035.8, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 3.9427848101265823, |
| "grad_norm": 0.3111439221332038, |
| "learning_rate": 5.218701610718162e-06, |
| "loss": 0.3044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1787598729133606, |
| "step": 3895, |
| "valid_targets_mean": 5102.0, |
| "valid_targets_min": 1779 |
| }, |
| { |
| "epoch": 3.947848101265823, |
| "grad_norm": 0.256548917813654, |
| "learning_rate": 5.171194226971947e-06, |
| "loss": 0.3164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15520493686199188, |
| "step": 3900, |
| "valid_targets_mean": 5819.2, |
| "valid_targets_min": 913 |
| }, |
| { |
| "epoch": 3.9529113924050634, |
| "grad_norm": 0.35240271321787325, |
| "learning_rate": 5.12387194328696e-06, |
| "loss": 0.2864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.100287064909935, |
| "step": 3905, |
| "valid_targets_mean": 2803.6, |
| "valid_targets_min": 1229 |
| }, |
| { |
| "epoch": 3.957974683544304, |
| "grad_norm": 0.28051305016909855, |
| "learning_rate": 5.0767353503620055e-06, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11824625730514526, |
| "step": 3910, |
| "valid_targets_mean": 4403.1, |
| "valid_targets_min": 1454 |
| }, |
| { |
| "epoch": 3.9630379746835445, |
| "grad_norm": 0.33648253442313436, |
| "learning_rate": 5.029785036577976e-06, |
| "loss": 0.3047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12415116280317307, |
| "step": 3915, |
| "valid_targets_mean": 3484.4, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 3.968101265822785, |
| "grad_norm": 0.3051655834868841, |
| "learning_rate": 4.983021587990577e-06, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16038689017295837, |
| "step": 3920, |
| "valid_targets_mean": 4039.8, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 3.9731645569620255, |
| "grad_norm": 0.3149366075705648, |
| "learning_rate": 4.936445588322947e-06, |
| "loss": 0.2836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17041844129562378, |
| "step": 3925, |
| "valid_targets_mean": 4645.1, |
| "valid_targets_min": 1388 |
| }, |
| { |
| "epoch": 3.978227848101266, |
| "grad_norm": 0.3104948744129676, |
| "learning_rate": 4.890057618958406e-06, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13706716895103455, |
| "step": 3930, |
| "valid_targets_mean": 4148.2, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 3.9832911392405066, |
| "grad_norm": 0.4596385567964535, |
| "learning_rate": 4.843858258933207e-06, |
| "loss": 0.306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12977036833763123, |
| "step": 3935, |
| "valid_targets_mean": 4589.1, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 3.9883544303797467, |
| "grad_norm": 0.35205194291692793, |
| "learning_rate": 4.797848084929271e-06, |
| "loss": 0.2963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16180771589279175, |
| "step": 3940, |
| "valid_targets_mean": 4005.4, |
| "valid_targets_min": 1682 |
| }, |
| { |
| "epoch": 3.993417721518987, |
| "grad_norm": 0.3115344869207087, |
| "learning_rate": 4.7520276712670344e-06, |
| "loss": 0.3138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1245289221405983, |
| "step": 3945, |
| "valid_targets_mean": 3869.5, |
| "valid_targets_min": 1814 |
| }, |
| { |
| "epoch": 3.9984810126582278, |
| "grad_norm": 0.3447482808883552, |
| "learning_rate": 4.706397589898237e-06, |
| "loss": 0.2992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21260038018226624, |
| "step": 3950, |
| "valid_targets_mean": 4663.9, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 4.0030379746835445, |
| "grad_norm": 0.31704002367241657, |
| "learning_rate": 4.660958410398808e-06, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11520913243293762, |
| "step": 3955, |
| "valid_targets_mean": 3230.5, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 4.008101265822785, |
| "grad_norm": 0.3107759512067684, |
| "learning_rate": 4.61571069996176e-06, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15815721452236176, |
| "step": 3960, |
| "valid_targets_mean": 4538.7, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 4.013164556962026, |
| "grad_norm": 0.3240449542122713, |
| "learning_rate": 4.5706550233900825e-06, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1527724266052246, |
| "step": 3965, |
| "valid_targets_mean": 4152.1, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 4.018227848101266, |
| "grad_norm": 0.3371371879535488, |
| "learning_rate": 4.5257919430897305e-06, |
| "loss": 0.2919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14754730463027954, |
| "step": 3970, |
| "valid_targets_mean": 3785.3, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 4.023291139240507, |
| "grad_norm": 0.28767581366652223, |
| "learning_rate": 4.481122019062562e-06, |
| "loss": 0.2976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14282898604869843, |
| "step": 3975, |
| "valid_targets_mean": 4653.0, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 4.028354430379747, |
| "grad_norm": 0.29732809453534903, |
| "learning_rate": 4.436645808899374e-06, |
| "loss": 0.3062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18286307156085968, |
| "step": 3980, |
| "valid_targets_mean": 5864.7, |
| "valid_targets_min": 1531 |
| }, |
| { |
| "epoch": 4.033417721518988, |
| "grad_norm": 0.29104777332578374, |
| "learning_rate": 4.3923638677729506e-06, |
| "loss": 0.292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15134663879871368, |
| "step": 3985, |
| "valid_targets_mean": 5712.8, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 4.038481012658228, |
| "grad_norm": 0.34370328700294156, |
| "learning_rate": 4.348276748431095e-06, |
| "loss": 0.2889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16227614879608154, |
| "step": 3990, |
| "valid_targets_mean": 4682.2, |
| "valid_targets_min": 1365 |
| }, |
| { |
| "epoch": 4.043544303797469, |
| "grad_norm": 0.2853726249793705, |
| "learning_rate": 4.304385001189781e-06, |
| "loss": 0.292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15851733088493347, |
| "step": 3995, |
| "valid_targets_mean": 5396.8, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 4.048607594936709, |
| "grad_norm": 0.2664334385740433, |
| "learning_rate": 4.260689173926238e-06, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1690644472837448, |
| "step": 4000, |
| "valid_targets_mean": 6774.5, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 4.053670886075949, |
| "grad_norm": 0.27904233780454435, |
| "learning_rate": 4.217189812072131e-06, |
| "loss": 0.2918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13511596620082855, |
| "step": 4005, |
| "valid_targets_mean": 4486.5, |
| "valid_targets_min": 1562 |
| }, |
| { |
| "epoch": 4.0587341772151895, |
| "grad_norm": 0.3231775999779525, |
| "learning_rate": 4.173887458606767e-06, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11682070791721344, |
| "step": 4010, |
| "valid_targets_mean": 3668.7, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 4.06379746835443, |
| "grad_norm": 0.2770166025598625, |
| "learning_rate": 4.130782654050283e-06, |
| "loss": 0.3007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15404465794563293, |
| "step": 4015, |
| "valid_targets_mean": 5586.6, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 4.0688607594936705, |
| "grad_norm": 0.27479033637998745, |
| "learning_rate": 4.087875936456937e-06, |
| "loss": 0.2758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12938356399536133, |
| "step": 4020, |
| "valid_targets_mean": 5243.8, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 4.073924050632911, |
| "grad_norm": 0.31378983164450186, |
| "learning_rate": 4.045167841408359e-06, |
| "loss": 0.3017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15723198652267456, |
| "step": 4025, |
| "valid_targets_mean": 4392.6, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 4.078987341772152, |
| "grad_norm": 0.29002739575691505, |
| "learning_rate": 4.002658902006893e-06, |
| "loss": 0.2859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15544429421424866, |
| "step": 4030, |
| "valid_targets_mean": 5350.4, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 4.084050632911392, |
| "grad_norm": 0.3087847959185058, |
| "learning_rate": 3.9603496488689174e-06, |
| "loss": 0.2968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16527938842773438, |
| "step": 4035, |
| "valid_targets_mean": 5526.1, |
| "valid_targets_min": 1129 |
| }, |
| { |
| "epoch": 4.089113924050633, |
| "grad_norm": 0.3085791674780826, |
| "learning_rate": 3.918240610118234e-06, |
| "loss": 0.2936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1917693018913269, |
| "step": 4040, |
| "valid_targets_mean": 6275.9, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 4.094177215189873, |
| "grad_norm": 0.286080067957159, |
| "learning_rate": 3.876332311379489e-06, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1519317775964737, |
| "step": 4045, |
| "valid_targets_mean": 5526.4, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 4.099240506329114, |
| "grad_norm": 0.2837484355272842, |
| "learning_rate": 3.834625275771582e-06, |
| "loss": 0.2926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.123206228017807, |
| "step": 4050, |
| "valid_targets_mean": 4113.7, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 4.104303797468354, |
| "grad_norm": 0.2999251731420047, |
| "learning_rate": 3.7931200239011643e-06, |
| "loss": 0.2945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13318127393722534, |
| "step": 4055, |
| "valid_targets_mean": 4568.8, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 4.109367088607595, |
| "grad_norm": 0.2816382941308749, |
| "learning_rate": 3.7518170738561168e-06, |
| "loss": 0.2923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14610666036605835, |
| "step": 4060, |
| "valid_targets_mean": 4928.9, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.114430379746835, |
| "grad_norm": 0.32554297974189644, |
| "learning_rate": 3.7107169411991127e-06, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12090884894132614, |
| "step": 4065, |
| "valid_targets_mean": 3398.6, |
| "valid_targets_min": 1385 |
| }, |
| { |
| "epoch": 4.119493670886076, |
| "grad_norm": 0.3170024428197897, |
| "learning_rate": 3.6698201389611423e-06, |
| "loss": 0.2839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13328410685062408, |
| "step": 4070, |
| "valid_targets_mean": 4025.0, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 4.124556962025316, |
| "grad_norm": 0.3205485924763668, |
| "learning_rate": 3.62912717763515e-06, |
| "loss": 0.3124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21576707065105438, |
| "step": 4075, |
| "valid_targets_mean": 6120.9, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 4.129620253164557, |
| "grad_norm": 0.38654381765739637, |
| "learning_rate": 3.5886385651696267e-06, |
| "loss": 0.287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14297889173030853, |
| "step": 4080, |
| "valid_targets_mean": 4917.6, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 4.1346835443037975, |
| "grad_norm": 0.3524477589713149, |
| "learning_rate": 3.5483548069623043e-06, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14278902113437653, |
| "step": 4085, |
| "valid_targets_mean": 3844.8, |
| "valid_targets_min": 1260 |
| }, |
| { |
| "epoch": 4.139746835443038, |
| "grad_norm": 0.3197809913122213, |
| "learning_rate": 3.5082764058538056e-06, |
| "loss": 0.2891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12523522973060608, |
| "step": 4090, |
| "valid_targets_mean": 3690.5, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 4.1448101265822785, |
| "grad_norm": 0.30886469526940097, |
| "learning_rate": 3.4684038621214124e-06, |
| "loss": 0.2829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16583015024662018, |
| "step": 4095, |
| "valid_targets_mean": 5001.4, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 4.149873417721519, |
| "grad_norm": 0.28226754473975985, |
| "learning_rate": 3.4287376734727817e-06, |
| "loss": 0.2931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16582466661930084, |
| "step": 4100, |
| "valid_targets_mean": 5544.1, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 4.15493670886076, |
| "grad_norm": 0.3051843817153008, |
| "learning_rate": 3.3892783350397675e-06, |
| "loss": 0.2876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11235642433166504, |
| "step": 4105, |
| "valid_targets_mean": 3728.7, |
| "valid_targets_min": 1019 |
| }, |
| { |
| "epoch": 4.16, |
| "grad_norm": 0.28561421446674784, |
| "learning_rate": 3.3500263393722033e-06, |
| "loss": 0.2821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14730824530124664, |
| "step": 4110, |
| "valid_targets_mean": 5325.3, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 4.165063291139241, |
| "grad_norm": 0.3396963845435047, |
| "learning_rate": 3.310982176431785e-06, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1362554281949997, |
| "step": 4115, |
| "valid_targets_mean": 4046.4, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 4.170126582278481, |
| "grad_norm": 0.3604026125994517, |
| "learning_rate": 3.2721463335859484e-06, |
| "loss": 0.2991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12034134566783905, |
| "step": 4120, |
| "valid_targets_mean": 2845.9, |
| "valid_targets_min": 1453 |
| }, |
| { |
| "epoch": 4.175189873417722, |
| "grad_norm": 0.3047812123169994, |
| "learning_rate": 3.2335192956017634e-06, |
| "loss": 0.2972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1503809243440628, |
| "step": 4125, |
| "valid_targets_mean": 4877.8, |
| "valid_targets_min": 1783 |
| }, |
| { |
| "epoch": 4.180253164556962, |
| "grad_norm": 0.36835014889244666, |
| "learning_rate": 3.1951015446399247e-06, |
| "loss": 0.2942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11517144739627838, |
| "step": 4130, |
| "valid_targets_mean": 2904.6, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 4.185316455696203, |
| "grad_norm": 0.32918669737266704, |
| "learning_rate": 3.156893560248688e-06, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140342578291893, |
| "step": 4135, |
| "valid_targets_mean": 4083.8, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 4.190379746835443, |
| "grad_norm": 0.33957836205604514, |
| "learning_rate": 3.118895819357908e-06, |
| "loss": 0.2808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1507326364517212, |
| "step": 4140, |
| "valid_targets_mean": 4652.1, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 4.195443037974684, |
| "grad_norm": 0.285494983139607, |
| "learning_rate": 3.081108796273098e-06, |
| "loss": 0.301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12487950921058655, |
| "step": 4145, |
| "valid_targets_mean": 4737.4, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 4.200506329113924, |
| "grad_norm": 0.32355832904009185, |
| "learning_rate": 3.0435329626694733e-06, |
| "loss": 0.3044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18284101784229279, |
| "step": 4150, |
| "valid_targets_mean": 4946.2, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 4.205569620253165, |
| "grad_norm": 0.2901811873935047, |
| "learning_rate": 3.006168787586097e-06, |
| "loss": 0.2793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13859279453754425, |
| "step": 4155, |
| "valid_targets_mean": 5316.1, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 4.2106329113924055, |
| "grad_norm": 0.5190123284320625, |
| "learning_rate": 2.9690167374200075e-06, |
| "loss": 0.2972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1444871723651886, |
| "step": 4160, |
| "valid_targets_mean": 4388.6, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 4.215696202531646, |
| "grad_norm": 0.31722642981901594, |
| "learning_rate": 2.9320772759203975e-06, |
| "loss": 0.2988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13206876814365387, |
| "step": 4165, |
| "valid_targets_mean": 4130.3, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 4.220759493670886, |
| "grad_norm": 0.30916942149206356, |
| "learning_rate": 2.8953508641828375e-06, |
| "loss": 0.3024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1427369862794876, |
| "step": 4170, |
| "valid_targets_mean": 4538.5, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 4.225822784810126, |
| "grad_norm": 0.3075492109138346, |
| "learning_rate": 2.858837960643499e-06, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17169958353042603, |
| "step": 4175, |
| "valid_targets_mean": 4840.8, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 4.230886075949367, |
| "grad_norm": 0.29933826061321767, |
| "learning_rate": 2.822539021073463e-06, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16137537360191345, |
| "step": 4180, |
| "valid_targets_mean": 5634.3, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 4.235949367088607, |
| "grad_norm": 0.29690888264127147, |
| "learning_rate": 2.786454498572997e-06, |
| "loss": 0.2857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.135961651802063, |
| "step": 4185, |
| "valid_targets_mean": 4399.6, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 4.241012658227848, |
| "grad_norm": 0.3246955608047686, |
| "learning_rate": 2.7505848435659156e-06, |
| "loss": 0.3044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1551479548215866, |
| "step": 4190, |
| "valid_targets_mean": 4534.1, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 4.246075949367088, |
| "grad_norm": 0.29829478040788515, |
| "learning_rate": 2.7149305037939687e-06, |
| "loss": 0.2932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18227550387382507, |
| "step": 4195, |
| "valid_targets_mean": 5650.3, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 4.251139240506329, |
| "grad_norm": 0.3491396172417171, |
| "learning_rate": 2.679491924311226e-06, |
| "loss": 0.2841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13989317417144775, |
| "step": 4200, |
| "valid_targets_mean": 3527.8, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 4.256202531645569, |
| "grad_norm": 0.3062465471975927, |
| "learning_rate": 2.644269547478555e-06, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16212749481201172, |
| "step": 4205, |
| "valid_targets_mean": 4856.2, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 4.26126582278481, |
| "grad_norm": 0.31154484975672075, |
| "learning_rate": 2.609263812958065e-06, |
| "loss": 0.2934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10032152384519577, |
| "step": 4210, |
| "valid_targets_mean": 3391.6, |
| "valid_targets_min": 1245 |
| }, |
| { |
| "epoch": 4.2663291139240505, |
| "grad_norm": 0.3276187265653155, |
| "learning_rate": 2.5744751577076343e-06, |
| "loss": 0.2924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16798563301563263, |
| "step": 4215, |
| "valid_targets_mean": 4301.5, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 4.271392405063291, |
| "grad_norm": 0.31771678562930245, |
| "learning_rate": 2.539904015975476e-06, |
| "loss": 0.2932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14239826798439026, |
| "step": 4220, |
| "valid_targets_mean": 4702.1, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 4.2764556962025315, |
| "grad_norm": 0.2979983224769533, |
| "learning_rate": 2.5055508192946732e-06, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15499252080917358, |
| "step": 4225, |
| "valid_targets_mean": 4931.4, |
| "valid_targets_min": 1420 |
| }, |
| { |
| "epoch": 4.281518987341772, |
| "grad_norm": 0.3378145372579719, |
| "learning_rate": 2.4714159964778394e-06, |
| "loss": 0.2766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15219071507453918, |
| "step": 4230, |
| "valid_targets_mean": 4131.9, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 4.286582278481013, |
| "grad_norm": 0.3132928788106069, |
| "learning_rate": 2.437499973611728e-06, |
| "loss": 0.2861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17868193984031677, |
| "step": 4235, |
| "valid_targets_mean": 5772.8, |
| "valid_targets_min": 1773 |
| }, |
| { |
| "epoch": 4.291645569620253, |
| "grad_norm": 0.3049108704834252, |
| "learning_rate": 2.403803174051933e-06, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17676058411598206, |
| "step": 4240, |
| "valid_targets_mean": 5360.8, |
| "valid_targets_min": 1400 |
| }, |
| { |
| "epoch": 4.296708860759494, |
| "grad_norm": 0.2674881690807918, |
| "learning_rate": 2.3703260184176103e-06, |
| "loss": 0.2849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11438636481761932, |
| "step": 4245, |
| "valid_targets_mean": 4663.1, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 4.301772151898734, |
| "grad_norm": 0.3381875004506121, |
| "learning_rate": 2.337068924586203e-06, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14016669988632202, |
| "step": 4250, |
| "valid_targets_mean": 3257.6, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 4.306835443037975, |
| "grad_norm": 0.33566799216440724, |
| "learning_rate": 2.3040323076882578e-06, |
| "loss": 0.2852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1721951961517334, |
| "step": 4255, |
| "valid_targets_mean": 4602.8, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 4.311898734177215, |
| "grad_norm": 0.39194447138918637, |
| "learning_rate": 2.2712165801022046e-06, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1366182416677475, |
| "step": 4260, |
| "valid_targets_mean": 2721.6, |
| "valid_targets_min": 913 |
| }, |
| { |
| "epoch": 4.316962025316456, |
| "grad_norm": 0.3637100172839474, |
| "learning_rate": 2.2386221514492502e-06, |
| "loss": 0.2911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11843443661928177, |
| "step": 4265, |
| "valid_targets_mean": 3167.0, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 4.322025316455696, |
| "grad_norm": 0.32727869850436964, |
| "learning_rate": 2.2062494285882363e-06, |
| "loss": 0.3013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1746322512626648, |
| "step": 4270, |
| "valid_targets_mean": 4557.8, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 4.327088607594937, |
| "grad_norm": 0.35219909889872136, |
| "learning_rate": 2.1740988156105593e-06, |
| "loss": 0.2937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08915197849273682, |
| "step": 4275, |
| "valid_targets_mean": 2497.8, |
| "valid_targets_min": 1172 |
| }, |
| { |
| "epoch": 4.332151898734177, |
| "grad_norm": 0.3312024847124787, |
| "learning_rate": 2.142170713835161e-06, |
| "loss": 0.2925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16628465056419373, |
| "step": 4280, |
| "valid_targets_mean": 4481.7, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 4.337215189873418, |
| "grad_norm": 0.26123810507474954, |
| "learning_rate": 2.1104655218034685e-06, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.136556938290596, |
| "step": 4285, |
| "valid_targets_mean": 5086.1, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 4.3422784810126585, |
| "grad_norm": 0.28913080019288895, |
| "learning_rate": 2.0789836352744653e-06, |
| "loss": 0.3025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1929275244474411, |
| "step": 4290, |
| "valid_targets_mean": 6718.0, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 4.347341772151899, |
| "grad_norm": 0.2856092567973034, |
| "learning_rate": 2.0477254472197237e-06, |
| "loss": 0.2857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12290873378515244, |
| "step": 4295, |
| "valid_targets_mean": 4296.3, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 4.3524050632911395, |
| "grad_norm": 0.376756316497093, |
| "learning_rate": 2.0166913478185004e-06, |
| "loss": 0.2969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1333305984735489, |
| "step": 4300, |
| "valid_targets_mean": 4643.4, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 4.35746835443038, |
| "grad_norm": 0.37269967571373286, |
| "learning_rate": 1.9858817244528896e-06, |
| "loss": 0.2771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16167780756950378, |
| "step": 4305, |
| "valid_targets_mean": 3327.0, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 4.362531645569621, |
| "grad_norm": 0.36507367284654024, |
| "learning_rate": 1.955296961702955e-06, |
| "loss": 0.2891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1149420514702797, |
| "step": 4310, |
| "valid_targets_mean": 3484.9, |
| "valid_targets_min": 1218 |
| }, |
| { |
| "epoch": 4.367594936708861, |
| "grad_norm": 0.3549138995526032, |
| "learning_rate": 1.9249374413419584e-06, |
| "loss": 0.3209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16552500426769257, |
| "step": 4315, |
| "valid_targets_mean": 4319.2, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 4.372658227848102, |
| "grad_norm": 0.30961509363434114, |
| "learning_rate": 1.894803542331567e-06, |
| "loss": 0.2936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12911680340766907, |
| "step": 4320, |
| "valid_targets_mean": 3623.0, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 4.377721518987342, |
| "grad_norm": 0.30219606387390835, |
| "learning_rate": 1.8648956408171547e-06, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1574065387248993, |
| "step": 4325, |
| "valid_targets_mean": 4955.6, |
| "valid_targets_min": 1679 |
| }, |
| { |
| "epoch": 4.382784810126582, |
| "grad_norm": 0.3279169523694041, |
| "learning_rate": 1.8352141101230758e-06, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1483180820941925, |
| "step": 4330, |
| "valid_targets_mean": 3969.1, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 4.387848101265822, |
| "grad_norm": 0.3105228186529775, |
| "learning_rate": 1.8057593207480194e-06, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11923258006572723, |
| "step": 4335, |
| "valid_targets_mean": 3387.1, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 4.392911392405063, |
| "grad_norm": 0.33881080054396395, |
| "learning_rate": 1.7765316403603927e-06, |
| "loss": 0.2916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13051745295524597, |
| "step": 4340, |
| "valid_targets_mean": 3938.3, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 4.397974683544303, |
| "grad_norm": 0.2859920210081916, |
| "learning_rate": 1.7475314337937099e-06, |
| "loss": 0.2971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14054298400878906, |
| "step": 4345, |
| "valid_targets_mean": 4863.8, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 4.403037974683544, |
| "grad_norm": 0.3222088763676915, |
| "learning_rate": 1.7187590630420681e-06, |
| "loss": 0.2911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15554268658161163, |
| "step": 4350, |
| "valid_targets_mean": 3944.6, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 4.4081012658227845, |
| "grad_norm": 0.32147293328088156, |
| "learning_rate": 1.6902148872555924e-06, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13429546356201172, |
| "step": 4355, |
| "valid_targets_mean": 3537.0, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 4.413164556962025, |
| "grad_norm": 0.2873112295172894, |
| "learning_rate": 1.661899262735991e-06, |
| "loss": 0.2809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11225029826164246, |
| "step": 4360, |
| "valid_targets_mean": 3726.2, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 4.418227848101266, |
| "grad_norm": 0.3137420905534193, |
| "learning_rate": 1.6338125429320694e-06, |
| "loss": 0.3025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1628667116165161, |
| "step": 4365, |
| "valid_targets_mean": 4489.4, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 4.423291139240506, |
| "grad_norm": 0.2980697010922971, |
| "learning_rate": 1.605955078435355e-06, |
| "loss": 0.2861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1740245670080185, |
| "step": 4370, |
| "valid_targets_mean": 5941.4, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 4.428354430379747, |
| "grad_norm": 0.29655956780164205, |
| "learning_rate": 1.5783272169756903e-06, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12947620451450348, |
| "step": 4375, |
| "valid_targets_mean": 4607.8, |
| "valid_targets_min": 1670 |
| }, |
| { |
| "epoch": 4.433417721518987, |
| "grad_norm": 0.28159919536576594, |
| "learning_rate": 1.550929303416917e-06, |
| "loss": 0.2891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11871195584535599, |
| "step": 4380, |
| "valid_targets_mean": 4622.2, |
| "valid_targets_min": 1319 |
| }, |
| { |
| "epoch": 4.438481012658228, |
| "grad_norm": 0.3159849176088272, |
| "learning_rate": 1.5237616797525512e-06, |
| "loss": 0.2964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13893471658229828, |
| "step": 4385, |
| "valid_targets_mean": 4139.4, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 4.443544303797468, |
| "grad_norm": 0.3103371076544768, |
| "learning_rate": 1.49682468510153e-06, |
| "loss": 0.292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17314529418945312, |
| "step": 4390, |
| "valid_targets_mean": 5825.6, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 4.448607594936709, |
| "grad_norm": 0.28729653443614084, |
| "learning_rate": 1.4701186557039648e-06, |
| "loss": 0.2844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13900840282440186, |
| "step": 4395, |
| "valid_targets_mean": 4918.3, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 4.453670886075949, |
| "grad_norm": 0.3411738428471954, |
| "learning_rate": 1.4436439249169554e-06, |
| "loss": 0.3038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13948732614517212, |
| "step": 4400, |
| "valid_targets_mean": 5576.6, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 4.45873417721519, |
| "grad_norm": 0.3118105881962252, |
| "learning_rate": 1.4174008232104285e-06, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13870777189731598, |
| "step": 4405, |
| "valid_targets_mean": 4355.1, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 4.46379746835443, |
| "grad_norm": 0.32978343142383926, |
| "learning_rate": 1.3913896781629954e-06, |
| "loss": 0.2975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13087686896324158, |
| "step": 4410, |
| "valid_targets_mean": 3731.3, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 4.468860759493671, |
| "grad_norm": 0.2618923931315447, |
| "learning_rate": 1.3656108144578962e-06, |
| "loss": 0.2879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13182973861694336, |
| "step": 4415, |
| "valid_targets_mean": 4776.1, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 4.473924050632911, |
| "grad_norm": 0.27864898068700833, |
| "learning_rate": 1.340064553878908e-06, |
| "loss": 0.2865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14037862420082092, |
| "step": 4420, |
| "valid_targets_mean": 5322.2, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 4.478987341772152, |
| "grad_norm": 0.2935646123466447, |
| "learning_rate": 1.3147512153063558e-06, |
| "loss": 0.2848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18074341118335724, |
| "step": 4425, |
| "valid_targets_mean": 6079.2, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 4.4840506329113925, |
| "grad_norm": 0.34486016144946086, |
| "learning_rate": 1.289671114713129e-06, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1330321580171585, |
| "step": 4430, |
| "valid_targets_mean": 3942.1, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 4.489113924050633, |
| "grad_norm": 0.3344555372523651, |
| "learning_rate": 1.264824565160716e-06, |
| "loss": 0.2802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1601177453994751, |
| "step": 4435, |
| "valid_targets_mean": 5832.6, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 4.494177215189874, |
| "grad_norm": 0.31338693723543865, |
| "learning_rate": 1.2402118767953342e-06, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11089809238910675, |
| "step": 4440, |
| "valid_targets_mean": 3433.5, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 4.499240506329114, |
| "grad_norm": 0.32257737557743127, |
| "learning_rate": 1.2158333568440183e-06, |
| "loss": 0.2943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19272515177726746, |
| "step": 4445, |
| "valid_targets_mean": 5173.0, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 4.504303797468355, |
| "grad_norm": 0.31362483355013254, |
| "learning_rate": 1.1916893096108063e-06, |
| "loss": 0.2946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1500798463821411, |
| "step": 4450, |
| "valid_targets_mean": 4663.4, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 4.509367088607595, |
| "grad_norm": 0.3261715632472016, |
| "learning_rate": 1.167780036472952e-06, |
| "loss": 0.2959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13341718912124634, |
| "step": 4455, |
| "valid_targets_mean": 3426.2, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 4.514430379746836, |
| "grad_norm": 0.30597584635072983, |
| "learning_rate": 1.1441058358771317e-06, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16293524205684662, |
| "step": 4460, |
| "valid_targets_mean": 4787.8, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 4.519493670886076, |
| "grad_norm": 0.2817037355554941, |
| "learning_rate": 1.1206670033357537e-06, |
| "loss": 0.2906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15130957961082458, |
| "step": 4465, |
| "valid_targets_mean": 5285.4, |
| "valid_targets_min": 1543 |
| }, |
| { |
| "epoch": 4.524556962025317, |
| "grad_norm": 0.31694092622996994, |
| "learning_rate": 1.0974638314232355e-06, |
| "loss": 0.2894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15193693339824677, |
| "step": 4470, |
| "valid_targets_mean": 4457.0, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 4.529620253164557, |
| "grad_norm": 0.3521199068866329, |
| "learning_rate": 1.074496609772384e-06, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12703898549079895, |
| "step": 4475, |
| "valid_targets_mean": 3699.0, |
| "valid_targets_min": 1328 |
| }, |
| { |
| "epoch": 4.534683544303798, |
| "grad_norm": 0.33021283919153493, |
| "learning_rate": 1.0517656250707575e-06, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17758193612098694, |
| "step": 4480, |
| "valid_targets_mean": 5269.1, |
| "valid_targets_min": 1336 |
| }, |
| { |
| "epoch": 4.539746835443038, |
| "grad_norm": 0.29305233423571464, |
| "learning_rate": 1.0292711610570904e-06, |
| "loss": 0.2799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17428819835186005, |
| "step": 4485, |
| "valid_targets_mean": 6173.5, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 4.544810126582279, |
| "grad_norm": 0.28819969743794543, |
| "learning_rate": 1.007013498517766e-06, |
| "loss": 0.2909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11772993206977844, |
| "step": 4490, |
| "valid_targets_mean": 4622.6, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 4.549873417721519, |
| "grad_norm": 0.28436809731542273, |
| "learning_rate": 9.849929152832937e-07, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1377575397491455, |
| "step": 4495, |
| "valid_targets_mean": 4425.2, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 4.55493670886076, |
| "grad_norm": 0.3150381879092353, |
| "learning_rate": 9.63209686224853e-07, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13312697410583496, |
| "step": 4500, |
| "valid_targets_mean": 3467.1, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.5600000000000005, |
| "grad_norm": 0.2911980506543601, |
| "learning_rate": 9.416640832508572e-07, |
| "loss": 0.2899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16458618640899658, |
| "step": 4505, |
| "valid_targets_mean": 5330.3, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 4.56506329113924, |
| "grad_norm": 0.32761330476726724, |
| "learning_rate": 9.203563753035527e-07, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15134479105472565, |
| "step": 4510, |
| "valid_targets_mean": 4789.5, |
| "valid_targets_min": 1240 |
| }, |
| { |
| "epoch": 4.570126582278481, |
| "grad_norm": 0.27610230646497064, |
| "learning_rate": 8.992868283556833e-07, |
| "loss": 0.3023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14713215827941895, |
| "step": 4515, |
| "valid_targets_mean": 5446.5, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 4.575189873417721, |
| "grad_norm": 0.33737396503280603, |
| "learning_rate": 8.78455705407144e-07, |
| "loss": 0.2892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15195101499557495, |
| "step": 4520, |
| "valid_targets_mean": 4126.9, |
| "valid_targets_min": 866 |
| }, |
| { |
| "epoch": 4.580253164556962, |
| "grad_norm": 0.421939799277528, |
| "learning_rate": 8.578632664817177e-07, |
| "loss": 0.2998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15855969488620758, |
| "step": 4525, |
| "valid_targets_mean": 4059.2, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 4.585316455696202, |
| "grad_norm": 0.30679616072425525, |
| "learning_rate": 8.375097686238187e-07, |
| "loss": 0.3003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15983693301677704, |
| "step": 4530, |
| "valid_targets_mean": 4688.2, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 4.590379746835443, |
| "grad_norm": 0.33783626379593873, |
| "learning_rate": 8.173954658952854e-07, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13029304146766663, |
| "step": 4535, |
| "valid_targets_mean": 3584.9, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 4.595443037974683, |
| "grad_norm": 0.409725960177412, |
| "learning_rate": 7.975206093722176e-07, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1639317274093628, |
| "step": 4540, |
| "valid_targets_mean": 4393.8, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 4.600506329113924, |
| "grad_norm": 0.34883872064169896, |
| "learning_rate": 7.778854471418306e-07, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1438419073820114, |
| "step": 4545, |
| "valid_targets_mean": 3598.3, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 4.605569620253164, |
| "grad_norm": 0.3163445155831429, |
| "learning_rate": 7.584902242993708e-07, |
| "loss": 0.2991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19004172086715698, |
| "step": 4550, |
| "valid_targets_mean": 5218.9, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 4.610632911392405, |
| "grad_norm": 0.28908020066387696, |
| "learning_rate": 7.393351829450379e-07, |
| "loss": 0.3023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12715786695480347, |
| "step": 4555, |
| "valid_targets_mean": 4291.9, |
| "valid_targets_min": 1068 |
| }, |
| { |
| "epoch": 4.6156962025316455, |
| "grad_norm": 0.3390758182489428, |
| "learning_rate": 7.204205621809813e-07, |
| "loss": 0.3018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16513592004776, |
| "step": 4560, |
| "valid_targets_mean": 4141.6, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 4.620759493670886, |
| "grad_norm": 0.3707332505274512, |
| "learning_rate": 7.017465981083127e-07, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18795087933540344, |
| "step": 4565, |
| "valid_targets_mean": 6154.2, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 4.6258227848101265, |
| "grad_norm": 0.3431279755640469, |
| "learning_rate": 6.833135238241473e-07, |
| "loss": 0.2955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1402522623538971, |
| "step": 4570, |
| "valid_targets_mean": 3705.2, |
| "valid_targets_min": 1346 |
| }, |
| { |
| "epoch": 4.630886075949367, |
| "grad_norm": 0.3201150073208208, |
| "learning_rate": 6.651215694187074e-07, |
| "loss": 0.2956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13963478803634644, |
| "step": 4575, |
| "valid_targets_mean": 4570.6, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 4.635949367088608, |
| "grad_norm": 0.32083737479519586, |
| "learning_rate": 6.471709619724386e-07, |
| "loss": 0.2811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1721346378326416, |
| "step": 4580, |
| "valid_targets_mean": 4410.9, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 4.641012658227848, |
| "grad_norm": 0.3413968428656355, |
| "learning_rate": 6.294619255531853e-07, |
| "loss": 0.2984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1746809184551239, |
| "step": 4585, |
| "valid_targets_mean": 4543.4, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 4.646075949367089, |
| "grad_norm": 0.2984905883347286, |
| "learning_rate": 6.119946812133926e-07, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2020062506198883, |
| "step": 4590, |
| "valid_targets_mean": 7061.8, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 4.651139240506329, |
| "grad_norm": 0.2957015403668056, |
| "learning_rate": 5.947694469873377e-07, |
| "loss": 0.3024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1912672221660614, |
| "step": 4595, |
| "valid_targets_mean": 6352.6, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 4.65620253164557, |
| "grad_norm": 0.3177142897029759, |
| "learning_rate": 5.777864378884212e-07, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1385997235774994, |
| "step": 4600, |
| "valid_targets_mean": 4380.5, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 4.66126582278481, |
| "grad_norm": 0.30671392692985, |
| "learning_rate": 5.610458659064688e-07, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17495407164096832, |
| "step": 4605, |
| "valid_targets_mean": 5155.4, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 4.666329113924051, |
| "grad_norm": 0.32460623503028924, |
| "learning_rate": 5.445479400051046e-07, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1435496062040329, |
| "step": 4610, |
| "valid_targets_mean": 4002.2, |
| "valid_targets_min": 1103 |
| }, |
| { |
| "epoch": 4.671392405063291, |
| "grad_norm": 0.3077758754022733, |
| "learning_rate": 5.282928661191178e-07, |
| "loss": 0.283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11725576967000961, |
| "step": 4615, |
| "valid_targets_mean": 3599.3, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 4.676455696202532, |
| "grad_norm": 0.2920943225927082, |
| "learning_rate": 5.12280847151918e-07, |
| "loss": 0.2933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15268352627754211, |
| "step": 4620, |
| "valid_targets_mean": 4974.8, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 4.681518987341772, |
| "grad_norm": 0.3310902814879114, |
| "learning_rate": 4.965120829729819e-07, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1577180027961731, |
| "step": 4625, |
| "valid_targets_mean": 4892.1, |
| "valid_targets_min": 1480 |
| }, |
| { |
| "epoch": 4.686582278481013, |
| "grad_norm": 0.3364738036743787, |
| "learning_rate": 4.809867704153726e-07, |
| "loss": 0.2962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11956533789634705, |
| "step": 4630, |
| "valid_targets_mean": 3546.2, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 4.6916455696202535, |
| "grad_norm": 0.34774374236202665, |
| "learning_rate": 4.657051032732707e-07, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14325565099716187, |
| "step": 4635, |
| "valid_targets_mean": 3353.1, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 4.696708860759494, |
| "grad_norm": 0.32445866672285933, |
| "learning_rate": 4.506672722995609e-07, |
| "loss": 0.2953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1779376119375229, |
| "step": 4640, |
| "valid_targets_mean": 5084.9, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 4.7017721518987345, |
| "grad_norm": 0.3370837185705519, |
| "learning_rate": 4.358734652034624e-07, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12637917697429657, |
| "step": 4645, |
| "valid_targets_mean": 3544.5, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 4.706835443037974, |
| "grad_norm": 0.3141292209016846, |
| "learning_rate": 4.2132386664815783e-07, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13325795531272888, |
| "step": 4650, |
| "valid_targets_mean": 4623.6, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 4.711898734177215, |
| "grad_norm": 0.3052040124075767, |
| "learning_rate": 4.070186582485214e-07, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14848539233207703, |
| "step": 4655, |
| "valid_targets_mean": 3974.2, |
| "valid_targets_min": 1752 |
| }, |
| { |
| "epoch": 4.716962025316455, |
| "grad_norm": 0.3485398015143201, |
| "learning_rate": 3.9295801856882307e-07, |
| "loss": 0.3033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15560302138328552, |
| "step": 4660, |
| "valid_targets_mean": 3853.7, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 4.722025316455696, |
| "grad_norm": 0.30603263342163534, |
| "learning_rate": 3.791421231205217e-07, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1302764117717743, |
| "step": 4665, |
| "valid_targets_mean": 4759.7, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 4.727088607594936, |
| "grad_norm": 0.36206047089808735, |
| "learning_rate": 3.6557114436005516e-07, |
| "loss": 0.2953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11317434906959534, |
| "step": 4670, |
| "valid_targets_mean": 2750.8, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 4.732151898734177, |
| "grad_norm": 0.31924377751088473, |
| "learning_rate": 3.522452516867048e-07, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19149929285049438, |
| "step": 4675, |
| "valid_targets_mean": 5680.5, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 4.737215189873417, |
| "grad_norm": 0.40142669703450146, |
| "learning_rate": 3.391646114404701e-07, |
| "loss": 0.3025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1676904857158661, |
| "step": 4680, |
| "valid_targets_mean": 5601.9, |
| "valid_targets_min": 1777 |
| }, |
| { |
| "epoch": 4.742278481012658, |
| "grad_norm": 0.33298593772917773, |
| "learning_rate": 3.263293868999928e-07, |
| "loss": 0.2974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1185358390212059, |
| "step": 4685, |
| "valid_targets_mean": 2993.5, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 4.7473417721518985, |
| "grad_norm": 0.28590139808721005, |
| "learning_rate": 3.1373973828052964e-07, |
| "loss": 0.2946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1383609175682068, |
| "step": 4690, |
| "valid_targets_mean": 4685.9, |
| "valid_targets_min": 1897 |
| }, |
| { |
| "epoch": 4.752405063291139, |
| "grad_norm": 0.33045699934667616, |
| "learning_rate": 3.013958227319358e-07, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.128380686044693, |
| "step": 4695, |
| "valid_targets_mean": 3661.8, |
| "valid_targets_min": 1102 |
| }, |
| { |
| "epoch": 4.7574683544303795, |
| "grad_norm": 0.3175505591380564, |
| "learning_rate": 2.892977943367159e-07, |
| "loss": 0.2774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19775532186031342, |
| "step": 4700, |
| "valid_targets_mean": 5166.0, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 4.76253164556962, |
| "grad_norm": 0.2773796894575858, |
| "learning_rate": 2.774458041080963e-07, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12263042479753494, |
| "step": 4705, |
| "valid_targets_mean": 4538.4, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 4.767594936708861, |
| "grad_norm": 0.3292357564608315, |
| "learning_rate": 2.6583999998814e-07, |
| "loss": 0.2953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14571279287338257, |
| "step": 4710, |
| "valid_targets_mean": 3984.7, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 4.772658227848101, |
| "grad_norm": 0.3368831623026044, |
| "learning_rate": 2.544805268459016e-07, |
| "loss": 0.2867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21459759771823883, |
| "step": 4715, |
| "valid_targets_mean": 4702.3, |
| "valid_targets_min": 1266 |
| }, |
| { |
| "epoch": 4.777721518987342, |
| "grad_norm": 0.335601220973268, |
| "learning_rate": 2.4336752647561304e-07, |
| "loss": 0.2845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14298905432224274, |
| "step": 4720, |
| "valid_targets_mean": 3874.7, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 4.782784810126582, |
| "grad_norm": 0.28413880966924987, |
| "learning_rate": 2.3250113759492266e-07, |
| "loss": 0.2862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1618804931640625, |
| "step": 4725, |
| "valid_targets_mean": 5582.7, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 4.787848101265823, |
| "grad_norm": 0.3021482607745952, |
| "learning_rate": 2.2188149584315922e-07, |
| "loss": 0.3055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15998998284339905, |
| "step": 4730, |
| "valid_targets_mean": 4565.1, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 4.792911392405063, |
| "grad_norm": 0.3011882542828061, |
| "learning_rate": 2.1150873377963954e-07, |
| "loss": 0.3021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1401754915714264, |
| "step": 4735, |
| "valid_targets_mean": 5010.8, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 4.797974683544304, |
| "grad_norm": 0.3507567997328214, |
| "learning_rate": 2.0138298088201004e-07, |
| "loss": 0.2854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0675700232386589, |
| "step": 4740, |
| "valid_targets_mean": 2630.8, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 4.803037974683544, |
| "grad_norm": 0.3187910514753291, |
| "learning_rate": 1.915043635446323e-07, |
| "loss": 0.2916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12245633453130722, |
| "step": 4745, |
| "valid_targets_mean": 3394.0, |
| "valid_targets_min": 1403 |
| }, |
| { |
| "epoch": 4.808101265822785, |
| "grad_norm": 0.2967133708531598, |
| "learning_rate": 1.8187300507701345e-07, |
| "loss": 0.3035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1302807629108429, |
| "step": 4750, |
| "valid_targets_mean": 3881.6, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 4.813164556962025, |
| "grad_norm": 0.30044714660435673, |
| "learning_rate": 1.7248902570225378e-07, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13116371631622314, |
| "step": 4755, |
| "valid_targets_mean": 4054.7, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 4.818227848101266, |
| "grad_norm": 0.3161774057323668, |
| "learning_rate": 1.6335254255555933e-07, |
| "loss": 0.2925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14581556618213654, |
| "step": 4760, |
| "valid_targets_mean": 4080.4, |
| "valid_targets_min": 1368 |
| }, |
| { |
| "epoch": 4.8232911392405065, |
| "grad_norm": 0.30034489171760914, |
| "learning_rate": 1.5446366968276283e-07, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1464047133922577, |
| "step": 4765, |
| "valid_targets_mean": 4359.5, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 4.828354430379747, |
| "grad_norm": 0.30396263421785596, |
| "learning_rate": 1.4582251803892055e-07, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14488472044467926, |
| "step": 4770, |
| "valid_targets_mean": 4854.4, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 4.8334177215189875, |
| "grad_norm": 0.25886849889886787, |
| "learning_rate": 1.3742919548691114e-07, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13551469147205353, |
| "step": 4775, |
| "valid_targets_mean": 5292.5, |
| "valid_targets_min": 1085 |
| }, |
| { |
| "epoch": 4.838481012658228, |
| "grad_norm": 0.3369536866060149, |
| "learning_rate": 1.2928380679609442e-07, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20701755583286285, |
| "step": 4780, |
| "valid_targets_mean": 5313.5, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 4.843544303797469, |
| "grad_norm": 0.2981209270612857, |
| "learning_rate": 1.2138645364101032e-07, |
| "loss": 0.2933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11797007918357849, |
| "step": 4785, |
| "valid_targets_mean": 4077.7, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 4.848607594936709, |
| "grad_norm": 0.2923056085103413, |
| "learning_rate": 1.1373723460009756e-07, |
| "loss": 0.2866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18645049631595612, |
| "step": 4790, |
| "valid_targets_mean": 6275.9, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 4.85367088607595, |
| "grad_norm": 0.31520564975094073, |
| "learning_rate": 1.0633624515447027e-07, |
| "loss": 0.3001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1347823590040207, |
| "step": 4795, |
| "valid_targets_mean": 3709.9, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 4.85873417721519, |
| "grad_norm": 0.330282900217264, |
| "learning_rate": 9.918357768673004e-08, |
| "loss": 0.3003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10554465651512146, |
| "step": 4800, |
| "valid_targets_mean": 3067.8, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 4.863797468354431, |
| "grad_norm": 0.34394007944621313, |
| "learning_rate": 9.22793214797979e-08, |
| "loss": 0.3043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1265249103307724, |
| "step": 4805, |
| "valid_targets_mean": 3206.9, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 4.868860759493671, |
| "grad_norm": 0.3066301892656282, |
| "learning_rate": 8.562356271582194e-08, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11144056916236877, |
| "step": 4810, |
| "valid_targets_mean": 3448.4, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 4.873924050632912, |
| "grad_norm": 0.31898550298505707, |
| "learning_rate": 7.92163844750804e-08, |
| "loss": 0.2921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17169725894927979, |
| "step": 4815, |
| "valid_targets_mean": 4453.8, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 4.878987341772152, |
| "grad_norm": 0.35072783756221276, |
| "learning_rate": 7.305786673495796e-08, |
| "loss": 0.298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1834912747144699, |
| "step": 4820, |
| "valid_targets_mean": 4796.1, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 4.884050632911393, |
| "grad_norm": 0.30086828019346806, |
| "learning_rate": 6.714808636893999e-08, |
| "loss": 0.2984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19445079565048218, |
| "step": 4825, |
| "valid_targets_mean": 5488.9, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 4.889113924050633, |
| "grad_norm": 0.29066248451169346, |
| "learning_rate": 6.148711714565992e-08, |
| "loss": 0.2906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14921297132968903, |
| "step": 4830, |
| "valid_targets_mean": 5289.1, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 4.894177215189873, |
| "grad_norm": 0.3206808977051651, |
| "learning_rate": 5.6075029727971075e-08, |
| "loss": 0.294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15516558289527893, |
| "step": 4835, |
| "valid_targets_mean": 4284.6, |
| "valid_targets_min": 1465 |
| }, |
| { |
| "epoch": 4.899240506329114, |
| "grad_norm": 0.34136663563954944, |
| "learning_rate": 5.091189167207189e-08, |
| "loss": 0.3011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16188789904117584, |
| "step": 4840, |
| "valid_targets_mean": 4162.2, |
| "valid_targets_min": 1536 |
| }, |
| { |
| "epoch": 4.904303797468354, |
| "grad_norm": 0.2892291641651244, |
| "learning_rate": 4.5997767426653183e-08, |
| "loss": 0.2969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11494030058383942, |
| "step": 4845, |
| "valid_targets_mean": 3805.9, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 4.909367088607595, |
| "grad_norm": 0.3310728562870818, |
| "learning_rate": 4.133271833210772e-08, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15285596251487732, |
| "step": 4850, |
| "valid_targets_mean": 4150.3, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 4.914430379746835, |
| "grad_norm": 0.29329622685622975, |
| "learning_rate": 3.6916802619746395e-08, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16643556952476501, |
| "step": 4855, |
| "valid_targets_mean": 5756.4, |
| "valid_targets_min": 1791 |
| }, |
| { |
| "epoch": 4.919493670886076, |
| "grad_norm": 0.3795378130128926, |
| "learning_rate": 3.2750075411087654e-08, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20965784788131714, |
| "step": 4860, |
| "valid_targets_mean": 5036.8, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 4.924556962025316, |
| "grad_norm": 0.3227285897594828, |
| "learning_rate": 2.8832588717164766e-08, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13055765628814697, |
| "step": 4865, |
| "valid_targets_mean": 3481.6, |
| "valid_targets_min": 1608 |
| }, |
| { |
| "epoch": 4.929620253164557, |
| "grad_norm": 0.30074655411206147, |
| "learning_rate": 2.516439143786631e-08, |
| "loss": 0.3002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17739662528038025, |
| "step": 4870, |
| "valid_targets_mean": 5336.9, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 4.934683544303797, |
| "grad_norm": 0.37988249749008485, |
| "learning_rate": 2.1745529361343333e-08, |
| "loss": 0.2951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18349409103393555, |
| "step": 4875, |
| "valid_targets_mean": 5208.7, |
| "valid_targets_min": 1284 |
| }, |
| { |
| "epoch": 4.939746835443038, |
| "grad_norm": 0.3022387792298933, |
| "learning_rate": 1.857604516342315e-08, |
| "loss": 0.2971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1349787563085556, |
| "step": 4880, |
| "valid_targets_mean": 4001.4, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 4.944810126582278, |
| "grad_norm": 0.3239022765036362, |
| "learning_rate": 1.5655978407085326e-08, |
| "loss": 0.3022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15572325885295868, |
| "step": 4885, |
| "valid_targets_mean": 4256.0, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 4.949873417721519, |
| "grad_norm": 0.3484022919664308, |
| "learning_rate": 1.2985365541959838e-08, |
| "loss": 0.2871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1123068630695343, |
| "step": 4890, |
| "valid_targets_mean": 3383.1, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 4.954936708860759, |
| "grad_norm": 0.2766076122909068, |
| "learning_rate": 1.0564239903885221e-08, |
| "loss": 0.298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13588979840278625, |
| "step": 4895, |
| "valid_targets_mean": 5022.2, |
| "valid_targets_min": 1687 |
| }, |
| { |
| "epoch": 4.96, |
| "grad_norm": 0.3637031857594984, |
| "learning_rate": 8.392631714477794e-09, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22151219844818115, |
| "step": 4900, |
| "valid_targets_mean": 4548.4, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 4.9650632911392405, |
| "grad_norm": 0.3070617643850501, |
| "learning_rate": 6.470568080760853e-09, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1599656343460083, |
| "step": 4905, |
| "valid_targets_mean": 5380.0, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 4.970126582278481, |
| "grad_norm": 0.2982099706698035, |
| "learning_rate": 4.798072994827152e-09, |
| "loss": 0.2819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13907426595687866, |
| "step": 4910, |
| "valid_targets_mean": 4511.9, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 4.975189873417722, |
| "grad_norm": 0.34819560371210506, |
| "learning_rate": 3.3751673335458147e-09, |
| "loss": 0.2899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14076785743236542, |
| "step": 4915, |
| "valid_targets_mean": 3422.9, |
| "valid_targets_min": 1383 |
| }, |
| { |
| "epoch": 4.980253164556962, |
| "grad_norm": 0.3120620502259134, |
| "learning_rate": 2.2018688582803315e-09, |
| "loss": 0.2976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17987266182899475, |
| "step": 4920, |
| "valid_targets_mean": 5285.9, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 4.985316455696203, |
| "grad_norm": 0.28626460706538365, |
| "learning_rate": 1.2781922146931635e-09, |
| "loss": 0.3007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15345998108386993, |
| "step": 4925, |
| "valid_targets_mean": 5331.3, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 4.990379746835443, |
| "grad_norm": 0.30214318111472815, |
| "learning_rate": 6.041489325459004e-10, |
| "loss": 0.2843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14609292149543762, |
| "step": 4930, |
| "valid_targets_mean": 4398.6, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 4.995443037974684, |
| "grad_norm": 0.36710406768986703, |
| "learning_rate": 1.7974742556159386e-10, |
| "loss": 0.2945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17454470694065094, |
| "step": 4935, |
| "valid_targets_mean": 4667.4, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.42711913533675244, |
| "learning_rate": 4.992991313734763e-12, |
| "loss": 0.2954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29739144444465637, |
| "step": 4940, |
| "valid_targets_mean": 4348.2, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 5.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29739144444465637, |
| "step": 4940, |
| "total_flos": 1.3775029894633226e+18, |
| "train_loss": 0.31707094306887884, |
| "train_runtime": 34760.1149, |
| "train_samples_per_second": 4.545, |
| "train_steps_per_second": 0.142, |
| "valid_targets_mean": 4348.2, |
| "valid_targets_min": 876 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4940, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 5, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": false, |
| "should_training_stop": false |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1.3775029894633226e+18, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|