| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4319, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.010351966873706004, |
| "grad_norm": 15.605315613103867, |
| "learning_rate": 4.71976401179941e-07, |
| "loss": 0.6774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7991642951965332, |
| "step": 5, |
| "valid_targets_mean": 2069.4, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 0.020703933747412008, |
| "grad_norm": 8.863140569141265, |
| "learning_rate": 1.0619469026548673e-06, |
| "loss": 0.7208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6838527917861938, |
| "step": 10, |
| "valid_targets_mean": 3883.4, |
| "valid_targets_min": 313 |
| }, |
| { |
| "epoch": 0.031055900621118012, |
| "grad_norm": 12.629168153366845, |
| "learning_rate": 1.6519174041297937e-06, |
| "loss": 0.685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7600278854370117, |
| "step": 15, |
| "valid_targets_mean": 2096.7, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 0.041407867494824016, |
| "grad_norm": 6.799624906702634, |
| "learning_rate": 2.24188790560472e-06, |
| "loss": 0.6675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6246192455291748, |
| "step": 20, |
| "valid_targets_mean": 3201.5, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 0.051759834368530024, |
| "grad_norm": 4.637130666016448, |
| "learning_rate": 2.831858407079646e-06, |
| "loss": 0.6722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7706674337387085, |
| "step": 25, |
| "valid_targets_mean": 3519.5, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 0.062111801242236024, |
| "grad_norm": 3.1183737090108545, |
| "learning_rate": 3.4218289085545726e-06, |
| "loss": 0.6021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6737767457962036, |
| "step": 30, |
| "valid_targets_mean": 3171.9, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 0.07246376811594203, |
| "grad_norm": 2.298602022892457, |
| "learning_rate": 4.011799410029498e-06, |
| "loss": 0.5708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5966386795043945, |
| "step": 35, |
| "valid_targets_mean": 2413.9, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 0.08281573498964803, |
| "grad_norm": 1.9166901302469286, |
| "learning_rate": 4.6017699115044254e-06, |
| "loss": 0.4853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5276696681976318, |
| "step": 40, |
| "valid_targets_mean": 1972.9, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 0.09316770186335403, |
| "grad_norm": 2.287553544660079, |
| "learning_rate": 5.191740412979352e-06, |
| "loss": 0.4365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.441994309425354, |
| "step": 45, |
| "valid_targets_mean": 3530.9, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 0.10351966873706005, |
| "grad_norm": 1.2570057018709198, |
| "learning_rate": 5.781710914454279e-06, |
| "loss": 0.4807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5429658889770508, |
| "step": 50, |
| "valid_targets_mean": 2901.6, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 0.11387163561076605, |
| "grad_norm": 0.930016752086229, |
| "learning_rate": 6.371681415929204e-06, |
| "loss": 0.5788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44122475385665894, |
| "step": 55, |
| "valid_targets_mean": 3173.3, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 0.12422360248447205, |
| "grad_norm": 0.8587397931841486, |
| "learning_rate": 6.961651917404131e-06, |
| "loss": 0.4867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46632158756256104, |
| "step": 60, |
| "valid_targets_mean": 2709.9, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 0.13457556935817805, |
| "grad_norm": 0.9248959615543452, |
| "learning_rate": 7.551622418879056e-06, |
| "loss": 0.5078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49240103363990784, |
| "step": 65, |
| "valid_targets_mean": 2006.4, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 0.14492753623188406, |
| "grad_norm": 0.7279615677685586, |
| "learning_rate": 8.141592920353984e-06, |
| "loss": 0.425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39918971061706543, |
| "step": 70, |
| "valid_targets_mean": 3112.9, |
| "valid_targets_min": 431 |
| }, |
| { |
| "epoch": 0.15527950310559005, |
| "grad_norm": 0.7659577874600716, |
| "learning_rate": 8.73156342182891e-06, |
| "loss": 0.4238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40704938769340515, |
| "step": 75, |
| "valid_targets_mean": 2240.1, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 0.16563146997929606, |
| "grad_norm": 0.7216997725030858, |
| "learning_rate": 9.321533923303837e-06, |
| "loss": 0.4238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43496978282928467, |
| "step": 80, |
| "valid_targets_mean": 3710.6, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 0.17598343685300208, |
| "grad_norm": 0.8774588952929467, |
| "learning_rate": 9.911504424778762e-06, |
| "loss": 0.4171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43825411796569824, |
| "step": 85, |
| "valid_targets_mean": 1872.3, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 0.18633540372670807, |
| "grad_norm": 0.8451380882184308, |
| "learning_rate": 1.0501474926253687e-05, |
| "loss": 0.4484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44401633739471436, |
| "step": 90, |
| "valid_targets_mean": 2137.0, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 0.19668737060041408, |
| "grad_norm": 0.6084483563484301, |
| "learning_rate": 1.1091445427728616e-05, |
| "loss": 0.4483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3756181001663208, |
| "step": 95, |
| "valid_targets_mean": 3593.1, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 0.2070393374741201, |
| "grad_norm": 0.6213761233419673, |
| "learning_rate": 1.1681415929203541e-05, |
| "loss": 0.4075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4502703547477722, |
| "step": 100, |
| "valid_targets_mean": 3648.6, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 0.21739130434782608, |
| "grad_norm": 0.9269246228823874, |
| "learning_rate": 1.2271386430678467e-05, |
| "loss": 0.4266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4538400173187256, |
| "step": 105, |
| "valid_targets_mean": 1649.7, |
| "valid_targets_min": 1060 |
| }, |
| { |
| "epoch": 0.2277432712215321, |
| "grad_norm": 0.6575358320968785, |
| "learning_rate": 1.2861356932153392e-05, |
| "loss": 0.4556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4259205162525177, |
| "step": 110, |
| "valid_targets_mean": 2929.3, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 0.23809523809523808, |
| "grad_norm": 0.7520773860181491, |
| "learning_rate": 1.345132743362832e-05, |
| "loss": 0.4091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.51981520652771, |
| "step": 115, |
| "valid_targets_mean": 2942.2, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 0.2484472049689441, |
| "grad_norm": 0.6260406424910655, |
| "learning_rate": 1.4041297935103246e-05, |
| "loss": 0.4403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.463638037443161, |
| "step": 120, |
| "valid_targets_mean": 3665.9, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 0.2587991718426501, |
| "grad_norm": 0.7666598846619594, |
| "learning_rate": 1.4631268436578171e-05, |
| "loss": 0.4347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49128270149230957, |
| "step": 125, |
| "valid_targets_mean": 2527.6, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 0.2691511387163561, |
| "grad_norm": 0.863409285542385, |
| "learning_rate": 1.5221238938053098e-05, |
| "loss": 0.3948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5175631046295166, |
| "step": 130, |
| "valid_targets_mean": 2604.3, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 0.2795031055900621, |
| "grad_norm": 0.6514406268066054, |
| "learning_rate": 1.5811209439528025e-05, |
| "loss": 0.3959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3603256940841675, |
| "step": 135, |
| "valid_targets_mean": 2682.6, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 0.2898550724637681, |
| "grad_norm": 0.7385382622379217, |
| "learning_rate": 1.6401179941002953e-05, |
| "loss": 0.3854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3818318247795105, |
| "step": 140, |
| "valid_targets_mean": 2239.2, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 0.3002070393374741, |
| "grad_norm": 0.7388257073327376, |
| "learning_rate": 1.6991150442477876e-05, |
| "loss": 0.429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5566807985305786, |
| "step": 145, |
| "valid_targets_mean": 3091.8, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 0.3105590062111801, |
| "grad_norm": 0.842626090176198, |
| "learning_rate": 1.7581120943952803e-05, |
| "loss": 0.4001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3940976560115814, |
| "step": 150, |
| "valid_targets_mean": 1999.4, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 0.32091097308488614, |
| "grad_norm": 0.6925465806852213, |
| "learning_rate": 1.817109144542773e-05, |
| "loss": 0.4275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44604888558387756, |
| "step": 155, |
| "valid_targets_mean": 2645.6, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 0.33126293995859213, |
| "grad_norm": 0.6871016903538135, |
| "learning_rate": 1.8761061946902657e-05, |
| "loss": 0.3953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4031655192375183, |
| "step": 160, |
| "valid_targets_mean": 2989.4, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 0.3416149068322981, |
| "grad_norm": 0.7772347914126068, |
| "learning_rate": 1.935103244837758e-05, |
| "loss": 0.3942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4824008345603943, |
| "step": 165, |
| "valid_targets_mean": 2767.8, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 0.35196687370600416, |
| "grad_norm": 0.7369249527882769, |
| "learning_rate": 1.9941002949852508e-05, |
| "loss": 0.3649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3546352982521057, |
| "step": 170, |
| "valid_targets_mean": 2191.2, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 0.36231884057971014, |
| "grad_norm": 0.7534283311389234, |
| "learning_rate": 2.0530973451327435e-05, |
| "loss": 0.3829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3965192437171936, |
| "step": 175, |
| "valid_targets_mean": 2274.2, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 0.37267080745341613, |
| "grad_norm": 0.5744145884839316, |
| "learning_rate": 2.1120943952802362e-05, |
| "loss": 0.3689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27616333961486816, |
| "step": 180, |
| "valid_targets_mean": 3288.3, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.3830227743271222, |
| "grad_norm": 0.7399447267515546, |
| "learning_rate": 2.171091445427729e-05, |
| "loss": 0.4155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5079173445701599, |
| "step": 185, |
| "valid_targets_mean": 3585.9, |
| "valid_targets_min": 305 |
| }, |
| { |
| "epoch": 0.39337474120082816, |
| "grad_norm": 0.787595577330117, |
| "learning_rate": 2.2300884955752213e-05, |
| "loss": 0.3672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40638184547424316, |
| "step": 190, |
| "valid_targets_mean": 2532.8, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 0.40372670807453415, |
| "grad_norm": 0.8366148088688402, |
| "learning_rate": 2.289085545722714e-05, |
| "loss": 0.3903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.344083696603775, |
| "step": 195, |
| "valid_targets_mean": 1931.6, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 0.4140786749482402, |
| "grad_norm": 0.7049038068177579, |
| "learning_rate": 2.3480825958702063e-05, |
| "loss": 0.366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3272162675857544, |
| "step": 200, |
| "valid_targets_mean": 2669.5, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 0.4244306418219462, |
| "grad_norm": 0.722982409943531, |
| "learning_rate": 2.4070796460176994e-05, |
| "loss": 0.4846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4433075487613678, |
| "step": 205, |
| "valid_targets_mean": 2856.4, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 0.43478260869565216, |
| "grad_norm": 0.6216316854835306, |
| "learning_rate": 2.466076696165192e-05, |
| "loss": 0.3702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3501080870628357, |
| "step": 210, |
| "valid_targets_mean": 2924.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.4451345755693582, |
| "grad_norm": 0.8036432318505198, |
| "learning_rate": 2.5250737463126848e-05, |
| "loss": 0.3722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3556331992149353, |
| "step": 215, |
| "valid_targets_mean": 2358.1, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 0.4554865424430642, |
| "grad_norm": 0.9026688718475531, |
| "learning_rate": 2.584070796460177e-05, |
| "loss": 0.4376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.362284779548645, |
| "step": 220, |
| "valid_targets_mean": 1682.8, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 0.4658385093167702, |
| "grad_norm": 0.8474657010085218, |
| "learning_rate": 2.64306784660767e-05, |
| "loss": 0.3687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41895484924316406, |
| "step": 225, |
| "valid_targets_mean": 1957.7, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 0.47619047619047616, |
| "grad_norm": 0.5989684265924352, |
| "learning_rate": 2.7020648967551622e-05, |
| "loss": 0.3956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.270280659198761, |
| "step": 230, |
| "valid_targets_mean": 3520.2, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 0.4865424430641822, |
| "grad_norm": 0.7407035731133066, |
| "learning_rate": 2.761061946902655e-05, |
| "loss": 0.3462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33700358867645264, |
| "step": 235, |
| "valid_targets_mean": 3075.6, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 0.4968944099378882, |
| "grad_norm": 0.6514761903429114, |
| "learning_rate": 2.8200589970501476e-05, |
| "loss": 0.3657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40764114260673523, |
| "step": 240, |
| "valid_targets_mean": 3008.0, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 0.5072463768115942, |
| "grad_norm": 0.9486281355398519, |
| "learning_rate": 2.8790560471976407e-05, |
| "loss": 0.2909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3389992117881775, |
| "step": 245, |
| "valid_targets_mean": 2530.0, |
| "valid_targets_min": 292 |
| }, |
| { |
| "epoch": 0.5175983436853002, |
| "grad_norm": 0.8255724854520955, |
| "learning_rate": 2.938053097345133e-05, |
| "loss": 0.387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5169772505760193, |
| "step": 250, |
| "valid_targets_mean": 2672.6, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 0.5279503105590062, |
| "grad_norm": 0.744452870979198, |
| "learning_rate": 2.9970501474926257e-05, |
| "loss": 0.4064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38283827900886536, |
| "step": 255, |
| "valid_targets_mean": 2401.8, |
| "valid_targets_min": 1422 |
| }, |
| { |
| "epoch": 0.5383022774327122, |
| "grad_norm": 0.5635474379382327, |
| "learning_rate": 3.0560471976401184e-05, |
| "loss": 0.3819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4241616725921631, |
| "step": 260, |
| "valid_targets_mean": 5410.8, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.5486542443064182, |
| "grad_norm": 0.676856787568286, |
| "learning_rate": 3.115044247787611e-05, |
| "loss": 0.3813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.534885823726654, |
| "step": 265, |
| "valid_targets_mean": 4032.4, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 0.5590062111801242, |
| "grad_norm": 0.685650100513104, |
| "learning_rate": 3.174041297935103e-05, |
| "loss": 0.3515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34689125418663025, |
| "step": 270, |
| "valid_targets_mean": 2478.0, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 0.5693581780538303, |
| "grad_norm": 0.92365940319728, |
| "learning_rate": 3.233038348082596e-05, |
| "loss": 0.3328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3527258038520813, |
| "step": 275, |
| "valid_targets_mean": 1704.9, |
| "valid_targets_min": 211 |
| }, |
| { |
| "epoch": 0.5797101449275363, |
| "grad_norm": 0.7943251607272555, |
| "learning_rate": 3.2920353982300886e-05, |
| "loss": 0.3735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31049463152885437, |
| "step": 280, |
| "valid_targets_mean": 1748.0, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 0.5900621118012422, |
| "grad_norm": 0.7707949131715036, |
| "learning_rate": 3.3510324483775816e-05, |
| "loss": 0.3549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3978985548019409, |
| "step": 285, |
| "valid_targets_mean": 2196.7, |
| "valid_targets_min": 345 |
| }, |
| { |
| "epoch": 0.6004140786749482, |
| "grad_norm": 0.9067101706634203, |
| "learning_rate": 3.410029498525074e-05, |
| "loss": 0.3773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3796255588531494, |
| "step": 290, |
| "valid_targets_mean": 1666.6, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 0.6107660455486542, |
| "grad_norm": 0.49575725135513243, |
| "learning_rate": 3.469026548672567e-05, |
| "loss": 0.3283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3226116895675659, |
| "step": 295, |
| "valid_targets_mean": 4260.1, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 0.6211180124223602, |
| "grad_norm": 0.7176031931898035, |
| "learning_rate": 3.5280235988200594e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32411545515060425, |
| "step": 300, |
| "valid_targets_mean": 2275.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 0.6314699792960663, |
| "grad_norm": 0.7663570928663194, |
| "learning_rate": 3.587020648967552e-05, |
| "loss": 0.3817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3520033359527588, |
| "step": 305, |
| "valid_targets_mean": 2414.7, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 0.6418219461697723, |
| "grad_norm": 0.46213987326297384, |
| "learning_rate": 3.646017699115044e-05, |
| "loss": 0.323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29329046607017517, |
| "step": 310, |
| "valid_targets_mean": 4565.9, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 0.6521739130434783, |
| "grad_norm": 0.6297790214422954, |
| "learning_rate": 3.705014749262537e-05, |
| "loss": 0.3365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27002575993537903, |
| "step": 315, |
| "valid_targets_mean": 2892.7, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 0.6625258799171843, |
| "grad_norm": 0.6803152264658195, |
| "learning_rate": 3.7640117994100295e-05, |
| "loss": 0.3263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35963690280914307, |
| "step": 320, |
| "valid_targets_mean": 2670.9, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 0.6728778467908902, |
| "grad_norm": 0.660475255702629, |
| "learning_rate": 3.8230088495575226e-05, |
| "loss": 0.3664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3141520619392395, |
| "step": 325, |
| "valid_targets_mean": 2466.3, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 0.6832298136645962, |
| "grad_norm": 0.5714885591458042, |
| "learning_rate": 3.882005899705015e-05, |
| "loss": 0.3123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2787840962409973, |
| "step": 330, |
| "valid_targets_mean": 2959.7, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.6935817805383023, |
| "grad_norm": 0.7840125701270887, |
| "learning_rate": 3.941002949852508e-05, |
| "loss": 0.3609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3164142966270447, |
| "step": 335, |
| "valid_targets_mean": 3174.2, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 0.7039337474120083, |
| "grad_norm": 0.6419066522152682, |
| "learning_rate": 4e-05, |
| "loss": 0.3102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30930954217910767, |
| "step": 340, |
| "valid_targets_mean": 3136.9, |
| "valid_targets_min": 440 |
| }, |
| { |
| "epoch": 0.7142857142857143, |
| "grad_norm": 0.5059032670699602, |
| "learning_rate": 3.999973336302744e-05, |
| "loss": 0.3525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25785183906555176, |
| "step": 345, |
| "valid_targets_mean": 3533.2, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 0.7246376811594203, |
| "grad_norm": 0.791626821129135, |
| "learning_rate": 3.999893345921928e-05, |
| "loss": 0.3358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3422420918941498, |
| "step": 350, |
| "valid_targets_mean": 2178.9, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 0.7349896480331263, |
| "grad_norm": 0.5850437706333231, |
| "learning_rate": 3.999760030990392e-05, |
| "loss": 0.3754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3285501003265381, |
| "step": 355, |
| "valid_targets_mean": 3447.8, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 0.7453416149068323, |
| "grad_norm": 1.4793972289409643, |
| "learning_rate": 3.999573395062805e-05, |
| "loss": 0.3541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4052942991256714, |
| "step": 360, |
| "valid_targets_mean": 2194.2, |
| "valid_targets_min": 217 |
| }, |
| { |
| "epoch": 0.7556935817805382, |
| "grad_norm": 0.8161182629951351, |
| "learning_rate": 3.9993334431155696e-05, |
| "loss": 0.3496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3312402367591858, |
| "step": 365, |
| "valid_targets_mean": 1771.2, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 0.7660455486542443, |
| "grad_norm": 0.7778042883063869, |
| "learning_rate": 3.9990401815466935e-05, |
| "loss": 0.3156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39662399888038635, |
| "step": 370, |
| "valid_targets_mean": 2807.4, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 0.7763975155279503, |
| "grad_norm": 0.9868164908098449, |
| "learning_rate": 3.9986936181756133e-05, |
| "loss": 0.3484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3773801326751709, |
| "step": 375, |
| "valid_targets_mean": 2612.4, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 0.7867494824016563, |
| "grad_norm": 0.7554054875779739, |
| "learning_rate": 3.9982937622429904e-05, |
| "loss": 0.3218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.378534197807312, |
| "step": 380, |
| "valid_targets_mean": 2050.9, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 0.7971014492753623, |
| "grad_norm": 0.6391636850831167, |
| "learning_rate": 3.997840624410462e-05, |
| "loss": 0.3325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30764123797416687, |
| "step": 385, |
| "valid_targets_mean": 3234.5, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 0.8074534161490683, |
| "grad_norm": 0.659669602172271, |
| "learning_rate": 3.997334216760358e-05, |
| "loss": 0.3556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2978909909725189, |
| "step": 390, |
| "valid_targets_mean": 4481.5, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 0.8178053830227743, |
| "grad_norm": 0.6718264239579972, |
| "learning_rate": 3.996774552795379e-05, |
| "loss": 0.3685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3460586667060852, |
| "step": 395, |
| "valid_targets_mean": 2349.4, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 0.8281573498964804, |
| "grad_norm": 0.7476248873647089, |
| "learning_rate": 3.996161647438236e-05, |
| "loss": 0.3653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3052156865596771, |
| "step": 400, |
| "valid_targets_mean": 2157.8, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 0.8385093167701864, |
| "grad_norm": 0.8223378901356958, |
| "learning_rate": 3.9954955170312504e-05, |
| "loss": 0.416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4880888760089874, |
| "step": 405, |
| "valid_targets_mean": 3147.2, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 0.8488612836438924, |
| "grad_norm": 0.6823448035407557, |
| "learning_rate": 3.994776179335923e-05, |
| "loss": 0.3239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3424914479255676, |
| "step": 410, |
| "valid_targets_mean": 2431.7, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.8592132505175983, |
| "grad_norm": 0.7312590665354671, |
| "learning_rate": 3.9940036535324564e-05, |
| "loss": 0.3355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3406717777252197, |
| "step": 415, |
| "valid_targets_mean": 2271.6, |
| "valid_targets_min": 400 |
| }, |
| { |
| "epoch": 0.8695652173913043, |
| "grad_norm": 0.6805623092937332, |
| "learning_rate": 3.9931779602192435e-05, |
| "loss": 0.3095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35298052430152893, |
| "step": 420, |
| "valid_targets_mean": 2380.3, |
| "valid_targets_min": 331 |
| }, |
| { |
| "epoch": 0.8799171842650103, |
| "grad_norm": 0.47734066638902245, |
| "learning_rate": 3.9922991214123226e-05, |
| "loss": 0.2681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27308475971221924, |
| "step": 425, |
| "valid_targets_mean": 3988.6, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.8902691511387164, |
| "grad_norm": 0.5978371647266324, |
| "learning_rate": 3.991367160544783e-05, |
| "loss": 0.3574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22311019897460938, |
| "step": 430, |
| "valid_targets_mean": 2887.8, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 0.9006211180124224, |
| "grad_norm": 0.5853594710092753, |
| "learning_rate": 3.99038210246615e-05, |
| "loss": 0.3862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33275023102760315, |
| "step": 435, |
| "valid_targets_mean": 3190.8, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.9109730848861284, |
| "grad_norm": 0.6824932837618515, |
| "learning_rate": 3.9893439734417125e-05, |
| "loss": 0.3382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2892998158931732, |
| "step": 440, |
| "valid_targets_mean": 2007.6, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 0.9213250517598344, |
| "grad_norm": 0.7388214988568738, |
| "learning_rate": 3.9882528011518286e-05, |
| "loss": 0.3598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4132966697216034, |
| "step": 445, |
| "valid_targets_mean": 2261.5, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 0.9316770186335404, |
| "grad_norm": 0.6447680427593593, |
| "learning_rate": 3.987108614691186e-05, |
| "loss": 0.3628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3517792522907257, |
| "step": 450, |
| "valid_targets_mean": 2310.1, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 0.9420289855072463, |
| "grad_norm": 0.679191901913392, |
| "learning_rate": 3.985911444568026e-05, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2909126877784729, |
| "step": 455, |
| "valid_targets_mean": 2311.9, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 0.9523809523809523, |
| "grad_norm": 0.793829538406422, |
| "learning_rate": 3.9846613227033305e-05, |
| "loss": 0.3663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34115058183670044, |
| "step": 460, |
| "valid_targets_mean": 2087.2, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 0.9627329192546584, |
| "grad_norm": 0.5926367081080217, |
| "learning_rate": 3.98335828242997e-05, |
| "loss": 0.3408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2802141606807709, |
| "step": 465, |
| "valid_targets_mean": 2543.6, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 0.9730848861283644, |
| "grad_norm": 0.5823847098766494, |
| "learning_rate": 3.982002358491817e-05, |
| "loss": 0.3349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.293674111366272, |
| "step": 470, |
| "valid_targets_mean": 2787.9, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 0.9834368530020704, |
| "grad_norm": 0.7514989296192166, |
| "learning_rate": 3.980593587042816e-05, |
| "loss": 0.359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3089297413825989, |
| "step": 475, |
| "valid_targets_mean": 2357.3, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 0.9937888198757764, |
| "grad_norm": 0.7508286456561156, |
| "learning_rate": 3.979132005646022e-05, |
| "loss": 0.3045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2705974578857422, |
| "step": 480, |
| "valid_targets_mean": 2060.9, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 1.0041407867494825, |
| "grad_norm": 0.578303130786325, |
| "learning_rate": 3.9776176532726005e-05, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23351214826107025, |
| "step": 485, |
| "valid_targets_mean": 2921.1, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 1.0144927536231885, |
| "grad_norm": 0.8565681891585248, |
| "learning_rate": 3.976050570300783e-05, |
| "loss": 0.3846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4955739974975586, |
| "step": 490, |
| "valid_targets_mean": 2399.9, |
| "valid_targets_min": 397 |
| }, |
| { |
| "epoch": 1.0248447204968945, |
| "grad_norm": 0.8525085460239903, |
| "learning_rate": 3.974430798514796e-05, |
| "loss": 0.2587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34586983919143677, |
| "step": 495, |
| "valid_targets_mean": 3405.7, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.0351966873706004, |
| "grad_norm": 0.6107145043153749, |
| "learning_rate": 3.972758381103744e-05, |
| "loss": 0.3328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25020384788513184, |
| "step": 500, |
| "valid_targets_mean": 2676.7, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 1.0455486542443064, |
| "grad_norm": 0.3712861445621319, |
| "learning_rate": 3.9710333626604585e-05, |
| "loss": 0.2865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2056269347667694, |
| "step": 505, |
| "valid_targets_mean": 5489.6, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 1.0559006211180124, |
| "grad_norm": 0.5445195023826013, |
| "learning_rate": 3.969255789180309e-05, |
| "loss": 0.3549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3427426815032959, |
| "step": 510, |
| "valid_targets_mean": 4128.8, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 1.0662525879917184, |
| "grad_norm": 1.5522590817967603, |
| "learning_rate": 3.9674257080599775e-05, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3245624303817749, |
| "step": 515, |
| "valid_targets_mean": 2571.8, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 1.0766045548654244, |
| "grad_norm": 0.7670802874384615, |
| "learning_rate": 3.9655431680961924e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3730795085430145, |
| "step": 520, |
| "valid_targets_mean": 2089.7, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 1.0869565217391304, |
| "grad_norm": 0.8808573279945764, |
| "learning_rate": 3.9636082194844285e-05, |
| "loss": 0.3202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31017860770225525, |
| "step": 525, |
| "valid_targets_mean": 2748.6, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.0973084886128364, |
| "grad_norm": 0.5678915273276016, |
| "learning_rate": 3.9616209138175705e-05, |
| "loss": 0.3206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3231387436389923, |
| "step": 530, |
| "valid_targets_mean": 3620.4, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 1.1076604554865424, |
| "grad_norm": 0.6715392961412922, |
| "learning_rate": 3.959581304084536e-05, |
| "loss": 0.3538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42259538173675537, |
| "step": 535, |
| "valid_targets_mean": 4127.1, |
| "valid_targets_min": 406 |
| }, |
| { |
| "epoch": 1.1180124223602483, |
| "grad_norm": 0.6122700992261885, |
| "learning_rate": 3.9574894446688594e-05, |
| "loss": 0.3044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.323467493057251, |
| "step": 540, |
| "valid_targets_mean": 3492.6, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.1283643892339545, |
| "grad_norm": 0.8429230339257078, |
| "learning_rate": 3.955345391347249e-05, |
| "loss": 0.3377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45265573263168335, |
| "step": 545, |
| "valid_targets_mean": 2018.4, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 1.1387163561076605, |
| "grad_norm": 0.5177578813671116, |
| "learning_rate": 3.9531492012880915e-05, |
| "loss": 0.272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24492105841636658, |
| "step": 550, |
| "valid_targets_mean": 3538.9, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 1.1490683229813665, |
| "grad_norm": 0.9358791063800329, |
| "learning_rate": 3.9509009330499356e-05, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3208366632461548, |
| "step": 555, |
| "valid_targets_mean": 2221.3, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 1.1594202898550725, |
| "grad_norm": 1.492654485940082, |
| "learning_rate": 3.948600646579923e-05, |
| "loss": 0.3741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30150753259658813, |
| "step": 560, |
| "valid_targets_mean": 1951.8, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 1.1697722567287785, |
| "grad_norm": 0.5458431310144255, |
| "learning_rate": 3.946248403212197e-05, |
| "loss": 0.325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34849831461906433, |
| "step": 565, |
| "valid_targets_mean": 4525.2, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 1.1801242236024845, |
| "grad_norm": 1.3216443391427874, |
| "learning_rate": 3.943844265666263e-05, |
| "loss": 0.3464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2811647057533264, |
| "step": 570, |
| "valid_targets_mean": 2566.6, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 1.1904761904761905, |
| "grad_norm": 0.5379526619584627, |
| "learning_rate": 3.9413882980453155e-05, |
| "loss": 0.3001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2871326506137848, |
| "step": 575, |
| "valid_targets_mean": 3341.6, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 1.2008281573498965, |
| "grad_norm": 0.5970973416160769, |
| "learning_rate": 3.9388805658345325e-05, |
| "loss": 0.3592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32768434286117554, |
| "step": 580, |
| "valid_targets_mean": 4324.7, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 1.2111801242236024, |
| "grad_norm": 0.7650985133734655, |
| "learning_rate": 3.9363211358993264e-05, |
| "loss": 0.3126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35999956727027893, |
| "step": 585, |
| "valid_targets_mean": 2116.5, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 1.2215320910973084, |
| "grad_norm": 0.6626315464935324, |
| "learning_rate": 3.9337100764835616e-05, |
| "loss": 0.2653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17115123569965363, |
| "step": 590, |
| "valid_targets_mean": 4721.6, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 1.2318840579710144, |
| "grad_norm": 0.608747167208178, |
| "learning_rate": 3.931047457207736e-05, |
| "loss": 0.3522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3361900746822357, |
| "step": 595, |
| "valid_targets_mean": 3093.6, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 1.2422360248447206, |
| "grad_norm": 0.7141578114058345, |
| "learning_rate": 3.928333349067125e-05, |
| "loss": 0.2756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3286536931991577, |
| "step": 600, |
| "valid_targets_mean": 2283.4, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 1.2525879917184266, |
| "grad_norm": 0.5678041106872164, |
| "learning_rate": 3.925567824429885e-05, |
| "loss": 0.2724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29660943150520325, |
| "step": 605, |
| "valid_targets_mean": 3684.8, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 1.2629399585921326, |
| "grad_norm": 0.722727884026502, |
| "learning_rate": 3.922750957035128e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2989663779735565, |
| "step": 610, |
| "valid_targets_mean": 2112.3, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 1.2732919254658386, |
| "grad_norm": 0.5666973822209642, |
| "learning_rate": 3.919882821990953e-05, |
| "loss": 0.3165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28699982166290283, |
| "step": 615, |
| "valid_targets_mean": 3570.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 1.2836438923395446, |
| "grad_norm": 0.6949218726412446, |
| "learning_rate": 3.9169634957724465e-05, |
| "loss": 0.2894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2630559206008911, |
| "step": 620, |
| "valid_targets_mean": 1976.1, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 1.2939958592132506, |
| "grad_norm": 0.7553316125934354, |
| "learning_rate": 3.913993056219636e-05, |
| "loss": 0.3238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3031398057937622, |
| "step": 625, |
| "valid_targets_mean": 2566.6, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 1.3043478260869565, |
| "grad_norm": 0.6012551894727312, |
| "learning_rate": 3.9109715825354254e-05, |
| "loss": 0.2841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30872005224227905, |
| "step": 630, |
| "valid_targets_mean": 2901.4, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 1.3146997929606625, |
| "grad_norm": 0.6499249693828386, |
| "learning_rate": 3.907899155283472e-05, |
| "loss": 0.3054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2922044098377228, |
| "step": 635, |
| "valid_targets_mean": 2478.1, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 1.3250517598343685, |
| "grad_norm": 0.6607109178219058, |
| "learning_rate": 3.904775856386047e-05, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32309627532958984, |
| "step": 640, |
| "valid_targets_mean": 2581.8, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 1.3354037267080745, |
| "grad_norm": 0.99359277719902, |
| "learning_rate": 3.9016017691218465e-05, |
| "loss": 0.3148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3399587869644165, |
| "step": 645, |
| "valid_targets_mean": 2634.0, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 1.3457556935817805, |
| "grad_norm": 0.6998735259668638, |
| "learning_rate": 3.8983769781237725e-05, |
| "loss": 0.3, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35572707653045654, |
| "step": 650, |
| "valid_targets_mean": 2802.4, |
| "valid_targets_min": 288 |
| }, |
| { |
| "epoch": 1.3561076604554865, |
| "grad_norm": 0.6543925730470436, |
| "learning_rate": 3.8951015693766755e-05, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3457895815372467, |
| "step": 655, |
| "valid_targets_mean": 2723.4, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 1.3664596273291925, |
| "grad_norm": 0.867046377934047, |
| "learning_rate": 3.8917756302150627e-05, |
| "loss": 0.283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34926313161849976, |
| "step": 660, |
| "valid_targets_mean": 2280.2, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 1.3768115942028984, |
| "grad_norm": 0.8720982266233283, |
| "learning_rate": 3.8883992493207696e-05, |
| "loss": 0.3581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3935870826244354, |
| "step": 665, |
| "valid_targets_mean": 2969.8, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 1.3871635610766044, |
| "grad_norm": 0.7607813486400433, |
| "learning_rate": 3.8849725167205934e-05, |
| "loss": 0.376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35601186752319336, |
| "step": 670, |
| "valid_targets_mean": 2010.1, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 1.3975155279503104, |
| "grad_norm": 0.6244741241809822, |
| "learning_rate": 3.8814955237838954e-05, |
| "loss": 0.3097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33208197355270386, |
| "step": 675, |
| "valid_targets_mean": 2881.0, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 1.4078674948240166, |
| "grad_norm": 0.701432966146093, |
| "learning_rate": 3.8779683632201625e-05, |
| "loss": 0.3234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2493334263563156, |
| "step": 680, |
| "valid_targets_mean": 2480.6, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 1.4182194616977226, |
| "grad_norm": 0.6386263618060875, |
| "learning_rate": 3.8743911290765354e-05, |
| "loss": 0.3563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33178985118865967, |
| "step": 685, |
| "valid_targets_mean": 2496.4, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 1.4285714285714286, |
| "grad_norm": 0.7163290212539811, |
| "learning_rate": 3.870763916735303e-05, |
| "loss": 0.3221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42771202325820923, |
| "step": 690, |
| "valid_targets_mean": 2670.1, |
| "valid_targets_min": 305 |
| }, |
| { |
| "epoch": 1.4389233954451346, |
| "grad_norm": 0.6173973599046334, |
| "learning_rate": 3.867086822911358e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3355981111526489, |
| "step": 695, |
| "valid_targets_mean": 4034.1, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 1.4492753623188406, |
| "grad_norm": 0.593581318712642, |
| "learning_rate": 3.863359945649615e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3260822296142578, |
| "step": 700, |
| "valid_targets_mean": 3011.0, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 1.4596273291925466, |
| "grad_norm": 0.7037825237005169, |
| "learning_rate": 3.859583384322402e-05, |
| "loss": 0.3314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2873789072036743, |
| "step": 705, |
| "valid_targets_mean": 2114.8, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 1.4699792960662525, |
| "grad_norm": 0.4809742053953339, |
| "learning_rate": 3.855757239626807e-05, |
| "loss": 0.2784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3173772394657135, |
| "step": 710, |
| "valid_targets_mean": 5494.3, |
| "valid_targets_min": 313 |
| }, |
| { |
| "epoch": 1.4803312629399585, |
| "grad_norm": 0.7992784007276763, |
| "learning_rate": 3.851881613581993e-05, |
| "loss": 0.3428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37110865116119385, |
| "step": 715, |
| "valid_targets_mean": 1696.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 1.4906832298136645, |
| "grad_norm": 0.7460466376190822, |
| "learning_rate": 3.847956609526481e-05, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36755889654159546, |
| "step": 720, |
| "valid_targets_mean": 2678.8, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 1.5010351966873707, |
| "grad_norm": 0.8015485930507722, |
| "learning_rate": 3.843982332115389e-05, |
| "loss": 0.3648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5440657734870911, |
| "step": 725, |
| "valid_targets_mean": 3186.0, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 1.5113871635610767, |
| "grad_norm": 0.6245802617185957, |
| "learning_rate": 3.839958887317649e-05, |
| "loss": 0.2775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27157890796661377, |
| "step": 730, |
| "valid_targets_mean": 2370.6, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 1.5217391304347827, |
| "grad_norm": 0.8406585786723727, |
| "learning_rate": 3.8358863824131726e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3849491477012634, |
| "step": 735, |
| "valid_targets_mean": 2885.7, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 1.5320910973084887, |
| "grad_norm": 0.6705418668893592, |
| "learning_rate": 3.831764925989999e-05, |
| "loss": 0.3017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2597661018371582, |
| "step": 740, |
| "valid_targets_mean": 2369.4, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 1.5424430641821947, |
| "grad_norm": 0.7570661925654296, |
| "learning_rate": 3.8275946279413946e-05, |
| "loss": 0.3126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4379417598247528, |
| "step": 745, |
| "valid_targets_mean": 3104.5, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 1.5527950310559007, |
| "grad_norm": 0.7568141088774238, |
| "learning_rate": 3.823375599462924e-05, |
| "loss": 0.315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3063448667526245, |
| "step": 750, |
| "valid_targets_mean": 1793.1, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 1.5631469979296067, |
| "grad_norm": 0.5008197907800821, |
| "learning_rate": 3.819107953049485e-05, |
| "loss": 0.2838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23246562480926514, |
| "step": 755, |
| "valid_targets_mean": 3298.4, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 1.5734989648033126, |
| "grad_norm": 0.6451644332169639, |
| "learning_rate": 3.814791802492309e-05, |
| "loss": 0.3332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4341411888599396, |
| "step": 760, |
| "valid_targets_mean": 3766.1, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 1.5838509316770186, |
| "grad_norm": 0.6316711474608361, |
| "learning_rate": 3.810427262875928e-05, |
| "loss": 0.3632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40523141622543335, |
| "step": 765, |
| "valid_targets_mean": 2900.8, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 1.5942028985507246, |
| "grad_norm": 0.6559079761601386, |
| "learning_rate": 3.8060144505751066e-05, |
| "loss": 0.3555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3753317594528198, |
| "step": 770, |
| "valid_targets_mean": 2754.6, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 1.6045548654244306, |
| "grad_norm": 0.8409357657293262, |
| "learning_rate": 3.8015534832517346e-05, |
| "loss": 0.2647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31297141313552856, |
| "step": 775, |
| "valid_targets_mean": 1537.7, |
| "valid_targets_min": 400 |
| }, |
| { |
| "epoch": 1.6149068322981366, |
| "grad_norm": 0.5230610037042105, |
| "learning_rate": 3.797044479851693e-05, |
| "loss": 0.3394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34146177768707275, |
| "step": 780, |
| "valid_targets_mean": 4368.2, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 1.6252587991718426, |
| "grad_norm": 0.8017960578186035, |
| "learning_rate": 3.7924875606016856e-05, |
| "loss": 0.3011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31278154253959656, |
| "step": 785, |
| "valid_targets_mean": 2435.0, |
| "valid_targets_min": 309 |
| }, |
| { |
| "epoch": 1.6356107660455486, |
| "grad_norm": 0.7307900776630412, |
| "learning_rate": 3.7878828470060274e-05, |
| "loss": 0.2563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24949385225772858, |
| "step": 790, |
| "valid_targets_mean": 1969.8, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.6459627329192545, |
| "grad_norm": 0.6089402692068703, |
| "learning_rate": 3.783230461843406e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2793858051300049, |
| "step": 795, |
| "valid_targets_mean": 2419.0, |
| "valid_targets_min": 303 |
| }, |
| { |
| "epoch": 1.6563146997929605, |
| "grad_norm": 0.604875615097612, |
| "learning_rate": 3.7785305291636126e-05, |
| "loss": 0.3101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35383036732673645, |
| "step": 800, |
| "valid_targets_mean": 2854.2, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.7840139460025201, |
| "learning_rate": 3.773783174284228e-05, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.270771324634552, |
| "step": 805, |
| "valid_targets_mean": 1783.1, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 1.6770186335403725, |
| "grad_norm": 0.5439330951892583, |
| "learning_rate": 3.768988523787287e-05, |
| "loss": 0.3221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2746136784553528, |
| "step": 810, |
| "valid_targets_mean": 3407.2, |
| "valid_targets_min": 459 |
| }, |
| { |
| "epoch": 1.6873706004140787, |
| "grad_norm": 0.707062238751807, |
| "learning_rate": 3.764146705515898e-05, |
| "loss": 0.2841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30619674921035767, |
| "step": 815, |
| "valid_targets_mean": 2142.9, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 1.6977225672877847, |
| "grad_norm": 0.6851395668736608, |
| "learning_rate": 3.759257848570838e-05, |
| "loss": 0.3534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5384789705276489, |
| "step": 820, |
| "valid_targets_mean": 3692.9, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 1.7080745341614907, |
| "grad_norm": 0.6969892105656047, |
| "learning_rate": 3.754322083307107e-05, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34344714879989624, |
| "step": 825, |
| "valid_targets_mean": 2168.1, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 1.7184265010351967, |
| "grad_norm": 0.6350233312646498, |
| "learning_rate": 3.749339541330457e-05, |
| "loss": 0.3013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21109239757061005, |
| "step": 830, |
| "valid_targets_mean": 2116.4, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 1.7287784679089027, |
| "grad_norm": 0.6242925285847643, |
| "learning_rate": 3.7443103554938794e-05, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35286158323287964, |
| "step": 835, |
| "valid_targets_mean": 2796.6, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 1.7391304347826086, |
| "grad_norm": 0.7068835221058171, |
| "learning_rate": 3.739234659894062e-05, |
| "loss": 0.2794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27447009086608887, |
| "step": 840, |
| "valid_targets_mean": 1944.8, |
| "valid_targets_min": 488 |
| }, |
| { |
| "epoch": 1.7494824016563149, |
| "grad_norm": 0.7775094105121269, |
| "learning_rate": 3.7341125898678154e-05, |
| "loss": 0.3409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3335605561733246, |
| "step": 845, |
| "valid_targets_mean": 2268.7, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 1.7598343685300208, |
| "grad_norm": 0.7026899191258092, |
| "learning_rate": 3.7289442819884644e-05, |
| "loss": 0.3313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3098892867565155, |
| "step": 850, |
| "valid_targets_mean": 2165.6, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 1.7701863354037268, |
| "grad_norm": 0.7785694411643936, |
| "learning_rate": 3.723729874062206e-05, |
| "loss": 0.3383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5063181519508362, |
| "step": 855, |
| "valid_targets_mean": 3067.9, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 1.7805383022774328, |
| "grad_norm": 0.6864346250242391, |
| "learning_rate": 3.718469505124434e-05, |
| "loss": 0.3438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30108267068862915, |
| "step": 860, |
| "valid_targets_mean": 2758.5, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 1.7908902691511388, |
| "grad_norm": 0.6688063851094667, |
| "learning_rate": 3.7131633154360336e-05, |
| "loss": 0.2891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3029250204563141, |
| "step": 865, |
| "valid_targets_mean": 2407.8, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 1.8012422360248448, |
| "grad_norm": 0.6814618177356577, |
| "learning_rate": 3.707811446479639e-05, |
| "loss": 0.2774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3125041127204895, |
| "step": 870, |
| "valid_targets_mean": 2367.2, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 1.8115942028985508, |
| "grad_norm": 0.6124859430419072, |
| "learning_rate": 3.702414040955866e-05, |
| "loss": 0.3282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33444851636886597, |
| "step": 875, |
| "valid_targets_mean": 2857.4, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 1.8219461697722568, |
| "grad_norm": 0.5332243076283965, |
| "learning_rate": 3.696971242779499e-05, |
| "loss": 0.2784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30144771933555603, |
| "step": 880, |
| "valid_targets_mean": 3346.8, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 1.8322981366459627, |
| "grad_norm": 0.6418575705848031, |
| "learning_rate": 3.691483197075664e-05, |
| "loss": 0.314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2444503903388977, |
| "step": 885, |
| "valid_targets_mean": 2092.2, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 1.8426501035196687, |
| "grad_norm": 0.6840565309784318, |
| "learning_rate": 3.685950050175946e-05, |
| "loss": 0.2981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3534913659095764, |
| "step": 890, |
| "valid_targets_mean": 2626.1, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 1.8530020703933747, |
| "grad_norm": 0.6411961833023883, |
| "learning_rate": 3.680371949614503e-05, |
| "loss": 0.3, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3057364523410797, |
| "step": 895, |
| "valid_targets_mean": 2653.8, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 1.8633540372670807, |
| "grad_norm": 0.734143938781199, |
| "learning_rate": 3.6747490441241166e-05, |
| "loss": 0.3165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2625513970851898, |
| "step": 900, |
| "valid_targets_mean": 1966.4, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 1.8737060041407867, |
| "grad_norm": 0.6002740004630833, |
| "learning_rate": 3.669081483632238e-05, |
| "loss": 0.2464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24936066567897797, |
| "step": 905, |
| "valid_targets_mean": 2350.6, |
| "valid_targets_min": 581 |
| }, |
| { |
| "epoch": 1.8840579710144927, |
| "grad_norm": 0.6634082462286021, |
| "learning_rate": 3.6633694192569835e-05, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2440337836742401, |
| "step": 910, |
| "valid_targets_mean": 2182.1, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.8944099378881987, |
| "grad_norm": 0.6598417402185687, |
| "learning_rate": 3.657613003303109e-05, |
| "loss": 0.3533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3100677728652954, |
| "step": 915, |
| "valid_targets_mean": 2527.1, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 1.9047619047619047, |
| "grad_norm": 0.7136251407724076, |
| "learning_rate": 3.651812389257947e-05, |
| "loss": 0.3177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40685153007507324, |
| "step": 920, |
| "valid_targets_mean": 2883.4, |
| "valid_targets_min": 438 |
| }, |
| { |
| "epoch": 1.9151138716356106, |
| "grad_norm": 0.8221505552013975, |
| "learning_rate": 3.645967731787313e-05, |
| "loss": 0.2988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.348793625831604, |
| "step": 925, |
| "valid_targets_mean": 1815.2, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 1.9254658385093166, |
| "grad_norm": 0.6714962697810101, |
| "learning_rate": 3.640079186731385e-05, |
| "loss": 0.2772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3066626787185669, |
| "step": 930, |
| "valid_targets_mean": 2163.9, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 1.9358178053830226, |
| "grad_norm": 0.8603452197126946, |
| "learning_rate": 3.634146911100547e-05, |
| "loss": 0.3325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3235263228416443, |
| "step": 935, |
| "valid_targets_mean": 2000.6, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 1.9461697722567288, |
| "grad_norm": 0.8181375628740634, |
| "learning_rate": 3.6281710630711984e-05, |
| "loss": 0.3459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33535006642341614, |
| "step": 940, |
| "valid_targets_mean": 2283.9, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 1.9565217391304348, |
| "grad_norm": 0.7661975352385241, |
| "learning_rate": 3.6221518019815436e-05, |
| "loss": 0.3142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32310929894447327, |
| "step": 945, |
| "valid_targets_mean": 2044.9, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 1.9668737060041408, |
| "grad_norm": 0.7546886437201982, |
| "learning_rate": 3.616089288327336e-05, |
| "loss": 0.2886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3442019522190094, |
| "step": 950, |
| "valid_targets_mean": 2058.4, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 1.9772256728778468, |
| "grad_norm": 0.6284194122874336, |
| "learning_rate": 3.609983683757606e-05, |
| "loss": 0.3189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41605764627456665, |
| "step": 955, |
| "valid_targets_mean": 4267.4, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 1.9875776397515528, |
| "grad_norm": 0.565257067101154, |
| "learning_rate": 3.603835151070345e-05, |
| "loss": 0.2715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27033889293670654, |
| "step": 960, |
| "valid_targets_mean": 3668.6, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 1.9979296066252588, |
| "grad_norm": 0.6360153374329626, |
| "learning_rate": 3.5976438542081666e-05, |
| "loss": 0.2872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2408621609210968, |
| "step": 965, |
| "valid_targets_mean": 2069.4, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 2.008281573498965, |
| "grad_norm": 0.6357166576139243, |
| "learning_rate": 3.591409958253937e-05, |
| "loss": 0.2626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2636573612689972, |
| "step": 970, |
| "valid_targets_mean": 2536.4, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 2.018633540372671, |
| "grad_norm": 0.6716098344095058, |
| "learning_rate": 3.5851336294263696e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25086358189582825, |
| "step": 975, |
| "valid_targets_mean": 2756.8, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 2.028985507246377, |
| "grad_norm": 0.4956351374220249, |
| "learning_rate": 3.578815035075597e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2566456198692322, |
| "step": 980, |
| "valid_targets_mean": 5390.4, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 2.039337474120083, |
| "grad_norm": 0.7064220242643727, |
| "learning_rate": 3.572454343678705e-05, |
| "loss": 0.2702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2861258387565613, |
| "step": 985, |
| "valid_targets_mean": 2059.2, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 2.049689440993789, |
| "grad_norm": 0.8729780469833862, |
| "learning_rate": 3.566051724835245e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32387927174568176, |
| "step": 990, |
| "valid_targets_mean": 1951.7, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 2.060041407867495, |
| "grad_norm": 0.6569866235371754, |
| "learning_rate": 3.559607349262705e-05, |
| "loss": 0.2351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23175671696662903, |
| "step": 995, |
| "valid_targets_mean": 2289.1, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 2.070393374741201, |
| "grad_norm": 0.9247889042046914, |
| "learning_rate": 3.5531213887919667e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2623339295387268, |
| "step": 1000, |
| "valid_targets_mean": 2524.4, |
| "valid_targets_min": 232 |
| }, |
| { |
| "epoch": 2.080745341614907, |
| "grad_norm": 0.6363817576343097, |
| "learning_rate": 3.546594016362716e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28919100761413574, |
| "step": 1005, |
| "valid_targets_mean": 2776.9, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 2.091097308488613, |
| "grad_norm": 0.7881930796673811, |
| "learning_rate": 3.540025406018834e-05, |
| "loss": 0.2697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2384035289287567, |
| "step": 1010, |
| "valid_targets_mean": 1624.8, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 2.101449275362319, |
| "grad_norm": 0.4465477565347781, |
| "learning_rate": 3.533415732903759e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2667323648929596, |
| "step": 1015, |
| "valid_targets_mean": 5425.1, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 2.111801242236025, |
| "grad_norm": 0.7631555157748504, |
| "learning_rate": 3.5267651732558146e-05, |
| "loss": 0.2935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3835008442401886, |
| "step": 1020, |
| "valid_targets_mean": 2624.8, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 2.122153209109731, |
| "grad_norm": 0.55664148104698, |
| "learning_rate": 3.520073904403509e-05, |
| "loss": 0.2668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25191134214401245, |
| "step": 1025, |
| "valid_targets_mean": 3272.8, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 2.132505175983437, |
| "grad_norm": 0.8149036515302649, |
| "learning_rate": 3.513342104760809e-05, |
| "loss": 0.2167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22442390024662018, |
| "step": 1030, |
| "valid_targets_mean": 1833.1, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 2.142857142857143, |
| "grad_norm": 0.5802425971474474, |
| "learning_rate": 3.506569953822383e-05, |
| "loss": 0.2449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2896159291267395, |
| "step": 1035, |
| "valid_targets_mean": 3547.2, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 2.153209109730849, |
| "grad_norm": 0.6221670768855667, |
| "learning_rate": 3.4997576321588126e-05, |
| "loss": 0.2757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22672376036643982, |
| "step": 1040, |
| "valid_targets_mean": 2443.9, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 2.1635610766045548, |
| "grad_norm": 0.8278897691479519, |
| "learning_rate": 3.492905321411781e-05, |
| "loss": 0.3221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2788503170013428, |
| "step": 1045, |
| "valid_targets_mean": 2161.9, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 2.1739130434782608, |
| "grad_norm": 0.6727746895274888, |
| "learning_rate": 3.486013204289227e-05, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21209818124771118, |
| "step": 1050, |
| "valid_targets_mean": 2909.8, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 2.1842650103519667, |
| "grad_norm": 0.6334119835007679, |
| "learning_rate": 3.479081464560475e-05, |
| "loss": 0.2621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29021257162094116, |
| "step": 1055, |
| "valid_targets_mean": 3242.4, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 2.1946169772256727, |
| "grad_norm": 1.1830366048428838, |
| "learning_rate": 3.4721102870513345e-05, |
| "loss": 0.253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36102619767189026, |
| "step": 1060, |
| "valid_targets_mean": 2006.9, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 2.2049689440993787, |
| "grad_norm": 0.8106585345203733, |
| "learning_rate": 3.465099857639173e-05, |
| "loss": 0.3153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27605193853378296, |
| "step": 1065, |
| "valid_targets_mean": 1677.1, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 2.2153209109730847, |
| "grad_norm": 0.5880377494754921, |
| "learning_rate": 3.458050363247957e-05, |
| "loss": 0.2832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24764445424079895, |
| "step": 1070, |
| "valid_targets_mean": 3182.0, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.2256728778467907, |
| "grad_norm": 0.5697074711554126, |
| "learning_rate": 3.450961991843271e-05, |
| "loss": 0.2566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24443545937538147, |
| "step": 1075, |
| "valid_targets_mean": 4197.8, |
| "valid_targets_min": 1715 |
| }, |
| { |
| "epoch": 2.2360248447204967, |
| "grad_norm": 0.7599961285605185, |
| "learning_rate": 3.4438349324273044e-05, |
| "loss": 0.2708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3468702733516693, |
| "step": 1080, |
| "valid_targets_mean": 2894.7, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 2.246376811594203, |
| "grad_norm": 0.7320534504878216, |
| "learning_rate": 3.436669375033812e-05, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2806239724159241, |
| "step": 1085, |
| "valid_targets_mean": 2801.9, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 2.256728778467909, |
| "grad_norm": 0.6651232453856196, |
| "learning_rate": 3.429465510723046e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25253286957740784, |
| "step": 1090, |
| "valid_targets_mean": 2427.6, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 2.267080745341615, |
| "grad_norm": 0.7318417075725385, |
| "learning_rate": 3.4222235315766634e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2881121039390564, |
| "step": 1095, |
| "valid_targets_mean": 2698.2, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 2.277432712215321, |
| "grad_norm": 0.5060721290785742, |
| "learning_rate": 3.414943630692605e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1891990602016449, |
| "step": 1100, |
| "valid_targets_mean": 3982.4, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 2.287784679089027, |
| "grad_norm": 0.6388973076559393, |
| "learning_rate": 3.407626002179943e-05, |
| "loss": 0.2605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2833097577095032, |
| "step": 1105, |
| "valid_targets_mean": 2923.7, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 2.298136645962733, |
| "grad_norm": 0.7050108379240185, |
| "learning_rate": 3.40027084115371e-05, |
| "loss": 0.2694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25936251878738403, |
| "step": 1110, |
| "valid_targets_mean": 2194.5, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 2.308488612836439, |
| "grad_norm": 1.1896188271617125, |
| "learning_rate": 3.3928783437296906e-05, |
| "loss": 0.2785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23933464288711548, |
| "step": 1115, |
| "valid_targets_mean": 2121.6, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 2.318840579710145, |
| "grad_norm": 0.5651209935539805, |
| "learning_rate": 3.385448707019199e-05, |
| "loss": 0.2806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25165855884552, |
| "step": 1120, |
| "valid_targets_mean": 4061.7, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 2.329192546583851, |
| "grad_norm": 0.7262731183176127, |
| "learning_rate": 3.37798212912382e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2577860951423645, |
| "step": 1125, |
| "valid_targets_mean": 2202.4, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 2.339544513457557, |
| "grad_norm": 0.5618393584824415, |
| "learning_rate": 3.370478809130126e-05, |
| "loss": 0.2452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1696050465106964, |
| "step": 1130, |
| "valid_targets_mean": 2500.9, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 2.349896480331263, |
| "grad_norm": 0.7126252849015065, |
| "learning_rate": 3.3629389471043686e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3189730942249298, |
| "step": 1135, |
| "valid_targets_mean": 3294.7, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 2.360248447204969, |
| "grad_norm": 0.9604299856824035, |
| "learning_rate": 3.355362744087147e-05, |
| "loss": 0.3133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40159639716148376, |
| "step": 1140, |
| "valid_targets_mean": 3716.9, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 2.370600414078675, |
| "grad_norm": 0.6100748889704821, |
| "learning_rate": 3.347750402088046e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25193271040916443, |
| "step": 1145, |
| "valid_targets_mean": 3066.1, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 2.380952380952381, |
| "grad_norm": 0.6513131119801923, |
| "learning_rate": 3.3401021240802446e-05, |
| "loss": 0.259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23295412957668304, |
| "step": 1150, |
| "valid_targets_mean": 2498.0, |
| "valid_targets_min": 428 |
| }, |
| { |
| "epoch": 2.391304347826087, |
| "grad_norm": 0.6813554157755068, |
| "learning_rate": 3.332418113995116e-05, |
| "loss": 0.2621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19543245434761047, |
| "step": 1155, |
| "valid_targets_mean": 2158.0, |
| "valid_targets_min": 831 |
| }, |
| { |
| "epoch": 2.401656314699793, |
| "grad_norm": 0.7313840895870419, |
| "learning_rate": 3.3246985767167763e-05, |
| "loss": 0.2842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22841569781303406, |
| "step": 1160, |
| "valid_targets_mean": 2154.1, |
| "valid_targets_min": 400 |
| }, |
| { |
| "epoch": 2.412008281573499, |
| "grad_norm": 0.5935846326263404, |
| "learning_rate": 3.316943718076633e-05, |
| "loss": 0.2533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.333047479391098, |
| "step": 1165, |
| "valid_targets_mean": 4248.6, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 2.422360248447205, |
| "grad_norm": 0.791044272962795, |
| "learning_rate": 3.3091537448478854e-05, |
| "loss": 0.2778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26495736837387085, |
| "step": 1170, |
| "valid_targets_mean": 2369.9, |
| "valid_targets_min": 975 |
| }, |
| { |
| "epoch": 2.432712215320911, |
| "grad_norm": 0.6676783405628622, |
| "learning_rate": 3.301328864740024e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33358559012413025, |
| "step": 1175, |
| "valid_targets_mean": 2824.4, |
| "valid_targets_min": 438 |
| }, |
| { |
| "epoch": 2.443064182194617, |
| "grad_norm": 0.6210999987816006, |
| "learning_rate": 3.2934692863932826e-05, |
| "loss": 0.2883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37713438272476196, |
| "step": 1180, |
| "valid_targets_mean": 4190.8, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 2.453416149068323, |
| "grad_norm": 0.9102484172009931, |
| "learning_rate": 3.285575219373079e-05, |
| "loss": 0.2817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27761310338974, |
| "step": 1185, |
| "valid_targets_mean": 2286.0, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 2.463768115942029, |
| "grad_norm": 0.8264325779605302, |
| "learning_rate": 3.2776468741644254e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35481444001197815, |
| "step": 1190, |
| "valid_targets_mean": 1918.8, |
| "valid_targets_min": 488 |
| }, |
| { |
| "epoch": 2.474120082815735, |
| "grad_norm": 0.7271253546023544, |
| "learning_rate": 3.26968446216632e-05, |
| "loss": 0.2342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26062947511672974, |
| "step": 1195, |
| "valid_targets_mean": 2231.8, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 2.4844720496894412, |
| "grad_norm": 0.8973929287276415, |
| "learning_rate": 3.2616881956861025e-05, |
| "loss": 0.2677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27928027510643005, |
| "step": 1200, |
| "valid_targets_mean": 1896.2, |
| "valid_targets_min": 348 |
| }, |
| { |
| "epoch": 2.494824016563147, |
| "grad_norm": 0.4082069685047567, |
| "learning_rate": 3.2536582879338046e-05, |
| "loss": 0.2536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18940213322639465, |
| "step": 1205, |
| "valid_targets_mean": 4323.4, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.505175983436853, |
| "grad_norm": 0.7017656676375894, |
| "learning_rate": 3.245594953016455e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2417268604040146, |
| "step": 1210, |
| "valid_targets_mean": 2325.2, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.5155279503105588, |
| "grad_norm": 0.6814415938184818, |
| "learning_rate": 3.237498405932374e-05, |
| "loss": 0.2775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33832401037216187, |
| "step": 1215, |
| "valid_targets_mean": 2867.0, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 2.525879917184265, |
| "grad_norm": 0.7801644137826693, |
| "learning_rate": 3.2293688625654414e-05, |
| "loss": 0.2863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27744320034980774, |
| "step": 1220, |
| "valid_targets_mean": 1826.2, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 2.536231884057971, |
| "grad_norm": 0.7921338973324987, |
| "learning_rate": 3.221206539679342e-05, |
| "loss": 0.2726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2806174159049988, |
| "step": 1225, |
| "valid_targets_mean": 4052.1, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 2.546583850931677, |
| "grad_norm": 0.7638655535817076, |
| "learning_rate": 3.213011654911781e-05, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22334516048431396, |
| "step": 1230, |
| "valid_targets_mean": 1654.2, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 2.556935817805383, |
| "grad_norm": 0.9533183958110001, |
| "learning_rate": 3.204784426768685e-05, |
| "loss": 0.2639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22882500290870667, |
| "step": 1235, |
| "valid_targets_mean": 3256.3, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 2.567287784679089, |
| "grad_norm": 0.3343640416944216, |
| "learning_rate": 3.1965250746183755e-05, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13794702291488647, |
| "step": 1240, |
| "valid_targets_mean": 5393.2, |
| "valid_targets_min": 363 |
| }, |
| { |
| "epoch": 2.577639751552795, |
| "grad_norm": 0.6369559557128881, |
| "learning_rate": 3.1882338186857164e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2859078645706177, |
| "step": 1245, |
| "valid_targets_mean": 2821.6, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 2.587991718426501, |
| "grad_norm": 0.6063783751731852, |
| "learning_rate": 3.1799108800462466e-05, |
| "loss": 0.3386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31201863288879395, |
| "step": 1250, |
| "valid_targets_mean": 3289.1, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 2.598343685300207, |
| "grad_norm": 0.5142821780449842, |
| "learning_rate": 3.1715564806202815e-05, |
| "loss": 0.3602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2918277978897095, |
| "step": 1255, |
| "valid_targets_mean": 3862.7, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 2.608695652173913, |
| "grad_norm": 0.5889004684696514, |
| "learning_rate": 3.1631708431669985e-05, |
| "loss": 0.2493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2696582078933716, |
| "step": 1260, |
| "valid_targets_mean": 3824.6, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 2.619047619047619, |
| "grad_norm": 0.6639591263396689, |
| "learning_rate": 3.1547541912784965e-05, |
| "loss": 0.2819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25455427169799805, |
| "step": 1265, |
| "valid_targets_mean": 2578.6, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 2.629399585921325, |
| "grad_norm": 0.6938668640706942, |
| "learning_rate": 3.146306749373833e-05, |
| "loss": 0.27, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.285896360874176, |
| "step": 1270, |
| "valid_targets_mean": 2242.8, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 2.639751552795031, |
| "grad_norm": 0.6635900887759165, |
| "learning_rate": 3.137828742693041e-05, |
| "loss": 0.3081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3423786163330078, |
| "step": 1275, |
| "valid_targets_mean": 3281.0, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 2.650103519668737, |
| "grad_norm": 0.6801128006550414, |
| "learning_rate": 3.129320397291125e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2767699360847473, |
| "step": 1280, |
| "valid_targets_mean": 2735.9, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 2.660455486542443, |
| "grad_norm": 0.7025184682700185, |
| "learning_rate": 3.12078194003203e-05, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27691537141799927, |
| "step": 1285, |
| "valid_targets_mean": 2134.4, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 2.670807453416149, |
| "grad_norm": 0.5924464858785424, |
| "learning_rate": 3.112213598582596e-05, |
| "loss": 0.2732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15232308208942413, |
| "step": 1290, |
| "valid_targets_mean": 4905.1, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 2.681159420289855, |
| "grad_norm": 0.7877428337019158, |
| "learning_rate": 3.1036156014064846e-05, |
| "loss": 0.2453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24164274334907532, |
| "step": 1295, |
| "valid_targets_mean": 2376.1, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 2.691511387163561, |
| "grad_norm": 0.7142467961580515, |
| "learning_rate": 3.094988177758091e-05, |
| "loss": 0.2558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37197333574295044, |
| "step": 1300, |
| "valid_targets_mean": 3346.9, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 2.701863354037267, |
| "grad_norm": 0.5870935195942067, |
| "learning_rate": 3.086331557676426e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2159366011619568, |
| "step": 1305, |
| "valid_targets_mean": 2964.8, |
| "valid_targets_min": 274 |
| }, |
| { |
| "epoch": 2.712215320910973, |
| "grad_norm": 0.6872956928546283, |
| "learning_rate": 3.0776459719789876e-05, |
| "loss": 0.2727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31350186467170715, |
| "step": 1310, |
| "valid_targets_mean": 2581.4, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 2.722567287784679, |
| "grad_norm": 0.7486101772028452, |
| "learning_rate": 3.0689316522556026e-05, |
| "loss": 0.3293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2855913043022156, |
| "step": 1315, |
| "valid_targets_mean": 2561.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 2.732919254658385, |
| "grad_norm": 0.4579078783293101, |
| "learning_rate": 3.060188830862254e-05, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27316346764564514, |
| "step": 1320, |
| "valid_targets_mean": 6253.2, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 2.7432712215320914, |
| "grad_norm": 0.5358219876585554, |
| "learning_rate": 3.0514177409148854e-05, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19187697768211365, |
| "step": 1325, |
| "valid_targets_mean": 2720.8, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 2.753623188405797, |
| "grad_norm": 0.5552497910549137, |
| "learning_rate": 3.042618616283184e-05, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27454033493995667, |
| "step": 1330, |
| "valid_targets_mean": 3399.2, |
| "valid_targets_min": 397 |
| }, |
| { |
| "epoch": 2.7639751552795033, |
| "grad_norm": 0.6823834665507209, |
| "learning_rate": 3.0337916915843437e-05, |
| "loss": 0.2599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2507593631744385, |
| "step": 1335, |
| "valid_targets_mean": 2280.2, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 2.774327122153209, |
| "grad_norm": 0.7550596937365505, |
| "learning_rate": 3.024937202176813e-05, |
| "loss": 0.3365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2813539505004883, |
| "step": 1340, |
| "valid_targets_mean": 1925.6, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 2.7846790890269153, |
| "grad_norm": 0.620351083586836, |
| "learning_rate": 3.016055384154016e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27360090613365173, |
| "step": 1345, |
| "valid_targets_mean": 2753.7, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 2.795031055900621, |
| "grad_norm": 0.5870647895388508, |
| "learning_rate": 3.007146474338061e-05, |
| "loss": 0.2453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25962918996810913, |
| "step": 1350, |
| "valid_targets_mean": 3009.2, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 2.8053830227743273, |
| "grad_norm": 0.7132808075099697, |
| "learning_rate": 2.9982107102734225e-05, |
| "loss": 0.2373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28429892659187317, |
| "step": 1355, |
| "valid_targets_mean": 2095.7, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 2.8157349896480333, |
| "grad_norm": 0.5718661527861477, |
| "learning_rate": 2.9892483302206067e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20819316804409027, |
| "step": 1360, |
| "valid_targets_mean": 2768.9, |
| "valid_targets_min": 258 |
| }, |
| { |
| "epoch": 2.8260869565217392, |
| "grad_norm": 0.3634008953249174, |
| "learning_rate": 2.9802595731498027e-05, |
| "loss": 0.2315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1665099710226059, |
| "step": 1365, |
| "valid_targets_mean": 6357.5, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 2.8364389233954452, |
| "grad_norm": 0.7314349692520135, |
| "learning_rate": 2.9712446787345076e-05, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30443474650382996, |
| "step": 1370, |
| "valid_targets_mean": 2490.6, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 2.846790890269151, |
| "grad_norm": 0.5362978528913575, |
| "learning_rate": 2.962203887345137e-05, |
| "loss": 0.2646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2595052719116211, |
| "step": 1375, |
| "valid_targets_mean": 3539.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 2.857142857142857, |
| "grad_norm": 0.6062346483149705, |
| "learning_rate": 2.9531374400426158e-05, |
| "loss": 0.3262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24060280621051788, |
| "step": 1380, |
| "valid_targets_mean": 2836.4, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 2.867494824016563, |
| "grad_norm": 0.7082210941894594, |
| "learning_rate": 2.9440455785719496e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2264600545167923, |
| "step": 1385, |
| "valid_targets_mean": 1664.6, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 2.877846790890269, |
| "grad_norm": 0.6123887449000341, |
| "learning_rate": 2.934928545355781e-05, |
| "loss": 0.2984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3257123827934265, |
| "step": 1390, |
| "valid_targets_mean": 3369.2, |
| "valid_targets_min": 829 |
| }, |
| { |
| "epoch": 2.888198757763975, |
| "grad_norm": 0.6864043917128869, |
| "learning_rate": 2.925786583487922e-05, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31987008452415466, |
| "step": 1395, |
| "valid_targets_mean": 2711.7, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 2.898550724637681, |
| "grad_norm": 0.6080342575365325, |
| "learning_rate": 2.916619936726877e-05, |
| "loss": 0.2845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2373320758342743, |
| "step": 1400, |
| "valid_targets_mean": 3641.7, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 2.908902691511387, |
| "grad_norm": 0.7181192036864602, |
| "learning_rate": 2.9074288494893407e-05, |
| "loss": 0.3389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31169378757476807, |
| "step": 1405, |
| "valid_targets_mean": 2594.9, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 2.919254658385093, |
| "grad_norm": 0.7116785040649848, |
| "learning_rate": 2.8982135668436796e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2377220094203949, |
| "step": 1410, |
| "valid_targets_mean": 2565.6, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.929606625258799, |
| "grad_norm": 0.527003497336332, |
| "learning_rate": 2.8889743345034012e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24901200830936432, |
| "step": 1415, |
| "valid_targets_mean": 3355.5, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 2.939958592132505, |
| "grad_norm": 0.7215643198974966, |
| "learning_rate": 2.8797113988205992e-05, |
| "loss": 0.2702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26589393615722656, |
| "step": 1420, |
| "valid_targets_mean": 2117.3, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 2.950310559006211, |
| "grad_norm": 0.7304693761897525, |
| "learning_rate": 2.8704250067793853e-05, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3305160701274872, |
| "step": 1425, |
| "valid_targets_mean": 2289.8, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 2.960662525879917, |
| "grad_norm": 0.5524041278998529, |
| "learning_rate": 2.8611154059893072e-05, |
| "loss": 0.2346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2436435967683792, |
| "step": 1430, |
| "valid_targets_mean": 3544.5, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 2.971014492753623, |
| "grad_norm": 0.6949146976027709, |
| "learning_rate": 2.851782844678741e-05, |
| "loss": 0.2591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24652817845344543, |
| "step": 1435, |
| "valid_targets_mean": 2396.6, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 2.981366459627329, |
| "grad_norm": 0.855845523061833, |
| "learning_rate": 2.8424275716882764e-05, |
| "loss": 0.3187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35203707218170166, |
| "step": 1440, |
| "valid_targets_mean": 2468.2, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 2.991718426501035, |
| "grad_norm": 0.6069280690104846, |
| "learning_rate": 2.8330498364640803e-05, |
| "loss": 0.2729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2389097809791565, |
| "step": 1445, |
| "valid_targets_mean": 2823.1, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 3.002070393374741, |
| "grad_norm": 0.7079484446595876, |
| "learning_rate": 2.823649889051245e-05, |
| "loss": 0.2605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33429914712905884, |
| "step": 1450, |
| "valid_targets_mean": 2347.8, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 3.012422360248447, |
| "grad_norm": 0.5927362264974598, |
| "learning_rate": 2.8142279800871226e-05, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17803658545017242, |
| "step": 1455, |
| "valid_targets_mean": 2970.0, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 3.022774327122153, |
| "grad_norm": 0.6173739269582847, |
| "learning_rate": 2.8047843607946416e-05, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21716290712356567, |
| "step": 1460, |
| "valid_targets_mean": 3280.1, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 3.0331262939958594, |
| "grad_norm": 0.8835749274852875, |
| "learning_rate": 2.7953192829756087e-05, |
| "loss": 0.2605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23659950494766235, |
| "step": 1465, |
| "valid_targets_mean": 1768.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.0434782608695654, |
| "grad_norm": 0.6416344650777536, |
| "learning_rate": 2.7858329990039922e-05, |
| "loss": 0.2249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26247477531433105, |
| "step": 1470, |
| "valid_targets_mean": 4569.3, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 3.0538302277432714, |
| "grad_norm": 0.7529415797399801, |
| "learning_rate": 2.7763257618191965e-05, |
| "loss": 0.2372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26717787981033325, |
| "step": 1475, |
| "valid_targets_mean": 2397.6, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 3.0641821946169774, |
| "grad_norm": 0.7317704953810572, |
| "learning_rate": 2.7667978249193142e-05, |
| "loss": 0.26, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21715983748435974, |
| "step": 1480, |
| "valid_targets_mean": 2296.4, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 3.0745341614906834, |
| "grad_norm": 0.5247604954590532, |
| "learning_rate": 2.757249442354373e-05, |
| "loss": 0.2678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27207493782043457, |
| "step": 1485, |
| "valid_targets_mean": 5021.0, |
| "valid_targets_min": 496 |
| }, |
| { |
| "epoch": 3.0848861283643894, |
| "grad_norm": 1.0520512297726068, |
| "learning_rate": 2.747680868719553e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2122560292482376, |
| "step": 1490, |
| "valid_targets_mean": 2820.4, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.0952380952380953, |
| "grad_norm": 0.6767778323794827, |
| "learning_rate": 2.738092359148405e-05, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2775751054286957, |
| "step": 1495, |
| "valid_targets_mean": 2690.2, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 3.1055900621118013, |
| "grad_norm": 0.6576226728100677, |
| "learning_rate": 2.7284841693060462e-05, |
| "loss": 0.2208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20576655864715576, |
| "step": 1500, |
| "valid_targets_mean": 2834.8, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 2.439222042139384, |
| "grad_norm": 0.8205999048363152, |
| "learning_rate": 3.295112400968073e-05, |
| "loss": 0.2474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2548583745956421, |
| "step": 1505, |
| "valid_targets_mean": 1901.8, |
| "valid_targets_min": 292 |
| }, |
| { |
| "epoch": 2.447325769854133, |
| "grad_norm": 0.5315794072702741, |
| "learning_rate": 3.2889429817593494e-05, |
| "loss": 0.2603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1704677790403366, |
| "step": 1510, |
| "valid_targets_mean": 3963.4, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 2.4554294975688817, |
| "grad_norm": 0.7664196020253414, |
| "learning_rate": 3.2827525129535135e-05, |
| "loss": 0.2847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1991099715232849, |
| "step": 1515, |
| "valid_targets_mean": 2012.4, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 2.4635332252836304, |
| "grad_norm": 0.8521592624429181, |
| "learning_rate": 3.276541095646482e-05, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29062721133232117, |
| "step": 1520, |
| "valid_targets_mean": 1823.2, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 2.471636952998379, |
| "grad_norm": 0.5852765718678786, |
| "learning_rate": 3.2703088312762825e-05, |
| "loss": 0.2458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24727652966976166, |
| "step": 1525, |
| "valid_targets_mean": 3405.0, |
| "valid_targets_min": 363 |
| }, |
| { |
| "epoch": 2.479740680713128, |
| "grad_norm": 0.813053837691479, |
| "learning_rate": 3.2640558216213914e-05, |
| "loss": 0.2491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30369141697883606, |
| "step": 1530, |
| "valid_targets_mean": 2343.3, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 2.487844408427877, |
| "grad_norm": 0.8194320234055189, |
| "learning_rate": 3.2577821687990764e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23056931793689728, |
| "step": 1535, |
| "valid_targets_mean": 2043.1, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 2.4959481361426255, |
| "grad_norm": 0.7683424849834839, |
| "learning_rate": 3.2514879752637236e-05, |
| "loss": 0.2137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2309729903936386, |
| "step": 1540, |
| "valid_targets_mean": 2539.1, |
| "valid_targets_min": 331 |
| }, |
| { |
| "epoch": 2.5040518638573745, |
| "grad_norm": 0.776312961878328, |
| "learning_rate": 3.2451733438051705e-05, |
| "loss": 0.2291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18839803338050842, |
| "step": 1545, |
| "valid_targets_mean": 1955.8, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 2.512155591572123, |
| "grad_norm": 0.655759060281187, |
| "learning_rate": 3.238838377547023e-05, |
| "loss": 0.2003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.189316064119339, |
| "step": 1550, |
| "valid_targets_mean": 2929.6, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 2.520259319286872, |
| "grad_norm": 1.6044275923948417, |
| "learning_rate": 3.2324831799449724e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17633099853992462, |
| "step": 1555, |
| "valid_targets_mean": 2779.9, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 2.528363047001621, |
| "grad_norm": 0.6561320237172028, |
| "learning_rate": 3.226107854785106e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1860257238149643, |
| "step": 1560, |
| "valid_targets_mean": 3073.5, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 2.5364667747163696, |
| "grad_norm": 0.6383285185047638, |
| "learning_rate": 3.2197125061822135e-05, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2523868680000305, |
| "step": 1565, |
| "valid_targets_mean": 3199.5, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.5445705024311183, |
| "grad_norm": 0.7962930999328149, |
| "learning_rate": 3.213297238578082e-05, |
| "loss": 0.2197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20864513516426086, |
| "step": 1570, |
| "valid_targets_mean": 2732.2, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 2.5526742301458674, |
| "grad_norm": 0.7676276530225514, |
| "learning_rate": 3.206862156739799e-05, |
| "loss": 0.2563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3047863245010376, |
| "step": 1575, |
| "valid_targets_mean": 2614.4, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 2.560777957860616, |
| "grad_norm": 0.8226887644393849, |
| "learning_rate": 3.2004073657580314e-05, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2075314223766327, |
| "step": 1580, |
| "valid_targets_mean": 2038.8, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 2.5688816855753647, |
| "grad_norm": 0.7831791976947534, |
| "learning_rate": 3.193932971045316e-05, |
| "loss": 0.2325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19461211562156677, |
| "step": 1585, |
| "valid_targets_mean": 2053.1, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 2.5769854132901133, |
| "grad_norm": 0.5644239851430982, |
| "learning_rate": 3.187439078334338e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18497009575366974, |
| "step": 1590, |
| "valid_targets_mean": 4375.7, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 2.585089141004862, |
| "grad_norm": 0.7466943240187409, |
| "learning_rate": 3.180925793676199e-05, |
| "loss": 0.2696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34886205196380615, |
| "step": 1595, |
| "valid_targets_mean": 3252.1, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 2.593192868719611, |
| "grad_norm": 0.654235875346469, |
| "learning_rate": 3.1743932234386905e-05, |
| "loss": 0.2239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23556801676750183, |
| "step": 1600, |
| "valid_targets_mean": 2707.2, |
| "valid_targets_min": 440 |
| }, |
| { |
| "epoch": 2.6012965964343597, |
| "grad_norm": 0.8478531512416733, |
| "learning_rate": 3.167841474304555e-05, |
| "loss": 0.2373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2540985345840454, |
| "step": 1605, |
| "valid_targets_mean": 2202.8, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 2.6094003241491084, |
| "grad_norm": 0.7568048524801189, |
| "learning_rate": 3.161270653269743e-05, |
| "loss": 0.2419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2507561445236206, |
| "step": 1610, |
| "valid_targets_mean": 2478.7, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 2.6175040518638575, |
| "grad_norm": 0.6768880292640026, |
| "learning_rate": 3.154680867641666e-05, |
| "loss": 0.2685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2119147777557373, |
| "step": 1615, |
| "valid_targets_mean": 2845.9, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 2.625607779578606, |
| "grad_norm": 0.6937745038803551, |
| "learning_rate": 3.1480722250374454e-05, |
| "loss": 0.2131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15716394782066345, |
| "step": 1620, |
| "valid_targets_mean": 3715.1, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 2.633711507293355, |
| "grad_norm": 0.687030718167616, |
| "learning_rate": 3.1414448333821526e-05, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26078009605407715, |
| "step": 1625, |
| "valid_targets_mean": 2993.9, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 2.641815235008104, |
| "grad_norm": 0.794998960315971, |
| "learning_rate": 3.1347988009070496e-05, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22042764723300934, |
| "step": 1630, |
| "valid_targets_mean": 2182.0, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 2.6499189627228525, |
| "grad_norm": 0.5288765889583341, |
| "learning_rate": 3.1281342361478184e-05, |
| "loss": 0.2031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18932923674583435, |
| "step": 1635, |
| "valid_targets_mean": 4350.9, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 2.658022690437601, |
| "grad_norm": 0.8061510946147543, |
| "learning_rate": 3.121451247942789e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23893296718597412, |
| "step": 1640, |
| "valid_targets_mean": 2239.7, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 2.6661264181523503, |
| "grad_norm": 0.8897502162805498, |
| "learning_rate": 3.1147499454311654e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24748632311820984, |
| "step": 1645, |
| "valid_targets_mean": 3042.6, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 2.674230145867099, |
| "grad_norm": 0.7411104018017028, |
| "learning_rate": 3.1080304380512386e-05, |
| "loss": 0.2258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3214663565158844, |
| "step": 1650, |
| "valid_targets_mean": 3191.7, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 2.6823338735818476, |
| "grad_norm": 0.6001100044618921, |
| "learning_rate": 3.101292835538602e-05, |
| "loss": 0.2736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21718555688858032, |
| "step": 1655, |
| "valid_targets_mean": 2929.2, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 2.6904376012965967, |
| "grad_norm": 0.5090566874249545, |
| "learning_rate": 3.0945372479243605e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1351870894432068, |
| "step": 1660, |
| "valid_targets_mean": 3636.1, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 2.6985413290113454, |
| "grad_norm": 0.8691139316583438, |
| "learning_rate": 3.087763785533328e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24571505188941956, |
| "step": 1665, |
| "valid_targets_mean": 2121.1, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 2.706645056726094, |
| "grad_norm": 0.7213977715140599, |
| "learning_rate": 3.0809725589822325e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22522029280662537, |
| "step": 1670, |
| "valid_targets_mean": 2168.9, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 2.7147487844408427, |
| "grad_norm": 0.6699076338131222, |
| "learning_rate": 3.074163679177907e-05, |
| "loss": 0.2315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24370843172073364, |
| "step": 1675, |
| "valid_targets_mean": 2977.4, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 2.7228525121555913, |
| "grad_norm": 0.6699594167700161, |
| "learning_rate": 3.067337257315477e-05, |
| "loss": 0.2335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19450387358665466, |
| "step": 1680, |
| "valid_targets_mean": 2758.7, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 2.7309562398703404, |
| "grad_norm": 0.7672860021178419, |
| "learning_rate": 3.0604934048765444e-05, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22159236669540405, |
| "step": 1685, |
| "valid_targets_mean": 2533.1, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 2.739059967585089, |
| "grad_norm": 0.7039751582203525, |
| "learning_rate": 3.05363223362737e-05, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2049209177494049, |
| "step": 1690, |
| "valid_targets_mean": 2859.5, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 2.7471636952998377, |
| "grad_norm": 2.679447162042586, |
| "learning_rate": 3.0467538556170463e-05, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1371978223323822, |
| "step": 1695, |
| "valid_targets_mean": 2292.4, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 2.755267423014587, |
| "grad_norm": 0.6779419086781114, |
| "learning_rate": 3.0398583831756655e-05, |
| "loss": 0.2261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20101284980773926, |
| "step": 1700, |
| "valid_targets_mean": 2922.6, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.7633711507293355, |
| "grad_norm": 0.6929703972487979, |
| "learning_rate": 3.03294592891249e-05, |
| "loss": 0.2141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2838400602340698, |
| "step": 1705, |
| "valid_targets_mean": 3094.0, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.771474878444084, |
| "grad_norm": 0.4798656780585094, |
| "learning_rate": 3.0260166057141086e-05, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18296658992767334, |
| "step": 1710, |
| "valid_targets_mean": 5082.8, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 2.7795786061588332, |
| "grad_norm": 0.7731022915468665, |
| "learning_rate": 3.0190705267425956e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25233393907546997, |
| "step": 1715, |
| "valid_targets_mean": 2334.8, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 2.787682333873582, |
| "grad_norm": 0.833833609952511, |
| "learning_rate": 3.0121078054336633e-05, |
| "loss": 0.2451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27136874198913574, |
| "step": 1720, |
| "valid_targets_mean": 3887.7, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 2.7957860615883305, |
| "grad_norm": 0.572927781409477, |
| "learning_rate": 3.005128555494806e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16209685802459717, |
| "step": 1725, |
| "valid_targets_mean": 3344.1, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 2.8038897893030796, |
| "grad_norm": 0.8175035205190527, |
| "learning_rate": 2.998132890903448e-05, |
| "loss": 0.2499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2571600377559662, |
| "step": 1730, |
| "valid_targets_mean": 2496.4, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 2.8119935170178283, |
| "grad_norm": 0.820561644375052, |
| "learning_rate": 2.9911209259050763e-05, |
| "loss": 0.2355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21497473120689392, |
| "step": 1735, |
| "valid_targets_mean": 2354.7, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 2.820097244732577, |
| "grad_norm": 0.6492150323752979, |
| "learning_rate": 2.984092775011382e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16714109480381012, |
| "step": 1740, |
| "valid_targets_mean": 2458.3, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 2.828200972447326, |
| "grad_norm": 0.7319549857733452, |
| "learning_rate": 2.9770485529983834e-05, |
| "loss": 0.2395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22950349748134613, |
| "step": 1745, |
| "valid_targets_mean": 3142.0, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 2.8363047001620747, |
| "grad_norm": 0.6560080208991743, |
| "learning_rate": 2.9699883749045564e-05, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1986587643623352, |
| "step": 1750, |
| "valid_targets_mean": 3457.0, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 2.8444084278768234, |
| "grad_norm": 0.6382253092955735, |
| "learning_rate": 2.962912356028953e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23129406571388245, |
| "step": 1755, |
| "valid_targets_mean": 2934.9, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 2.852512155591572, |
| "grad_norm": 0.5301256913380961, |
| "learning_rate": 2.95582061192932e-05, |
| "loss": 0.2389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18352752923965454, |
| "step": 1760, |
| "valid_targets_mean": 5318.9, |
| "valid_targets_min": 288 |
| }, |
| { |
| "epoch": 2.8606158833063207, |
| "grad_norm": 0.5551356639022342, |
| "learning_rate": 2.9487132584202115e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15121974050998688, |
| "step": 1765, |
| "valid_targets_mean": 3240.4, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 2.8687196110210698, |
| "grad_norm": 0.6494961371690191, |
| "learning_rate": 2.9415904115710964e-05, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27294760942459106, |
| "step": 1770, |
| "valid_targets_mean": 3565.1, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 2.8768233387358184, |
| "grad_norm": 0.755878858613056, |
| "learning_rate": 2.9344521877044633e-05, |
| "loss": 0.2449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2581571936607361, |
| "step": 1775, |
| "valid_targets_mean": 2870.9, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 2.884927066450567, |
| "grad_norm": 0.6896180082571636, |
| "learning_rate": 2.927298703393924e-05, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3024943768978119, |
| "step": 1780, |
| "valid_targets_mean": 3049.6, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 2.893030794165316, |
| "grad_norm": 0.5548812442234702, |
| "learning_rate": 2.9201300754623046e-05, |
| "loss": 0.2251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23311251401901245, |
| "step": 1785, |
| "valid_targets_mean": 4044.0, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 2.901134521880065, |
| "grad_norm": 1.438754224110583, |
| "learning_rate": 2.9129464209797404e-05, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24073530733585358, |
| "step": 1790, |
| "valid_targets_mean": 1909.4, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 2.9092382495948135, |
| "grad_norm": 0.7830491458219581, |
| "learning_rate": 2.9057478572617644e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24332499504089355, |
| "step": 1795, |
| "valid_targets_mean": 2556.9, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 2.9173419773095626, |
| "grad_norm": 0.6145444178155638, |
| "learning_rate": 2.898534501867391e-05, |
| "loss": 0.2337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25278767943382263, |
| "step": 1800, |
| "valid_targets_mean": 3891.1, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 2.9254457050243112, |
| "grad_norm": 0.3981787416840784, |
| "learning_rate": 2.8913064725971947e-05, |
| "loss": 0.2051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14965100586414337, |
| "step": 1805, |
| "valid_targets_mean": 5392.8, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 2.93354943273906, |
| "grad_norm": 0.5818947273050361, |
| "learning_rate": 2.8840638874913894e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24818670749664307, |
| "step": 1810, |
| "valid_targets_mean": 3600.8, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 2.941653160453809, |
| "grad_norm": 0.7145037253167454, |
| "learning_rate": 2.8768068648278976e-05, |
| "loss": 0.2105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1713862121105194, |
| "step": 1815, |
| "valid_targets_mean": 2208.1, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 2.9497568881685576, |
| "grad_norm": 0.6506752973751263, |
| "learning_rate": 2.8695355231204206e-05, |
| "loss": 0.2021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1586257517337799, |
| "step": 1820, |
| "valid_targets_mean": 2533.8, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 2.9578606158833063, |
| "grad_norm": 0.9308540302999432, |
| "learning_rate": 2.862249981116502e-05, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18500950932502747, |
| "step": 1825, |
| "valid_targets_mean": 1953.1, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 2.965964343598055, |
| "grad_norm": 0.868527787807027, |
| "learning_rate": 2.854950357795589e-05, |
| "loss": 0.2713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30140724778175354, |
| "step": 1830, |
| "valid_targets_mean": 2394.5, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 2.974068071312804, |
| "grad_norm": 0.7675779936155871, |
| "learning_rate": 2.847636772367091e-05, |
| "loss": 0.2659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38385745882987976, |
| "step": 1835, |
| "valid_targets_mean": 3416.3, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 2.9821717990275527, |
| "grad_norm": 0.5095446691779011, |
| "learning_rate": 2.8403093442684287e-05, |
| "loss": 0.1997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17920516431331635, |
| "step": 1840, |
| "valid_targets_mean": 4411.1, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.9902755267423013, |
| "grad_norm": 0.7425898253446929, |
| "learning_rate": 2.8329681931630877e-05, |
| "loss": 0.2287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21636709570884705, |
| "step": 1845, |
| "valid_targets_mean": 2047.3, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 2.99837925445705, |
| "grad_norm": 0.7698249801134349, |
| "learning_rate": 2.825613438938663e-05, |
| "loss": 0.2574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3017503619194031, |
| "step": 1850, |
| "valid_targets_mean": 2716.4, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 3.006482982171799, |
| "grad_norm": 0.7062953708878924, |
| "learning_rate": 2.8182452017048983e-05, |
| "loss": 0.2273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16801732778549194, |
| "step": 1855, |
| "valid_targets_mean": 2252.6, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 3.0145867098865478, |
| "grad_norm": 0.7009970781236867, |
| "learning_rate": 2.81086360179173e-05, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3520157039165497, |
| "step": 1860, |
| "valid_targets_mean": 3688.4, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 3.0226904376012964, |
| "grad_norm": 1.0084991924004758, |
| "learning_rate": 2.8034687597473164e-05, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21333259344100952, |
| "step": 1865, |
| "valid_targets_mean": 2459.2, |
| "valid_targets_min": 286 |
| }, |
| { |
| "epoch": 3.0307941653160455, |
| "grad_norm": 0.5137156161040282, |
| "learning_rate": 2.796060796336074e-05, |
| "loss": 0.2002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18863826990127563, |
| "step": 1870, |
| "valid_targets_mean": 5101.9, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 3.038897893030794, |
| "grad_norm": 1.8100288546636265, |
| "learning_rate": 2.7886398325367018e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2229488492012024, |
| "step": 1875, |
| "valid_targets_mean": 2298.8, |
| "valid_targets_min": 353 |
| }, |
| { |
| "epoch": 3.047001620745543, |
| "grad_norm": 0.720734898463899, |
| "learning_rate": 2.7812059895402064e-05, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20065172016620636, |
| "step": 1880, |
| "valid_targets_mean": 3090.3, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 3.055105348460292, |
| "grad_norm": 0.8640799066873229, |
| "learning_rate": 2.773759388747925e-05, |
| "loss": 0.3024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4552222788333893, |
| "step": 1885, |
| "valid_targets_mean": 3287.7, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 3.0632090761750406, |
| "grad_norm": 0.6353362563989103, |
| "learning_rate": 2.7663001517695386e-05, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24317996203899384, |
| "step": 1890, |
| "valid_targets_mean": 3646.6, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 3.0713128038897892, |
| "grad_norm": 0.7914447945449794, |
| "learning_rate": 2.7588284004210907e-05, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20814718306064606, |
| "step": 1895, |
| "valid_targets_mean": 2367.0, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 3.079416531604538, |
| "grad_norm": 0.6958540521779719, |
| "learning_rate": 2.7513442567229936e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20249110460281372, |
| "step": 1900, |
| "valid_targets_mean": 2836.4, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 3.087520259319287, |
| "grad_norm": 0.596529064303546, |
| "learning_rate": 2.7438478428980407e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14787033200263977, |
| "step": 1905, |
| "valid_targets_mean": 3139.7, |
| "valid_targets_min": 475 |
| }, |
| { |
| "epoch": 3.0956239870340356, |
| "grad_norm": 0.7078002600984272, |
| "learning_rate": 2.7363392813694047e-05, |
| "loss": 0.2662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3391125798225403, |
| "step": 1910, |
| "valid_targets_mean": 3532.0, |
| "valid_targets_min": 345 |
| }, |
| { |
| "epoch": 3.1037277147487843, |
| "grad_norm": 0.7778209985657967, |
| "learning_rate": 2.7288186947586426e-05, |
| "loss": 0.2797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18052786588668823, |
| "step": 1915, |
| "valid_targets_mean": 2382.4, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 3.1118314424635334, |
| "grad_norm": 0.6013057667276556, |
| "learning_rate": 2.7212862058836925e-05, |
| "loss": 0.2246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20441167056560516, |
| "step": 1920, |
| "valid_targets_mean": 4624.4, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 3.119935170178282, |
| "grad_norm": 0.8433721924819828, |
| "learning_rate": 2.713741937756865e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21256756782531738, |
| "step": 1925, |
| "valid_targets_mean": 2051.4, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 3.1280388978930307, |
| "grad_norm": 0.8267912865776698, |
| "learning_rate": 2.7061860135828384e-05, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23010283708572388, |
| "step": 1930, |
| "valid_targets_mean": 2566.1, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 3.1361426256077793, |
| "grad_norm": 0.9281087995213807, |
| "learning_rate": 2.6986185567566442e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26588061451911926, |
| "step": 1935, |
| "valid_targets_mean": 2648.5, |
| "valid_targets_min": 1102 |
| }, |
| { |
| "epoch": 3.1442463533225284, |
| "grad_norm": 0.7402140669755561, |
| "learning_rate": 2.6910396908616527e-05, |
| "loss": 0.2389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24440577626228333, |
| "step": 1940, |
| "valid_targets_mean": 2880.9, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 3.152350081037277, |
| "grad_norm": 0.9250550622058952, |
| "learning_rate": 2.6834495396675526e-05, |
| "loss": 0.214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18351495265960693, |
| "step": 1945, |
| "valid_targets_mean": 1815.4, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 3.1604538087520258, |
| "grad_norm": 0.7075464086399091, |
| "learning_rate": 2.6758482271283347e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14974619448184967, |
| "step": 1950, |
| "valid_targets_mean": 2622.6, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 3.168557536466775, |
| "grad_norm": 0.9235868375401112, |
| "learning_rate": 2.668235877380263e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24251984059810638, |
| "step": 1955, |
| "valid_targets_mean": 1804.3, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 3.1766612641815235, |
| "grad_norm": 0.6596779615208653, |
| "learning_rate": 2.660612614739849e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14453783631324768, |
| "step": 1960, |
| "valid_targets_mean": 2709.9, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 3.184764991896272, |
| "grad_norm": 0.766766066884446, |
| "learning_rate": 2.652978563701822e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1874874234199524, |
| "step": 1965, |
| "valid_targets_mean": 2113.1, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 3.1928687196110213, |
| "grad_norm": 0.8124849594835287, |
| "learning_rate": 2.645333848937095e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23300279676914215, |
| "step": 1970, |
| "valid_targets_mean": 2446.9, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 3.20097244732577, |
| "grad_norm": 0.46106063693318805, |
| "learning_rate": 2.6376785952907292e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10534625500440598, |
| "step": 1975, |
| "valid_targets_mean": 4224.2, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 3.2090761750405186, |
| "grad_norm": 0.7587794893394673, |
| "learning_rate": 2.630012927779896e-05, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2638416290283203, |
| "step": 1980, |
| "valid_targets_mean": 2923.1, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 3.217179902755267, |
| "grad_norm": 0.8879684966937325, |
| "learning_rate": 2.6223369715918338e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22857242822647095, |
| "step": 1985, |
| "valid_targets_mean": 1645.6, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 3.2252836304700163, |
| "grad_norm": 0.7748370854682728, |
| "learning_rate": 2.614650852081805e-05, |
| "loss": 0.2333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24988800287246704, |
| "step": 1990, |
| "valid_targets_mean": 2849.4, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 3.233387358184765, |
| "grad_norm": 0.7495261062213084, |
| "learning_rate": 2.606954694771047e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23291251063346863, |
| "step": 1995, |
| "valid_targets_mean": 2843.9, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 3.2414910858995136, |
| "grad_norm": 0.7547991819930768, |
| "learning_rate": 2.5992486253447258e-05, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21426227688789368, |
| "step": 2000, |
| "valid_targets_mean": 2390.5, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 3.2495948136142627, |
| "grad_norm": 0.8127669361485503, |
| "learning_rate": 2.5915327696498787e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12424997985363007, |
| "step": 2005, |
| "valid_targets_mean": 1779.2, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 3.2576985413290114, |
| "grad_norm": 0.7721290973743158, |
| "learning_rate": 2.583807253693362e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18391962349414825, |
| "step": 2010, |
| "valid_targets_mean": 2541.4, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 3.26580226904376, |
| "grad_norm": 0.7334128634083178, |
| "learning_rate": 2.576072203639794e-05, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19778266549110413, |
| "step": 2015, |
| "valid_targets_mean": 2840.1, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 3.2739059967585087, |
| "grad_norm": 0.9287603147287846, |
| "learning_rate": 2.5683277458094926e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2278834730386734, |
| "step": 2020, |
| "valid_targets_mean": 1949.1, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 3.282009724473258, |
| "grad_norm": 0.8397730144943303, |
| "learning_rate": 2.560574006676413e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2002110779285431, |
| "step": 2025, |
| "valid_targets_mean": 3523.7, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 3.2901134521880064, |
| "grad_norm": 0.4390442212313819, |
| "learning_rate": 2.5528111128660826e-05, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13749784231185913, |
| "step": 2030, |
| "valid_targets_mean": 5424.6, |
| "valid_targets_min": 232 |
| }, |
| { |
| "epoch": 3.298217179902755, |
| "grad_norm": 0.6699615633322983, |
| "learning_rate": 2.545039191153533e-05, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2043614387512207, |
| "step": 2035, |
| "valid_targets_mean": 3574.8, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 3.306320907617504, |
| "grad_norm": 0.8633099775212048, |
| "learning_rate": 2.53725836846123e-05, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1649923026561737, |
| "step": 2040, |
| "valid_targets_mean": 1737.0, |
| "valid_targets_min": 456 |
| }, |
| { |
| "epoch": 3.314424635332253, |
| "grad_norm": 0.6256214069648829, |
| "learning_rate": 2.5294687718569994e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14858299493789673, |
| "step": 2045, |
| "valid_targets_mean": 3804.9, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 3.3225283630470015, |
| "grad_norm": 0.9944856313019108, |
| "learning_rate": 2.5216705285519525e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17022621631622314, |
| "step": 2050, |
| "valid_targets_mean": 2688.2, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 3.3306320907617506, |
| "grad_norm": 0.6389414039882365, |
| "learning_rate": 2.5138637658984116e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12931106984615326, |
| "step": 2055, |
| "valid_targets_mean": 2573.4, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 3.3387358184764993, |
| "grad_norm": 0.6456462614939432, |
| "learning_rate": 2.5060486113878244e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22942790389060974, |
| "step": 2060, |
| "valid_targets_mean": 3076.4, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 3.346839546191248, |
| "grad_norm": 0.4552379058782566, |
| "learning_rate": 2.4982251926486873e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0790659636259079, |
| "step": 2065, |
| "valid_targets_mean": 3547.6, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 3.354943273905997, |
| "grad_norm": 0.5502283454291953, |
| "learning_rate": 2.490393637444458e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16592127084732056, |
| "step": 2070, |
| "valid_targets_mean": 4692.4, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 3.3630470016207457, |
| "grad_norm": 0.8617017867222999, |
| "learning_rate": 2.482554073671471e-05, |
| "loss": 0.2125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24501700699329376, |
| "step": 2075, |
| "valid_targets_mean": 2338.4, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 3.3711507293354943, |
| "grad_norm": 0.7899472946015639, |
| "learning_rate": 2.4747066293568452e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15188781917095184, |
| "step": 2080, |
| "valid_targets_mean": 2104.1, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 3.379254457050243, |
| "grad_norm": 0.8193544565230731, |
| "learning_rate": 2.4668514326564e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17579089105129242, |
| "step": 2085, |
| "valid_targets_mean": 2063.2, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 3.387358184764992, |
| "grad_norm": 0.889128650784621, |
| "learning_rate": 2.4589886118525556e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18815834820270538, |
| "step": 2090, |
| "valid_targets_mean": 1816.8, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 3.3954619124797407, |
| "grad_norm": 0.7550229654302467, |
| "learning_rate": 2.4511182953522405e-05, |
| "loss": 0.1906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26341044902801514, |
| "step": 2095, |
| "valid_targets_mean": 3581.5, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 3.4035656401944894, |
| "grad_norm": 0.8942138699800349, |
| "learning_rate": 2.4432406116847954e-05, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2436755895614624, |
| "step": 2100, |
| "valid_targets_mean": 1985.3, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 3.411669367909238, |
| "grad_norm": 0.5028709815573968, |
| "learning_rate": 2.435355689499874e-05, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11536405980587006, |
| "step": 2105, |
| "valid_targets_mean": 3964.9, |
| "valid_targets_min": 233 |
| }, |
| { |
| "epoch": 3.419773095623987, |
| "grad_norm": 0.714825678842735, |
| "learning_rate": 2.4274636575653398e-05, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15641966462135315, |
| "step": 2110, |
| "valid_targets_mean": 2424.9, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 3.427876823338736, |
| "grad_norm": 0.8122455585254386, |
| "learning_rate": 2.4195646447651663e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2142556607723236, |
| "step": 2115, |
| "valid_targets_mean": 4355.4, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 3.4359805510534844, |
| "grad_norm": 0.783700231697767, |
| "learning_rate": 2.411658780097331e-05, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3505910634994507, |
| "step": 2120, |
| "valid_targets_mean": 4021.6, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 3.4440842787682335, |
| "grad_norm": 0.7313909744848299, |
| "learning_rate": 2.4037461926717075e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17269133031368256, |
| "step": 2125, |
| "valid_targets_mean": 2451.2, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 3.452188006482982, |
| "grad_norm": 0.8088615988871327, |
| "learning_rate": 2.395827011707959e-05, |
| "loss": 0.2503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20847368240356445, |
| "step": 2130, |
| "valid_targets_mean": 2553.2, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 3.460291734197731, |
| "grad_norm": 0.5900039519353123, |
| "learning_rate": 2.3879013665334258e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20145244896411896, |
| "step": 2135, |
| "valid_targets_mean": 4923.4, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 3.46839546191248, |
| "grad_norm": 0.6378206622182675, |
| "learning_rate": 2.3799693865810163e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16754154860973358, |
| "step": 2140, |
| "valid_targets_mean": 3790.3, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.4764991896272286, |
| "grad_norm": 0.7389226745729313, |
| "learning_rate": 2.37203120138709e-05, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2016831338405609, |
| "step": 2145, |
| "valid_targets_mean": 3017.4, |
| "valid_targets_min": 913 |
| }, |
| { |
| "epoch": 3.4846029173419772, |
| "grad_norm": 0.542849963051636, |
| "learning_rate": 2.3640869405893446e-05, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19606372714042664, |
| "step": 2150, |
| "valid_targets_mean": 3942.9, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 3.492706645056726, |
| "grad_norm": 0.8814880321553831, |
| "learning_rate": 2.3561367339246976e-05, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2154223620891571, |
| "step": 2155, |
| "valid_targets_mean": 1835.9, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 3.500810372771475, |
| "grad_norm": 0.7067348415715224, |
| "learning_rate": 2.3481807112271678e-05, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.166023850440979, |
| "step": 2160, |
| "valid_targets_mean": 3050.1, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 3.5089141004862237, |
| "grad_norm": 0.620735692816103, |
| "learning_rate": 2.3402190024257543e-05, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13485875725746155, |
| "step": 2165, |
| "valid_targets_mean": 3070.6, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 3.5170178282009723, |
| "grad_norm": 0.7429662318750067, |
| "learning_rate": 2.3322517375423165e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16115394234657288, |
| "step": 2170, |
| "valid_targets_mean": 2298.1, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 3.525121555915721, |
| "grad_norm": 0.8477525841685281, |
| "learning_rate": 2.3242790466894494e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19504885375499725, |
| "step": 2175, |
| "valid_targets_mean": 2246.0, |
| "valid_targets_min": 398 |
| }, |
| { |
| "epoch": 3.53322528363047, |
| "grad_norm": 0.7627025545672735, |
| "learning_rate": 2.316301060068359e-05, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21119363605976105, |
| "step": 2180, |
| "valid_targets_mean": 2926.6, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.5413290113452187, |
| "grad_norm": 1.100127953832155, |
| "learning_rate": 2.3083179079667347e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20743992924690247, |
| "step": 2185, |
| "valid_targets_mean": 4087.3, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 3.5494327390599674, |
| "grad_norm": 0.5805399953892108, |
| "learning_rate": 2.300329720756625e-05, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15286213159561157, |
| "step": 2190, |
| "valid_targets_mean": 3119.1, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 3.5575364667747165, |
| "grad_norm": 0.7519460987432748, |
| "learning_rate": 2.2923366288923045e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18701784312725067, |
| "step": 2195, |
| "valid_targets_mean": 2679.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 3.565640194489465, |
| "grad_norm": 0.5738422561843207, |
| "learning_rate": 2.2843387629081453e-05, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14277049899101257, |
| "step": 2200, |
| "valid_targets_mean": 4261.6, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 3.5737439222042138, |
| "grad_norm": 0.6995930320107968, |
| "learning_rate": 2.2763362534164854e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1426575481891632, |
| "step": 2205, |
| "valid_targets_mean": 2615.9, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 3.581847649918963, |
| "grad_norm": 0.778790384658622, |
| "learning_rate": 2.268329231105498e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22932958602905273, |
| "step": 2210, |
| "valid_targets_mean": 2972.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 3.5899513776337115, |
| "grad_norm": 0.8621285854700218, |
| "learning_rate": 2.2603178267370504e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20100966095924377, |
| "step": 2215, |
| "valid_targets_mean": 2199.8, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 3.59805510534846, |
| "grad_norm": 0.6366888964927337, |
| "learning_rate": 2.2523021711445746e-05, |
| "loss": 0.1847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14098083972930908, |
| "step": 2220, |
| "valid_targets_mean": 3288.6, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 3.6061588330632093, |
| "grad_norm": 1.031030067314881, |
| "learning_rate": 2.2442823952309308e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21637287735939026, |
| "step": 2225, |
| "valid_targets_mean": 1423.6, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 3.614262560777958, |
| "grad_norm": 0.8638929404500169, |
| "learning_rate": 2.2362586299662642e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2800928056240082, |
| "step": 2230, |
| "valid_targets_mean": 2027.9, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 3.6223662884927066, |
| "grad_norm": 0.7529589056185002, |
| "learning_rate": 2.228231006385873e-05, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3154662251472473, |
| "step": 2235, |
| "valid_targets_mean": 4337.9, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 3.6304700162074557, |
| "grad_norm": 0.6840352862675642, |
| "learning_rate": 2.2201996555880633e-05, |
| "loss": 0.1879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13636550307273865, |
| "step": 2240, |
| "valid_targets_mean": 2383.8, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 3.6385737439222043, |
| "grad_norm": 0.7568859162264532, |
| "learning_rate": 2.2121647087320105e-05, |
| "loss": 0.2209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17221365869045258, |
| "step": 2245, |
| "valid_targets_mean": 2137.6, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 3.646677471636953, |
| "grad_norm": 0.8960270729679528, |
| "learning_rate": 2.204126297035617e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23943698406219482, |
| "step": 2250, |
| "valid_targets_mean": 1959.3, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 3.6547811993517016, |
| "grad_norm": 0.7464106224245589, |
| "learning_rate": 2.196084551773368e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18965956568717957, |
| "step": 2255, |
| "valid_targets_mean": 2451.1, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 3.6628849270664503, |
| "grad_norm": 0.9722153370680764, |
| "learning_rate": 2.1880396042741906e-05, |
| "loss": 0.2534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22785764932632446, |
| "step": 2260, |
| "valid_targets_mean": 1551.8, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 3.6709886547811994, |
| "grad_norm": 0.4697676488300176, |
| "learning_rate": 2.179991585919307e-05, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0863395407795906, |
| "step": 2265, |
| "valid_targets_mean": 3504.8, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 3.679092382495948, |
| "grad_norm": 0.7371456685043023, |
| "learning_rate": 2.1719406281400873e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2391626387834549, |
| "step": 2270, |
| "valid_targets_mean": 2812.4, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 3.6871961102106967, |
| "grad_norm": 0.7116149527659587, |
| "learning_rate": 2.163886862415908e-05, |
| "loss": 0.2048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16868996620178223, |
| "step": 2275, |
| "valid_targets_mean": 3199.4, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 3.695299837925446, |
| "grad_norm": 0.6944396008804573, |
| "learning_rate": 2.155830420272e-05, |
| "loss": 0.2347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36398154497146606, |
| "step": 2280, |
| "valid_targets_mean": 4588.9, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 3.7034035656401945, |
| "grad_norm": 0.49891846247542965, |
| "learning_rate": 2.1477714332773022e-05, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12793442606925964, |
| "step": 2285, |
| "valid_targets_mean": 4197.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.711507293354943, |
| "grad_norm": 0.7737664275138527, |
| "learning_rate": 2.139710033042314e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21408765017986298, |
| "step": 2290, |
| "valid_targets_mean": 2392.2, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 3.719611021069692, |
| "grad_norm": 0.6249478567474501, |
| "learning_rate": 2.1316463512169453e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17073558270931244, |
| "step": 2295, |
| "valid_targets_mean": 3448.7, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 3.727714748784441, |
| "grad_norm": 0.6319183901564622, |
| "learning_rate": 2.1235805194883665e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12544557452201843, |
| "step": 2300, |
| "valid_targets_mean": 3194.1, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 3.7358184764991895, |
| "grad_norm": 0.8809027809587772, |
| "learning_rate": 2.115512669578857e-05, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21802709996700287, |
| "step": 2305, |
| "valid_targets_mean": 2093.7, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 3.7439222042139386, |
| "grad_norm": 0.8125759794942795, |
| "learning_rate": 2.107442933243656e-05, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1779268980026245, |
| "step": 2310, |
| "valid_targets_mean": 2595.6, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 3.7520259319286873, |
| "grad_norm": 0.7211723580416524, |
| "learning_rate": 2.099371442268809e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1611754596233368, |
| "step": 2315, |
| "valid_targets_mean": 2815.6, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 3.760129659643436, |
| "grad_norm": 0.7848416454395023, |
| "learning_rate": 2.0912983284690157e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2059643268585205, |
| "step": 2320, |
| "valid_targets_mean": 2567.2, |
| "valid_targets_min": 232 |
| }, |
| { |
| "epoch": 3.768233387358185, |
| "grad_norm": 0.5904887355051087, |
| "learning_rate": 2.0832237236854794e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15662437677383423, |
| "step": 2325, |
| "valid_targets_mean": 3666.7, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 3.7763371150729337, |
| "grad_norm": 0.7236461690914054, |
| "learning_rate": 2.0751477597837528e-05, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12969183921813965, |
| "step": 2330, |
| "valid_targets_mean": 2251.1, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 3.7844408427876823, |
| "grad_norm": 0.9505422297729229, |
| "learning_rate": 2.0670705686515822e-05, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23993048071861267, |
| "step": 2335, |
| "valid_targets_mean": 1928.8, |
| "valid_targets_min": 505 |
| }, |
| { |
| "epoch": 3.792544570502431, |
| "grad_norm": 0.6637526217519724, |
| "learning_rate": 2.0589922821967566e-05, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1568320393562317, |
| "step": 2340, |
| "valid_targets_mean": 2895.9, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 3.8006482982171796, |
| "grad_norm": 1.0128117172897237, |
| "learning_rate": 2.0509130323449545e-05, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15534460544586182, |
| "step": 2345, |
| "valid_targets_mean": 1361.9, |
| "valid_targets_min": 488 |
| }, |
| { |
| "epoch": 3.8087520259319287, |
| "grad_norm": 0.6671945777380213, |
| "learning_rate": 2.0428329510375838e-05, |
| "loss": 0.1997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30660581588745117, |
| "step": 2350, |
| "valid_targets_mean": 4413.9, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 3.8168557536466774, |
| "grad_norm": 0.5544375126811655, |
| "learning_rate": 2.0347521702296333e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17179805040359497, |
| "step": 2355, |
| "valid_targets_mean": 4360.7, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.824959481361426, |
| "grad_norm": 0.8902971352705107, |
| "learning_rate": 2.026670821887516e-05, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16486603021621704, |
| "step": 2360, |
| "valid_targets_mean": 1924.4, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 3.833063209076175, |
| "grad_norm": 0.691767954969929, |
| "learning_rate": 2.0185890379869115e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29504096508026123, |
| "step": 2365, |
| "valid_targets_mean": 3782.2, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 3.841166936790924, |
| "grad_norm": 0.7902862954174232, |
| "learning_rate": 2.0105069505106126e-05, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2295757234096527, |
| "step": 2370, |
| "valid_targets_mean": 2529.1, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 3.8492706645056725, |
| "grad_norm": 0.6983178682113452, |
| "learning_rate": 2.00242469144637e-05, |
| "loss": 0.1819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1746961772441864, |
| "step": 2375, |
| "valid_targets_mean": 3053.4, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 3.8573743922204216, |
| "grad_norm": 0.7564438056864309, |
| "learning_rate": 1.994342392784738e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17830297350883484, |
| "step": 2380, |
| "valid_targets_mean": 2944.7, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 3.86547811993517, |
| "grad_norm": 0.755822155072044, |
| "learning_rate": 1.9862601865169154e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19303062558174133, |
| "step": 2385, |
| "valid_targets_mean": 2711.5, |
| "valid_targets_min": 1487 |
| }, |
| { |
| "epoch": 3.873581847649919, |
| "grad_norm": 0.7160490637060567, |
| "learning_rate": 1.9781782046325938e-05, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18017929792404175, |
| "step": 2390, |
| "valid_targets_mean": 2449.2, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 3.881685575364668, |
| "grad_norm": 0.6508016267439924, |
| "learning_rate": 1.9700965791177986e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22605565190315247, |
| "step": 2395, |
| "valid_targets_mean": 3326.8, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 3.8897893030794166, |
| "grad_norm": 0.6852974910747845, |
| "learning_rate": 1.9620154419527372e-05, |
| "loss": 0.2692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24458330869674683, |
| "step": 2400, |
| "valid_targets_mean": 3742.1, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 3.8978930307941653, |
| "grad_norm": 0.8183442535515982, |
| "learning_rate": 1.953934925109641e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3048601746559143, |
| "step": 2405, |
| "valid_targets_mean": 2523.3, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 3.9059967585089144, |
| "grad_norm": 0.7630671943332308, |
| "learning_rate": 1.945855160550611e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16103631258010864, |
| "step": 2410, |
| "valid_targets_mean": 2636.6, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 3.914100486223663, |
| "grad_norm": 0.8070470089137307, |
| "learning_rate": 1.937776280225463e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20676636695861816, |
| "step": 2415, |
| "valid_targets_mean": 2609.7, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 3.9222042139384117, |
| "grad_norm": 0.9463383844932369, |
| "learning_rate": 1.929698416069571e-05, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.197508305311203, |
| "step": 2420, |
| "valid_targets_mean": 1525.7, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 3.9303079416531603, |
| "grad_norm": 0.6974073097875326, |
| "learning_rate": 1.9216217000017182e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21730129420757294, |
| "step": 2425, |
| "valid_targets_mean": 2918.9, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 3.938411669367909, |
| "grad_norm": 0.6196655766852457, |
| "learning_rate": 1.9135462639219325e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22163273394107819, |
| "step": 2430, |
| "valid_targets_mean": 4302.2, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 3.946515397082658, |
| "grad_norm": 1.0083387028610686, |
| "learning_rate": 1.905472239709343e-05, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27771952748298645, |
| "step": 2435, |
| "valid_targets_mean": 1752.2, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 3.9546191247974067, |
| "grad_norm": 0.6436193457753687, |
| "learning_rate": 1.89739975922002e-05, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24347497522830963, |
| "step": 2440, |
| "valid_targets_mean": 3727.1, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 3.9627228525121554, |
| "grad_norm": 0.7463707250780504, |
| "learning_rate": 1.889328954284823e-05, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21482862532138824, |
| "step": 2445, |
| "valid_targets_mean": 2699.9, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 3.9708265802269045, |
| "grad_norm": 0.8578748435821815, |
| "learning_rate": 1.8812599567072496e-05, |
| "loss": 0.2208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22225850820541382, |
| "step": 2450, |
| "valid_targets_mean": 2473.5, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 3.978930307941653, |
| "grad_norm": 0.6000598430860175, |
| "learning_rate": 1.873192898261281e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17323483526706696, |
| "step": 2455, |
| "valid_targets_mean": 3969.9, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 3.987034035656402, |
| "grad_norm": 0.6411349311068479, |
| "learning_rate": 1.8651279106892317e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22670185565948486, |
| "step": 2460, |
| "valid_targets_mean": 3840.9, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 3.995137763371151, |
| "grad_norm": 0.8265211359345982, |
| "learning_rate": 1.8570651256995933e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16508886218070984, |
| "step": 2465, |
| "valid_targets_mean": 1857.5, |
| "valid_targets_min": 407 |
| }, |
| { |
| "epoch": 4.003241491085899, |
| "grad_norm": 0.7438519471306131, |
| "learning_rate": 1.849004674964891e-05, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13882270455360413, |
| "step": 2470, |
| "valid_targets_mean": 2407.8, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 4.011345218800648, |
| "grad_norm": 0.666660079984095, |
| "learning_rate": 1.840946690119528e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18586783111095428, |
| "step": 2475, |
| "valid_targets_mean": 3428.2, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 4.019448946515397, |
| "grad_norm": 0.6224308701315978, |
| "learning_rate": 1.8328913027576373e-05, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1357424110174179, |
| "step": 2480, |
| "valid_targets_mean": 2990.6, |
| "valid_targets_min": 297 |
| }, |
| { |
| "epoch": 4.0275526742301455, |
| "grad_norm": 0.9706356061146716, |
| "learning_rate": 1.824838644430934e-05, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17957650125026703, |
| "step": 2485, |
| "valid_targets_mean": 2300.4, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 4.035656401944895, |
| "grad_norm": 0.5507038011859006, |
| "learning_rate": 1.8167888466465652e-05, |
| "loss": 0.1543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1574670970439911, |
| "step": 2490, |
| "valid_targets_mean": 6137.8, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 4.043760129659644, |
| "grad_norm": 0.9201955501879038, |
| "learning_rate": 1.8087420408649596e-05, |
| "loss": 0.1852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1650194525718689, |
| "step": 2495, |
| "valid_targets_mean": 1996.8, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 4.051863857374392, |
| "grad_norm": 0.7731697108102025, |
| "learning_rate": 1.8006983584976877e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18308573961257935, |
| "step": 2500, |
| "valid_targets_mean": 2703.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.059967585089141, |
| "grad_norm": 0.7203113706129127, |
| "learning_rate": 1.7926579309053098e-05, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1433395892381668, |
| "step": 2505, |
| "valid_targets_mean": 2686.1, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 4.06807131280389, |
| "grad_norm": 0.857648318619981, |
| "learning_rate": 1.7846208893952346e-05, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17913417518138885, |
| "step": 2510, |
| "valid_targets_mean": 2421.8, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 4.076175040518638, |
| "grad_norm": 0.9249873120711297, |
| "learning_rate": 1.7765873652195713e-05, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19423171877861023, |
| "step": 2515, |
| "valid_targets_mean": 2475.4, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 4.084278768233387, |
| "grad_norm": 2.311467435227256, |
| "learning_rate": 1.7685574895729886e-05, |
| "loss": 0.2207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4830706715583801, |
| "step": 2520, |
| "valid_targets_mean": 3542.9, |
| "valid_targets_min": 305 |
| }, |
| { |
| "epoch": 4.0923824959481365, |
| "grad_norm": 0.654022585178441, |
| "learning_rate": 1.7605313935905722e-05, |
| "loss": 0.1511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1987391710281372, |
| "step": 2525, |
| "valid_targets_mean": 4264.9, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 4.100486223662885, |
| "grad_norm": 0.7899542972251363, |
| "learning_rate": 1.7525092083456795e-05, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15167073905467987, |
| "step": 2530, |
| "valid_targets_mean": 2471.2, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 4.108589951377634, |
| "grad_norm": 0.7446749286045431, |
| "learning_rate": 1.744491064847805e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14512816071510315, |
| "step": 2535, |
| "valid_targets_mean": 3130.6, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 4.116693679092383, |
| "grad_norm": 0.6706352002553055, |
| "learning_rate": 1.7364770940404375e-05, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18727947771549225, |
| "step": 2540, |
| "valid_targets_mean": 3859.0, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 4.124797406807131, |
| "grad_norm": 0.7374471536131514, |
| "learning_rate": 1.7284674267989213e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3415883183479309, |
| "step": 2545, |
| "valid_targets_mean": 3796.5, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 4.13290113452188, |
| "grad_norm": 0.6623719219174707, |
| "learning_rate": 1.72046219392832e-05, |
| "loss": 0.1622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09289093315601349, |
| "step": 2550, |
| "valid_targets_mean": 2261.0, |
| "valid_targets_min": 372 |
| }, |
| { |
| "epoch": 4.1410048622366284, |
| "grad_norm": 0.6819916449930195, |
| "learning_rate": 1.712461526161279e-05, |
| "loss": 0.2122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19168910384178162, |
| "step": 2555, |
| "valid_targets_mean": 3595.6, |
| "valid_targets_min": 431 |
| }, |
| { |
| "epoch": 4.1491085899513775, |
| "grad_norm": 1.006431838006035, |
| "learning_rate": 1.7044655541558934e-05, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19053317606449127, |
| "step": 2560, |
| "valid_targets_mean": 2357.0, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 4.157212317666127, |
| "grad_norm": 0.7533939089362455, |
| "learning_rate": 1.69647440849357e-05, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2373582273721695, |
| "step": 2565, |
| "valid_targets_mean": 2927.2, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 4.165316045380875, |
| "grad_norm": 0.890040140849173, |
| "learning_rate": 1.6884882196768985e-05, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.188620924949646, |
| "step": 2570, |
| "valid_targets_mean": 2630.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.173419773095624, |
| "grad_norm": 0.9465451734827055, |
| "learning_rate": 1.680507118127518e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19093164801597595, |
| "step": 2575, |
| "valid_targets_mean": 1947.6, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 4.181523500810373, |
| "grad_norm": 0.7658272802842436, |
| "learning_rate": 1.6725312341839895e-05, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14707794785499573, |
| "step": 2580, |
| "valid_targets_mean": 2918.4, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 4.189627228525121, |
| "grad_norm": 0.6443361980317487, |
| "learning_rate": 1.664560698099664e-05, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15699368715286255, |
| "step": 2585, |
| "valid_targets_mean": 3664.1, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 4.19773095623987, |
| "grad_norm": 0.9445201634571403, |
| "learning_rate": 1.6565956400405586e-05, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19105768203735352, |
| "step": 2590, |
| "valid_targets_mean": 1996.1, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 4.2058346839546195, |
| "grad_norm": 1.5563352274482452, |
| "learning_rate": 1.6486361900832284e-05, |
| "loss": 0.142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1398153007030487, |
| "step": 2595, |
| "valid_targets_mean": 1860.5, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 4.213938411669368, |
| "grad_norm": 0.6946128489566771, |
| "learning_rate": 1.6406824782126428e-05, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22305166721343994, |
| "step": 2600, |
| "valid_targets_mean": 3348.3, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 4.222042139384117, |
| "grad_norm": 0.6233066610164918, |
| "learning_rate": 1.632734634320064e-05, |
| "loss": 0.2009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22936005890369415, |
| "step": 2605, |
| "valid_targets_mean": 3911.8, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 4.230145867098866, |
| "grad_norm": 0.6881169895401946, |
| "learning_rate": 1.6247927882009256e-05, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13565057516098022, |
| "step": 2610, |
| "valid_targets_mean": 3660.1, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 4.238249594813614, |
| "grad_norm": 0.9276168493947143, |
| "learning_rate": 1.6168570695527096e-05, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2158156931400299, |
| "step": 2615, |
| "valid_targets_mean": 2655.6, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 4.246353322528363, |
| "grad_norm": 1.0419792453131715, |
| "learning_rate": 1.6089276079728334e-05, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12811069190502167, |
| "step": 2620, |
| "valid_targets_mean": 1496.8, |
| "valid_targets_min": 303 |
| }, |
| { |
| "epoch": 4.254457050243111, |
| "grad_norm": 0.5184090018750442, |
| "learning_rate": 1.6010045329565294e-05, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08075259625911713, |
| "step": 2625, |
| "valid_targets_mean": 3308.2, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 4.2625607779578605, |
| "grad_norm": 1.374064211424771, |
| "learning_rate": 1.5930879738947328e-05, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14756430685520172, |
| "step": 2630, |
| "valid_targets_mean": 2306.1, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 4.27066450567261, |
| "grad_norm": 0.7709350033003551, |
| "learning_rate": 1.585178060071966e-05, |
| "loss": 0.1548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16429486870765686, |
| "step": 2635, |
| "valid_targets_mean": 2699.4, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 4.278768233387358, |
| "grad_norm": 0.7949963216390307, |
| "learning_rate": 1.5772749206642296e-05, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11400672793388367, |
| "step": 2640, |
| "valid_targets_mean": 2194.9, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 4.286871961102107, |
| "grad_norm": 1.0554910650197593, |
| "learning_rate": 1.5693786847368918e-05, |
| "loss": 0.1554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1564255654811859, |
| "step": 2645, |
| "valid_targets_mean": 1670.0, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 4.294975688816856, |
| "grad_norm": 0.8555240936332876, |
| "learning_rate": 1.5614894812425806e-05, |
| "loss": 0.1256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1624247133731842, |
| "step": 2650, |
| "valid_targets_mean": 2291.0, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 4.303079416531604, |
| "grad_norm": 0.7761516523216345, |
| "learning_rate": 1.5536074390190786e-05, |
| "loss": 0.1422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12907105684280396, |
| "step": 2655, |
| "valid_targets_mean": 2245.6, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 4.311183144246353, |
| "grad_norm": 1.4090587432444437, |
| "learning_rate": 1.5457326867872177e-05, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17307105660438538, |
| "step": 2660, |
| "valid_targets_mean": 2902.2, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 4.319286871961102, |
| "grad_norm": 0.7599287679035327, |
| "learning_rate": 1.5378653531487784e-05, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1532491147518158, |
| "step": 2665, |
| "valid_targets_mean": 2631.6, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 4.327390599675851, |
| "grad_norm": 0.8485351714572734, |
| "learning_rate": 1.5300055665843875e-05, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14278289675712585, |
| "step": 2670, |
| "valid_targets_mean": 2180.6, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 4.3354943273906, |
| "grad_norm": 0.7356937932327555, |
| "learning_rate": 1.5221534554514225e-05, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13728389143943787, |
| "step": 2675, |
| "valid_targets_mean": 2713.6, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 4.343598055105349, |
| "grad_norm": 0.8514962373379015, |
| "learning_rate": 1.5143091479819146e-05, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12912364304065704, |
| "step": 2680, |
| "valid_targets_mean": 2137.4, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 4.351701782820097, |
| "grad_norm": 0.8511576532571051, |
| "learning_rate": 1.5064727722804531e-05, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20828333497047424, |
| "step": 2685, |
| "valid_targets_mean": 2588.8, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 4.359805510534846, |
| "grad_norm": 1.0492092151976131, |
| "learning_rate": 1.4986444563220948e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23015139997005463, |
| "step": 2690, |
| "valid_targets_mean": 1931.1, |
| "valid_targets_min": 426 |
| }, |
| { |
| "epoch": 4.367909238249595, |
| "grad_norm": 0.9100981933490145, |
| "learning_rate": 1.4908243279502741e-05, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1979110985994339, |
| "step": 2695, |
| "valid_targets_mean": 2374.7, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 4.376012965964343, |
| "grad_norm": 0.7595733722776951, |
| "learning_rate": 1.4830125148747138e-05, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1817144751548767, |
| "step": 2700, |
| "valid_targets_mean": 2891.0, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 4.3841166936790925, |
| "grad_norm": 0.7794754495340108, |
| "learning_rate": 1.475209144669341e-05, |
| "loss": 0.1891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2341780811548233, |
| "step": 2705, |
| "valid_targets_mean": 3009.4, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 4.392220421393841, |
| "grad_norm": 0.9584422683500831, |
| "learning_rate": 1.4674143447702036e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13136430084705353, |
| "step": 2710, |
| "valid_targets_mean": 1982.9, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 4.40032414910859, |
| "grad_norm": 0.5758324638844335, |
| "learning_rate": 1.4596282424733877e-05, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06660260260105133, |
| "step": 2715, |
| "valid_targets_mean": 3760.6, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 4.408427876823339, |
| "grad_norm": 0.6558036998170294, |
| "learning_rate": 1.4518509649329406e-05, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.157700315117836, |
| "step": 2720, |
| "valid_targets_mean": 3546.7, |
| "valid_targets_min": 932 |
| }, |
| { |
| "epoch": 4.416531604538087, |
| "grad_norm": 0.8633304546821023, |
| "learning_rate": 1.4440826391587926e-05, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12797395884990692, |
| "step": 2725, |
| "valid_targets_mean": 3217.9, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 4.424635332252836, |
| "grad_norm": 0.6582694588059188, |
| "learning_rate": 1.4363233920146855e-05, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16166099905967712, |
| "step": 2730, |
| "valid_targets_mean": 4224.6, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 4.432739059967585, |
| "grad_norm": 0.7022399878776832, |
| "learning_rate": 1.4285733502160955e-05, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1490454524755478, |
| "step": 2735, |
| "valid_targets_mean": 3313.8, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 4.4408427876823335, |
| "grad_norm": 0.6688054411278289, |
| "learning_rate": 1.4208326403281702e-05, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1919623762369156, |
| "step": 2740, |
| "valid_targets_mean": 3607.4, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 4.448946515397083, |
| "grad_norm": 0.9020567053374119, |
| "learning_rate": 1.4131013887636576e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16687409579753876, |
| "step": 2745, |
| "valid_targets_mean": 2358.4, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 4.457050243111832, |
| "grad_norm": 0.7645681159215328, |
| "learning_rate": 1.4053797217808432e-05, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2162127047777176, |
| "step": 2750, |
| "valid_targets_mean": 3857.8, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 4.46515397082658, |
| "grad_norm": 0.867803300126707, |
| "learning_rate": 1.3976677654814866e-05, |
| "loss": 0.1396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11421076953411102, |
| "step": 2755, |
| "valid_targets_mean": 2012.0, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 4.473257698541329, |
| "grad_norm": 0.8742220073053529, |
| "learning_rate": 1.3899656458087647e-05, |
| "loss": 0.1435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15495306253433228, |
| "step": 2760, |
| "valid_targets_mean": 2445.5, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 4.481361426256078, |
| "grad_norm": 0.7571940426598677, |
| "learning_rate": 1.3822734885452136e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1919158697128296, |
| "step": 2765, |
| "valid_targets_mean": 3757.5, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 4.489465153970826, |
| "grad_norm": 0.8691721790493876, |
| "learning_rate": 1.3745914193106715e-05, |
| "loss": 0.1971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14633077383041382, |
| "step": 2770, |
| "valid_targets_mean": 1987.1, |
| "valid_targets_min": 406 |
| }, |
| { |
| "epoch": 4.4975688816855754, |
| "grad_norm": 1.000044264127931, |
| "learning_rate": 1.366919563560233e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3116513788700104, |
| "step": 2775, |
| "valid_targets_mean": 4190.8, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 4.5056726094003245, |
| "grad_norm": 0.8331745332190477, |
| "learning_rate": 1.3592580465821956e-05, |
| "loss": 0.1926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18027907609939575, |
| "step": 2780, |
| "valid_targets_mean": 2925.8, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 4.513776337115073, |
| "grad_norm": 0.8471157769543586, |
| "learning_rate": 1.3516069934960174e-05, |
| "loss": 0.1475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18600761890411377, |
| "step": 2785, |
| "valid_targets_mean": 2895.5, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 4.521880064829822, |
| "grad_norm": 0.8127559212585381, |
| "learning_rate": 1.3439665292502695e-05, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16321048140525818, |
| "step": 2790, |
| "valid_targets_mean": 2676.2, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 4.52998379254457, |
| "grad_norm": 0.8681867438751043, |
| "learning_rate": 1.3363367786205985e-05, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16139662265777588, |
| "step": 2795, |
| "valid_targets_mean": 2765.1, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 4.538087520259319, |
| "grad_norm": 0.6147735291418077, |
| "learning_rate": 1.3287178662076893e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2413632571697235, |
| "step": 2800, |
| "valid_targets_mean": 4606.2, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 4.546191247974068, |
| "grad_norm": 0.7563381558755065, |
| "learning_rate": 1.3211099164352261e-05, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21764537692070007, |
| "step": 2805, |
| "valid_targets_mean": 2891.3, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 4.5542949756888165, |
| "grad_norm": 0.7369725771049391, |
| "learning_rate": 1.3135130535478655e-05, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15378154814243317, |
| "step": 2810, |
| "valid_targets_mean": 3029.8, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 4.562398703403566, |
| "grad_norm": 0.8372190818629114, |
| "learning_rate": 1.3059274016092057e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17605245113372803, |
| "step": 2815, |
| "valid_targets_mean": 3103.2, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 4.570502431118315, |
| "grad_norm": 0.831632617042843, |
| "learning_rate": 1.2983530844997585e-05, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1470744013786316, |
| "step": 2820, |
| "valid_targets_mean": 2123.9, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 4.578606158833063, |
| "grad_norm": 0.8005009026500092, |
| "learning_rate": 1.2907902259149287e-05, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17905943095684052, |
| "step": 2825, |
| "valid_targets_mean": 2288.1, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 4.586709886547812, |
| "grad_norm": 0.7146959989523917, |
| "learning_rate": 1.2832389493629928e-05, |
| "loss": 0.1502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18556524813175201, |
| "step": 2830, |
| "valid_targets_mean": 3489.2, |
| "valid_targets_min": 866 |
| }, |
| { |
| "epoch": 4.594813614262561, |
| "grad_norm": 0.982213080774264, |
| "learning_rate": 1.275699378163083e-05, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20789432525634766, |
| "step": 2835, |
| "valid_targets_mean": 2519.7, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 4.602917341977309, |
| "grad_norm": 0.5100944274599919, |
| "learning_rate": 1.2681716354431704e-05, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09983259439468384, |
| "step": 2840, |
| "valid_targets_mean": 5123.9, |
| "valid_targets_min": 505 |
| }, |
| { |
| "epoch": 4.611021069692058, |
| "grad_norm": 0.9532072125518306, |
| "learning_rate": 1.2606558441380587e-05, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2288963943719864, |
| "step": 2845, |
| "valid_targets_mean": 1986.6, |
| "valid_targets_min": 459 |
| }, |
| { |
| "epoch": 4.6191247974068075, |
| "grad_norm": 0.7215937040297506, |
| "learning_rate": 1.2531521269873736e-05, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18275988101959229, |
| "step": 2850, |
| "valid_targets_mean": 3461.2, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 4.627228525121556, |
| "grad_norm": 0.7854523287609847, |
| "learning_rate": 1.245660606533559e-05, |
| "loss": 0.1813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2999517619609833, |
| "step": 2855, |
| "valid_targets_mean": 3333.9, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 4.635332252836305, |
| "grad_norm": 0.9116092627493867, |
| "learning_rate": 1.2381814051198751e-05, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13685894012451172, |
| "step": 2860, |
| "valid_targets_mean": 1892.0, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 4.643435980551054, |
| "grad_norm": 2.35524174458915, |
| "learning_rate": 1.2307146448884021e-05, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1372871696949005, |
| "step": 2865, |
| "valid_targets_mean": 2473.6, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 4.651539708265802, |
| "grad_norm": 0.7956965758481088, |
| "learning_rate": 1.2232604477780445e-05, |
| "loss": 0.1706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20719727873802185, |
| "step": 2870, |
| "valid_targets_mean": 4660.5, |
| "valid_targets_min": 1343 |
| }, |
| { |
| "epoch": 4.659643435980551, |
| "grad_norm": 0.7578731157658531, |
| "learning_rate": 1.2158189355225382e-05, |
| "loss": 0.1335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16715043783187866, |
| "step": 2875, |
| "valid_targets_mean": 3336.8, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 4.667747163695299, |
| "grad_norm": 0.5455735164703488, |
| "learning_rate": 1.2083902296484659e-05, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1390770971775055, |
| "step": 2880, |
| "valid_targets_mean": 5098.4, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 4.6758508914100485, |
| "grad_norm": 0.8754352764073323, |
| "learning_rate": 1.2009744514732698e-05, |
| "loss": 0.1251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1272560954093933, |
| "step": 2885, |
| "valid_targets_mean": 1902.8, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 4.683954619124798, |
| "grad_norm": 0.7125376899744773, |
| "learning_rate": 1.1935717221032707e-05, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12357346713542938, |
| "step": 2890, |
| "valid_targets_mean": 3547.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 4.692058346839546, |
| "grad_norm": 0.9406847214639302, |
| "learning_rate": 1.1861821624316916e-05, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1456756889820099, |
| "step": 2895, |
| "valid_targets_mean": 2065.8, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 4.700162074554295, |
| "grad_norm": 0.6883619788971869, |
| "learning_rate": 1.1788058931366822e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2756902575492859, |
| "step": 2900, |
| "valid_targets_mean": 4024.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 4.708265802269044, |
| "grad_norm": 0.7882633472589065, |
| "learning_rate": 1.1714430346793479e-05, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13730135560035706, |
| "step": 2905, |
| "valid_targets_mean": 2645.8, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 4.716369529983792, |
| "grad_norm": 0.8885552000120186, |
| "learning_rate": 1.1640937073017837e-05, |
| "loss": 0.1522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11991922557353973, |
| "step": 2910, |
| "valid_targets_mean": 2493.4, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 4.724473257698541, |
| "grad_norm": 0.9089134585480407, |
| "learning_rate": 1.1567580310251097e-05, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16488614678382874, |
| "step": 2915, |
| "valid_targets_mean": 2730.6, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 4.73257698541329, |
| "grad_norm": 0.9805367472588664, |
| "learning_rate": 1.1494361256475105e-05, |
| "loss": 0.1403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1491793394088745, |
| "step": 2920, |
| "valid_targets_mean": 1666.0, |
| "valid_targets_min": 363 |
| }, |
| { |
| "epoch": 4.740680713128039, |
| "grad_norm": 0.9415315025271603, |
| "learning_rate": 1.1421281107422804e-05, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2649831473827362, |
| "step": 2925, |
| "valid_targets_mean": 2495.4, |
| "valid_targets_min": 334 |
| }, |
| { |
| "epoch": 4.748784440842788, |
| "grad_norm": 0.7579993458608958, |
| "learning_rate": 1.1348341056558709e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21222791075706482, |
| "step": 2930, |
| "valid_targets_mean": 3278.5, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 4.756888168557537, |
| "grad_norm": 0.8752970421825866, |
| "learning_rate": 1.1275542295059384e-05, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11920589953660965, |
| "step": 2935, |
| "valid_targets_mean": 2097.3, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 4.764991896272285, |
| "grad_norm": 0.9284513357192202, |
| "learning_rate": 1.1202886011794023e-05, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2457813024520874, |
| "step": 2940, |
| "valid_targets_mean": 2385.9, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 4.773095623987034, |
| "grad_norm": 0.9398075096458122, |
| "learning_rate": 1.1130373393305004e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12277652323246002, |
| "step": 2945, |
| "valid_targets_mean": 2361.6, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 4.781199351701783, |
| "grad_norm": 1.1737385550719055, |
| "learning_rate": 1.1058005623788564e-05, |
| "loss": 0.184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140442356467247, |
| "step": 2950, |
| "valid_targets_mean": 1775.1, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 4.789303079416531, |
| "grad_norm": 0.8063596837128346, |
| "learning_rate": 1.0985783885075407e-05, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18340390920639038, |
| "step": 2955, |
| "valid_targets_mean": 2692.0, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 4.7974068071312805, |
| "grad_norm": 0.8609461611073953, |
| "learning_rate": 1.0913709356611411e-05, |
| "loss": 0.1328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14733055233955383, |
| "step": 2960, |
| "valid_targets_mean": 2302.0, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 4.805510534846029, |
| "grad_norm": 0.5940642190543134, |
| "learning_rate": 1.0841783215438406e-05, |
| "loss": 0.1554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19221073389053345, |
| "step": 2965, |
| "valid_targets_mean": 5023.8, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 4.813614262560778, |
| "grad_norm": 1.0256200972517306, |
| "learning_rate": 1.07700066361749e-05, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23758450150489807, |
| "step": 2970, |
| "valid_targets_mean": 2783.9, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 4.821717990275527, |
| "grad_norm": 0.8057695967861453, |
| "learning_rate": 1.0698380790996921e-05, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15349268913269043, |
| "step": 2975, |
| "valid_targets_mean": 3128.6, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 4.829821717990275, |
| "grad_norm": 0.7274055955361053, |
| "learning_rate": 1.0626906849618903e-05, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16329367458820343, |
| "step": 2980, |
| "valid_targets_mean": 3118.8, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 4.837925445705024, |
| "grad_norm": 0.8346294549363144, |
| "learning_rate": 1.0555585979274513e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2559146285057068, |
| "step": 2985, |
| "valid_targets_mean": 3082.2, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 4.846029173419773, |
| "grad_norm": 1.3240258810633323, |
| "learning_rate": 1.0484419344697667e-05, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13262823224067688, |
| "step": 2990, |
| "valid_targets_mean": 1733.1, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 4.854132901134522, |
| "grad_norm": 0.995006362928102, |
| "learning_rate": 1.0413408108103445e-05, |
| "loss": 0.1576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20635709166526794, |
| "step": 2995, |
| "valid_targets_mean": 3296.1, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 4.862236628849271, |
| "grad_norm": 0.8460865973678914, |
| "learning_rate": 1.0342553429169163e-05, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11528654396533966, |
| "step": 3000, |
| "valid_targets_mean": 1933.8, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 4.87034035656402, |
| "grad_norm": 1.147006877758278, |
| "learning_rate": 1.0271856465015388e-05, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18788880109786987, |
| "step": 3005, |
| "valid_targets_mean": 1968.5, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 4.878444084278768, |
| "grad_norm": 0.8479478722559892, |
| "learning_rate": 1.0201318370187065e-05, |
| "loss": 0.1495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13283419609069824, |
| "step": 3010, |
| "valid_targets_mean": 2158.6, |
| "valid_targets_min": 496 |
| }, |
| { |
| "epoch": 4.886547811993517, |
| "grad_norm": 0.7961067473066475, |
| "learning_rate": 1.0130940296634683e-05, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18867862224578857, |
| "step": 3015, |
| "valid_targets_mean": 2611.9, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 4.894651539708266, |
| "grad_norm": 1.0151300176784335, |
| "learning_rate": 1.0060723393695411e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23992988467216492, |
| "step": 3020, |
| "valid_targets_mean": 2529.1, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 4.902755267423014, |
| "grad_norm": 0.9733399168762327, |
| "learning_rate": 9.990668808074378e-06, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14787709712982178, |
| "step": 3025, |
| "valid_targets_mean": 1709.7, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 4.9108589951377635, |
| "grad_norm": 0.72365986298008, |
| "learning_rate": 9.920777683825906e-06, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19551479816436768, |
| "step": 3030, |
| "valid_targets_mean": 2936.8, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 4.918962722852513, |
| "grad_norm": 0.8027516059720535, |
| "learning_rate": 9.851051162334871e-06, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1954280436038971, |
| "step": 3035, |
| "valid_targets_mean": 2570.2, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 4.927066450567261, |
| "grad_norm": 0.762963457517037, |
| "learning_rate": 9.781490382298018e-06, |
| "loss": 0.1348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15942156314849854, |
| "step": 3040, |
| "valid_targets_mean": 3299.4, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 4.93517017828201, |
| "grad_norm": 0.8720989205317229, |
| "learning_rate": 9.712096479705382e-06, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11061131954193115, |
| "step": 3045, |
| "valid_targets_mean": 2380.6, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 4.943273905996758, |
| "grad_norm": 0.6183829564964957, |
| "learning_rate": 9.642870587821761e-06, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13789555430412292, |
| "step": 3050, |
| "valid_targets_mean": 3705.7, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 4.951377633711507, |
| "grad_norm": 0.9202251472551713, |
| "learning_rate": 9.573813837168166e-06, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16328653693199158, |
| "step": 3055, |
| "valid_targets_mean": 2631.2, |
| "valid_targets_min": 461 |
| }, |
| { |
| "epoch": 4.959481361426256, |
| "grad_norm": 0.6337283642064705, |
| "learning_rate": 9.504927355503399e-06, |
| "loss": 0.1594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0957586020231247, |
| "step": 3060, |
| "valid_targets_mean": 3474.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 4.9675850891410045, |
| "grad_norm": 0.9004406261162295, |
| "learning_rate": 9.436212267805591e-06, |
| "loss": 0.1495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12372364848852158, |
| "step": 3065, |
| "valid_targets_mean": 1903.6, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.975688816855754, |
| "grad_norm": 0.5981555247573468, |
| "learning_rate": 9.367669696253885e-06, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10008936375379562, |
| "step": 3070, |
| "valid_targets_mean": 3947.9, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 4.983792544570503, |
| "grad_norm": 0.7429447660340368, |
| "learning_rate": 9.299300760210059e-06, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2495230734348297, |
| "step": 3075, |
| "valid_targets_mean": 3267.3, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 4.991896272285251, |
| "grad_norm": 0.8545859108818904, |
| "learning_rate": 9.231106576200268e-06, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1375666856765747, |
| "step": 3080, |
| "valid_targets_mean": 2512.9, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 1.0000828363963175, |
| "learning_rate": 9.163088257896825e-06, |
| "loss": 0.153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12231343239545822, |
| "step": 3085, |
| "valid_targets_mean": 1496.2, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 5.008103727714749, |
| "grad_norm": 1.283136207413487, |
| "learning_rate": 9.095246916099978e-06, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16958777606487274, |
| "step": 3090, |
| "valid_targets_mean": 2647.4, |
| "valid_targets_min": 582 |
| }, |
| { |
| "epoch": 5.016207455429497, |
| "grad_norm": 0.943279239764171, |
| "learning_rate": 9.027583658719812e-06, |
| "loss": 0.1412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12485413998365402, |
| "step": 3095, |
| "valid_targets_mean": 1937.0, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 5.024311183144246, |
| "grad_norm": 0.8436158526907404, |
| "learning_rate": 8.960099590758104e-06, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1455596685409546, |
| "step": 3100, |
| "valid_targets_mean": 2281.4, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 5.0324149108589955, |
| "grad_norm": 0.9944315406392032, |
| "learning_rate": 8.892795814290342e-06, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19890674948692322, |
| "step": 3105, |
| "valid_targets_mean": 2202.4, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.040518638573744, |
| "grad_norm": 0.6387733217996346, |
| "learning_rate": 8.825673428447668e-06, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13640737533569336, |
| "step": 3110, |
| "valid_targets_mean": 4190.6, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 5.048622366288493, |
| "grad_norm": 0.7019234673750581, |
| "learning_rate": 8.758733529398945e-06, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09768907725811005, |
| "step": 3115, |
| "valid_targets_mean": 2849.2, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 5.056726094003242, |
| "grad_norm": 1.384661286889182, |
| "learning_rate": 8.691977210332892e-06, |
| "loss": 0.1274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13747167587280273, |
| "step": 3120, |
| "valid_targets_mean": 2221.4, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 5.06482982171799, |
| "grad_norm": 0.930073668995111, |
| "learning_rate": 8.625405561440172e-06, |
| "loss": 0.1412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11428385972976685, |
| "step": 3125, |
| "valid_targets_mean": 1706.4, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 5.072933549432739, |
| "grad_norm": 0.7331543719322425, |
| "learning_rate": 8.559019669895648e-06, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22601112723350525, |
| "step": 3130, |
| "valid_targets_mean": 3574.3, |
| "valid_targets_min": 398 |
| }, |
| { |
| "epoch": 5.081037277147487, |
| "grad_norm": 0.9113971174023665, |
| "learning_rate": 8.492820619840563e-06, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.287741094827652, |
| "step": 3135, |
| "valid_targets_mean": 2638.6, |
| "valid_targets_min": 341 |
| }, |
| { |
| "epoch": 5.0891410048622365, |
| "grad_norm": 0.8833049318176625, |
| "learning_rate": 8.426809492364907e-06, |
| "loss": 0.1215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11894373595714569, |
| "step": 3140, |
| "valid_targets_mean": 2332.4, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 5.097244732576986, |
| "grad_norm": 0.5946354001150366, |
| "learning_rate": 8.360987365489698e-06, |
| "loss": 0.1223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1098465770483017, |
| "step": 3145, |
| "valid_targets_mean": 3904.6, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 5.105348460291734, |
| "grad_norm": 0.8044122587163143, |
| "learning_rate": 8.295355314149413e-06, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13747110962867737, |
| "step": 3150, |
| "valid_targets_mean": 2310.0, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 5.113452188006483, |
| "grad_norm": 0.5980128769879898, |
| "learning_rate": 8.229914410174435e-06, |
| "loss": 0.1099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08813309669494629, |
| "step": 3155, |
| "valid_targets_mean": 3792.1, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 5.121555915721232, |
| "grad_norm": 0.622312258802971, |
| "learning_rate": 8.16466572227352e-06, |
| "loss": 0.1068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0873100534081459, |
| "step": 3160, |
| "valid_targets_mean": 3185.2, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 5.12965964343598, |
| "grad_norm": 0.8954975866967348, |
| "learning_rate": 8.099610316016373e-06, |
| "loss": 0.1456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13367177546024323, |
| "step": 3165, |
| "valid_targets_mean": 2045.3, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 5.137763371150729, |
| "grad_norm": 0.8258936353394385, |
| "learning_rate": 8.03474925381625e-06, |
| "loss": 0.1564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16128379106521606, |
| "step": 3170, |
| "valid_targets_mean": 3819.5, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 5.145867098865478, |
| "grad_norm": 0.9892899982440995, |
| "learning_rate": 7.97008359491257e-06, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1371055245399475, |
| "step": 3175, |
| "valid_targets_mean": 1996.4, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 5.153970826580227, |
| "grad_norm": 0.9178033916752635, |
| "learning_rate": 7.905614395353649e-06, |
| "loss": 0.1424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13662882149219513, |
| "step": 3180, |
| "valid_targets_mean": 2094.7, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 5.162074554294976, |
| "grad_norm": 0.9445719514300331, |
| "learning_rate": 7.841342707979442e-06, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30393123626708984, |
| "step": 3185, |
| "valid_targets_mean": 3291.1, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 5.170178282009725, |
| "grad_norm": 0.7306623592816158, |
| "learning_rate": 7.77726958240437e-06, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.100005142390728, |
| "step": 3190, |
| "valid_targets_mean": 2373.6, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 5.178282009724473, |
| "grad_norm": 0.5681715595432818, |
| "learning_rate": 7.713396065000133e-06, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16320055723190308, |
| "step": 3195, |
| "valid_targets_mean": 5024.4, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 5.186385737439222, |
| "grad_norm": 0.9141392131056238, |
| "learning_rate": 7.649723198878676e-06, |
| "loss": 0.13, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17028486728668213, |
| "step": 3200, |
| "valid_targets_mean": 2462.1, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 5.194489465153971, |
| "grad_norm": 1.0211463763575084, |
| "learning_rate": 7.586252023875125e-06, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13707610964775085, |
| "step": 3205, |
| "valid_targets_mean": 1633.6, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 5.2025931928687195, |
| "grad_norm": 0.9857389473887078, |
| "learning_rate": 7.522983576530791e-06, |
| "loss": 0.1549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1323859989643097, |
| "step": 3210, |
| "valid_targets_mean": 1957.2, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 5.210696920583469, |
| "grad_norm": 1.0143771026388138, |
| "learning_rate": 7.459918890076272e-06, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16915765404701233, |
| "step": 3215, |
| "valid_targets_mean": 3357.4, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 5.218800648298217, |
| "grad_norm": 0.8291361309836706, |
| "learning_rate": 7.397058994414563e-06, |
| "loss": 0.1304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18082496523857117, |
| "step": 3220, |
| "valid_targets_mean": 2756.2, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 5.226904376012966, |
| "grad_norm": 0.6737718264710545, |
| "learning_rate": 7.3344049161042495e-06, |
| "loss": 0.1324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14597007632255554, |
| "step": 3225, |
| "valid_targets_mean": 4198.1, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 5.235008103727715, |
| "grad_norm": 0.6961828666596263, |
| "learning_rate": 7.271957678342738e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07819020748138428, |
| "step": 3230, |
| "valid_targets_mean": 2952.6, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 5.243111831442463, |
| "grad_norm": 1.2860828286107657, |
| "learning_rate": 7.209718300949519e-06, |
| "loss": 0.152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11555998027324677, |
| "step": 3235, |
| "valid_targets_mean": 2056.3, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 5.251215559157212, |
| "grad_norm": 0.6896094917138008, |
| "learning_rate": 7.14768780034957e-06, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18422646820545197, |
| "step": 3240, |
| "valid_targets_mean": 3863.6, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 5.259319286871961, |
| "grad_norm": 0.8253153069121804, |
| "learning_rate": 7.085867189556697e-06, |
| "loss": 0.2144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20815926790237427, |
| "step": 3245, |
| "valid_targets_mean": 3034.3, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 5.26742301458671, |
| "grad_norm": 0.7086894492399584, |
| "learning_rate": 7.024257478157015e-06, |
| "loss": 0.1555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10221417248249054, |
| "step": 3250, |
| "valid_targets_mean": 3288.2, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 5.275526742301459, |
| "grad_norm": 0.5798277120600573, |
| "learning_rate": 6.96285967229249e-06, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14061783254146576, |
| "step": 3255, |
| "valid_targets_mean": 5321.4, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 5.283630470016208, |
| "grad_norm": 0.6297473245719093, |
| "learning_rate": 6.901674774644449e-06, |
| "loss": 0.1113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09192270785570145, |
| "step": 3260, |
| "valid_targets_mean": 3162.9, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 5.291734197730956, |
| "grad_norm": 0.655326604774191, |
| "learning_rate": 6.840703784417262e-06, |
| "loss": 0.1477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1667039543390274, |
| "step": 3265, |
| "valid_targets_mean": 3882.1, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 5.299837925445705, |
| "grad_norm": 0.9464717792115727, |
| "learning_rate": 6.779947697321974e-06, |
| "loss": 0.1328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11113858968019485, |
| "step": 3270, |
| "valid_targets_mean": 2199.8, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 5.307941653160454, |
| "grad_norm": 0.8508764069285351, |
| "learning_rate": 6.719407505560094e-06, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14729882776737213, |
| "step": 3275, |
| "valid_targets_mean": 2665.4, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 5.316045380875202, |
| "grad_norm": 1.03542912623809, |
| "learning_rate": 6.659084197807348e-06, |
| "loss": 0.1997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4161680340766907, |
| "step": 3280, |
| "valid_targets_mean": 4139.7, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 5.3241491085899515, |
| "grad_norm": 0.8555285929048103, |
| "learning_rate": 6.598978759197554e-06, |
| "loss": 0.119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19164308905601501, |
| "step": 3285, |
| "valid_targets_mean": 2472.9, |
| "valid_targets_min": 488 |
| }, |
| { |
| "epoch": 5.332252836304701, |
| "grad_norm": 0.7884153355344533, |
| "learning_rate": 6.539092171306541e-06, |
| "loss": 0.1166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13263387978076935, |
| "step": 3290, |
| "valid_targets_mean": 2924.2, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 5.340356564019449, |
| "grad_norm": 0.7139375465777716, |
| "learning_rate": 6.479425412136093e-06, |
| "loss": 0.1412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08301765471696854, |
| "step": 3295, |
| "valid_targets_mean": 3015.2, |
| "valid_targets_min": 456 |
| }, |
| { |
| "epoch": 5.348460291734198, |
| "grad_norm": 0.8136742499601274, |
| "learning_rate": 6.419979456098016e-06, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0914689153432846, |
| "step": 3300, |
| "valid_targets_mean": 2395.7, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 5.356564019448946, |
| "grad_norm": 0.8426989185718268, |
| "learning_rate": 6.360755273998174e-06, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18558555841445923, |
| "step": 3305, |
| "valid_targets_mean": 3175.8, |
| "valid_targets_min": 426 |
| }, |
| { |
| "epoch": 5.364667747163695, |
| "grad_norm": 0.7043825571960722, |
| "learning_rate": 6.301753833020691e-06, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.185553640127182, |
| "step": 3310, |
| "valid_targets_mean": 3304.7, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 5.372771474878444, |
| "grad_norm": 0.9549981037856647, |
| "learning_rate": 6.242976096712112e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22695674002170563, |
| "step": 3315, |
| "valid_targets_mean": 2425.8, |
| "valid_targets_min": 334 |
| }, |
| { |
| "epoch": 5.3808752025931925, |
| "grad_norm": 0.8195898613602235, |
| "learning_rate": 6.18442302496568e-06, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13929906487464905, |
| "step": 3320, |
| "valid_targets_mean": 2468.8, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 5.388978930307942, |
| "grad_norm": 1.029682002666224, |
| "learning_rate": 6.1260955740056835e-06, |
| "loss": 0.1347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1550445258617401, |
| "step": 3325, |
| "valid_targets_mean": 2025.9, |
| "valid_targets_min": 1103 |
| }, |
| { |
| "epoch": 5.397082658022691, |
| "grad_norm": 1.1169106309979446, |
| "learning_rate": 6.067994696371797e-06, |
| "loss": 0.1246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15255971252918243, |
| "step": 3330, |
| "valid_targets_mean": 2080.6, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 5.405186385737439, |
| "grad_norm": 0.8850686193118384, |
| "learning_rate": 6.010121340903574e-06, |
| "loss": 0.1224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1398320496082306, |
| "step": 3335, |
| "valid_targets_mean": 2204.1, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 5.413290113452188, |
| "grad_norm": 0.6189940261103392, |
| "learning_rate": 5.952476452724898e-06, |
| "loss": 0.1416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10511147975921631, |
| "step": 3340, |
| "valid_targets_mean": 3397.1, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 5.421393841166937, |
| "grad_norm": 0.7869848129875665, |
| "learning_rate": 5.895060973228606e-06, |
| "loss": 0.1406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17136400938034058, |
| "step": 3345, |
| "valid_targets_mean": 3590.9, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 5.429497568881685, |
| "grad_norm": 0.9786557729553311, |
| "learning_rate": 5.837875840061064e-06, |
| "loss": 0.1352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12982967495918274, |
| "step": 3350, |
| "valid_targets_mean": 1677.5, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 5.437601296596434, |
| "grad_norm": 0.8317312217862712, |
| "learning_rate": 5.780921987106878e-06, |
| "loss": 0.136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12355664372444153, |
| "step": 3355, |
| "valid_targets_mean": 2306.0, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 5.4457050243111835, |
| "grad_norm": 0.7338499031126493, |
| "learning_rate": 5.724200344473651e-06, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19103437662124634, |
| "step": 3360, |
| "valid_targets_mean": 3675.8, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 5.453808752025932, |
| "grad_norm": 0.6656448002153311, |
| "learning_rate": 5.66771183847677e-06, |
| "loss": 0.1301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09611663967370987, |
| "step": 3365, |
| "valid_targets_mean": 2633.0, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 5.461912479740681, |
| "grad_norm": 1.0874356250956578, |
| "learning_rate": 5.611457391624309e-06, |
| "loss": 0.1322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15315888822078705, |
| "step": 3370, |
| "valid_targets_mean": 3031.9, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 5.47001620745543, |
| "grad_norm": 1.0445039076091298, |
| "learning_rate": 5.555437922601918e-06, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16164973378181458, |
| "step": 3375, |
| "valid_targets_mean": 1917.6, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 5.478119935170178, |
| "grad_norm": 0.8104164724449195, |
| "learning_rate": 5.499654346257879e-06, |
| "loss": 0.1359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12006053328514099, |
| "step": 3380, |
| "valid_targets_mean": 2426.0, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 5.486223662884927, |
| "grad_norm": 0.7493612429318233, |
| "learning_rate": 5.444107573588116e-06, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1710258424282074, |
| "step": 3385, |
| "valid_targets_mean": 3943.8, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 5.4943273905996755, |
| "grad_norm": 0.893693814456575, |
| "learning_rate": 5.388798511721329e-06, |
| "loss": 0.1456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19235970079898834, |
| "step": 3390, |
| "valid_targets_mean": 2304.8, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 5.5024311183144246, |
| "grad_norm": 0.9281024443148513, |
| "learning_rate": 5.333728063904213e-06, |
| "loss": 0.139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13582965731620789, |
| "step": 3395, |
| "valid_targets_mean": 3602.9, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.510534846029174, |
| "grad_norm": 0.7276815688419767, |
| "learning_rate": 5.278897129486656e-06, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13215868175029755, |
| "step": 3400, |
| "valid_targets_mean": 3562.9, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 5.518638573743922, |
| "grad_norm": 0.8662128457006715, |
| "learning_rate": 5.224306603907095e-06, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12716642022132874, |
| "step": 3405, |
| "valid_targets_mean": 2820.1, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 5.526742301458671, |
| "grad_norm": 0.7807235589640765, |
| "learning_rate": 5.169957378677859e-06, |
| "loss": 0.1258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1254601776599884, |
| "step": 3410, |
| "valid_targets_mean": 2691.8, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 5.53484602917342, |
| "grad_norm": 0.7560906227588559, |
| "learning_rate": 5.11585034137064e-06, |
| "loss": 0.1318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23728054761886597, |
| "step": 3415, |
| "valid_targets_mean": 3586.0, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 5.542949756888168, |
| "grad_norm": 1.102731743141789, |
| "learning_rate": 5.061986375601977e-06, |
| "loss": 0.1495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13842478394508362, |
| "step": 3420, |
| "valid_targets_mean": 1943.7, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 5.551053484602917, |
| "grad_norm": 0.7825513713620168, |
| "learning_rate": 5.0083663610188215e-06, |
| "loss": 0.1298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11432783305644989, |
| "step": 3425, |
| "valid_targets_mean": 2848.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 5.5591572123176665, |
| "grad_norm": 0.9134357132489729, |
| "learning_rate": 4.954991173284207e-06, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16197806596755981, |
| "step": 3430, |
| "valid_targets_mean": 2609.7, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 5.567260940032415, |
| "grad_norm": 0.9586959035897938, |
| "learning_rate": 4.901861684062899e-06, |
| "loss": 0.152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11932115256786346, |
| "step": 3435, |
| "valid_targets_mean": 2300.0, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 5.575364667747164, |
| "grad_norm": 0.9077572994362951, |
| "learning_rate": 4.848978761007206e-06, |
| "loss": 0.1211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15258963406085968, |
| "step": 3440, |
| "valid_targets_mean": 2265.6, |
| "valid_targets_min": 932 |
| }, |
| { |
| "epoch": 5.583468395461912, |
| "grad_norm": 1.1023316942136527, |
| "learning_rate": 4.796343267742782e-06, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14780212938785553, |
| "step": 3445, |
| "valid_targets_mean": 1948.9, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 5.591572123176661, |
| "grad_norm": 0.7251051495316837, |
| "learning_rate": 4.743956063854529e-06, |
| "loss": 0.1311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09377004206180573, |
| "step": 3450, |
| "valid_targets_mean": 2942.9, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 5.59967585089141, |
| "grad_norm": 0.8488916792785556, |
| "learning_rate": 4.691818004872557e-06, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12640199065208435, |
| "step": 3455, |
| "valid_targets_mean": 2410.6, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 5.607779578606159, |
| "grad_norm": 0.8737493446227516, |
| "learning_rate": 4.639929942258217e-06, |
| "loss": 0.1383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11130397021770477, |
| "step": 3460, |
| "valid_targets_mean": 1994.3, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 5.6158833063209075, |
| "grad_norm": 0.8723045293450462, |
| "learning_rate": 4.588292723390204e-06, |
| "loss": 0.1462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18794122338294983, |
| "step": 3465, |
| "valid_targets_mean": 2340.5, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 5.623987034035657, |
| "grad_norm": 0.9131558045501164, |
| "learning_rate": 4.536907191550694e-06, |
| "loss": 0.1385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18654656410217285, |
| "step": 3470, |
| "valid_targets_mean": 3264.6, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 5.632090761750405, |
| "grad_norm": 0.7832447854160407, |
| "learning_rate": 4.4857741859116024e-06, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10856875032186508, |
| "step": 3475, |
| "valid_targets_mean": 4026.0, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 5.640194489465154, |
| "grad_norm": 0.9603685340587842, |
| "learning_rate": 4.434894541520862e-06, |
| "loss": 0.1285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12167471647262573, |
| "step": 3480, |
| "valid_targets_mean": 2858.6, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 5.648298217179903, |
| "grad_norm": 0.8143816562047289, |
| "learning_rate": 4.3842690892887795e-06, |
| "loss": 0.1283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11910448223352432, |
| "step": 3485, |
| "valid_targets_mean": 2518.2, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 5.656401944894651, |
| "grad_norm": 1.0269959031972293, |
| "learning_rate": 4.333898655974484e-06, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13059552013874054, |
| "step": 3490, |
| "valid_targets_mean": 2272.3, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 5.6645056726094, |
| "grad_norm": 0.8493579524196188, |
| "learning_rate": 4.283784064172405e-06, |
| "loss": 0.147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23569592833518982, |
| "step": 3495, |
| "valid_targets_mean": 2847.4, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 5.672609400324149, |
| "grad_norm": 1.0045947500475891, |
| "learning_rate": 4.233926132298867e-06, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12646427750587463, |
| "step": 3500, |
| "valid_targets_mean": 1906.7, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 5.680713128038898, |
| "grad_norm": 1.4216952442247126, |
| "learning_rate": 4.1843256745787e-06, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18572121858596802, |
| "step": 3505, |
| "valid_targets_mean": 1459.9, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 5.688816855753647, |
| "grad_norm": 0.9002937899719397, |
| "learning_rate": 4.134983501031942e-06, |
| "loss": 0.1033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11701390147209167, |
| "step": 3510, |
| "valid_targets_mean": 2314.2, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.696920583468396, |
| "grad_norm": 0.8596504160989296, |
| "learning_rate": 4.085900417460633e-06, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15798306465148926, |
| "step": 3515, |
| "valid_targets_mean": 2459.4, |
| "valid_targets_min": 1225 |
| }, |
| { |
| "epoch": 5.705024311183144, |
| "grad_norm": 1.0572710496515947, |
| "learning_rate": 4.037077225435628e-06, |
| "loss": 0.1485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14602217078208923, |
| "step": 3520, |
| "valid_targets_mean": 1989.2, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 5.713128038897893, |
| "grad_norm": 0.5224530736412875, |
| "learning_rate": 3.988514722283523e-06, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0725245401263237, |
| "step": 3525, |
| "valid_targets_mean": 3406.3, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 5.721231766612641, |
| "grad_norm": 0.9644662300746688, |
| "learning_rate": 3.940213701073636e-06, |
| "loss": 0.1119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10431959480047226, |
| "step": 3530, |
| "valid_targets_mean": 1862.7, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 5.72933549432739, |
| "grad_norm": 0.6423940525393956, |
| "learning_rate": 3.892174950605039e-06, |
| "loss": 0.1221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0762447863817215, |
| "step": 3535, |
| "valid_targets_mean": 2733.1, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 5.7374392220421395, |
| "grad_norm": 1.0504974617543583, |
| "learning_rate": 3.844399255393705e-06, |
| "loss": 0.1272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12259531021118164, |
| "step": 3540, |
| "valid_targets_mean": 2066.3, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 5.745542949756889, |
| "grad_norm": 1.0177720813084683, |
| "learning_rate": 3.7968873956596563e-06, |
| "loss": 0.1244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18689052760601044, |
| "step": 3545, |
| "valid_targets_mean": 2081.0, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 5.753646677471637, |
| "grad_norm": 1.081526403816516, |
| "learning_rate": 3.749640147314264e-06, |
| "loss": 0.1412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15227672457695007, |
| "step": 3550, |
| "valid_targets_mean": 1617.8, |
| "valid_targets_min": 450 |
| }, |
| { |
| "epoch": 5.761750405186386, |
| "grad_norm": 1.281386145306865, |
| "learning_rate": 3.7026582819475443e-06, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1037423312664032, |
| "step": 3555, |
| "valid_targets_mean": 1829.5, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 5.769854132901134, |
| "grad_norm": 1.166110176855929, |
| "learning_rate": 3.6559425668155733e-06, |
| "loss": 0.1227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11849828064441681, |
| "step": 3560, |
| "valid_targets_mean": 2195.3, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 5.777957860615883, |
| "grad_norm": 0.5899092092985859, |
| "learning_rate": 3.6094937648279647e-06, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10452926158905029, |
| "step": 3565, |
| "valid_targets_mean": 3788.1, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 5.786061588330632, |
| "grad_norm": 0.6076238022877796, |
| "learning_rate": 3.563312634535383e-06, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09219780564308167, |
| "step": 3570, |
| "valid_targets_mean": 4160.1, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 5.7941653160453805, |
| "grad_norm": 0.9424647522354361, |
| "learning_rate": 3.517399930117196e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13615809381008148, |
| "step": 3575, |
| "valid_targets_mean": 2198.9, |
| "valid_targets_min": 866 |
| }, |
| { |
| "epoch": 5.80226904376013, |
| "grad_norm": 0.5696560681892507, |
| "learning_rate": 3.4717564013691087e-06, |
| "loss": 0.1521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11359340697526932, |
| "step": 3580, |
| "valid_targets_mean": 5013.9, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 5.810372771474879, |
| "grad_norm": 0.8141064051451715, |
| "learning_rate": 3.4263827936909744e-06, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12475259602069855, |
| "step": 3585, |
| "valid_targets_mean": 2504.2, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 5.818476499189627, |
| "grad_norm": 0.5674431699647517, |
| "learning_rate": 3.38127984807457e-06, |
| "loss": 0.112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09661044925451279, |
| "step": 3590, |
| "valid_targets_mean": 4857.5, |
| "valid_targets_min": 834 |
| }, |
| { |
| "epoch": 5.826580226904376, |
| "grad_norm": 0.7103962514018813, |
| "learning_rate": 3.3364483010915237e-06, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12006492912769318, |
| "step": 3595, |
| "valid_targets_mean": 3394.4, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 5.834683954619125, |
| "grad_norm": 0.9765118903364278, |
| "learning_rate": 3.2918888848812913e-06, |
| "loss": 0.1362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18907558917999268, |
| "step": 3600, |
| "valid_targets_mean": 2537.3, |
| "valid_targets_min": 232 |
| }, |
| { |
| "epoch": 5.842787682333873, |
| "grad_norm": 0.6452405236633486, |
| "learning_rate": 3.2476023271391698e-06, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10429327189922333, |
| "step": 3605, |
| "valid_targets_mean": 3199.5, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 5.8508914100486225, |
| "grad_norm": 0.9704787354907897, |
| "learning_rate": 3.2035893511044524e-06, |
| "loss": 0.1271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12537583708763123, |
| "step": 3610, |
| "valid_targets_mean": 2012.1, |
| "valid_targets_min": 505 |
| }, |
| { |
| "epoch": 5.858995137763371, |
| "grad_norm": 1.0125575644527998, |
| "learning_rate": 3.159850675548577e-06, |
| "loss": 0.1254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13451366126537323, |
| "step": 3615, |
| "valid_targets_mean": 2137.6, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 5.86709886547812, |
| "grad_norm": 0.5958492150298547, |
| "learning_rate": 3.116387014763429e-06, |
| "loss": 0.1595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18298457562923431, |
| "step": 3620, |
| "valid_targets_mean": 4842.6, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 5.875202593192869, |
| "grad_norm": 0.9194613793350569, |
| "learning_rate": 3.073199078549638e-06, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14356893301010132, |
| "step": 3625, |
| "valid_targets_mean": 2403.4, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 5.883306320907618, |
| "grad_norm": 0.7587379022022571, |
| "learning_rate": 3.0302875722050064e-06, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19144773483276367, |
| "step": 3630, |
| "valid_targets_mean": 3720.6, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 5.891410048622366, |
| "grad_norm": 0.757032598883858, |
| "learning_rate": 2.987653196513003e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10905779898166656, |
| "step": 3635, |
| "valid_targets_mean": 2983.9, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 5.899513776337115, |
| "grad_norm": 0.84410146266729, |
| "learning_rate": 2.9452966477312815e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12055391073226929, |
| "step": 3640, |
| "valid_targets_mean": 2604.8, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 5.9076175040518635, |
| "grad_norm": 0.6912606615140152, |
| "learning_rate": 2.9032186175803545e-06, |
| "loss": 0.147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.231064572930336, |
| "step": 3645, |
| "valid_targets_mean": 4160.1, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 5.915721231766613, |
| "grad_norm": 0.9150252191276331, |
| "learning_rate": 2.8614197932322585e-06, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14955416321754456, |
| "step": 3650, |
| "valid_targets_mean": 2538.5, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 5.923824959481362, |
| "grad_norm": 1.0537159718577105, |
| "learning_rate": 2.819900857299358e-06, |
| "loss": 0.1196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12648676335811615, |
| "step": 3655, |
| "valid_targets_mean": 1749.5, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 5.93192868719611, |
| "grad_norm": 0.9562074384683694, |
| "learning_rate": 2.778662487823187e-06, |
| "loss": 0.1226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11901277303695679, |
| "step": 3660, |
| "valid_targets_mean": 3005.4, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 5.940032414910859, |
| "grad_norm": 0.9786475511741156, |
| "learning_rate": 2.7377053582633652e-06, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1406671404838562, |
| "step": 3665, |
| "valid_targets_mean": 2011.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 5.948136142625608, |
| "grad_norm": 0.780480994666007, |
| "learning_rate": 2.6970301374866337e-06, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15554064512252808, |
| "step": 3670, |
| "valid_targets_mean": 2561.8, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 5.956239870340356, |
| "grad_norm": 0.6847569982772912, |
| "learning_rate": 2.656637489755889e-06, |
| "loss": 0.107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08473924547433853, |
| "step": 3675, |
| "valid_targets_mean": 2566.4, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 5.964343598055105, |
| "grad_norm": 1.1663803129546406, |
| "learning_rate": 2.616528074719371e-06, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16240835189819336, |
| "step": 3680, |
| "valid_targets_mean": 1863.8, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 5.9724473257698545, |
| "grad_norm": 1.0505470362211855, |
| "learning_rate": 2.576702547399863e-06, |
| "loss": 0.1137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11963564902544022, |
| "step": 3685, |
| "valid_targets_mean": 2972.6, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 5.980551053484603, |
| "grad_norm": 0.6153132292802707, |
| "learning_rate": 2.53716155818402e-06, |
| "loss": 0.1199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10222367942333221, |
| "step": 3690, |
| "valid_targets_mean": 3769.6, |
| "valid_targets_min": 496 |
| }, |
| { |
| "epoch": 5.988654781199352, |
| "grad_norm": 0.7706022269958611, |
| "learning_rate": 2.49790575281172e-06, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10004860907793045, |
| "step": 3695, |
| "valid_targets_mean": 4118.3, |
| "valid_targets_min": 461 |
| }, |
| { |
| "epoch": 5.9967585089141, |
| "grad_norm": 1.1497778298396315, |
| "learning_rate": 2.4589357723655405e-06, |
| "loss": 0.1159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12909851968288422, |
| "step": 3700, |
| "valid_targets_mean": 1985.4, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 6.004862236628849, |
| "grad_norm": 0.8065263620717076, |
| "learning_rate": 2.4202522532602846e-06, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12583133578300476, |
| "step": 3705, |
| "valid_targets_mean": 2561.8, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 6.012965964343598, |
| "grad_norm": 0.47440335088604885, |
| "learning_rate": 2.381855827232571e-06, |
| "loss": 0.1023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08017963171005249, |
| "step": 3710, |
| "valid_targets_mean": 4353.3, |
| "valid_targets_min": 232 |
| }, |
| { |
| "epoch": 6.021069692058346, |
| "grad_norm": 0.8208816345120449, |
| "learning_rate": 2.343747121330544e-06, |
| "loss": 0.1576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12535922229290009, |
| "step": 3715, |
| "valid_targets_mean": 2856.1, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 6.0291734197730955, |
| "grad_norm": 0.7429830314090826, |
| "learning_rate": 2.3059267579036183e-06, |
| "loss": 0.1217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10140064358711243, |
| "step": 3720, |
| "valid_targets_mean": 3342.2, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 6.037277147487845, |
| "grad_norm": 0.5938762525392249, |
| "learning_rate": 2.268395354592312e-06, |
| "loss": 0.1442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11517813801765442, |
| "step": 3725, |
| "valid_targets_mean": 5581.0, |
| "valid_targets_min": 232 |
| }, |
| { |
| "epoch": 6.045380875202593, |
| "grad_norm": 0.8583542985755236, |
| "learning_rate": 2.2311535243181637e-06, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2661886513233185, |
| "step": 3730, |
| "valid_targets_mean": 3863.1, |
| "valid_targets_min": 443 |
| }, |
| { |
| "epoch": 6.053484602917342, |
| "grad_norm": 0.8438682223939366, |
| "learning_rate": 2.1942018752737227e-06, |
| "loss": 0.121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08933848142623901, |
| "step": 3735, |
| "valid_targets_mean": 2379.1, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 6.061588330632091, |
| "grad_norm": 0.4750345988672662, |
| "learning_rate": 2.1575410109126293e-06, |
| "loss": 0.1062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07867272198200226, |
| "step": 3740, |
| "valid_targets_mean": 5703.2, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 6.069692058346839, |
| "grad_norm": 0.7820914107075465, |
| "learning_rate": 2.121171529939734e-06, |
| "loss": 0.1316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15075111389160156, |
| "step": 3745, |
| "valid_targets_mean": 3570.4, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 6.077795786061588, |
| "grad_norm": 0.7594471532290356, |
| "learning_rate": 2.085094026301349e-06, |
| "loss": 0.1173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20603245496749878, |
| "step": 3750, |
| "valid_targets_mean": 3489.7, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 6.085899513776337, |
| "grad_norm": 0.6047064426773207, |
| "learning_rate": 2.0493090891755262e-06, |
| "loss": 0.1361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07911926507949829, |
| "step": 3755, |
| "valid_targets_mean": 3143.4, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 6.094003241491086, |
| "grad_norm": 0.5079708101672858, |
| "learning_rate": 2.013817302962444e-06, |
| "loss": 0.1252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17122353613376617, |
| "step": 3760, |
| "valid_targets_mean": 6064.8, |
| "valid_targets_min": 1526 |
| }, |
| { |
| "epoch": 6.102106969205835, |
| "grad_norm": 0.8625230922660629, |
| "learning_rate": 1.9786192472748643e-06, |
| "loss": 0.1475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10119368880987167, |
| "step": 3765, |
| "valid_targets_mean": 2206.5, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 6.110210696920584, |
| "grad_norm": 1.0935738204994028, |
| "learning_rate": 1.9437154969286577e-06, |
| "loss": 0.1485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12805625796318054, |
| "step": 3770, |
| "valid_targets_mean": 1756.6, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 6.118314424635332, |
| "grad_norm": 0.7094021347408048, |
| "learning_rate": 1.9091066219334365e-06, |
| "loss": 0.1246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09319410473108292, |
| "step": 3775, |
| "valid_targets_mean": 3571.6, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 6.126418152350081, |
| "grad_norm": 0.8810616245799291, |
| "learning_rate": 1.8747931874832325e-06, |
| "loss": 0.13, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06927265226840973, |
| "step": 3780, |
| "valid_targets_mean": 3894.1, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 6.13452188006483, |
| "grad_norm": 0.7966465543664667, |
| "learning_rate": 1.8407757539472548e-06, |
| "loss": 0.1291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1974271982908249, |
| "step": 3785, |
| "valid_targets_mean": 3178.2, |
| "valid_targets_min": 450 |
| }, |
| { |
| "epoch": 6.1426256077795784, |
| "grad_norm": 0.5378695627769883, |
| "learning_rate": 1.8070548768607744e-06, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10642120242118835, |
| "step": 3790, |
| "valid_targets_mean": 4619.8, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 6.1507293354943275, |
| "grad_norm": 1.0147575200870909, |
| "learning_rate": 1.773631106915996e-06, |
| "loss": 0.1432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09471525251865387, |
| "step": 3795, |
| "valid_targets_mean": 2203.6, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 6.158833063209076, |
| "grad_norm": 0.7484970018269975, |
| "learning_rate": 1.740504989953129e-06, |
| "loss": 0.1485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11913225054740906, |
| "step": 3800, |
| "valid_targets_mean": 2594.4, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 6.166936790923825, |
| "grad_norm": 0.8241935721612473, |
| "learning_rate": 1.707677066951432e-06, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21923650801181793, |
| "step": 3805, |
| "valid_targets_mean": 3371.1, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 6.175040518638574, |
| "grad_norm": 0.7791725998755106, |
| "learning_rate": 1.6751478740203776e-06, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14890174567699432, |
| "step": 3810, |
| "valid_targets_mean": 3476.3, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 6.183144246353322, |
| "grad_norm": 0.9316060672966924, |
| "learning_rate": 1.6429179423909248e-06, |
| "loss": 0.1066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09502556920051575, |
| "step": 3815, |
| "valid_targets_mean": 1851.6, |
| "valid_targets_min": 319 |
| }, |
| { |
| "epoch": 6.191247974068071, |
| "grad_norm": 0.6681121617992075, |
| "learning_rate": 1.6109877984068089e-06, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10410622507333755, |
| "step": 3820, |
| "valid_targets_mean": 3242.0, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 6.19935170178282, |
| "grad_norm": 0.7966050962281183, |
| "learning_rate": 1.5793579635159883e-06, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12778472900390625, |
| "step": 3825, |
| "valid_targets_mean": 2881.1, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 6.207455429497569, |
| "grad_norm": 1.0811104704970367, |
| "learning_rate": 1.5480289542620686e-06, |
| "loss": 0.1234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14305716753005981, |
| "step": 3830, |
| "valid_targets_mean": 1729.1, |
| "valid_targets_min": 505 |
| }, |
| { |
| "epoch": 6.215559157212318, |
| "grad_norm": 0.8218570136420974, |
| "learning_rate": 1.517001282275936e-06, |
| "loss": 0.1119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19680121541023254, |
| "step": 3835, |
| "valid_targets_mean": 3000.9, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 6.223662884927067, |
| "grad_norm": 1.3444875208456322, |
| "learning_rate": 1.486275454267354e-06, |
| "loss": 0.1256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1285068839788437, |
| "step": 3840, |
| "valid_targets_mean": 2764.1, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 6.231766612641815, |
| "grad_norm": 0.8944598377852021, |
| "learning_rate": 1.4558519720166975e-06, |
| "loss": 0.1422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16025900840759277, |
| "step": 3845, |
| "valid_targets_mean": 2910.8, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 6.239870340356564, |
| "grad_norm": 0.651296867676762, |
| "learning_rate": 1.4257313323667798e-06, |
| "loss": 0.1298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08879795670509338, |
| "step": 3850, |
| "valid_targets_mean": 3112.5, |
| "valid_targets_min": 400 |
| }, |
| { |
| "epoch": 6.247974068071313, |
| "grad_norm": 0.5999610443428787, |
| "learning_rate": 1.3959140272146998e-06, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11679062247276306, |
| "step": 3855, |
| "valid_targets_mean": 3881.8, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 6.256077795786061, |
| "grad_norm": 0.9636049482804864, |
| "learning_rate": 1.366400543503854e-06, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18295209109783173, |
| "step": 3860, |
| "valid_targets_mean": 2168.9, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 6.2641815235008105, |
| "grad_norm": 0.78397490864793, |
| "learning_rate": 1.3371913632159506e-06, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.089485764503479, |
| "step": 3865, |
| "valid_targets_mean": 2398.6, |
| "valid_targets_min": 871 |
| }, |
| { |
| "epoch": 6.272285251215559, |
| "grad_norm": 0.7820564283288564, |
| "learning_rate": 1.3082869633631413e-06, |
| "loss": 0.1407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1150301992893219, |
| "step": 3870, |
| "valid_targets_mean": 2335.1, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 6.280388978930308, |
| "grad_norm": 1.027079175401604, |
| "learning_rate": 1.2796878159802595e-06, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15304911136627197, |
| "step": 3875, |
| "valid_targets_mean": 2105.1, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 6.288492706645057, |
| "grad_norm": 0.6199836306967389, |
| "learning_rate": 1.2513943881170754e-06, |
| "loss": 0.137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13365209102630615, |
| "step": 3880, |
| "valid_targets_mean": 4391.9, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 6.296596434359805, |
| "grad_norm": 0.7727236218240091, |
| "learning_rate": 1.2234071418306903e-06, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10507519543170929, |
| "step": 3885, |
| "valid_targets_mean": 2839.7, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 6.304700162074554, |
| "grad_norm": 0.8259960625219598, |
| "learning_rate": 1.1957265341779855e-06, |
| "loss": 0.1128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06842942535877228, |
| "step": 3890, |
| "valid_targets_mean": 2111.8, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 6.312803889789303, |
| "grad_norm": 1.3006108319686243, |
| "learning_rate": 1.1683530172081592e-06, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16923511028289795, |
| "step": 3895, |
| "valid_targets_mean": 2721.0, |
| "valid_targets_min": 318 |
| }, |
| { |
| "epoch": 6.3209076175040515, |
| "grad_norm": 0.9212042910130562, |
| "learning_rate": 1.1412870379553387e-06, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11085739731788635, |
| "step": 3900, |
| "valid_targets_mean": 2037.5, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 6.329011345218801, |
| "grad_norm": 0.7484624073581349, |
| "learning_rate": 1.1145290384312846e-06, |
| "loss": 0.1312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10903692245483398, |
| "step": 3905, |
| "valid_targets_mean": 2927.1, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 6.33711507293355, |
| "grad_norm": 0.7780860184446243, |
| "learning_rate": 1.0880794556181762e-06, |
| "loss": 0.1465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13929596543312073, |
| "step": 3910, |
| "valid_targets_mean": 3093.2, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 6.345218800648298, |
| "grad_norm": 0.857143392794329, |
| "learning_rate": 1.0619387214614662e-06, |
| "loss": 0.1038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08489274978637695, |
| "step": 3915, |
| "valid_targets_mean": 2249.3, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 6.353322528363047, |
| "grad_norm": 0.7892887000224863, |
| "learning_rate": 1.0361072628628354e-06, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1285485327243805, |
| "step": 3920, |
| "valid_targets_mean": 3397.4, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 6.361426256077796, |
| "grad_norm": 0.8963361991084041, |
| "learning_rate": 1.0105855016732113e-06, |
| "loss": 0.1328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15654143691062927, |
| "step": 3925, |
| "valid_targets_mean": 2594.8, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 6.369529983792544, |
| "grad_norm": 0.9164724545517589, |
| "learning_rate": 9.853738546858893e-07, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09162580966949463, |
| "step": 3930, |
| "valid_targets_mean": 2038.8, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 6.377633711507293, |
| "grad_norm": 0.6269508433513853, |
| "learning_rate": 9.604727336297203e-07, |
| "loss": 0.1511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10261643677949905, |
| "step": 3935, |
| "valid_targets_mean": 3776.9, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 6.3857374392220425, |
| "grad_norm": 0.7267537967221318, |
| "learning_rate": 9.358825451623832e-07, |
| "loss": 0.1693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16209650039672852, |
| "step": 3940, |
| "valid_targets_mean": 3149.4, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 6.393841166936791, |
| "grad_norm": 0.8819007736794746, |
| "learning_rate": 9.116036908637582e-07, |
| "loss": 0.1257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13063153624534607, |
| "step": 3945, |
| "valid_targets_mean": 2710.8, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 6.40194489465154, |
| "grad_norm": 0.6745885226985678, |
| "learning_rate": 8.876365672293441e-07, |
| "loss": 0.091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08468009531497955, |
| "step": 3950, |
| "valid_targets_mean": 3238.0, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 6.410048622366288, |
| "grad_norm": 0.8819209149898708, |
| "learning_rate": 8.639815656638162e-07, |
| "loss": 0.1247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15380942821502686, |
| "step": 3955, |
| "valid_targets_mean": 2853.2, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 6.418152350081037, |
| "grad_norm": 0.8845074945045972, |
| "learning_rate": 8.406390724745961e-07, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1663370132446289, |
| "step": 3960, |
| "valid_targets_mean": 2657.0, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 6.426256077795786, |
| "grad_norm": 0.7576749630747052, |
| "learning_rate": 8.176094688655789e-07, |
| "loss": 0.1185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1374589502811432, |
| "step": 3965, |
| "valid_targets_mean": 3111.9, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 6.434359805510534, |
| "grad_norm": 0.8629454796074068, |
| "learning_rate": 7.948931309308872e-07, |
| "loss": 0.1229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13856954872608185, |
| "step": 3970, |
| "valid_targets_mean": 3491.9, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 6.4424635332252835, |
| "grad_norm": 1.0231777837569396, |
| "learning_rate": 7.724904296487246e-07, |
| "loss": 0.1405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11940930783748627, |
| "step": 3975, |
| "valid_targets_mean": 1845.0, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 6.450567260940033, |
| "grad_norm": 0.8238449493780197, |
| "learning_rate": 7.504017308753386e-07, |
| "loss": 0.1506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18350258469581604, |
| "step": 3980, |
| "valid_targets_mean": 4485.2, |
| "valid_targets_min": 217 |
| }, |
| { |
| "epoch": 6.458670988654781, |
| "grad_norm": 0.8464204623046769, |
| "learning_rate": 7.286273953390278e-07, |
| "loss": 0.2092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.258614182472229, |
| "step": 3985, |
| "valid_targets_mean": 3313.9, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 6.46677471636953, |
| "grad_norm": 0.8918238849564315, |
| "learning_rate": 7.071677786342568e-07, |
| "loss": 0.1237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1031871885061264, |
| "step": 3990, |
| "valid_targets_mean": 2293.3, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 6.474878444084279, |
| "grad_norm": 0.8528535194867968, |
| "learning_rate": 6.860232312158554e-07, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15150435268878937, |
| "step": 3995, |
| "valid_targets_mean": 2968.9, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 6.482982171799027, |
| "grad_norm": 0.7636360851041402, |
| "learning_rate": 6.651940983932737e-07, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19292369484901428, |
| "step": 4000, |
| "valid_targets_mean": 3176.4, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 6.491085899513776, |
| "grad_norm": 1.0126383046774314, |
| "learning_rate": 6.44680720324975e-07, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12578508257865906, |
| "step": 4005, |
| "valid_targets_mean": 1690.8, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 6.4991896272285254, |
| "grad_norm": 0.7355254192324758, |
| "learning_rate": 6.244834320128501e-07, |
| "loss": 0.1175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10512825846672058, |
| "step": 4010, |
| "valid_targets_mean": 2727.1, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 6.507293354943274, |
| "grad_norm": 0.8817717410341444, |
| "learning_rate": 6.0460256329677e-07, |
| "loss": 0.1362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0961059033870697, |
| "step": 4015, |
| "valid_targets_mean": 1961.8, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 6.515397082658023, |
| "grad_norm": 0.9530199455424444, |
| "learning_rate": 5.850384388491814e-07, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11027082055807114, |
| "step": 4020, |
| "valid_targets_mean": 2610.9, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 6.523500810372772, |
| "grad_norm": 1.1973587173189302, |
| "learning_rate": 5.657913781698221e-07, |
| "loss": 0.1467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15702632069587708, |
| "step": 4025, |
| "valid_targets_mean": 2178.3, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 6.53160453808752, |
| "grad_norm": 0.9362106839228681, |
| "learning_rate": 5.468616955804873e-07, |
| "loss": 0.1169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1587480902671814, |
| "step": 4030, |
| "valid_targets_mean": 2364.8, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 6.539708265802269, |
| "grad_norm": 0.8971025729416715, |
| "learning_rate": 5.282497002198983e-07, |
| "loss": 0.1034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10483712702989578, |
| "step": 4035, |
| "valid_targets_mean": 2060.6, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 6.547811993517017, |
| "grad_norm": 2.337830249158839, |
| "learning_rate": 5.099556960386686e-07, |
| "loss": 0.119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.114591583609581, |
| "step": 4040, |
| "valid_targets_mean": 1819.8, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 6.5559157212317665, |
| "grad_norm": 0.9163559690136783, |
| "learning_rate": 4.919799817943238e-07, |
| "loss": 0.1064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1364617496728897, |
| "step": 4045, |
| "valid_targets_mean": 2475.9, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 6.564019448946516, |
| "grad_norm": 1.0530486479633936, |
| "learning_rate": 4.7432285104642703e-07, |
| "loss": 0.1509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1412011682987213, |
| "step": 4050, |
| "valid_targets_mean": 1812.3, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 6.572123176661265, |
| "grad_norm": 1.0490371458755887, |
| "learning_rate": 4.569845921517968e-07, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1328582465648651, |
| "step": 4055, |
| "valid_targets_mean": 2563.8, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 6.580226904376013, |
| "grad_norm": 0.8827517020820953, |
| "learning_rate": 4.399654882597726e-07, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09797355532646179, |
| "step": 4060, |
| "valid_targets_mean": 1908.7, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 6.588330632090762, |
| "grad_norm": 0.5796761962828608, |
| "learning_rate": 4.232658173076232e-07, |
| "loss": 0.1306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08027474582195282, |
| "step": 4065, |
| "valid_targets_mean": 4144.1, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 6.59643435980551, |
| "grad_norm": 1.0909407783873655, |
| "learning_rate": 4.068858520159724e-07, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11777451634407043, |
| "step": 4070, |
| "valid_targets_mean": 2117.9, |
| "valid_targets_min": 292 |
| }, |
| { |
| "epoch": 6.604538087520259, |
| "grad_norm": 0.6833254490640153, |
| "learning_rate": 3.9082585988437617e-07, |
| "loss": 0.1341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1639232188463211, |
| "step": 4075, |
| "valid_targets_mean": 3476.4, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 6.612641815235008, |
| "grad_norm": 0.9742355762056493, |
| "learning_rate": 3.7508610318693684e-07, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1798877716064453, |
| "step": 4080, |
| "valid_targets_mean": 2434.2, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 6.620745542949757, |
| "grad_norm": 0.7781187724054021, |
| "learning_rate": 3.596668389680247e-07, |
| "loss": 0.1188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09959834814071655, |
| "step": 4085, |
| "valid_targets_mean": 2723.8, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 6.628849270664506, |
| "grad_norm": 0.8466343867882937, |
| "learning_rate": 3.445683190380833e-07, |
| "loss": 0.1141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08893650770187378, |
| "step": 4090, |
| "valid_targets_mean": 1926.0, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 6.636952998379255, |
| "grad_norm": 0.7908915562547193, |
| "learning_rate": 3.297907899695019e-07, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09306427836418152, |
| "step": 4095, |
| "valid_targets_mean": 2579.3, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 6.645056726094003, |
| "grad_norm": 0.6540049138105144, |
| "learning_rate": 3.1533449309262056e-07, |
| "loss": 0.1347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12161879241466522, |
| "step": 4100, |
| "valid_targets_mean": 3311.7, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 6.653160453808752, |
| "grad_norm": 0.8462221047782975, |
| "learning_rate": 3.0119966449174474e-07, |
| "loss": 0.1398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0935630202293396, |
| "step": 4105, |
| "valid_targets_mean": 1882.8, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 6.661264181523501, |
| "grad_norm": 0.81490063291204, |
| "learning_rate": 2.8738653500133494e-07, |
| "loss": 0.1271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10476881265640259, |
| "step": 4110, |
| "valid_targets_mean": 2528.9, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 6.669367909238249, |
| "grad_norm": 0.6366928478749754, |
| "learning_rate": 2.738953302022096e-07, |
| "loss": 0.1103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08438228070735931, |
| "step": 4115, |
| "valid_targets_mean": 3672.2, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 6.6774716369529985, |
| "grad_norm": 0.5680139767437395, |
| "learning_rate": 2.6072627041785925e-07, |
| "loss": 0.1178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05923807621002197, |
| "step": 4120, |
| "valid_targets_mean": 3334.2, |
| "valid_targets_min": 913 |
| }, |
| { |
| "epoch": 6.685575364667747, |
| "grad_norm": 3.566418268679015, |
| "learning_rate": 2.478795707108672e-07, |
| "loss": 0.1124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0984240397810936, |
| "step": 4125, |
| "valid_targets_mean": 3397.5, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 6.693679092382496, |
| "grad_norm": 0.8102395858284243, |
| "learning_rate": 2.3535544087938345e-07, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1713753342628479, |
| "step": 4130, |
| "valid_targets_mean": 2797.9, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 6.701782820097245, |
| "grad_norm": 0.9439721686588282, |
| "learning_rate": 2.2315408545370288e-07, |
| "loss": 0.1177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15056179463863373, |
| "step": 4135, |
| "valid_targets_mean": 2218.5, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 6.709886547811994, |
| "grad_norm": 0.9719771412362007, |
| "learning_rate": 2.1127570369292361e-07, |
| "loss": 0.1266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1161581426858902, |
| "step": 4140, |
| "valid_targets_mean": 2372.7, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 6.717990275526742, |
| "grad_norm": 0.7885505138738974, |
| "learning_rate": 1.9972048958168954e-07, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08716851472854614, |
| "step": 4145, |
| "valid_targets_mean": 2679.0, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.726094003241491, |
| "grad_norm": 0.7564261208584763, |
| "learning_rate": 1.8848863182703513e-07, |
| "loss": 0.1293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14512531459331512, |
| "step": 4150, |
| "valid_targets_mean": 3178.8, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 6.7341977309562395, |
| "grad_norm": 0.8230943188429811, |
| "learning_rate": 1.7758031385528784e-07, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19820144772529602, |
| "step": 4155, |
| "valid_targets_mean": 2705.9, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 6.742301458670989, |
| "grad_norm": 0.7304895753350193, |
| "learning_rate": 1.6699571380908385e-07, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1148165911436081, |
| "step": 4160, |
| "valid_targets_mean": 2799.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 6.750405186385738, |
| "grad_norm": 0.8783884446179141, |
| "learning_rate": 1.5673500454445046e-07, |
| "loss": 0.1137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1160724088549614, |
| "step": 4165, |
| "valid_targets_mean": 1911.4, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 6.758508914100486, |
| "grad_norm": 0.8452843386698703, |
| "learning_rate": 1.4679835362799266e-07, |
| "loss": 0.1405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17844310402870178, |
| "step": 4170, |
| "valid_targets_mean": 2903.6, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 6.766612641815235, |
| "grad_norm": 0.9641957278215031, |
| "learning_rate": 1.3718592333414881e-07, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1178508773446083, |
| "step": 4175, |
| "valid_targets_mean": 1679.4, |
| "valid_targets_min": 456 |
| }, |
| { |
| "epoch": 6.774716369529984, |
| "grad_norm": 0.6732633682506574, |
| "learning_rate": 1.2789787064253934e-07, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12225890159606934, |
| "step": 4180, |
| "valid_targets_mean": 3461.0, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 6.782820097244732, |
| "grad_norm": 0.9548675664452392, |
| "learning_rate": 1.1893434723541542e-07, |
| "loss": 0.1272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12099964916706085, |
| "step": 4185, |
| "valid_targets_mean": 1765.4, |
| "valid_targets_min": 348 |
| }, |
| { |
| "epoch": 6.790923824959481, |
| "grad_norm": 0.7229822657096528, |
| "learning_rate": 1.1029549949516549e-07, |
| "loss": 0.1312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16705356538295746, |
| "step": 4190, |
| "valid_targets_mean": 4125.2, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 6.7990275526742305, |
| "grad_norm": 1.0053755294682665, |
| "learning_rate": 1.0198146850193935e-07, |
| "loss": 0.1376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10085690766572952, |
| "step": 4195, |
| "valid_targets_mean": 1957.5, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 6.807131280388979, |
| "grad_norm": 1.335653057078746, |
| "learning_rate": 9.399239003132999e-08, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09673996269702911, |
| "step": 4200, |
| "valid_targets_mean": 1523.4, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 6.815235008103728, |
| "grad_norm": 0.8800015171398834, |
| "learning_rate": 8.632839455216869e-08, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11644886434078217, |
| "step": 4205, |
| "valid_targets_mean": 2234.9, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 6.823338735818476, |
| "grad_norm": 0.782216107013055, |
| "learning_rate": 7.89896072243912e-08, |
| "loss": 0.1221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10838295519351959, |
| "step": 4210, |
| "valid_targets_mean": 2606.8, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 6.831442463533225, |
| "grad_norm": 0.7331468581917359, |
| "learning_rate": 7.197614789698604e-08, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27159422636032104, |
| "step": 4215, |
| "valid_targets_mean": 4613.2, |
| "valid_targets_min": 1164 |
| }, |
| { |
| "epoch": 6.839546191247974, |
| "grad_norm": 0.7847565716440916, |
| "learning_rate": 6.528813110604714e-08, |
| "loss": 0.1195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10585910081863403, |
| "step": 4220, |
| "valid_targets_mean": 2765.0, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 6.847649918962723, |
| "grad_norm": 0.8253246012683277, |
| "learning_rate": 5.8925666072899845e-08, |
| "loss": 0.1249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14212317764759064, |
| "step": 4225, |
| "valid_targets_mean": 2604.4, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 6.855753646677472, |
| "grad_norm": 0.798983689706256, |
| "learning_rate": 5.288885670231336e-08, |
| "loss": 0.1315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10902281105518341, |
| "step": 4230, |
| "valid_targets_mean": 2613.6, |
| "valid_targets_min": 461 |
| }, |
| { |
| "epoch": 6.863857374392221, |
| "grad_norm": 0.8467915925619014, |
| "learning_rate": 4.717780158080887e-08, |
| "loss": 0.1119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1464867889881134, |
| "step": 4235, |
| "valid_targets_mean": 2088.5, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 6.871961102106969, |
| "grad_norm": 1.0029490169977413, |
| "learning_rate": 4.1792593975049644e-08, |
| "loss": 0.1264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12026522308588028, |
| "step": 4240, |
| "valid_targets_mean": 1802.7, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 6.880064829821718, |
| "grad_norm": 0.9011238391462046, |
| "learning_rate": 3.6733321830315636e-08, |
| "loss": 0.1337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11811887472867966, |
| "step": 4245, |
| "valid_targets_mean": 2323.1, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 6.888168557536467, |
| "grad_norm": 0.7165823854167281, |
| "learning_rate": 3.200006776906461e-08, |
| "loss": 0.1129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09492816030979156, |
| "step": 4250, |
| "valid_targets_mean": 2960.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 6.896272285251215, |
| "grad_norm": 0.9450518017052805, |
| "learning_rate": 2.7592909089593224e-08, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14789974689483643, |
| "step": 4255, |
| "valid_targets_mean": 2218.0, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 6.904376012965964, |
| "grad_norm": 0.7311474778057845, |
| "learning_rate": 2.351191776475581e-08, |
| "loss": 0.1319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1463954895734787, |
| "step": 4260, |
| "valid_targets_mean": 3855.9, |
| "valid_targets_min": 1393 |
| }, |
| { |
| "epoch": 6.9124797406807135, |
| "grad_norm": 0.6301982317715115, |
| "learning_rate": 1.9757160440814217e-08, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10000479966402054, |
| "step": 4265, |
| "valid_targets_mean": 3855.6, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 6.920583468395462, |
| "grad_norm": 0.9798344906644698, |
| "learning_rate": 1.6328698436327562e-08, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16356664896011353, |
| "step": 4270, |
| "valid_targets_mean": 2240.9, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 6.928687196110211, |
| "grad_norm": 0.8892538533790851, |
| "learning_rate": 1.3226587741159702e-08, |
| "loss": 0.1134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13213740289211273, |
| "step": 4275, |
| "valid_targets_mean": 2755.2, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 6.93679092382496, |
| "grad_norm": 0.8637275559260358, |
| "learning_rate": 1.0450879015566629e-08, |
| "loss": 0.1239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10389816761016846, |
| "step": 4280, |
| "valid_targets_mean": 2268.2, |
| "valid_targets_min": 302 |
| }, |
| { |
| "epoch": 6.944894651539708, |
| "grad_norm": 0.7857182787493622, |
| "learning_rate": 8.001617589368238e-09, |
| "loss": 0.1201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09846210479736328, |
| "step": 4285, |
| "valid_targets_mean": 2556.7, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 6.952998379254457, |
| "grad_norm": 0.5942319504605537, |
| "learning_rate": 5.878843461200046e-09, |
| "loss": 0.122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08767960220575333, |
| "step": 4290, |
| "valid_targets_mean": 4519.6, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 6.961102106969205, |
| "grad_norm": 0.8250059679447841, |
| "learning_rate": 4.082591297873695e-09, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17609858512878418, |
| "step": 4295, |
| "valid_targets_mean": 3104.8, |
| "valid_targets_min": 398 |
| }, |
| { |
| "epoch": 6.9692058346839545, |
| "grad_norm": 0.7499567331158492, |
| "learning_rate": 2.6128904338018624e-09, |
| "loss": 0.1151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08152391016483307, |
| "step": 4300, |
| "valid_targets_mean": 2886.6, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 6.977309562398704, |
| "grad_norm": 0.9718691223278781, |
| "learning_rate": 1.4697648705186417e-09, |
| "loss": 0.1302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15906545519828796, |
| "step": 4305, |
| "valid_targets_mean": 2148.2, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 6.985413290113452, |
| "grad_norm": 0.7283394841772546, |
| "learning_rate": 6.532332762931859e-10, |
| "loss": 0.0901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12135720252990723, |
| "step": 4310, |
| "valid_targets_mean": 3223.2, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 6.993517017828201, |
| "grad_norm": 0.7328657780903466, |
| "learning_rate": 1.6330898581884414e-10, |
| "loss": 0.1321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09660885483026505, |
| "step": 4315, |
| "valid_targets_mean": 2950.4, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20906896889209747, |
| "step": 4319, |
| "total_flos": 702151473364992.0, |
| "train_loss": 0.11156423039722288, |
| "train_runtime": 12711.7053, |
| "train_samples_per_second": 5.432, |
| "train_steps_per_second": 0.34, |
| "valid_targets_mean": 3750.0, |
| "valid_targets_min": 750 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4319, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 702151473364992.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|