llm-sort / training_history.json
gatmiry's picture
Upload folder using huggingface_hub
c7f1373 verified
[
{
"iter": 1000,
"lr": 0.02999995260854827,
"loss": 0.005900065414607525,
"test_loss": 0.008110598661005497
},
{
"iter": 2000,
"lr": 0.02999976008128888,
"loss": 0.0037083972711116076,
"test_loss": 0.0017547315219417214
},
{
"iter": 3000,
"lr": 0.029999419458155555,
"loss": 0.0018333976622670889,
"test_loss": 0.0035039177164435387
},
{
"iter": 4000,
"lr": 0.029998930742511455,
"loss": 0.002187943086028099,
"test_loss": 0.003171480493620038
},
{
"iter": 5000,
"lr": 0.029998293939181936,
"loss": 0.000614767603110522,
"test_loss": 0.0010897500906139612
},
{
"iter": 6000,
"lr": 0.029997509054454502,
"loss": 0.0022282572463154793,
"test_loss": 0.000761986942961812
},
{
"iter": 7000,
"lr": 0.029996576096078753,
"loss": 0.0030392277985811234,
"test_loss": 0.005726512987166643
},
{
"iter": 8000,
"lr": 0.029995495073266293,
"loss": 0.0009557040757499635,
"test_loss": 0.0031210174784064293
},
{
"iter": 9000,
"lr": 0.02999426599669065,
"loss": 0.002027565846219659,
"test_loss": 0.0001318393333349377
},
{
"iter": 10000,
"lr": 0.029992888878487164,
"loss": 0.0020335630979388952,
"test_loss": 0.0011286439839750528
},
{
"iter": 11000,
"lr": 0.029991363732252883,
"loss": 0.0002862904220819473,
"test_loss": 0.0025837209541350603
},
{
"iter": 12000,
"lr": 0.029989690573046394,
"loss": 0.005489793140441179,
"test_loss": 0.004253063350915909
},
{
"iter": 13000,
"lr": 0.029987869417387722,
"loss": 0.00044908569543622434,
"test_loss": 0.001501839724369347
},
{
"iter": 14000,
"lr": 0.029985900283258128,
"loss": 0.002667603548616171,
"test_loss": 0.0018379520624876022
},
{
"iter": 15000,
"lr": 0.029983783190099943,
"loss": 0.0006638114573433995,
"test_loss": 0.00048749358393251896
},
{
"iter": 16000,
"lr": 0.02998151815881638,
"loss": 0.0010706594912335277,
"test_loss": 0.0002588446077425033
},
{
"iter": 17000,
"lr": 0.029979105211771336,
"loss": 0.0016598147340118885,
"test_loss": 0.00021189564722590148
},
{
"iter": 18000,
"lr": 0.029976544372789148,
"loss": 0.00015606710803695023,
"test_loss": 0.0004901384236291051
},
{
"iter": 19000,
"lr": 0.029973835667154378,
"loss": 0.0004137195064686239,
"test_loss": 5.3709234634879977e-05
},
{
"iter": 20000,
"lr": 0.029970979121611546,
"loss": 0.00015013388474471867,
"test_loss": 4.361213359516114e-05
},
{
"iter": 21000,
"lr": 0.029967974764364896,
"loss": 0.0019828234799206257,
"test_loss": 0.0006869188509881496
},
{
"iter": 22000,
"lr": 0.02996482262507808,
"loss": 0.0009633651934564114,
"test_loss": 0.002071307972073555
},
{
"iter": 23000,
"lr": 0.029961522734873885,
"loss": 0.0008989389170892537,
"test_loss": 0.001555844908580184
},
{
"iter": 24000,
"lr": 0.02995807512633393,
"loss": 0.0013871460687369108,
"test_loss": 0.0007349022198468447
},
{
"iter": 25000,
"lr": 0.029954479833498335,
"loss": 0.0004608951276168227,
"test_loss": 0.0004932876327075064
},
{
"iter": 26000,
"lr": 0.02995073689186538,
"loss": 0.0007279432029463351,
"test_loss": 0.00011546596942935139
},
{
"iter": 27000,
"lr": 0.02994684633839118,
"loss": 0.0003217199118807912,
"test_loss": 0.0007169806049205363
},
{
"iter": 28000,
"lr": 0.02994280821148928,
"loss": 0.0002881638938561082,
"test_loss": 2.532686630729586e-05
},
{
"iter": 29000,
"lr": 0.029938622551030317,
"loss": 0.00018042103329207748,
"test_loss": 0.0010614339262247086
},
{
"iter": 30000,
"lr": 0.029934289398341588,
"loss": 0.0011770232813432813,
"test_loss": 0.001257568597793579
},
{
"iter": 31000,
"lr": 0.02992980879620669,
"loss": 0.0002549682976678014,
"test_loss": 6.940988532733172e-05
},
{
"iter": 32000,
"lr": 0.029925180788865035,
"loss": 0.00355816213414073,
"test_loss": 0.0006839775014668703
},
{
"iter": 33000,
"lr": 0.02992040542201147,
"loss": 0.0009913304820656776,
"test_loss": 0.0010673595825210214
},
{
"iter": 34000,
"lr": 0.0299154827427958,
"loss": 0.0002624760090839118,
"test_loss": 2.292902354383841e-05
},
{
"iter": 35000,
"lr": 0.02991041279982231,
"loss": 0.00016965818940661848,
"test_loss": 0.0015826878370717168
},
{
"iter": 36000,
"lr": 0.029905195643149318,
"loss": 0.003708045929670334,
"test_loss": 0.003369540674611926
},
{
"iter": 37000,
"lr": 0.02989983132428866,
"loss": 0.006338479928672314,
"test_loss": 0.0018295375630259514
},
{
"iter": 38000,
"lr": 0.029894319896205182,
"loss": 0.0008441746467724442,
"test_loss": 0.001544564263895154
},
{
"iter": 39000,
"lr": 0.02988866141331621,
"loss": 0.0001859079347923398,
"test_loss": 5.146275361767039e-05
},
{
"iter": 40000,
"lr": 0.02988285593149104,
"loss": 0.003105625044554472,
"test_loss": 0.0007138763321563601
},
{
"iter": 41000,
"lr": 0.029876903508050355,
"loss": 3.819684206973761e-05,
"test_loss": 1.5355977666331455e-05
},
{
"iter": 42000,
"lr": 0.029870804201765678,
"loss": 0.0006075446726754308,
"test_loss": 8.39575586724095e-05
},
{
"iter": 43000,
"lr": 0.029864558072858784,
"loss": 0.0001545970735605806,
"test_loss": 0.000391665002098307
},
{
"iter": 44000,
"lr": 0.029858165183001113,
"loss": 0.0005413244944065809,
"test_loss": 1.7497819499112666e-05
},
{
"iter": 45000,
"lr": 0.029851625595313156,
"loss": 0.0013656863011419773,
"test_loss": 0.00021639352780766785
},
{
"iter": 46000,
"lr": 0.029844939374363822,
"loss": 0.0006423690356314182,
"test_loss": 0.0015119562158361077
},
{
"iter": 47000,
"lr": 0.029838106586169817,
"loss": 0.00030507222982123494,
"test_loss": 0.0003638866764958948
},
{
"iter": 48000,
"lr": 0.02983112729819499,
"loss": 0.0001789523521438241,
"test_loss": 4.8229154344880953e-05
},
{
"iter": 49000,
"lr": 0.029824001579349654,
"loss": 0.00026359857292845845,
"test_loss": 0.002731637330725789
},
{
"iter": 50000,
"lr": 0.029816729499989914,
"loss": 4.367465589893982e-05,
"test_loss": 4.644911678042263e-05
},
{
"iter": 51000,
"lr": 0.029809311131916975,
"loss": 0.004326030611991882,
"test_loss": 0.0011909769382327795
},
{
"iter": 52000,
"lr": 0.029801746548376435,
"loss": 0.0014979676343500614,
"test_loss": 0.0027145135682076216
},
{
"iter": 53000,
"lr": 0.029794035824057548,
"loss": 0.0003500604652799666,
"test_loss": 0.000241837406065315
},
{
"iter": 54000,
"lr": 0.029786179035092505,
"loss": 8.903366688173264e-05,
"test_loss": 6.296028732322156e-05
},
{
"iter": 55000,
"lr": 0.029778176259055662,
"loss": 0.0001017519534798339,
"test_loss": 0.001408581854775548
},
{
"iter": 56000,
"lr": 0.029770027574962794,
"loss": 8.221656025853008e-05,
"test_loss": 0.00015615554002579302
},
{
"iter": 57000,
"lr": 0.0297617330632703,
"loss": 0.0019328156486153603,
"test_loss": 0.001631657825782895
},
{
"iter": 58000,
"lr": 0.029753292805874423,
"loss": 0.00024117162683978677,
"test_loss": 2.6498506485950202e-05
},
{
"iter": 59000,
"lr": 0.02974470688611042,
"loss": 0.0005084581789560616,
"test_loss": 0.0016478949692100286
},
{
"iter": 60000,
"lr": 0.02973597538875176,
"loss": 0.0010710344649851322,
"test_loss": 0.000751753686927259
},
{
"iter": 61000,
"lr": 0.029727098400009283,
"loss": 0.0010715620592236519,
"test_loss": 9.92331206361996e-06
},
{
"iter": 62000,
"lr": 0.029718076007530334,
"loss": 8.981147402664647e-05,
"test_loss": 0.0021601326297968626
},
{
"iter": 63000,
"lr": 0.029708908300397914,
"loss": 0.0003549798857420683,
"test_loss": 0.0003031898522749543
},
{
"iter": 64000,
"lr": 0.029699595369129795,
"loss": 0.0012836523819714785,
"test_loss": 0.0011360461357980967
},
{
"iter": 65000,
"lr": 0.02969013730567763,
"loss": 0.00018293611356057227,
"test_loss": 0.00030903745209798217
},
{
"iter": 66000,
"lr": 0.02968053420342603,
"loss": 0.0007299676071852446,
"test_loss": 2.3418193450197577e-05
},
{
"iter": 67000,
"lr": 0.029670786157191674,
"loss": 0.00037448544753715396,
"test_loss": 0.0001091007434297353
},
{
"iter": 68000,
"lr": 0.029660893263222316,
"loss": 0.003656078362837434,
"test_loss": 0.00020010056323371828
},
{
"iter": 69000,
"lr": 0.029650855619195914,
"loss": 0.0010504031088203192,
"test_loss": 0.00024744667462073267
},
{
"iter": 70000,
"lr": 0.029640673324219588,
"loss": 0.001332410261966288,
"test_loss": 0.0008789754938334227
},
{
"iter": 71000,
"lr": 0.02963034647882869,
"loss": 1.1792585610237438e-05,
"test_loss": 2.303485234733671e-05
},
{
"iter": 72000,
"lr": 0.0296198751849858,
"loss": 0.002845509210601449,
"test_loss": 0.0008803476230241358
},
{
"iter": 73000,
"lr": 0.029609259546079715,
"loss": 0.0005771153955720365,
"test_loss": 0.0002461008552927524
},
{
"iter": 74000,
"lr": 0.02959849966692442,
"loss": 0.00034079549368470907,
"test_loss": 0.00013242995191831142
},
{
"iter": 75000,
"lr": 0.02958759565375807,
"loss": 5.4725380323361605e-05,
"test_loss": 3.366063901921734e-05
},
{
"iter": 76000,
"lr": 0.02957654761424194,
"loss": 0.0009836836252361536,
"test_loss": 0.0005578318377956748
},
{
"iter": 77000,
"lr": 0.02956535565745934,
"loss": 0.00022700421686749905,
"test_loss": 0.0016809571534395218
},
{
"iter": 78000,
"lr": 0.02955401989391456,
"loss": 9.005140782392118e-06,
"test_loss": 0.0001240746641997248
},
{
"iter": 79000,
"lr": 0.02954254043553179,
"loss": 0.00356005085632205,
"test_loss": 0.021294262260198593
},
{
"iter": 80000,
"lr": 0.029530917395653965,
"loss": 0.0020755967125296593,
"test_loss": 0.0011172222439199686
},
{
"iter": 81000,
"lr": 0.02951915088904171,
"loss": 0.00047674868255853653,
"test_loss": 0.00018403143621981144
},
{
"iter": 82000,
"lr": 0.02950724103187215,
"loss": 0.0009484861511737108,
"test_loss": 0.00034782756119966507
},
{
"iter": 83000,
"lr": 0.02949518794173781,
"loss": 0.0010415322612971067,
"test_loss": 2.6095975044881925e-05
},
{
"iter": 84000,
"lr": 0.02948299173764541,
"loss": 0.0019430904649198055,
"test_loss": 0.0018973937258124352
},
{
"iter": 85000,
"lr": 0.02947065254001473,
"loss": 0.00043586594983935356,
"test_loss": 3.3344509574817494e-05
},
{
"iter": 86000,
"lr": 0.0294581704706774,
"loss": 0.0026760578621178865,
"test_loss": 0.00023115577641874552
},
{
"iter": 87000,
"lr": 0.029445545652875695,
"loss": 0.0005670686950907111,
"test_loss": 0.001024324563331902
},
{
"iter": 88000,
"lr": 0.029432778211261317,
"loss": 0.0022992314770817757,
"test_loss": 0.0014907981967553496
},
{
"iter": 89000,
"lr": 0.02941986827189419,
"loss": 0.0003089222591370344,
"test_loss": 0.0017780089983716607
},
{
"iter": 90000,
"lr": 0.02940681596224118,
"loss": 0.0008599871071055532,
"test_loss": 0.0021578308660537004
},
{
"iter": 91000,
"lr": 0.029393621411174853,
"loss": 0.0028714954387396574,
"test_loss": 0.0016358887078240514
},
{
"iter": 92000,
"lr": 0.02938028474897222,
"loss": 0.00036192702827975154,
"test_loss": 0.00017050963651854545
},
{
"iter": 93000,
"lr": 0.029366806107313414,
"loss": 0.0012631320860236883,
"test_loss": 2.577611849119421e-05
},
{
"iter": 94000,
"lr": 0.029353185619280405,
"loss": 0.004303206689655781,
"test_loss": 0.003471080679446459
},
{
"iter": 95000,
"lr": 0.029339423419355713,
"loss": 2.8697912057396024e-05,
"test_loss": 0.0004158954252488911
},
{
"iter": 96000,
"lr": 0.02932551964342103,
"loss": 0.0001660243869991973,
"test_loss": 5.906213482376188e-05
},
{
"iter": 97000,
"lr": 0.029311474428755924,
"loss": 0.0017301312182098627,
"test_loss": 0.0026456094346940517
},
{
"iter": 98000,
"lr": 0.02929728791403646,
"loss": 0.0009389626211486757,
"test_loss": 0.0030357050709426403
},
{
"iter": 99000,
"lr": 0.029282960239333824,
"loss": 0.0008112811483442783,
"test_loss": 0.0004201643751002848
},
{
"iter": 100000,
"lr": 0.02926849154611297,
"loss": 4.2298794141970575e-05,
"test_loss": 0.0001234379888046533
},
{
"iter": 101000,
"lr": 0.0292538819772312,
"loss": 0.0009970646351575851,
"test_loss": 0.0004125392879359424
},
{
"iter": 102000,
"lr": 0.02923913167693674,
"loss": 7.432238635374233e-05,
"test_loss": 0.00012762525875587016
},
{
"iter": 103000,
"lr": 0.029224240790867363,
"loss": 0.0014614630490541458,
"test_loss": 0.003949446603655815
},
{
"iter": 104000,
"lr": 0.0292092094660489,
"loss": 0.00012159409379819408,
"test_loss": 0.00012510902888607234
},
{
"iter": 105000,
"lr": 0.029194037850893816,
"loss": 0.0011255019344389439,
"test_loss": 0.00042938615661114454
},
{
"iter": 106000,
"lr": 0.029178726095199746,
"loss": 0.00037009609513916075,
"test_loss": 0.006013224832713604
},
{
"iter": 107000,
"lr": 0.029163274350147997,
"loss": 0.0009672853047959507,
"test_loss": 0.0006766193546354771
},
{
"iter": 108000,
"lr": 0.029147682768302076,
"loss": 0.004114079289138317,
"test_loss": 0.010924482718110085
},
{
"iter": 109000,
"lr": 0.02913195150360618,
"loss": 0.006451473571360111,
"test_loss": 0.012044638395309448
},
{
"iter": 110000,
"lr": 0.029116080711383652,
"loss": 0.0031763166189193726,
"test_loss": 0.0016330855432897806
},
{
"iter": 111000,
"lr": 0.029100070548335483,
"loss": 0.005331407301127911,
"test_loss": 0.004954859614372253
},
{
"iter": 112000,
"lr": 0.02908392117253875,
"loss": 0.0011283056810498238,
"test_loss": 0.00014881588867865503
},
{
"iter": 113000,
"lr": 0.029067632743445034,
"loss": 0.002038228325545788,
"test_loss": 0.00265526887960732
},
{
"iter": 114000,
"lr": 0.029051205421878886,
"loss": 0.003950613550841808,
"test_loss": 0.0003795516095124185
},
{
"iter": 115000,
"lr": 0.029034639370036208,
"loss": 0.0012936361599713564,
"test_loss": 0.0015910060610622168
},
{
"iter": 116000,
"lr": 0.029017934751482663,
"loss": 0.008529255166649818,
"test_loss": 0.008688698522746563
},
{
"iter": 117000,
"lr": 0.02900109173115206,
"loss": 0.0012397072277963161,
"test_loss": 0.0006463420577347279
},
{
"iter": 118000,
"lr": 0.02898411047534472,
"loss": 0.038918688893318176,
"test_loss": 0.05722200497984886
},
{
"iter": 119000,
"lr": 0.028966991151725845,
"loss": 0.006451927591115236,
"test_loss": 0.007227016147226095
},
{
"iter": 120000,
"lr": 0.02894973392932385,
"loss": 0.003611186519265175,
"test_loss": 0.0008724697981961071
},
{
"iter": 121000,
"lr": 0.028932338978528704,
"loss": 0.005443987902253866,
"test_loss": 0.005751044023782015
},
{
"iter": 122000,
"lr": 0.028914806471090237,
"loss": 0.010784897021949291,
"test_loss": 0.008434824645519257
},
{
"iter": 123000,
"lr": 0.028897136580116466,
"loss": 0.05031467229127884,
"test_loss": 0.04758216440677643
},
{
"iter": 124000,
"lr": 0.028879329480071853,
"loss": 0.005141451954841614,
"test_loss": 0.0022348552010953426
},
{
"iter": 125000,
"lr": 0.028861385346775605,
"loss": 0.008585900068283081,
"test_loss": 0.011862917803227901
},
{
"iter": 126000,
"lr": 0.028843304357399936,
"loss": 0.02390182763338089,
"test_loss": 0.017609553411602974
},
{
"iter": 127000,
"lr": 0.028825086690468318,
"loss": 0.0156545452773571,
"test_loss": 0.010482419282197952
},
{
"iter": 128000,
"lr": 0.02880673252585371,
"loss": 0.029937002807855606,
"test_loss": 0.035524651408195496
},
{
"iter": 129000,
"lr": 0.02878824204477678,
"loss": 0.013299585320055485,
"test_loss": 0.005939376074820757
},
{
"iter": 130000,
"lr": 0.028769615429804146,
"loss": 0.011156000196933746,
"test_loss": 0.017653973773121834
},
{
"iter": 131000,
"lr": 0.028750852864846518,
"loss": 0.006514297798275948,
"test_loss": 0.008974754251539707
},
{
"iter": 132000,
"lr": 0.02873195453515694,
"loss": 0.02357827126979828,
"test_loss": 0.026947323232889175
},
{
"iter": 133000,
"lr": 0.028712920627328924,
"loss": 0.0075813643634319305,
"test_loss": 0.006107478868216276
},
{
"iter": 134000,
"lr": 0.028693751329294623,
"loss": 0.016182970255613327,
"test_loss": 0.013855169527232647
},
{
"iter": 135000,
"lr": 0.028674446830322966,
"loss": 0.01896003633737564,
"test_loss": 0.021220946684479713
},
{
"iter": 136000,
"lr": 0.028655007321017806,
"loss": 0.020756855607032776,
"test_loss": 0.013010598719120026
},
{
"iter": 137000,
"lr": 0.02863543299331601,
"loss": 0.019164541736245155,
"test_loss": 0.017986319959163666
},
{
"iter": 138000,
"lr": 0.028615724040485593,
"loss": 0.008877967484295368,
"test_loss": 0.02549726888537407
},
{
"iter": 139000,
"lr": 0.028595880657123793,
"loss": 0.0042451415210962296,
"test_loss": 0.003108325647190213
},
{
"iter": 140000,
"lr": 0.02857590303915516,
"loss": 0.016433309763669968,
"test_loss": 0.009964171797037125
},
{
"iter": 141000,
"lr": 0.0285557913838296,
"loss": 0.0028391436208039522,
"test_loss": 0.006361861247569323
},
{
"iter": 142000,
"lr": 0.028535545889720463,
"loss": 0.0048980629071593285,
"test_loss": 0.0037613483145833015
},
{
"iter": 143000,
"lr": 0.028515166756722547,
"loss": 0.011203103698790073,
"test_loss": 0.007850386202335358
},
{
"iter": 144000,
"lr": 0.028494654186050142,
"loss": 0.003986678086221218,
"test_loss": 0.005661428906023502
},
{
"iter": 145000,
"lr": 0.02847400838023505,
"loss": 0.015594959259033203,
"test_loss": 0.009820223785936832
},
{
"iter": 146000,
"lr": 0.028453229543124563,
"loss": 0.006637849844992161,
"test_loss": 0.00879084412008524
},
{
"iter": 147000,
"lr": 0.028432317879879477,
"loss": 0.012278251349925995,
"test_loss": 0.009384680539369583
},
{
"iter": 148000,
"lr": 0.02841127359697205,
"loss": 0.029495524242520332,
"test_loss": 0.03286384791135788
},
{
"iter": 149000,
"lr": 0.02839009690218395,
"loss": 0.0020807762630283833,
"test_loss": 0.004195379093289375
},
{
"iter": 150000,
"lr": 0.02836878800460424,
"loss": 0.0026313485577702522,
"test_loss": 0.00771433487534523
},
{
"iter": 151000,
"lr": 0.02834734711462729,
"loss": 0.003208052832633257,
"test_loss": 0.002173841930925846
},
{
"iter": 152000,
"lr": 0.028325774443950683,
"loss": 0.004879931919276714,
"test_loss": 0.006381724961102009
},
{
"iter": 153000,
"lr": 0.028304070205573177,
"loss": 0.005067159421741962,
"test_loss": 0.0038414141163229942
},
{
"iter": 154000,
"lr": 0.02828223461379255,
"loss": 0.017109381034970284,
"test_loss": 0.0076220398768782616
},
{
"iter": 155000,
"lr": 0.0282602678842035,
"loss": 0.0049171606078743935,
"test_loss": 0.0031963633373379707
},
{
"iter": 156000,
"lr": 0.028238170233695535,
"loss": 0.003127795411273837,
"test_loss": 0.003430670592933893
},
{
"iter": 157000,
"lr": 0.028215941880450797,
"loss": 0.0034541976638138294,
"test_loss": 0.0032552520278841257
},
{
"iter": 158000,
"lr": 0.02819358304394195,
"loss": 0.0018731520976871252,
"test_loss": 0.00224409275688231
},
{
"iter": 159000,
"lr": 0.02817109394492997,
"loss": 0.007337294984608889,
"test_loss": 0.007232898846268654
},
{
"iter": 160000,
"lr": 0.028148474805462002,
"loss": 0.00681578554213047,
"test_loss": 0.004005147144198418
},
{
"iter": 161000,
"lr": 0.02812572584886914,
"loss": 0.028274931013584137,
"test_loss": 0.009157809428870678
},
{
"iter": 162000,
"lr": 0.028102847299764238,
"loss": 0.00524199428036809,
"test_loss": 0.003932656720280647
},
{
"iter": 163000,
"lr": 0.02807983938403969,
"loss": 0.003872151020914316,
"test_loss": 0.0028623794205486774
},
{
"iter": 164000,
"lr": 0.028056702328865195,
"loss": 0.001210351474583149,
"test_loss": 0.0008379850769415498
},
{
"iter": 165000,
"lr": 0.028033436362685512,
"loss": 0.002097975229844451,
"test_loss": 0.0027224509976804256
},
{
"iter": 166000,
"lr": 0.028010041715218214,
"loss": 0.005084976553916931,
"test_loss": 0.007190586067736149
},
{
"iter": 167000,
"lr": 0.027986518617451408,
"loss": 0.0023271595127880573,
"test_loss": 0.000907504465430975
},
{
"iter": 168000,
"lr": 0.02796286730164147,
"loss": 0.001695204759016633,
"test_loss": 0.002770280232653022
},
{
"iter": 169000,
"lr": 0.02793908800131074,
"loss": 0.0037577603943645954,
"test_loss": 0.008116018958389759
},
{
"iter": 170000,
"lr": 0.027915180951245212,
"loss": 0.0016152429161593318,
"test_loss": 0.00045253714779391885
},
{
"iter": 171000,
"lr": 0.027891146387492235,
"loss": 0.0016916058957576752,
"test_loss": 0.0018121148459613323
},
{
"iter": 172000,
"lr": 0.027866984547358153,
"loss": 0.002640731167048216,
"test_loss": 0.0016402374021708965
},
{
"iter": 173000,
"lr": 0.027842695669405993,
"loss": 0.004582331050187349,
"test_loss": 0.003638762980699539
},
{
"iter": 174000,
"lr": 0.0278182799934531,
"loss": 0.0025481977500021458,
"test_loss": 0.0007963242242112756
},
{
"iter": 175000,
"lr": 0.02779373776056875,
"loss": 0.0014466342981904745,
"test_loss": 0.0008588299388065934
},
{
"iter": 176000,
"lr": 0.027769069213071783,
"loss": 0.002241849899291992,
"test_loss": 0.0015434545930474997
},
{
"iter": 177000,
"lr": 0.027744274594528235,
"loss": 0.0038108571898192167,
"test_loss": 0.0035817385651171207
},
{
"iter": 178000,
"lr": 0.02771935414974889,
"loss": 0.0029787179082632065,
"test_loss": 0.001269749365746975
},
{
"iter": 179000,
"lr": 0.027694308124786883,
"loss": 0.0016144576948136091,
"test_loss": 0.002594810212031007
},
{
"iter": 180000,
"lr": 0.027669136766935283,
"loss": 0.01568378321826458,
"test_loss": 0.011610452085733414
},
{
"iter": 181000,
"lr": 0.027643840324724632,
"loss": 0.004004272632300854,
"test_loss": 0.003277471289038658
},
{
"iter": 182000,
"lr": 0.027618419047920492,
"loss": 0.00180589419323951,
"test_loss": 0.0006558397435583174
},
{
"iter": 183000,
"lr": 0.027592873187521,
"loss": 0.0019884267821907997,
"test_loss": 0.0017487561563029885
},
{
"iter": 184000,
"lr": 0.027567202995754356,
"loss": 0.008319799788296223,
"test_loss": 0.015586787834763527
},
{
"iter": 185000,
"lr": 0.02754140872607637,
"loss": 0.0009156313026323915,
"test_loss": 0.0008562610018998384
},
{
"iter": 186000,
"lr": 0.027515490633167924,
"loss": 0.0006645068642683327,
"test_loss": 0.0002475435903761536
},
{
"iter": 187000,
"lr": 0.027489448972932495,
"loss": 0.003239435376599431,
"test_loss": 0.0030319164507091045
},
{
"iter": 188000,
"lr": 0.027463284002493583,
"loss": 0.002974236849695444,
"test_loss": 0.005696661304682493
},
{
"iter": 189000,
"lr": 0.027436995980192214,
"loss": 0.002773429499939084,
"test_loss": 0.004185836296528578
},
{
"iter": 190000,
"lr": 0.027410585165584367,
"loss": 0.0075587122701108456,
"test_loss": 0.006252805236726999
},
{
"iter": 191000,
"lr": 0.027384051819438416,
"loss": 0.008997881785035133,
"test_loss": 0.008614677004516125
},
{
"iter": 192000,
"lr": 0.027357396203732554,
"loss": 0.010975779965519905,
"test_loss": 0.019135724753141403
},
{
"iter": 193000,
"lr": 0.027330618581652213,
"loss": 0.010834279470145702,
"test_loss": 0.008247069083154202
},
{
"iter": 194000,
"lr": 0.02730371921758746,
"loss": 0.003223707899451256,
"test_loss": 0.00592515803873539
},
{
"iter": 195000,
"lr": 0.02727669837713038,
"loss": 0.006697945296764374,
"test_loss": 0.004159124568104744
},
{
"iter": 196000,
"lr": 0.027249556327072464,
"loss": 0.0010288299527019262,
"test_loss": 0.0017243127804249525
},
{
"iter": 197000,
"lr": 0.027222293335401982,
"loss": 0.0030477200634777546,
"test_loss": 0.0026654077228158712
},
{
"iter": 198000,
"lr": 0.02719490967130131,
"loss": 0.0032533612102270126,
"test_loss": 0.002175636123865843
},
{
"iter": 199000,
"lr": 0.027167405605144298,
"loss": 0.0037997192703187466,
"test_loss": 0.0012982346815988421
},
{
"iter": 200000,
"lr": 0.02713978140849359,
"loss": 0.0018231956055387855,
"test_loss": 0.0018179294420406222
},
{
"iter": 201000,
"lr": 0.027112037354097944,
"loss": 0.0016209282912313938,
"test_loss": 0.017513517290353775
},
{
"iter": 202000,
"lr": 0.02708417371588953,
"loss": 0.003704036818817258,
"test_loss": 0.00375428912229836
},
{
"iter": 203000,
"lr": 0.02705619076898125,
"loss": 0.013147672638297081,
"test_loss": 0.01016729325056076
},
{
"iter": 204000,
"lr": 0.027028088789663996,
"loss": 0.003172150580212474,
"test_loss": 0.0017637547571212053
},
{
"iter": 205000,
"lr": 0.026999868055403935,
"loss": 0.0029970044270157814,
"test_loss": 0.004906327463686466
},
{
"iter": 206000,
"lr": 0.02697152884483977,
"loss": 0.002943827770650387,
"test_loss": 0.003670147620141506
},
{
"iter": 207000,
"lr": 0.02694307143777997,
"loss": 0.005224711261689663,
"test_loss": 0.0037015387788414955
},
{
"iter": 208000,
"lr": 0.026914496115200037,
"loss": 0.0111452117562294,
"test_loss": 0.010410155169665813
},
{
"iter": 209000,
"lr": 0.02688580315923971,
"loss": 0.004208044148981571,
"test_loss": 0.003291388973593712
},
{
"iter": 210000,
"lr": 0.026856992853200198,
"loss": 0.0014585935277864337,
"test_loss": 0.0011729426914826035
},
{
"iter": 211000,
"lr": 0.02682806548154136,
"loss": 0.0013480978086590767,
"test_loss": 0.0032471115700900555
},
{
"iter": 212000,
"lr": 0.026799021329878905,
"loss": 0.012472687289118767,
"test_loss": 0.015618221834301949
},
{
"iter": 213000,
"lr": 0.02676986068498159,
"loss": 0.009718325920403004,
"test_loss": 0.010203873738646507
},
{
"iter": 214000,
"lr": 0.02674058383476835,
"loss": 0.0032009705901145935,
"test_loss": 0.004933621734380722
},
{
"iter": 215000,
"lr": 0.0267111910683055,
"loss": 0.007160776294767857,
"test_loss": 0.00994201935827732
},
{
"iter": 216000,
"lr": 0.026681682675803852,
"loss": 0.003271687775850296,
"test_loss": 0.004862448200583458
},
{
"iter": 217000,
"lr": 0.02665205894861586,
"loss": 0.003876295406371355,
"test_loss": 0.0014560327399522066
},
{
"iter": 218000,
"lr": 0.02662232017923272,
"loss": 0.009912321344017982,
"test_loss": 0.014334676787257195
},
{
"iter": 219000,
"lr": 0.02659246666128154,
"loss": 0.006082275882363319,
"test_loss": 0.0057898880913853645
},
{
"iter": 220000,
"lr": 0.026562498689522367,
"loss": 0.0020288927480578423,
"test_loss": 0.005537952296435833
},
{
"iter": 221000,
"lr": 0.026532416559845333,
"loss": 0.006171380169689655,
"test_loss": 0.008454486727714539
},
{
"iter": 222000,
"lr": 0.02650222056926771,
"loss": 0.002694549039006233,
"test_loss": 0.0015573103446513414
},
{
"iter": 223000,
"lr": 0.026471911015930976,
"loss": 0.0031362446025013924,
"test_loss": 0.0031584962271153927
},
{
"iter": 224000,
"lr": 0.026441488199097887,
"loss": 0.0038221648428589106,
"test_loss": 0.0031443117186427116
},
{
"iter": 225000,
"lr": 0.026410952419149487,
"loss": 0.004907033406198025,
"test_loss": 0.0032492754980921745
},
{
"iter": 226000,
"lr": 0.026380303977582193,
"loss": 0.0018036147812381387,
"test_loss": 0.003828649874776602
},
{
"iter": 227000,
"lr": 0.026349543177004785,
"loss": 0.001066069584339857,
"test_loss": 0.0014874342596158385
},
{
"iter": 228000,
"lr": 0.026318670321135412,
"loss": 0.0035194093361496925,
"test_loss": 0.003042072057723999
},
{
"iter": 229000,
"lr": 0.026287685714798618,
"loss": 0.009114778600633144,
"test_loss": 0.006110726855695248
},
{
"iter": 230000,
"lr": 0.026256589663922324,
"loss": 0.00380698312073946,
"test_loss": 0.011846048757433891
},
{
"iter": 231000,
"lr": 0.02622538247553479,
"loss": 0.0034530917182564735,
"test_loss": 0.002706685569137335
},
{
"iter": 232000,
"lr": 0.026194064457761606,
"loss": 0.005602722056210041,
"test_loss": 0.0059903510846197605
},
{
"iter": 233000,
"lr": 0.026162635919822635,
"loss": 0.009672198444604874,
"test_loss": 0.008974193595349789
},
{
"iter": 234000,
"lr": 0.02613109717202898,
"loss": 0.024900667369365692,
"test_loss": 0.02461247146129608
},
{
"iter": 235000,
"lr": 0.02609944852577989,
"loss": 0.009276055730879307,
"test_loss": 0.010469124652445316
},
{
"iter": 236000,
"lr": 0.026067690293559712,
"loss": 0.008351858705282211,
"test_loss": 0.00900268740952015
},
{
"iter": 237000,
"lr": 0.026035822788934782,
"loss": 0.005251324735581875,
"test_loss": 0.007232215721160173
},
{
"iter": 238000,
"lr": 0.026003846326550353,
"loss": 0.0036761255469173193,
"test_loss": 0.0038605486042797565
},
{
"iter": 239000,
"lr": 0.025971761222127483,
"loss": 0.0038110241293907166,
"test_loss": 0.003158943261951208
},
{
"iter": 240000,
"lr": 0.025939567792459896,
"loss": 0.003796353004872799,
"test_loss": 0.007506145630031824
},
{
"iter": 241000,
"lr": 0.025907266355410886,
"loss": 0.007820069789886475,
"test_loss": 0.011313961818814278
},
{
"iter": 242000,
"lr": 0.025874857229910144,
"loss": 0.009549151174724102,
"test_loss": 0.01569555141031742
},
{
"iter": 243000,
"lr": 0.02584234073595065,
"loss": 0.02349958010017872,
"test_loss": 0.0326787531375885
},
{
"iter": 244000,
"lr": 0.02580971719458547,
"loss": 0.011202016845345497,
"test_loss": 0.011364019475877285
},
{
"iter": 245000,
"lr": 0.025776986927924624,
"loss": 0.007761344313621521,
"test_loss": 0.003998031839728355
},
{
"iter": 246000,
"lr": 0.025744150259131883,
"loss": 0.008733600378036499,
"test_loss": 0.003168123308569193
},
{
"iter": 247000,
"lr": 0.02571120751242158,
"loss": 0.005032610148191452,
"test_loss": 0.006757295690476894
},
{
"iter": 248000,
"lr": 0.025678159013055427,
"loss": 0.004061665385961533,
"test_loss": 0.002719667972996831
},
{
"iter": 249000,
"lr": 0.025645005087339263,
"loss": 0.004180450923740864,
"test_loss": 0.00430157408118248
},
{
"iter": 250000,
"lr": 0.025611746062619893,
"loss": 0.004622316919267178,
"test_loss": 0.003972124308347702
},
{
"iter": 251000,
"lr": 0.02557838226728179,
"loss": 0.0027732967864722013,
"test_loss": 0.0025357636623084545
},
{
"iter": 252000,
"lr": 0.025544914030743906,
"loss": 0.009181534871459007,
"test_loss": 0.00789961963891983
},
{
"iter": 253000,
"lr": 0.02551134168345639,
"loss": 0.012753221206367016,
"test_loss": 0.012441668659448624
},
{
"iter": 254000,
"lr": 0.025477665556897334,
"loss": 0.010536564514040947,
"test_loss": 0.005048907361924648
},
{
"iter": 255000,
"lr": 0.025443885983569496,
"loss": 0.003478358732536435,
"test_loss": 0.0020251194946467876
},
{
"iter": 256000,
"lr": 0.025410003296997028,
"loss": 0.0024845139123499393,
"test_loss": 0.00321107916533947
},
{
"iter": 257000,
"lr": 0.02537601783172217,
"loss": 0.001314252382144332,
"test_loss": 0.0010274284286424518
},
{
"iter": 258000,
"lr": 0.02534192992330195,
"loss": 0.004131457768380642,
"test_loss": 0.004498985596001148
},
{
"iter": 259000,
"lr": 0.025307739908304882,
"loss": 0.004664195701479912,
"test_loss": 0.0030648433603346348
},
{
"iter": 260000,
"lr": 0.025273448124307624,
"loss": 0.00871725007891655,
"test_loss": 0.013529743067920208
},
{
"iter": 261000,
"lr": 0.025239054909891655,
"loss": 0.009320715442299843,
"test_loss": 0.01604446768760681
},
{
"iter": 262000,
"lr": 0.025204560604639943,
"loss": 0.0040467833168804646,
"test_loss": 0.004220261238515377
},
{
"iter": 263000,
"lr": 0.02516996554913357,
"loss": 0.005600417964160442,
"test_loss": 0.009918153285980225
},
{
"iter": 264000,
"lr": 0.025135270084948383,
"loss": 0.002370871603488922,
"test_loss": 0.002101703779771924
},
{
"iter": 265000,
"lr": 0.02510047455465162,
"loss": 0.012270070612430573,
"test_loss": 0.009733596816658974
},
{
"iter": 266000,
"lr": 0.02506557930179853,
"loss": 0.004519831854850054,
"test_loss": 0.003118803258985281
},
{
"iter": 267000,
"lr": 0.025030584670928967,
"loss": 0.01339467242360115,
"test_loss": 0.014820907264947891
},
{
"iter": 268000,
"lr": 0.024995491007564003,
"loss": 0.003758954117074609,
"test_loss": 0.0056359656155109406
},
{
"iter": 269000,
"lr": 0.024960298658202523,
"loss": 0.001641460694372654,
"test_loss": 0.004405388608574867
},
{
"iter": 270000,
"lr": 0.024925007970317777,
"loss": 0.00873821321874857,
"test_loss": 0.00486126821488142
},
{
"iter": 271000,
"lr": 0.02488961929235397,
"loss": 0.004769525025039911,
"test_loss": 0.005883777979761362
},
{
"iter": 272000,
"lr": 0.024854132973722808,
"loss": 0.0058099958114326,
"test_loss": 0.00522029772400856
},
{
"iter": 273000,
"lr": 0.02481854936480008,
"loss": 0.0031291497871279716,
"test_loss": 0.0036910707131028175
},
{
"iter": 274000,
"lr": 0.02478286881692216,
"loss": 0.001098710810765624,
"test_loss": 0.0014021608512848616
},
{
"iter": 275000,
"lr": 0.02474709168238255,
"loss": 0.004439540207386017,
"test_loss": 0.00451246090233326
},
{
"iter": 276000,
"lr": 0.024711218314428404,
"loss": 0.006433282047510147,
"test_loss": 0.009515691548585892
},
{
"iter": 277000,
"lr": 0.02467524906725705,
"loss": 0.0039498996920883656,
"test_loss": 0.0019493245054036379
},
{
"iter": 278000,
"lr": 0.02463918429601248,
"loss": 0.0026055516209453344,
"test_loss": 0.003371638245880604
},
{
"iter": 279000,
"lr": 0.024603024356781848,
"loss": 0.004473382607102394,
"test_loss": 0.0025877654552459717
},
{
"iter": 280000,
"lr": 0.02456676960659195,
"loss": 0.0044031767174601555,
"test_loss": 0.0025896199513226748
},
{
"iter": 281000,
"lr": 0.024530420403405702,
"loss": 0.007547914050519466,
"test_loss": 0.006386089604347944
},
{
"iter": 282000,
"lr": 0.02449397710611861,
"loss": 0.00314199086278677,
"test_loss": 0.0024068360216915607
},
{
"iter": 283000,
"lr": 0.024457440074555234,
"loss": 0.006031259428709745,
"test_loss": 0.004548929166048765
},
{
"iter": 284000,
"lr": 0.02442080966946559,
"loss": 0.0019232046324759722,
"test_loss": 0.003923590295016766
},
{
"iter": 285000,
"lr": 0.02438408625252165,
"loss": 0.005979673005640507,
"test_loss": 0.005767210852354765
},
{
"iter": 286000,
"lr": 0.024347270186313733,
"loss": 0.006389237940311432,
"test_loss": 0.007830338552594185
},
{
"iter": 287000,
"lr": 0.02431036183434694,
"loss": 0.00721075851470232,
"test_loss": 0.012150455266237259
},
{
"iter": 288000,
"lr": 0.024273361561037557,
"loss": 0.004674108698964119,
"test_loss": 0.005389980040490627
},
{
"iter": 289000,
"lr": 0.024236269731709458,
"loss": 0.0066370535641908646,
"test_loss": 0.004767067730426788
},
{
"iter": 290000,
"lr": 0.0241990867125905,
"loss": 0.005096702836453915,
"test_loss": 0.005722790956497192
},
{
"iter": 291000,
"lr": 0.024161812870808902,
"loss": 0.004534249193966389,
"test_loss": 0.008508238941431046
},
{
"iter": 292000,
"lr": 0.024124448574389636,
"loss": 0.002413136651739478,
"test_loss": 0.0034640957601368427
},
{
"iter": 293000,
"lr": 0.024086994192250775,
"loss": 0.0031674334313720465,
"test_loss": 0.0035344602074474096
},
{
"iter": 294000,
"lr": 0.024049450094199856,
"loss": 0.0023323099594563246,
"test_loss": 0.005762317683547735
},
{
"iter": 295000,
"lr": 0.02401181665093023,
"loss": 0.0030240134801715612,
"test_loss": 0.0032650367356836796
},
{
"iter": 296000,
"lr": 0.023974094234017407,
"loss": 0.0014272239059209824,
"test_loss": 0.006906958296895027
},
{
"iter": 297000,
"lr": 0.02393628321591538,
"loss": 0.0013781699817627668,
"test_loss": 0.002446200931444764
},
{
"iter": 298000,
"lr": 0.02389838396995294,
"loss": 0.005329154431819916,
"test_loss": 0.004246043972671032
},
{
"iter": 299000,
"lr": 0.023860396870330022,
"loss": 0.0019448443781584501,
"test_loss": 0.0010329644428566098
},
{
"iter": 300000,
"lr": 0.023822322292113972,
"loss": 0.008393359370529652,
"test_loss": 0.005630714353173971
},
{
"iter": 301000,
"lr": 0.02378416061123586,
"loss": 0.0014907442964613438,
"test_loss": 0.001707607414573431
},
{
"iter": 302000,
"lr": 0.023745912204486765,
"loss": 0.017736928537487984,
"test_loss": 0.02176503837108612
},
{
"iter": 303000,
"lr": 0.023707577449514072,
"loss": 0.001970216166228056,
"test_loss": 0.0036807935684919357
},
{
"iter": 304000,
"lr": 0.023669156724817723,
"loss": 0.006412023678421974,
"test_loss": 0.011694186367094517
},
{
"iter": 305000,
"lr": 0.023630650409746486,
"loss": 0.005007663741707802,
"test_loss": 0.0037637734785676003
},
{
"iter": 306000,
"lr": 0.023592058884494192,
"loss": 0.002266363240778446,
"test_loss": 0.0025780838914215565
},
{
"iter": 307000,
"lr": 0.023553382530096027,
"loss": 0.002736572176218033,
"test_loss": 0.0032588704489171505
},
{
"iter": 308000,
"lr": 0.023514621728424723,
"loss": 0.0026423560921102762,
"test_loss": 0.0018260593060404062
},
{
"iter": 309000,
"lr": 0.023475776862186812,
"loss": 0.005027745850384235,
"test_loss": 0.006777969654649496
},
{
"iter": 310000,
"lr": 0.023436848314918848,
"loss": 0.0022937036119401455,
"test_loss": 0.0031273523345589638
},
{
"iter": 311000,
"lr": 0.023397836470983594,
"loss": 0.003965223208069801,
"test_loss": 0.0023642058949917555
},
{
"iter": 312000,
"lr": 0.02335874171556626,
"loss": 0.005313948728144169,
"test_loss": 0.005365452729165554
},
{
"iter": 313000,
"lr": 0.023319564434670696,
"loss": 0.0024826303124427795,
"test_loss": 0.003409608732908964
},
{
"iter": 314000,
"lr": 0.023280305015115552,
"loss": 0.0020392960868775845,
"test_loss": 0.004671364091336727
},
{
"iter": 315000,
"lr": 0.023240963844530484,
"loss": 0.001961235422641039,
"test_loss": 0.026694834232330322
},
{
"iter": 316000,
"lr": 0.023201541311352325,
"loss": 0.0010364726185798645,
"test_loss": 0.0010819952003657818
},
{
"iter": 317000,
"lr": 0.023162037804821244,
"loss": 0.0017599717248231173,
"test_loss": 0.0038418557960540056
},
{
"iter": 318000,
"lr": 0.0231224537149769,
"loss": 0.001057835528627038,
"test_loss": 0.0010505085811018944
},
{
"iter": 319000,
"lr": 0.023082789432654596,
"loss": 0.002106625586748123,
"test_loss": 0.004606937523931265
},
{
"iter": 320000,
"lr": 0.023043045349481418,
"loss": 0.004333317745476961,
"test_loss": 0.0009624625090509653
},
{
"iter": 321000,
"lr": 0.02300322185787238,
"loss": 0.004252217710018158,
"test_loss": 0.0018453216180205345
},
{
"iter": 322000,
"lr": 0.022963319351026527,
"loss": 0.0023403784725815058,
"test_loss": 0.00273308833129704
},
{
"iter": 323000,
"lr": 0.022923338222923063,
"loss": 0.0022133588790893555,
"test_loss": 0.0019295017700642347
},
{
"iter": 324000,
"lr": 0.022883278868317473,
"loss": 0.0127000967040658,
"test_loss": 0.008353522047400475
},
{
"iter": 325000,
"lr": 0.02284314168273761,
"loss": 0.005515168886631727,
"test_loss": 0.007600512355566025
},
{
"iter": 326000,
"lr": 0.022802927062479796,
"loss": 0.004449785687029362,
"test_loss": 0.005663862451910973
},
{
"iter": 327000,
"lr": 0.022762635404604898,
"loss": 0.0033371560275554657,
"test_loss": 0.001621014322154224
},
{
"iter": 328000,
"lr": 0.02272226710693443,
"loss": 0.0029605210293084383,
"test_loss": 0.0042740521021187305
},
{
"iter": 329000,
"lr": 0.02268182256804661,
"loss": 0.005739983171224594,
"test_loss": 0.0063252379186451435
},
{
"iter": 330000,
"lr": 0.022641302187272422,
"loss": 0.003278180491179228,
"test_loss": 0.0020751701667904854
},
{
"iter": 331000,
"lr": 0.02260070636469168,
"loss": 0.0038942010141909122,
"test_loss": 0.007130652666091919
},
{
"iter": 332000,
"lr": 0.022560035501129085,
"loss": 0.004581931978464127,
"test_loss": 0.001929939491674304
},
{
"iter": 333000,
"lr": 0.022519289998150244,
"loss": 0.0024493923410773277,
"test_loss": 0.003575567388907075
},
{
"iter": 334000,
"lr": 0.022478470258057725,
"loss": 0.002172841690480709,
"test_loss": 0.0011024491395801306
},
{
"iter": 335000,
"lr": 0.022437576683887083,
"loss": 0.003154472913593054,
"test_loss": 0.0020468891598284245
},
{
"iter": 336000,
"lr": 0.02239660967940288,
"loss": 0.003386006224900484,
"test_loss": 0.002800632268190384
},
{
"iter": 337000,
"lr": 0.022355569649094686,
"loss": 0.007896492257714272,
"test_loss": 0.001382704358547926
},
{
"iter": 338000,
"lr": 0.0223144569981731,
"loss": 0.005629195831716061,
"test_loss": 0.00553442258387804
},
{
"iter": 339000,
"lr": 0.022273272132565743,
"loss": 0.004258297383785248,
"test_loss": 0.001613761531189084
},
{
"iter": 340000,
"lr": 0.022232015458913255,
"loss": 0.004461368545889854,
"test_loss": 0.0010750286746770144
},
{
"iter": 341000,
"lr": 0.02219068738456527,
"loss": 0.006841880269348621,
"test_loss": 0.005424811504781246
},
{
"iter": 342000,
"lr": 0.022149288317576395,
"loss": 0.003427179530262947,
"test_loss": 0.004023235756903887
},
{
"iter": 343000,
"lr": 0.02210781866670221,
"loss": 0.003179234219714999,
"test_loss": 0.003170567797496915
},
{
"iter": 344000,
"lr": 0.022066278841395174,
"loss": 0.003925511613488197,
"test_loss": 0.003508116817101836
},
{
"iter": 345000,
"lr": 0.022024669251800646,
"loss": 0.005033682566136122,
"test_loss": 0.0039046197198331356
},
{
"iter": 346000,
"lr": 0.02198299030875279,
"loss": 0.005603437777608633,
"test_loss": 0.002058255486190319
},
{
"iter": 347000,
"lr": 0.02194124242377054,
"loss": 0.006487406324595213,
"test_loss": 0.005847100634127855
},
{
"iter": 348000,
"lr": 0.021899426009053525,
"loss": 0.005823981016874313,
"test_loss": 0.0036564976908266544
},
{
"iter": 349000,
"lr": 0.021857541477478017,
"loss": 0.001821751706302166,
"test_loss": 0.0013244403526186943
},
{
"iter": 350000,
"lr": 0.02181558924259283,
"loss": 0.0029425914399325848,
"test_loss": 0.004246935714036226
},
{
"iter": 351000,
"lr": 0.021773569718615257,
"loss": 0.0044395774602890015,
"test_loss": 0.002581089735031128
},
{
"iter": 352000,
"lr": 0.021731483320426976,
"loss": 0.004286543466150761,
"test_loss": 0.0032992076594382524
},
{
"iter": 353000,
"lr": 0.021689330463569943,
"loss": 0.003387096803635359,
"test_loss": 0.004971416667103767
},
{
"iter": 354000,
"lr": 0.0216471115642423,
"loss": 0.0020806859247386456,
"test_loss": 0.003832163056358695
},
{
"iter": 355000,
"lr": 0.02160482703929426,
"loss": 0.0021562210749834776,
"test_loss": 0.001426595845259726
},
{
"iter": 356000,
"lr": 0.021562477306224,
"loss": 0.003053523600101471,
"test_loss": 0.0029009408317506313
},
{
"iter": 357000,
"lr": 0.021520062783173526,
"loss": 0.0032427823171019554,
"test_loss": 0.004624674096703529
},
{
"iter": 358000,
"lr": 0.02147758388892455,
"loss": 0.0012938822619616985,
"test_loss": 0.00364934210665524
},
{
"iter": 359000,
"lr": 0.021435041042894364,
"loss": 0.0014421942178159952,
"test_loss": 0.0016871215775609016
},
{
"iter": 360000,
"lr": 0.02139243466513168,
"loss": 0.003954396583139896,
"test_loss": 0.003178955987095833
},
{
"iter": 361000,
"lr": 0.021349765176312506,
"loss": 0.0009196070022881031,
"test_loss": 0.0026779184117913246
},
{
"iter": 362000,
"lr": 0.021307032997735967,
"loss": 0.0022866155486553907,
"test_loss": 0.0014379071071743965
},
{
"iter": 363000,
"lr": 0.021264238551320164,
"loss": 0.0028034988790750504,
"test_loss": 0.0038171708583831787
},
{
"iter": 364000,
"lr": 0.02122138225959801,
"loss": 0.00331479636952281,
"test_loss": 0.0025309016928076744
},
{
"iter": 365000,
"lr": 0.02117846454571303,
"loss": 0.0028660704847425222,
"test_loss": 0.005081166513264179
},
{
"iter": 366000,
"lr": 0.02113548583341523,
"loss": 0.002766562160104513,
"test_loss": 0.003085349453613162
},
{
"iter": 367000,
"lr": 0.021092446547056866,
"loss": 0.0020738416351377964,
"test_loss": 0.0011017649667337537
},
{
"iter": 368000,
"lr": 0.02104934711158828,
"loss": 0.002023151144385338,
"test_loss": 0.0017363816732540727
},
{
"iter": 369000,
"lr": 0.021006187952553705,
"loss": 0.009654244408011436,
"test_loss": 0.0074168178252875805
},
{
"iter": 370000,
"lr": 0.02096296949608705,
"loss": 0.001865508733317256,
"test_loss": 0.0016607609577476978
},
{
"iter": 371000,
"lr": 0.020919692168907704,
"loss": 0.0017585232853889465,
"test_loss": 0.0017329211113974452
},
{
"iter": 372000,
"lr": 0.02087635639831632,
"loss": 0.0013483911752700806,
"test_loss": 0.001445314264856279
},
{
"iter": 373000,
"lr": 0.020832962612190586,
"loss": 0.0010248161852359772,
"test_loss": 0.0011386662954464555
},
{
"iter": 374000,
"lr": 0.020789511238981023,
"loss": 0.0037165952380746603,
"test_loss": 0.004814023617655039
},
{
"iter": 375000,
"lr": 0.020746002707706726,
"loss": 0.0014297252055257559,
"test_loss": 0.0023714161943644285
},
{
"iter": 376000,
"lr": 0.020702437447951152,
"loss": 0.002895237412303686,
"test_loss": 0.005415003746747971
},
{
"iter": 377000,
"lr": 0.02065881588985787,
"loss": 0.0011381172807887197,
"test_loss": 0.0009007496992126107
},
{
"iter": 378000,
"lr": 0.02061513846412631,
"loss": 0.0038409209810197353,
"test_loss": 0.0014597245026379824
},
{
"iter": 379000,
"lr": 0.020571405602007504,
"loss": 0.002149030566215515,
"test_loss": 0.001826093764975667
},
{
"iter": 380000,
"lr": 0.02052761773529986,
"loss": 0.0017281027976423502,
"test_loss": 0.0010900819906964898
},
{
"iter": 381000,
"lr": 0.02048377529634486,
"loss": 0.0008142647566273808,
"test_loss": 0.0012082929024472833
},
{
"iter": 382000,
"lr": 0.020439878718022803,
"loss": 0.0013281453866511583,
"test_loss": 0.00039479410042986274
},
{
"iter": 383000,
"lr": 0.02039592843374855,
"loss": 0.0015743995318189263,
"test_loss": 0.0018233570735901594
},
{
"iter": 384000,
"lr": 0.020351924877467228,
"loss": 0.003327306592836976,
"test_loss": 0.0007659384282305837
},
{
"iter": 385000,
"lr": 0.02030786848364994,
"loss": 0.0014527408638969064,
"test_loss": 0.0002966596803162247
},
{
"iter": 386000,
"lr": 0.020263759687289485,
"loss": 0.0019077076576650143,
"test_loss": 0.0013225534930825233
},
{
"iter": 387000,
"lr": 0.02021959892389606,
"loss": 0.0012876775581389666,
"test_loss": 0.002673704642802477
},
{
"iter": 388000,
"lr": 0.020175386629492968,
"loss": 0.0008654642151668668,
"test_loss": 0.0011580318678170443
},
{
"iter": 389000,
"lr": 0.020131123240612298,
"loss": 0.0017032746691256762,
"test_loss": 0.0012502613244578242
},
{
"iter": 390000,
"lr": 0.02008680919429063,
"loss": 0.002843728056177497,
"test_loss": 0.006892813369631767
},
{
"iter": 391000,
"lr": 0.0200424449280647,
"loss": 0.0021212929859757423,
"test_loss": 0.0033796564675867558
},
{
"iter": 392000,
"lr": 0.01999803087996711,
"loss": 0.0005293131107464433,
"test_loss": 0.0013081841170787811
},
{
"iter": 393000,
"lr": 0.019953567488521964,
"loss": 0.0015701663214713335,
"test_loss": 0.0016504100058227777
},
{
"iter": 394000,
"lr": 0.01990905519274058,
"loss": 0.0017204233445227146,
"test_loss": 0.001071484643034637
},
{
"iter": 395000,
"lr": 0.019864494432117123,
"loss": 0.0028193271718919277,
"test_loss": 0.0013575383927673101
},
{
"iter": 396000,
"lr": 0.019819885646624288,
"loss": 0.002082481747493148,
"test_loss": 0.0012683767126873136
},
{
"iter": 397000,
"lr": 0.019775229276708935,
"loss": 0.004446134436875582,
"test_loss": 0.0052950941026210785
},
{
"iter": 398000,
"lr": 0.019730525763287755,
"loss": 0.0022772776428610086,
"test_loss": 0.0011805309914052486
},
{
"iter": 399000,
"lr": 0.019685775547742913,
"loss": 0.0015102208126336336,
"test_loss": 0.0007366648060269654
},
{
"iter": 400000,
"lr": 0.01964097907191769,
"loss": 0.001994397956877947,
"test_loss": 0.000783414114266634
},
{
"iter": 401000,
"lr": 0.019596136778112123,
"loss": 0.0009458464337512851,
"test_loss": 0.00042463955469429493
},
{
"iter": 402000,
"lr": 0.019551249109078628,
"loss": 0.001247018575668335,
"test_loss": 0.00026821557548828423
},
{
"iter": 403000,
"lr": 0.019506316508017638,
"loss": 0.00021781015675514936,
"test_loss": 0.00042301128269173205
},
{
"iter": 404000,
"lr": 0.019461339418573222,
"loss": 0.0007367624202743173,
"test_loss": 0.0024472419172525406
},
{
"iter": 405000,
"lr": 0.019416318284828725,
"loss": 0.0020251956302672625,
"test_loss": 0.001079440931789577
},
{
"iter": 406000,
"lr": 0.019371253551302335,
"loss": 0.0012915844563394785,
"test_loss": 0.0035742090549319983
},
{
"iter": 407000,
"lr": 0.019326145662942742,
"loss": 0.0074498835019767284,
"test_loss": 0.0021352190524339676
},
{
"iter": 408000,
"lr": 0.019280995065124734,
"loss": 0.0018002715660259128,
"test_loss": 0.0008934105280786753
},
{
"iter": 409000,
"lr": 0.019235802203644774,
"loss": 0.0015140729956328869,
"test_loss": 0.002051664050668478
},
{
"iter": 410000,
"lr": 0.019190567524716633,
"loss": 0.0008876629290170968,
"test_loss": 0.00045265594962984324
},
{
"iter": 411000,
"lr": 0.019145291474966963,
"loss": 0.002150661312043667,
"test_loss": 0.0008878207299858332
},
{
"iter": 412000,
"lr": 0.019099974501430892,
"loss": 0.0022444911301136017,
"test_loss": 0.0040635885670781136
},
{
"iter": 413000,
"lr": 0.01905461705154761,
"loss": 0.002123081823810935,
"test_loss": 0.0013356831623241305
},
{
"iter": 414000,
"lr": 0.01900921957315595,
"loss": 0.0016920199850574136,
"test_loss": 0.0024555742274969816
},
{
"iter": 415000,
"lr": 0.018963782514489977,
"loss": 0.00044727715430781245,
"test_loss": 0.0011314463336020708
},
{
"iter": 416000,
"lr": 0.018918306324174548,
"loss": 0.0012349702883511782,
"test_loss": 0.0006494345725513995
},
{
"iter": 417000,
"lr": 0.018872791451220883,
"loss": 0.000871861120685935,
"test_loss": 0.0026833824813365936
},
{
"iter": 418000,
"lr": 0.018827238345022153,
"loss": 0.00045165891060605645,
"test_loss": 0.0018681623041629791
},
{
"iter": 419000,
"lr": 0.018781647455349,
"loss": 0.000649906462058425,
"test_loss": 0.0013825923670083284
},
{
"iter": 420000,
"lr": 0.018736019232345153,
"loss": 0.001726906863041222,
"test_loss": 0.0013884902000427246
},
{
"iter": 421000,
"lr": 0.018690354126522927,
"loss": 0.0008551835198886693,
"test_loss": 0.0014136084355413914
},
{
"iter": 422000,
"lr": 0.01864465258875882,
"loss": 0.001413583057001233,
"test_loss": 0.00156830670312047
},
{
"iter": 423000,
"lr": 0.01859891507028904,
"loss": 0.000784430536441505,
"test_loss": 0.0010985585395246744
},
{
"iter": 424000,
"lr": 0.018553142022705037,
"loss": 0.00045206694630905986,
"test_loss": 0.0006883598398417234
},
{
"iter": 425000,
"lr": 0.018507333897949077,
"loss": 0.0011310284025967121,
"test_loss": 0.004156462848186493
},
{
"iter": 426000,
"lr": 0.018461491148309753,
"loss": 0.0010064819362014532,
"test_loss": 0.0005030919564887881
},
{
"iter": 427000,
"lr": 0.018415614226417534,
"loss": 0.0007148656877689064,
"test_loss": 0.00019564271497074515
},
{
"iter": 428000,
"lr": 0.018369703585240277,
"loss": 0.0017797250766307116,
"test_loss": 0.0014324643416330218
},
{
"iter": 429000,
"lr": 0.018323759678078793,
"loss": 0.0005678959423676133,
"test_loss": 0.0004587931907735765
},
{
"iter": 430000,
"lr": 0.01827778295856232,
"loss": 0.0021604886278510094,
"test_loss": 0.0010707334149628878
},
{
"iter": 431000,
"lr": 0.018231773880644078,
"loss": 0.0011422473471611738,
"test_loss": 0.001102776499465108
},
{
"iter": 432000,
"lr": 0.018185732898596787,
"loss": 0.0014112507924437523,
"test_loss": 0.00016971587319858372
},
{
"iter": 433000,
"lr": 0.01813966046700817,
"loss": 0.0008836248307488859,
"test_loss": 0.0027075218968093395
},
{
"iter": 434000,
"lr": 0.018093557040776472,
"loss": 0.00029551045736297965,
"test_loss": 0.001216703443787992
},
{
"iter": 435000,
"lr": 0.01804742307510595,
"loss": 0.002235500607639551,
"test_loss": 0.00024242306244559586
},
{
"iter": 436000,
"lr": 0.01800125902550241,
"loss": 0.001060995040461421,
"test_loss": 0.001033919514156878
},
{
"iter": 437000,
"lr": 0.017955065347768688,
"loss": 0.0012554036220535636,
"test_loss": 0.0012063629692420363
},
{
"iter": 438000,
"lr": 0.01790884249800015,
"loss": 0.001961404923349619,
"test_loss": 0.00019972448353655636
},
{
"iter": 439000,
"lr": 0.0178625909325802,
"loss": 0.0018396172672510147,
"test_loss": 0.004008515737950802
},
{
"iter": 440000,
"lr": 0.01781631110817577,
"loss": 0.006894783116877079,
"test_loss": 0.0034180080983787775
},
{
"iter": 441000,
"lr": 0.01777000348173279,
"loss": 0.002610748866572976,
"test_loss": 0.0025454512797296047
},
{
"iter": 442000,
"lr": 0.017723668510471715,
"loss": 0.0011392002925276756,
"test_loss": 0.004870769567787647
},
{
"iter": 443000,
"lr": 0.017677306651882985,
"loss": 0.001616138033568859,
"test_loss": 0.001309181796386838
},
{
"iter": 444000,
"lr": 0.017630918363722506,
"loss": 0.0008581280708312988,
"test_loss": 0.0006332147167995572
},
{
"iter": 445000,
"lr": 0.01758450410400715,
"loss": 0.0005998535780236125,
"test_loss": 0.0006870012730360031
},
{
"iter": 446000,
"lr": 0.017538064331010204,
"loss": 0.0009828031761571765,
"test_loss": 0.0007571580354124308
},
{
"iter": 447000,
"lr": 0.01749159950325688,
"loss": 0.001355904620140791,
"test_loss": 0.0019973833113908768
},
{
"iter": 448000,
"lr": 0.01744511007951975,
"loss": 0.0004578658554237336,
"test_loss": 0.0018023262964561582
},
{
"iter": 449000,
"lr": 0.017398596518814258,
"loss": 0.002621842548251152,
"test_loss": 0.002531354781240225
},
{
"iter": 450000,
"lr": 0.017352059280394135,
"loss": 0.0003939744201488793,
"test_loss": 0.0006794952787458897
},
{
"iter": 451000,
"lr": 0.017305498823746927,
"loss": 0.0010835808934643865,
"test_loss": 0.0016679420368745923
},
{
"iter": 452000,
"lr": 0.017258915608589408,
"loss": 0.0009043310419656336,
"test_loss": 0.0008867436554282904
},
{
"iter": 453000,
"lr": 0.017212310094863067,
"loss": 0.0005586008192040026,
"test_loss": 0.0012618150794878602
},
{
"iter": 454000,
"lr": 0.017165682742729546,
"loss": 0.001658054068684578,
"test_loss": 0.0010470612905919552
},
{
"iter": 455000,
"lr": 0.017119034012566127,
"loss": 0.001162797212600708,
"test_loss": 0.0005646627396345139
},
{
"iter": 456000,
"lr": 0.017072364364961155,
"loss": 0.0012168282410129905,
"test_loss": 0.0005882377154193819
},
{
"iter": 457000,
"lr": 0.017025674260709514,
"loss": 0.0013401043834164739,
"test_loss": 0.00016164191765710711
},
{
"iter": 458000,
"lr": 0.01697896416080806,
"loss": 0.001002814038656652,
"test_loss": 0.0006601196946576238
},
{
"iter": 459000,
"lr": 0.016932234526451085,
"loss": 0.0006279475055634975,
"test_loss": 0.0008444065460935235
},
{
"iter": 460000,
"lr": 0.01688548581902575,
"loss": 0.0016093496233224869,
"test_loss": 0.0009688998106867075
},
{
"iter": 461000,
"lr": 0.01683871850010753,
"loss": 0.0008121808641590178,
"test_loss": 0.0008685288485139608
},
{
"iter": 462000,
"lr": 0.016791933031455677,
"loss": 0.0010969492141157389,
"test_loss": 0.0006457250565290451
},
{
"iter": 463000,
"lr": 0.016745129875008626,
"loss": 0.0019472987623885274,
"test_loss": 0.0027446704916656017
},
{
"iter": 464000,
"lr": 0.016698309492879468,
"loss": 0.0003577872703317553,
"test_loss": 0.00023929146118462086
},
{
"iter": 465000,
"lr": 0.01665147234735136,
"loss": 0.0002801507944241166,
"test_loss": 0.0004314736870583147
},
{
"iter": 466000,
"lr": 0.016604618900872992,
"loss": 0.0018715329933911562,
"test_loss": 0.0026305760256946087
},
{
"iter": 467000,
"lr": 0.01655774961605398,
"loss": 0.0009736770298331976,
"test_loss": 0.0014222455210983753
},
{
"iter": 468000,
"lr": 0.016510864955660336,
"loss": 0.002256464445963502,
"test_loss": 0.000341863720677793
},
{
"iter": 469000,
"lr": 0.016463965382609875,
"loss": 0.0013059449847787619,
"test_loss": 0.0005914373905397952
},
{
"iter": 470000,
"lr": 0.016417051359967662,
"loss": 0.0007435351144522429,
"test_loss": 0.0007491387077607214
},
{
"iter": 471000,
"lr": 0.016370123350941422,
"loss": 0.0016935465391725302,
"test_loss": 0.00019898773462045938
},
{
"iter": 472000,
"lr": 0.016323181818876972,
"loss": 0.000956690520979464,
"test_loss": 0.0008758006151765585
},
{
"iter": 473000,
"lr": 0.01627622722725367,
"loss": 0.0005887510487809777,
"test_loss": 0.0008168969070538878
},
{
"iter": 474000,
"lr": 0.01622926003967979,
"loss": 0.0018150035757571459,
"test_loss": 0.0010191992623731494
},
{
"iter": 475000,
"lr": 0.01618228071988799,
"loss": 0.001426883041858673,
"test_loss": 0.00043500089668668807
},
{
"iter": 476000,
"lr": 0.016135289731730715,
"loss": 0.0002781851217150688,
"test_loss": 0.0008035525097511709
},
{
"iter": 477000,
"lr": 0.016088287539175614,
"loss": 0.0010025199735537171,
"test_loss": 0.0002377173223067075
},
{
"iter": 478000,
"lr": 0.016041274606300962,
"loss": 0.001877885195426643,
"test_loss": 0.0007670074701309204
},
{
"iter": 479000,
"lr": 0.015994251397291086,
"loss": 0.0003341192496009171,
"test_loss": 0.0005114746745675802
},
{
"iter": 480000,
"lr": 0.015947218376431767,
"loss": 0.0011178376153111458,
"test_loss": 0.00024691203725524247
},
{
"iter": 481000,
"lr": 0.015900176008105667,
"loss": 0.001542575191706419,
"test_loss": 0.0035214137751609087
},
{
"iter": 482000,
"lr": 0.015853124756787747,
"loss": 0.0008141195285134017,
"test_loss": 6.874567770864815e-05
},
{
"iter": 483000,
"lr": 0.01580606508704066,
"loss": 0.0006352186901494861,
"test_loss": 0.0009114991407841444
},
{
"iter": 484000,
"lr": 0.015758997463510192,
"loss": 0.0003278875374235213,
"test_loss": 0.00019279788830317557
},
{
"iter": 485000,
"lr": 0.015711922350920653,
"loss": 0.002054064068943262,
"test_loss": 0.0005524063017219305
},
{
"iter": 486000,
"lr": 0.015664840214070302,
"loss": 0.0012821103446185589,
"test_loss": 0.0013239753898233175
},
{
"iter": 487000,
"lr": 0.015617751517826755,
"loss": 0.0009265710250474513,
"test_loss": 0.00040389690548181534
},
{
"iter": 488000,
"lr": 0.01557065672712238,
"loss": 0.00154742575250566,
"test_loss": 0.0014085073489695787
},
{
"iter": 489000,
"lr": 0.015523556306949729,
"loss": 0.0010090741561725736,
"test_loss": 0.0004286096664145589
},
{
"iter": 490000,
"lr": 0.015476450722356937,
"loss": 0.0003911459643859416,
"test_loss": 0.0011356179602444172
},
{
"iter": 491000,
"lr": 0.015429340438443125,
"loss": 0.0017186534823849797,
"test_loss": 0.0007090962026268244
},
{
"iter": 492000,
"lr": 0.015382225920353819,
"loss": 0.0009289293666370213,
"test_loss": 0.0002737371833063662
},
{
"iter": 493000,
"lr": 0.015335107633276342,
"loss": 0.0006876366678625345,
"test_loss": 0.0004160284879617393
},
{
"iter": 494000,
"lr": 0.015287986042435236,
"loss": 0.0012115961872041225,
"test_loss": 0.0004916189936921
},
{
"iter": 495000,
"lr": 0.015240861613087669,
"loss": 0.0005784963723272085,
"test_loss": 0.00066507508745417
},
{
"iter": 496000,
"lr": 0.015193734810518826,
"loss": 0.0006595265585929155,
"test_loss": 0.0011432294268161058
},
{
"iter": 497000,
"lr": 0.015146606100037329,
"loss": 0.00028376447153277695,
"test_loss": 0.002093046437948942
},
{
"iter": 498000,
"lr": 0.015099475946970633,
"loss": 0.000990218250080943,
"test_loss": 0.002114306204020977
},
{
"iter": 499000,
"lr": 0.01505234481666044,
"loss": 0.0005279307952150702,
"test_loss": 0.0020383098162710667
},
{
"iter": 500000,
"lr": 0.015005213174458099,
"loss": 0.0012892737286165357,
"test_loss": 0.0008001800742931664
},
{
"iter": 501000,
"lr": 0.014958081485720018,
"loss": 0.0006455975817516446,
"test_loss": 0.00028686627047136426
},
{
"iter": 502000,
"lr": 0.014910950215803059,
"loss": 0.0010355450212955475,
"test_loss": 0.00039976462721824646
},
{
"iter": 503000,
"lr": 0.014863819830059952,
"loss": 0.0004513832973316312,
"test_loss": 0.0010389594826847315
},
{
"iter": 504000,
"lr": 0.014816690793834693,
"loss": 0.0008465172722935677,
"test_loss": 0.002259437693282962
},
{
"iter": 505000,
"lr": 0.01476956357245796,
"loss": 0.0003712764009833336,
"test_loss": 0.0035667777992784977
},
{
"iter": 506000,
"lr": 0.014722438631242507,
"loss": 0.0002872837067116052,
"test_loss": 0.0007826737128198147
},
{
"iter": 507000,
"lr": 0.014675316435478576,
"loss": 0.000687014835420996,
"test_loss": 0.0026312407571822405
},
{
"iter": 508000,
"lr": 0.014628197450429299,
"loss": 0.0005929861217737198,
"test_loss": 0.00021763748372904956
},
{
"iter": 509000,
"lr": 0.014581082141326113,
"loss": 0.0027408648747950792,
"test_loss": 0.0006975308060646057
},
{
"iter": 510000,
"lr": 0.014533970973364155,
"loss": 0.0011070272885262966,
"test_loss": 0.00016097421757876873
},
{
"iter": 511000,
"lr": 0.014486864411697678,
"loss": 0.0005041176918894053,
"test_loss": 0.0002846837160177529
},
{
"iter": 512000,
"lr": 0.014439762921435452,
"loss": 0.0010332193924114108,
"test_loss": 0.0006721330573782325
},
{
"iter": 513000,
"lr": 0.014392666967636174,
"loss": 0.0007505768444389105,
"test_loss": 0.0003510648966766894
},
{
"iter": 514000,
"lr": 0.014345577015303878,
"loss": 0.0007509069982916117,
"test_loss": 0.0008840748923830688
},
{
"iter": 515000,
"lr": 0.01429849352938334,
"loss": 0.0018233577720820904,
"test_loss": 0.00027079787105321884
},
{
"iter": 516000,
"lr": 0.014251416974755496,
"loss": 0.0004419066826812923,
"test_loss": 0.0020575181115418673
},
{
"iter": 517000,
"lr": 0.014204347816232839,
"loss": 0.0004147517611272633,
"test_loss": 0.004220424219965935
},
{
"iter": 518000,
"lr": 0.01415728651855484,
"loss": 0.00011157682456541806,
"test_loss": 0.0004126974963583052
},
{
"iter": 519000,
"lr": 0.014110233546383345,
"loss": 0.001831643283367157,
"test_loss": 0.0011785029200837016
},
{
"iter": 520000,
"lr": 0.014063189364298012,
"loss": 0.0016237555537372828,
"test_loss": 0.0005322147044353187
},
{
"iter": 521000,
"lr": 0.014016154436791705,
"loss": 0.0005503818392753601,
"test_loss": 0.00010657223901944235
},
{
"iter": 522000,
"lr": 0.013969129228265912,
"loss": 0.0007592215551994741,
"test_loss": 0.00048010385944508016
},
{
"iter": 523000,
"lr": 0.013922114203026154,
"loss": 0.0005761296488344669,
"test_loss": 8.232181426137686e-05
},
{
"iter": 524000,
"lr": 0.013875109825277421,
"loss": 0.0009733953629620373,
"test_loss": 7.630998152308166e-05
},
{
"iter": 525000,
"lr": 0.013828116559119566,
"loss": 0.00131307914853096,
"test_loss": 0.0027507462073117495
},
{
"iter": 526000,
"lr": 0.013781134868542723,
"loss": 0.0010201893746852875,
"test_loss": 0.0008117129909805954
},
{
"iter": 527000,
"lr": 0.013734165217422746,
"loss": 0.0004323165921960026,
"test_loss": 0.0010531311854720116
},
{
"iter": 528000,
"lr": 0.013687208069516616,
"loss": 0.0009642827790230513,
"test_loss": 0.001371166668832302
},
{
"iter": 529000,
"lr": 0.013640263888457857,
"loss": 0.0006040302105247974,
"test_loss": 0.0005374707980081439
},
{
"iter": 530000,
"lr": 0.01359333313775197,
"loss": 0.0014848463470116258,
"test_loss": 0.0007040203199721873
},
{
"iter": 531000,
"lr": 0.013546416280771849,
"loss": 0.000378171622287482,
"test_loss": 0.0008174966205842793
},
{
"iter": 532000,
"lr": 0.013499513780753203,
"loss": 0.0023019046057015657,
"test_loss": 0.00035232288064435124
},
{
"iter": 533000,
"lr": 0.013452626100789991,
"loss": 0.0003324197023175657,
"test_loss": 0.0016174387419596314
},
{
"iter": 534000,
"lr": 0.01340575370382985,
"loss": 0.00038826907984912395,
"test_loss": 0.0018026139587163925
},
{
"iter": 535000,
"lr": 0.013358897052669511,
"loss": 0.00048767600674182177,
"test_loss": 9.470780787523836e-05
},
{
"iter": 536000,
"lr": 0.013312056609950242,
"loss": 0.0014404880348592997,
"test_loss": 0.0018513526301831007
},
{
"iter": 537000,
"lr": 0.013265232838153278,
"loss": 0.0004743087920360267,
"test_loss": 9.381012932863086e-05
},
{
"iter": 538000,
"lr": 0.013218426199595252,
"loss": 0.0012038422282785177,
"test_loss": 0.0001999441592488438
},
{
"iter": 539000,
"lr": 0.013171637156423627,
"loss": 0.001045291661284864,
"test_loss": 0.001166196190752089
},
{
"iter": 540000,
"lr": 0.013124866170612141,
"loss": 0.002651712391525507,
"test_loss": 0.0014898314839228988
},
{
"iter": 541000,
"lr": 0.013078113703956245,
"loss": 0.0006866821786388755,
"test_loss": 0.0010755910770967603
},
{
"iter": 542000,
"lr": 0.013031380218068532,
"loss": 0.0016219114186242223,
"test_loss": 0.0003577709139790386
},
{
"iter": 543000,
"lr": 0.012984666174374195,
"loss": 0.0003397889086045325,
"test_loss": 0.0005465522408485413
},
{
"iter": 544000,
"lr": 0.01293797203410646,
"loss": 0.0013826616341248155,
"test_loss": 0.0004678067343775183
},
{
"iter": 545000,
"lr": 0.012891298258302038,
"loss": 0.0020455028861761093,
"test_loss": 0.0005912315100431442
},
{
"iter": 546000,
"lr": 0.012844645307796566,
"loss": 0.001781894825398922,
"test_loss": 0.00010303789167664945
},
{
"iter": 547000,
"lr": 0.012798013643220064,
"loss": 0.000538290711119771,
"test_loss": 0.000440761010395363
},
{
"iter": 548000,
"lr": 0.012751403724992387,
"loss": 0.0009532846743240952,
"test_loss": 0.00032193068182095885
},
{
"iter": 549000,
"lr": 0.012704816013318672,
"loss": 0.0006129799876362085,
"test_loss": 0.0017110361950471997
},
{
"iter": 550000,
"lr": 0.012658250968184804,
"loss": 0.0009158900356851518,
"test_loss": 0.00028641123208217323
},
{
"iter": 551000,
"lr": 0.012611709049352864,
"loss": 0.0003188929404132068,
"test_loss": 0.000307373033137992
},
{
"iter": 552000,
"lr": 0.012565190716356596,
"loss": 0.0006597063620574772,
"test_loss": 0.00047615464427508414
},
{
"iter": 553000,
"lr": 0.012518696428496866,
"loss": 0.0004818353627342731,
"test_loss": 0.0011267950758337975
},
{
"iter": 554000,
"lr": 0.012472226644837135,
"loss": 0.0008072013733908534,
"test_loss": 0.0025269677862524986
},
{
"iter": 555000,
"lr": 0.012425781824198916,
"loss": 0.003020527772605419,
"test_loss": 0.0006349066970869899
},
{
"iter": 556000,
"lr": 0.012379362425157251,
"loss": 0.0004567653522826731,
"test_loss": 6.47614651825279e-05
},
{
"iter": 557000,
"lr": 0.012332968906036178,
"loss": 0.0009270739392377436,
"test_loss": 8.918115781852975e-05
},
{
"iter": 558000,
"lr": 0.012286601724904209,
"loss": 0.0008365680114366114,
"test_loss": 0.002986628795042634
},
{
"iter": 559000,
"lr": 0.01224026133956981,
"loss": 0.0005223011830821633,
"test_loss": 0.0033248355612158775
},
{
"iter": 560000,
"lr": 0.012193948207576872,
"loss": 0.0006891837692819536,
"test_loss": 0.000723143748473376
},
{
"iter": 561000,
"lr": 0.012147662786200204,
"loss": 0.0002181071467930451,
"test_loss": 0.00045972398947924376
},
{
"iter": 562000,
"lr": 0.01210140553244101,
"loss": 0.0006067493231967092,
"test_loss": 8.953656652010977e-05
},
{
"iter": 563000,
"lr": 0.012055176903022382,
"loss": 0.0005697174347005785,
"test_loss": 0.000464151642518118
},
{
"iter": 564000,
"lr": 0.012008977354384784,
"loss": 0.0003945131611544639,
"test_loss": 0.00042847348959185183
},
{
"iter": 565000,
"lr": 0.011962807342681557,
"loss": 0.0006984459469094872,
"test_loss": 0.0008577359840273857
},
{
"iter": 566000,
"lr": 0.0119166673237744,
"loss": 0.00025238897069357336,
"test_loss": 0.0012229797430336475
},
{
"iter": 567000,
"lr": 0.011870557753228879,
"loss": 0.001797222881577909,
"test_loss": 0.00022345277830027044
},
{
"iter": 568000,
"lr": 0.011824479086309929,
"loss": 0.0013131401501595974,
"test_loss": 0.0011669655796140432
},
{
"iter": 569000,
"lr": 0.011778431777977355,
"loss": 0.001468952395953238,
"test_loss": 0.0005825070547871292
},
{
"iter": 570000,
"lr": 0.011732416282881344,
"loss": 0.00032668566564098,
"test_loss": 0.0008958480320870876
},
{
"iter": 571000,
"lr": 0.011686433055357968,
"loss": 0.00044076511403545737,
"test_loss": 0.0022129560820758343
},
{
"iter": 572000,
"lr": 0.011640482549424711,
"loss": 0.0003078072622884065,
"test_loss": 0.00015087041538208723
},
{
"iter": 573000,
"lr": 0.01159456521877597,
"loss": 0.000491248385515064,
"test_loss": 0.001402691937983036
},
{
"iter": 574000,
"lr": 0.011548681516778602,
"loss": 0.0019348680507391691,
"test_loss": 0.0016335069667547941
},
{
"iter": 575000,
"lr": 0.0115028318964674,
"loss": 0.0003160156775265932,
"test_loss": 0.0003107008524239063
},
{
"iter": 576000,
"lr": 0.011457016810540677,
"loss": 0.0003186331014148891,
"test_loss": 0.0015827221795916557
},
{
"iter": 577000,
"lr": 0.011411236711355755,
"loss": 0.0010675948578864336,
"test_loss": 0.0005534673109650612
},
{
"iter": 578000,
"lr": 0.011365492050924523,
"loss": 0.0003086884680669755,
"test_loss": 0.0015667371917515993
},
{
"iter": 579000,
"lr": 0.011319783280908954,
"loss": 0.000701546436175704,
"test_loss": 0.0003413469821680337
},
{
"iter": 580000,
"lr": 0.011274110852616658,
"loss": 0.0004716732364613563,
"test_loss": 0.0022530690766870975
},
{
"iter": 581000,
"lr": 0.011228475216996431,
"loss": 0.004853188060224056,
"test_loss": 0.0008644365589134395
},
{
"iter": 582000,
"lr": 0.011182876824633783,
"loss": 0.0009480512235313654,
"test_loss": 0.0003157789178658277
},
{
"iter": 583000,
"lr": 0.011137316125746512,
"loss": 0.0008055985672399402,
"test_loss": 0.0003489110677037388
},
{
"iter": 584000,
"lr": 0.011091793570180237,
"loss": 0.0003441110020503402,
"test_loss": 0.00014654593542218208
},
{
"iter": 585000,
"lr": 0.011046309607403975,
"loss": 0.0005082832649350166,
"test_loss": 0.00017857991042546928
},
{
"iter": 586000,
"lr": 0.011000864686505693,
"loss": 0.0009060876909643412,
"test_loss": 1.7044640117092058e-05
},
{
"iter": 587000,
"lr": 0.01095545925618788,
"loss": 0.00039040943374857306,
"test_loss": 0.00042166811181232333
},
{
"iter": 588000,
"lr": 0.010910093764763103,
"loss": 0.0004096267803106457,
"test_loss": 0.0004237088141962886
},
{
"iter": 589000,
"lr": 0.010864768660149602,
"loss": 0.0006679316284134984,
"test_loss": 0.00032463035313412547
},
{
"iter": 590000,
"lr": 0.010819484389866848,
"loss": 0.0002243861381430179,
"test_loss": 0.0005250261747278273
},
{
"iter": 591000,
"lr": 0.010774241401031134,
"loss": 0.0011987112229689956,
"test_loss": 0.001292552798986435
},
{
"iter": 592000,
"lr": 0.010729040140351162,
"loss": 0.0007533092284575105,
"test_loss": 0.0005736892344430089
},
{
"iter": 593000,
"lr": 0.01068388105412363,
"loss": 0.0013655164511874318,
"test_loss": 0.0001333851832896471
},
{
"iter": 594000,
"lr": 0.010638764588228817,
"loss": 0.0007195626385509968,
"test_loss": 0.00038202526047825813
},
{
"iter": 595000,
"lr": 0.010593691188126192,
"loss": 0.00010935480531770736,
"test_loss": 0.0009176620515063405
},
{
"iter": 596000,
"lr": 0.010548661298850017,
"loss": 0.0010547854471951723,
"test_loss": 0.0008620707085356116
},
{
"iter": 597000,
"lr": 0.010503675365004942,
"loss": 0.0002224130294052884,
"test_loss": 0.0007377410656772554
},
{
"iter": 598000,
"lr": 0.01045873383076162,
"loss": 0.0009394345106557012,
"test_loss": 0.001116321887820959
},
{
"iter": 599000,
"lr": 0.010413837139852333,
"loss": 0.0009001733269542456,
"test_loss": 0.0018045573960989714
},
{
"iter": 600000,
"lr": 0.010368985735566586,
"loss": 0.002757147653028369,
"test_loss": 0.006506178993731737
},
{
"iter": 601000,
"lr": 0.010324180060746754,
"loss": 0.00013280635175760835,
"test_loss": 0.00027354108169674873
},
{
"iter": 602000,
"lr": 0.010279420557783693,
"loss": 0.0005230330862104893,
"test_loss": 0.0017191506922245026
},
{
"iter": 603000,
"lr": 0.01023470766861239,
"loss": 0.00023588690964970738,
"test_loss": 0.0009780528489500284
},
{
"iter": 604000,
"lr": 0.010190041834707578,
"loss": 0.0005233339034020901,
"test_loss": 0.0015935801202431321
},
{
"iter": 605000,
"lr": 0.01014542349707939,
"loss": 0.0009236594196408987,
"test_loss": 0.0004019607149530202
},
{
"iter": 606000,
"lr": 0.010100853096269008,
"loss": 0.0007024857914075255,
"test_loss": 0.00026160822017118335
},
{
"iter": 607000,
"lr": 0.0100563310723443,
"loss": 0.00034118883195333183,
"test_loss": 0.0012122015468776226
},
{
"iter": 608000,
"lr": 0.010011857864895491,
"loss": 0.0013319621793925762,
"test_loss": 0.0008541626739315689
},
{
"iter": 609000,
"lr": 0.009967433913030803,
"loss": 6.858102278783917e-05,
"test_loss": 0.0009914751863107085
},
{
"iter": 610000,
"lr": 0.009923059655372143,
"loss": 0.000533860526047647,
"test_loss": 3.093391205766238e-05
},
{
"iter": 611000,
"lr": 0.009878735530050751,
"loss": 0.00012268716818653047,
"test_loss": 0.00011144612653879449
},
{
"iter": 612000,
"lr": 0.009834461974702889,
"loss": 0.0013026760425418615,
"test_loss": 0.00022565870312973857
},
{
"iter": 613000,
"lr": 0.009790239426465511,
"loss": 0.0006563797942362726,
"test_loss": 0.0001582685945322737
},
{
"iter": 614000,
"lr": 0.009746068321971947,
"loss": 0.0001245627790922299,
"test_loss": 0.0009426868637092412
},
{
"iter": 615000,
"lr": 0.009701949097347602,
"loss": 0.00047358626034110785,
"test_loss": 0.0006730449385941029
},
{
"iter": 616000,
"lr": 0.009657882188205636,
"loss": 0.00038315964047797024,
"test_loss": 0.0005483478889800608
},
{
"iter": 617000,
"lr": 0.009613868029642673,
"loss": 6.555605796165764e-05,
"test_loss": 0.0001472670555813238
},
{
"iter": 618000,
"lr": 0.009569907056234506,
"loss": 0.0003721877292264253,
"test_loss": 0.0009639491327106953
},
{
"iter": 619000,
"lr": 0.009525999702031794,
"loss": 0.0002539389824960381,
"test_loss": 0.0005925237783230841
},
{
"iter": 620000,
"lr": 0.009482146400555787,
"loss": 0.000683964928612113,
"test_loss": 5.248585875960998e-05
},
{
"iter": 621000,
"lr": 0.009438347584794048,
"loss": 0.0004773076216224581,
"test_loss": 0.0001189803151646629
},
{
"iter": 622000,
"lr": 0.009394603687196164,
"loss": 0.00013578360085375607,
"test_loss": 0.0008651628158986568
},
{
"iter": 623000,
"lr": 0.009350915139669493,
"loss": 0.00024061123258434236,
"test_loss": 0.0009920442244037986
},
{
"iter": 624000,
"lr": 0.009307282373574886,
"loss": 0.00038744136691093445,
"test_loss": 0.0003832645888905972
},
{
"iter": 625000,
"lr": 0.009263705819722438,
"loss": 0.0001734234974719584,
"test_loss": 0.0005889477324672043
},
{
"iter": 626000,
"lr": 0.009220185908367224,
"loss": 0.0003031865053344518,
"test_loss": 0.000554343918338418
},
{
"iter": 627000,
"lr": 0.009176723069205067,
"loss": 0.00018117844592779875,
"test_loss": 4.5028573367744684e-05
},
{
"iter": 628000,
"lr": 0.009133317731368272,
"loss": 0.0004718296113424003,
"test_loss": 0.0001814178831409663
},
{
"iter": 629000,
"lr": 0.009089970323421409,
"loss": 0.000236018662690185,
"test_loss": 7.713556988164783e-05
},
{
"iter": 630000,
"lr": 0.009046681273357077,
"loss": 0.0010963089298456907,
"test_loss": 0.00042849063174799085
},
{
"iter": 631000,
"lr": 0.00900345100859168,
"loss": 0.00032940827077254653,
"test_loss": 0.0003561262274160981
},
{
"iter": 632000,
"lr": 0.00896027995596118,
"loss": 0.00023012531164567918,
"test_loss": 0.0006929393857717514
},
{
"iter": 633000,
"lr": 0.008917168541716928,
"loss": 0.0001751006639096886,
"test_loss": 0.0007037872564978898
},
{
"iter": 634000,
"lr": 0.008874117191521426,
"loss": 0.00013767457858193666,
"test_loss": 0.0003049746446777135
},
{
"iter": 635000,
"lr": 0.00883112633044413,
"loss": 0.0009521713363938034,
"test_loss": 0.000354320858605206
},
{
"iter": 636000,
"lr": 0.008788196382957258,
"loss": 0.0003043506876565516,
"test_loss": 7.10361564415507e-05
},
{
"iter": 637000,
"lr": 0.008745327772931587,
"loss": 0.000953107897657901,
"test_loss": 9.117537410929799e-05
},
{
"iter": 638000,
"lr": 0.008702520923632282,
"loss": 9.412868530489504e-05,
"test_loss": 0.0004087283159606159
},
{
"iter": 639000,
"lr": 0.008659776257714708,
"loss": 0.0006191434222273529,
"test_loss": 0.0011739606270566583
},
{
"iter": 640000,
"lr": 0.008617094197220261,
"loss": 0.00046630934230051935,
"test_loss": 6.900281005073339e-05
},
{
"iter": 641000,
"lr": 0.0085744751635722,
"loss": 0.0002344609092688188,
"test_loss": 0.0001870036358013749
},
{
"iter": 642000,
"lr": 0.008531919577571483,
"loss": 7.535194890806451e-05,
"test_loss": 0.0014849761500954628
},
{
"iter": 643000,
"lr": 0.008489427859392617,
"loss": 0.0002256140433019027,
"test_loss": 0.0008647762006148696
},
{
"iter": 644000,
"lr": 0.008447000428579507,
"loss": 0.00045717298053205013,
"test_loss": 0.00023732254339847714
},
{
"iter": 645000,
"lr": 0.008404637704041313,
"loss": 0.00016825359489303082,
"test_loss": 0.00043780734995380044
},
{
"iter": 646000,
"lr": 0.008362340104048313,
"loss": 7.72785278968513e-05,
"test_loss": 0.0001533004833618179
},
{
"iter": 647000,
"lr": 0.008320108046227778,
"loss": 0.0005080492701381445,
"test_loss": 0.00010740502330008894
},
{
"iter": 648000,
"lr": 0.008277941947559845,
"loss": 0.001218202756717801,
"test_loss": 0.000172010826645419
},
{
"iter": 649000,
"lr": 0.008235842224373398,
"loss": 0.0007862054626457393,
"test_loss": 0.0010570450685918331
},
{
"iter": 650000,
"lr": 0.008193809292341963,
"loss": 0.0004157691146247089,
"test_loss": 0.00010228406608803198
},
{
"iter": 651000,
"lr": 0.008151843566479597,
"loss": 0.00012982070620637387,
"test_loss": 7.736915904388297e-06
},
{
"iter": 652000,
"lr": 0.008109945461136803,
"loss": 0.00047562882537022233,
"test_loss": 0.00024827325250953436
},
{
"iter": 653000,
"lr": 0.00806811538999641,
"loss": 9.72490306594409e-05,
"test_loss": 0.0008120188722386956
},
{
"iter": 654000,
"lr": 0.008026353766069524,
"loss": 0.0002877913066186011,
"test_loss": 0.0010482347570359707
},
{
"iter": 655000,
"lr": 0.007984661001691432,
"loss": 0.000712985813152045,
"test_loss": 0.00013668768224306405
},
{
"iter": 656000,
"lr": 0.007943037508517534,
"loss": 0.002328993286937475,
"test_loss": 0.0021568811498582363
},
{
"iter": 657000,
"lr": 0.007901483697519274,
"loss": 0.00014240664313547313,
"test_loss": 0.00020754309662152082
},
{
"iter": 658000,
"lr": 0.00785999997898009,
"loss": 0.000636913173366338,
"test_loss": 6.605694943573326e-05
},
{
"iter": 659000,
"lr": 0.00781858676249135,
"loss": 0.018876513466238976,
"test_loss": 0.018992874771356583
},
{
"iter": 660000,
"lr": 0.007777244456948329,
"loss": 0.00015534149133600295,
"test_loss": 8.493806672049686e-05
},
{
"iter": 661000,
"lr": 0.007735973470546151,
"loss": 0.001094334525987506,
"test_loss": 0.00014982414722908288
},
{
"iter": 662000,
"lr": 0.007694774210775771,
"loss": 5.4884982091607526e-05,
"test_loss": 0.002017006743699312
},
{
"iter": 663000,
"lr": 0.007653647084419946,
"loss": 0.0005890895845368505,
"test_loss": 8.296010491903871e-05
},
{
"iter": 664000,
"lr": 0.007612592497549223,
"loss": 0.0004882353823632002,
"test_loss": 0.0002981507277581841
},
{
"iter": 665000,
"lr": 0.007571610855517924,
"loss": 0.0011987258912995458,
"test_loss": 7.434636063408107e-05
},
{
"iter": 666000,
"lr": 0.007530702562960149,
"loss": 0.002394667826592922,
"test_loss": 0.0011622675228863955
},
{
"iter": 667000,
"lr": 0.0074898680237857765,
"loss": 0.0005991871003061533,
"test_loss": 0.00038514871266670525
},
{
"iter": 668000,
"lr": 0.00744910764117648,
"loss": 0.013577697798609734,
"test_loss": 0.013052081689238548
},
{
"iter": 669000,
"lr": 0.007408421817581744,
"loss": 0.0010074659949168563,
"test_loss": 0.001454031909815967
},
{
"iter": 670000,
"lr": 0.0073678109547148886,
"loss": 0.0020081778056919575,
"test_loss": 0.001295184949412942
},
{
"iter": 671000,
"lr": 0.007327275453549112,
"loss": 0.0017324460204690695,
"test_loss": 0.00046670984011143446
},
{
"iter": 672000,
"lr": 0.007286815714313518,
"loss": 0.0007549117435701191,
"test_loss": 0.00044920400250703096
},
{
"iter": 673000,
"lr": 0.007246432136489179,
"loss": 0.0011420168448239565,
"test_loss": 0.0003282500256318599
},
{
"iter": 674000,
"lr": 0.007206125118805176,
"loss": 0.0005538839031942189,
"test_loss": 0.0018635225715115666
},
{
"iter": 675000,
"lr": 0.007165895059234675,
"loss": 0.0005427796859294176,
"test_loss": 0.0006577699678018689
},
{
"iter": 676000,
"lr": 0.007125742354990993,
"loss": 0.00030612098635174334,
"test_loss": 0.0008050508913584054
},
{
"iter": 677000,
"lr": 0.007085667402523675,
"loss": 0.00044765332131646574,
"test_loss": 0.001523069222457707
},
{
"iter": 678000,
"lr": 0.007045670597514577,
"loss": 0.0005792126758024096,
"test_loss": 0.0019303439185023308
},
{
"iter": 679000,
"lr": 0.0070057523348739685,
"loss": 0.0005485191941261292,
"test_loss": 0.0006543839699588716
},
{
"iter": 680000,
"lr": 0.00696591300873662,
"loss": 0.000358588615199551,
"test_loss": 0.00041224728920497
},
{
"iter": 681000,
"lr": 0.006926153012457927,
"loss": 0.00036718026967719197,
"test_loss": 0.0006798094254918396
},
{
"iter": 682000,
"lr": 0.006886472738610012,
"loss": 0.0003204848326276988,
"test_loss": 0.00017404546088073403
},
{
"iter": 683000,
"lr": 0.006846872578977857,
"loss": 0.0008089168695732951,
"test_loss": 0.00010651150660123676
},
{
"iter": 684000,
"lr": 0.006807352924555434,
"loss": 0.0006770688341930509,
"test_loss": 0.00029859121423214674
},
{
"iter": 685000,
"lr": 0.006767914165541838,
"loss": 0.000999291194602847,
"test_loss": 0.002608596347272396
},
{
"iter": 686000,
"lr": 0.006728556691337444,
"loss": 0.0001479576458223164,
"test_loss": 0.0008598893182352185
},
{
"iter": 687000,
"lr": 0.006689280890540057,
"loss": 0.00250047305598855,
"test_loss": 9.035238326760009e-05
},
{
"iter": 688000,
"lr": 0.006650087150941081,
"loss": 0.0006713169859722257,
"test_loss": 0.0009461415465921164
},
{
"iter": 689000,
"lr": 0.006610975859521669,
"loss": 0.0002004460693569854,
"test_loss": 0.0003148822288494557
},
{
"iter": 690000,
"lr": 0.0065719474024489325,
"loss": 0.0002764951204881072,
"test_loss": 4.1546838474459946e-05
},
{
"iter": 691000,
"lr": 0.006533002165072111,
"loss": 0.00027048116317018867,
"test_loss": 0.00039523636223748326
},
{
"iter": 692000,
"lr": 0.006494140531918773,
"loss": 0.0003055687411688268,
"test_loss": 0.00031629251316189766
},
{
"iter": 693000,
"lr": 0.00645536288669101,
"loss": 0.0008974722004495561,
"test_loss": 4.016832463094033e-05
},
{
"iter": 694000,
"lr": 0.006416669612261663,
"loss": 0.0006815840606577694,
"test_loss": 0.005000988487154245
},
{
"iter": 695000,
"lr": 0.006378061090670526,
"loss": 0.0007683028234168887,
"test_loss": 0.0004241243004798889
},
{
"iter": 696000,
"lr": 0.006339537703120588,
"loss": 0.0002078249235637486,
"test_loss": 0.0001756464334903285
},
{
"iter": 697000,
"lr": 0.006301099829974262,
"loss": 0.00035508774453774095,
"test_loss": 0.00019619052181951702
},
{
"iter": 698000,
"lr": 0.006262747850749628,
"loss": 0.0004675464006140828,
"test_loss": 0.00051696109585464
},
{
"iter": 699000,
"lr": 0.00622448214411669,
"loss": 0.0007464250084012747,
"test_loss": 0.0012356519000604749
},
{
"iter": 700000,
"lr": 0.006186303087893644,
"loss": 0.0003026399062946439,
"test_loss": 0.00042836545617319643
},
{
"iter": 701000,
"lr": 0.00614821105904312,
"loss": 4.703604645328596e-05,
"test_loss": 0.0022145211696624756
},
{
"iter": 702000,
"lr": 0.006110206433668494,
"loss": 0.00041446040268056095,
"test_loss": 0.00029782368801534176
},
{
"iter": 703000,
"lr": 0.006072289587010157,
"loss": 0.00013254470832180232,
"test_loss": 0.0005287069361656904
},
{
"iter": 704000,
"lr": 0.006034460893441813,
"loss": 0.0012548124650493264,
"test_loss": 8.99676961125806e-05
},
{
"iter": 705000,
"lr": 0.005996720726466783,
"loss": 0.00034251948818564415,
"test_loss": 0.0001108428041334264
},
{
"iter": 706000,
"lr": 0.005959069458714312,
"loss": 0.0008773178560659289,
"test_loss": 8.607211202615872e-05
},
{
"iter": 707000,
"lr": 0.0059215074619359,
"loss": 0.00028212033794261515,
"test_loss": 0.0009132612030953169
},
{
"iter": 708000,
"lr": 0.005884035107001625,
"loss": 0.0003156496968585998,
"test_loss": 7.403876224998385e-05
},
{
"iter": 709000,
"lr": 0.005846652763896478,
"loss": 0.00043570122215896845,
"test_loss": 0.00094130594516173
},
{
"iter": 710000,
"lr": 0.0058093608017167194,
"loss": 0.0005302815698087215,
"test_loss": 0.0025161111261695623
},
{
"iter": 711000,
"lr": 0.0057721595886662275,
"loss": 0.0009098786395043135,
"test_loss": 0.0008282344788312912
},
{
"iter": 712000,
"lr": 0.005735049492052863,
"loss": 0.0012772809714078903,
"test_loss": 0.000279176514595747
},
{
"iter": 713000,
"lr": 0.005698030878284847,
"loss": 0.00033539149444550276,
"test_loss": 0.0009443502058275044
},
{
"iter": 714000,
"lr": 0.005661104112867139,
"loss": 0.00030596807482652366,
"test_loss": 0.0006685437401756644
},
{
"iter": 715000,
"lr": 0.005624269560397833,
"loss": 0.00015325126878451556,
"test_loss": 0.00040271395118907094
},
{
"iter": 716000,
"lr": 0.005587527584564549,
"loss": 9.53778435359709e-05,
"test_loss": 0.0007819866295903921
},
{
"iter": 717000,
"lr": 0.005550878548140849,
"loss": 0.0013228713069111109,
"test_loss": 0.00043525395449250937
},
{
"iter": 718000,
"lr": 0.005514322812982656,
"loss": 0.00047959655057638884,
"test_loss": 0.0004038755432702601
},
{
"iter": 719000,
"lr": 0.005477860740024678,
"loss": 0.0006594113074243069,
"test_loss": 0.001303842756897211
},
{
"iter": 720000,
"lr": 0.005441492689276842,
"loss": 0.00011169565550517291,
"test_loss": 0.0036835926584899426
},
{
"iter": 721000,
"lr": 0.005405219019820747,
"loss": 0.0011432378087192774,
"test_loss": 0.0017841916996985674
},
{
"iter": 722000,
"lr": 0.00536904008980611,
"loss": 0.0006839287816546857,
"test_loss": 5.892757690162398e-05
},
{
"iter": 723000,
"lr": 0.005332956256447235,
"loss": 0.00028997764457017183,
"test_loss": 0.0005914493231102824
},
{
"iter": 724000,
"lr": 0.0052969678760194875,
"loss": 0.00019233681086916476,
"test_loss": 0.00025373350945301354
},
{
"iter": 725000,
"lr": 0.005261075303855772,
"loss": 0.00032090063905343413,
"test_loss": 0.00039198691956698895
},
{
"iter": 726000,
"lr": 0.005225278894343024,
"loss": 0.00023240596055984497,
"test_loss": 0.0010119992075487971
},
{
"iter": 727000,
"lr": 0.005189579000918714,
"loss": 0.0002789186255540699,
"test_loss": 0.00013308043708093464
},
{
"iter": 728000,
"lr": 0.0051539759760673605,
"loss": 0.00023468321887776256,
"test_loss": 0.00027097263955511153
},
{
"iter": 729000,
"lr": 0.0051184701713170395,
"loss": 0.0007189432508312166,
"test_loss": 8.151790825650096e-05
},
{
"iter": 730000,
"lr": 0.005083061937235923,
"loss": 3.444700632826425e-05,
"test_loss": 0.00029171566711738706
},
{
"iter": 731000,
"lr": 0.005047751623428816,
"loss": 0.0002939694677479565,
"test_loss": 0.00013575618504546583
},
{
"iter": 732000,
"lr": 0.0050125395785337,
"loss": 0.00030716467881575227,
"test_loss": 0.00032672579982317984
},
{
"iter": 733000,
"lr": 0.004977426150218296,
"loss": 9.459215652896091e-05,
"test_loss": 0.00012511668319348246
},
{
"iter": 734000,
"lr": 0.004942411685176629,
"loss": 3.510117676341906e-05,
"test_loss": 0.0005697406595572829
},
{
"iter": 735000,
"lr": 0.004907496529125605,
"loss": 0.0003277510404586792,
"test_loss": 0.00029067799914628267
},
{
"iter": 736000,
"lr": 0.004872681026801602,
"loss": 0.001335246954113245,
"test_loss": 0.00017261027824133635
},
{
"iter": 737000,
"lr": 0.004837965521957057,
"loss": 0.00021075968106742948,
"test_loss": 0.0003607178514357656
},
{
"iter": 738000,
"lr": 0.004803350357357079,
"loss": 0.0003023139724973589,
"test_loss": 9.95629743556492e-05
},
{
"iter": 739000,
"lr": 0.004768835874776071,
"loss": 0.000234548730077222,
"test_loss": 1.7148289771284908e-05
},
{
"iter": 740000,
"lr": 0.00473442241499433,
"loss": 0.0006361486739479005,
"test_loss": 0.000685411156155169
},
{
"iter": 741000,
"lr": 0.004700110317794714,
"loss": 0.0004211427003610879,
"test_loss": 8.993875235319138e-05
},
{
"iter": 742000,
"lr": 0.004665899921959271,
"loss": 3.0771254387218505e-05,
"test_loss": 0.00030732559389434755
},
{
"iter": 743000,
"lr": 0.004631791565265894,
"loss": 0.00024712245794944465,
"test_loss": 0.00012730207527056336
},
{
"iter": 744000,
"lr": 0.004597785584484984,
"loss": 0.0003255722695030272,
"test_loss": 8.118983532767743e-05
},
{
"iter": 745000,
"lr": 0.004563882315376139,
"loss": 8.785341924522072e-05,
"test_loss": 0.0016193846240639687
},
{
"iter": 746000,
"lr": 0.0045300820926848185,
"loss": 0.00024154374841600657,
"test_loss": 0.0005729191470891237
},
{
"iter": 747000,
"lr": 0.004496385250139053,
"loss": 0.0016036672750487924,
"test_loss": 6.0443249822128564e-05
},
{
"iter": 748000,
"lr": 0.004462792120446149,
"loss": 0.00038341747131198645,
"test_loss": 3.324146382510662e-05
},
{
"iter": 749000,
"lr": 0.004429303035289386,
"loss": 0.0012969729723408818,
"test_loss": 8.851135498844087e-05
},
{
"iter": 750000,
"lr": 0.0043959183253247675,
"loss": 0.0001292884990107268,
"test_loss": 4.940944199915975e-05
},
{
"iter": 751000,
"lr": 0.004362638320177739,
"loss": 0.00013666824088431895,
"test_loss": 3.109317185590044e-05
},
{
"iter": 752000,
"lr": 0.00432946334843994,
"loss": 0.000945383682847023,
"test_loss": 0.000647810404188931
},
{
"iter": 753000,
"lr": 0.004296393737665955,
"loss": 0.00022100156638771296,
"test_loss": 0.00013249123003333807
},
{
"iter": 754000,
"lr": 0.004263429814370087,
"loss": 0.0003365427255630493,
"test_loss": 4.934730168315582e-05
},
{
"iter": 755000,
"lr": 0.004230571904023125,
"loss": 0.00036613247357308865,
"test_loss": 0.0031186738051474094
},
{
"iter": 756000,
"lr": 0.004197820331049135,
"loss": 0.00020041156676597893,
"test_loss": 0.0003211932780686766
},
{
"iter": 757000,
"lr": 0.004165175418822256,
"loss": 0.0014086413430050015,
"test_loss": 0.00025882862973958254
},
{
"iter": 758000,
"lr": 0.004132637489663509,
"loss": 0.0003959703026339412,
"test_loss": 0.0003597394097596407
},
{
"iter": 759000,
"lr": 0.004100206864837612,
"loss": 0.00016228266758844256,
"test_loss": 0.0008841356611810625
},
{
"iter": 760000,
"lr": 0.0040678838645498054,
"loss": 0.0003754801582545042,
"test_loss": 0.0004331124946475029
},
{
"iter": 761000,
"lr": 0.004035668807942701,
"loss": 6.874233076814562e-05,
"test_loss": 0.00014139863196760416
},
{
"iter": 762000,
"lr": 0.0040035620130931164,
"loss": 0.0014717577723786235,
"test_loss": 7.96977928985143e-06
},
{
"iter": 763000,
"lr": 0.0039715637970089476,
"loss": 0.0005845490377396345,
"test_loss": 0.00012191086716484278
},
{
"iter": 764000,
"lr": 0.003939674475626029,
"loss": 0.0003126713272649795,
"test_loss": 0.0001681185094639659
},
{
"iter": 765000,
"lr": 0.003907894363805021,
"loss": 0.0011262851767241955,
"test_loss": 7.983873365446925e-05
},
{
"iter": 766000,
"lr": 0.003876223775328296,
"loss": 0.00021683804516214877,
"test_loss": 2.9906490453868173e-05
},
{
"iter": 767000,
"lr": 0.003844663022896845,
"loss": 0.0005589034408330917,
"test_loss": 0.0006298614316619933
},
{
"iter": 768000,
"lr": 0.003813212418127187,
"loss": 0.0002333608572371304,
"test_loss": 0.0004918933846056461
},
{
"iter": 769000,
"lr": 0.0037818722715482933,
"loss": 0.0003828414482995868,
"test_loss": 0.001677652820944786
},
{
"iter": 770000,
"lr": 0.0037506428925985213,
"loss": 0.0003410539939068258,
"test_loss": 9.751989273354411e-05
},
{
"iter": 771000,
"lr": 0.003719524589622557,
"loss": 4.785457713296637e-05,
"test_loss": 6.687653512926772e-05
},
{
"iter": 772000,
"lr": 0.0036885176698683774,
"loss": 5.114313171361573e-05,
"test_loss": 4.5651082473341376e-05
},
{
"iter": 773000,
"lr": 0.0036576224394842074,
"loss": 0.00016491388669237494,
"test_loss": 0.0003995895094703883
},
{
"iter": 774000,
"lr": 0.003626839203515503,
"loss": 0.00016464140207972378,
"test_loss": 0.00047633241047151387
},
{
"iter": 775000,
"lr": 0.003596168265901942,
"loss": 0.00013418863818515092,
"test_loss": 4.681738209910691e-05
},
{
"iter": 776000,
"lr": 0.003565609929474414,
"loss": 0.0006716088973917067,
"test_loss": 0.00017610503709875047
},
{
"iter": 777000,
"lr": 0.00353516449595204,
"loss": 0.0002365962864132598,
"test_loss": 3.8804166251793504e-05
},
{
"iter": 778000,
"lr": 0.0035048322659391846,
"loss": 0.00029646483017131686,
"test_loss": 0.0005965767777524889
},
{
"iter": 779000,
"lr": 0.0034746135389224987,
"loss": 0.00011969543993473053,
"test_loss": 6.227897392818704e-05
},
{
"iter": 780000,
"lr": 0.0034445086132679483,
"loss": 4.0311977500095963e-05,
"test_loss": 4.282890586182475e-05
},
{
"iter": 781000,
"lr": 0.003414517786217885,
"loss": 5.338907067198306e-05,
"test_loss": 0.0002733458823058754
},
{
"iter": 782000,
"lr": 0.0033846413538880945,
"loss": 0.00010520615614950657,
"test_loss": 1.8110411474481225e-05
},
{
"iter": 783000,
"lr": 0.0033548796112648866,
"loss": 0.0002137995616067201,
"test_loss": 0.0004651027265936136
},
{
"iter": 784000,
"lr": 0.0033252328522021765,
"loss": 0.00030850665643811226,
"test_loss": 8.391511801164597e-05
},
{
"iter": 785000,
"lr": 0.0032957013694185806,
"loss": 0.0003874555986840278,
"test_loss": 0.0001889062114059925
},
{
"iter": 786000,
"lr": 0.003266285454494533,
"loss": 0.0005587927298620343,
"test_loss": 4.337891732575372e-05
},
{
"iter": 787000,
"lr": 0.003236985397869404,
"loss": 0.00035468488931655884,
"test_loss": 0.00046475647832266986
},
{
"iter": 788000,
"lr": 0.003207801488838633,
"loss": 3.681732414406724e-05,
"test_loss": 2.351371949771419e-05
},
{
"iter": 789000,
"lr": 0.0031787340155508582,
"loss": 0.0013139687944203615,
"test_loss": 2.3141228666645475e-05
},
{
"iter": 790000,
"lr": 0.003149783265005099,
"loss": 0.0007538029458373785,
"test_loss": 0.0005501474952325225
},
{
"iter": 791000,
"lr": 0.003120949523047905,
"loss": 0.00017734929861035198,
"test_loss": 0.0003675412735901773
},
{
"iter": 792000,
"lr": 0.0030922330743705304,
"loss": 0.00020882046374026686,
"test_loss": 0.0009912648238241673
},
{
"iter": 793000,
"lr": 0.0030636342025061325,
"loss": 5.890374450245872e-05,
"test_loss": 0.0011899934615939856
},
{
"iter": 794000,
"lr": 0.0030351531898269706,
"loss": 4.894568701274693e-05,
"test_loss": 0.0005241618491709232
},
{
"iter": 795000,
"lr": 0.0030067903175416124,
"loss": 0.0018501813756302,
"test_loss": 0.00018937885761260986
},
{
"iter": 796000,
"lr": 0.0029785458656921607,
"loss": 3.880121948895976e-05,
"test_loss": 0.0002543677401263267
},
{
"iter": 797000,
"lr": 0.002950420113151492,
"loss": 5.280700861476362e-05,
"test_loss": 7.015364826656878e-05
},
{
"iter": 798000,
"lr": 0.0029224133376204997,
"loss": 0.00046325253788381815,
"test_loss": 3.1149575079325587e-05
},
{
"iter": 799000,
"lr": 0.0028945258156253483,
"loss": 8.62869419506751e-05,
"test_loss": 2.1589947209577076e-05
},
{
"iter": 800000,
"lr": 0.002866757822514749,
"loss": 0.00027410752954892814,
"test_loss": 0.00010998256038874388
},
{
"iter": 801000,
"lr": 0.0028391096324572435,
"loss": 2.120648423442617e-05,
"test_loss": 4.991244350094348e-05
},
{
"iter": 802000,
"lr": 0.00281158151843849,
"loss": 7.631343032699078e-05,
"test_loss": 7.268734771059826e-05
},
{
"iter": 803000,
"lr": 0.0027841737522585623,
"loss": 0.0006091410759836435,
"test_loss": 0.0009268511203117669
},
{
"iter": 804000,
"lr": 0.0027568866045292848,
"loss": 2.3472985049011186e-05,
"test_loss": 2.365170803386718e-05
},
{
"iter": 805000,
"lr": 0.002729720344671547,
"loss": 0.0003594857989810407,
"test_loss": 0.00020125643641222268
},
{
"iter": 806000,
"lr": 0.0027026752409126473,
"loss": 0.009193153120577335,
"test_loss": 0.0006944616325199604
},
{
"iter": 807000,
"lr": 0.0026757515602836416,
"loss": 0.00025091992574743927,
"test_loss": 0.00018026397447101772
},
{
"iter": 808000,
"lr": 0.002648949568616711,
"loss": 8.148832421284169e-05,
"test_loss": 1.5608680769219063e-05
},
{
"iter": 809000,
"lr": 0.0026222695305425335,
"loss": 0.00013469471014104784,
"test_loss": 0.001521756174042821
},
{
"iter": 810000,
"lr": 0.002595711709487676,
"loss": 0.0005708974786102772,
"test_loss": 0.00019854224228765815
},
{
"iter": 811000,
"lr": 0.0025692763676719863,
"loss": 0.00023888761643320322,
"test_loss": 4.6917932195356116e-05
},
{
"iter": 812000,
"lr": 0.0025429637661060094,
"loss": 0.00028354045934975147,
"test_loss": 8.254782005678862e-05
},
{
"iter": 813000,
"lr": 0.002516774164588409,
"loss": 0.000508604571223259,
"test_loss": 7.501007348764688e-05
},
{
"iter": 814000,
"lr": 0.0024907078217034015,
"loss": 3.240957448724657e-05,
"test_loss": 2.0139301341259852e-05
},
{
"iter": 815000,
"lr": 0.002464764994818206,
"loss": 7.75083972257562e-05,
"test_loss": 2.4329365260200575e-05
},
{
"iter": 816000,
"lr": 0.0024389459400804975,
"loss": 2.5860583264147863e-05,
"test_loss": 1.0080298125103582e-05
},
{
"iter": 817000,
"lr": 0.0024132509124158833,
"loss": 9.857260738499463e-05,
"test_loss": 0.00104460958391428
},
{
"iter": 818000,
"lr": 0.002387680165525383,
"loss": 0.0003853709786199033,
"test_loss": 0.0003412032383494079
},
{
"iter": 819000,
"lr": 0.0023622339518829263,
"loss": 0.0008270180551335216,
"test_loss": 7.953643944347277e-05
},
{
"iter": 820000,
"lr": 0.0023369125227328522,
"loss": 0.0004488629347179085,
"test_loss": 0.000880400009918958
},
{
"iter": 821000,
"lr": 0.0023117161280874422,
"loss": 0.0001996172359213233,
"test_loss": 0.00013713251973968
},
{
"iter": 822000,
"lr": 0.0022866450167244395,
"loss": 1.896937465062365e-05,
"test_loss": 7.428220851579681e-05
},
{
"iter": 823000,
"lr": 0.002261699436184597,
"loss": 0.00013456163287628442,
"test_loss": 0.00029024758259765804
},
{
"iter": 824000,
"lr": 0.002236879632769234,
"loss": 0.0004284908645786345,
"test_loss": 6.611862045247108e-05
},
{
"iter": 825000,
"lr": 0.002212185851537805,
"loss": 1.1459032066341024e-05,
"test_loss": 0.0003108781238552183
},
{
"iter": 826000,
"lr": 0.002187618336305478,
"loss": 0.00037317111855372787,
"test_loss": 5.880569005967118e-06
},
{
"iter": 827000,
"lr": 0.0021631773296407284,
"loss": 0.00032713141990825534,
"test_loss": 1.9254655853728764e-05
},
{
"iter": 828000,
"lr": 0.0021388630728629396,
"loss": 0.0005525414599105716,
"test_loss": 0.000852710974868387
},
{
"iter": 829000,
"lr": 0.00211467580604003,
"loss": 0.0003025742480531335,
"test_loss": 4.266275482223136e-06
},
{
"iter": 830000,
"lr": 0.0020906157679860733,
"loss": 0.00014817573537584394,
"test_loss": 0.000290561409201473
},
{
"iter": 831000,
"lr": 0.0020666831962589467,
"loss": 0.00029073780751787126,
"test_loss": 3.791091148741543e-05
},
{
"iter": 832000,
"lr": 0.0020428783271579792,
"loss": 5.9674006479326636e-05,
"test_loss": 3.781837222049944e-05
},
{
"iter": 833000,
"lr": 0.002019201395721627,
"loss": 0.0001753699907567352,
"test_loss": 0.0004482464864850044
},
{
"iter": 834000,
"lr": 0.0019956526357251415,
"loss": 5.6943237723317e-05,
"test_loss": 0.00015464822354260832
},
{
"iter": 835000,
"lr": 0.0019722322796782753,
"loss": 4.277301923139021e-05,
"test_loss": 0.0001293517416343093
},
{
"iter": 836000,
"lr": 0.0019489405588229754,
"loss": 0.0006003423477523029,
"test_loss": 0.00025099271442741156
},
{
"iter": 837000,
"lr": 0.0019257777031310974,
"loss": 0.00028466215007938445,
"test_loss": 4.738118150271475e-05
},
{
"iter": 838000,
"lr": 0.0019027439413021497,
"loss": 0.00013970420695841312,
"test_loss": 0.0002945093729067594
},
{
"iter": 839000,
"lr": 0.0018798395007610235,
"loss": 3.3790340239647776e-05,
"test_loss": 4.484365854295902e-05
},
{
"iter": 840000,
"lr": 0.001857064607655748,
"loss": 3.1816169212106615e-05,
"test_loss": 2.9099588573444635e-05
},
{
"iter": 841000,
"lr": 0.0018344194868552654,
"loss": 3.3000458643073216e-05,
"test_loss": 6.595349077542778e-06
},
{
"iter": 842000,
"lr": 0.001811904361947201,
"loss": 0.00027465858147479594,
"test_loss": 1.0659949111868627e-05
},
{
"iter": 843000,
"lr": 0.0017895194552356572,
"loss": 3.514915442792699e-05,
"test_loss": 2.9089815143379383e-05
},
{
"iter": 844000,
"lr": 0.001767264987739029,
"loss": 0.0005240679020062089,
"test_loss": 1.8339917005505413e-05
},
{
"iter": 845000,
"lr": 0.0017451411791878065,
"loss": 0.0002651929680723697,
"test_loss": 0.00020296570437494665
},
{
"iter": 846000,
"lr": 0.0017231482480224182,
"loss": 1.0721685612224974e-05,
"test_loss": 6.359841790981591e-05
},
{
"iter": 847000,
"lr": 0.001701286411391064,
"loss": 6.2940634961705655e-06,
"test_loss": 6.991222107899375e-06
},
{
"iter": 848000,
"lr": 0.0016795558851475777,
"loss": 8.735109440749511e-05,
"test_loss": 0.0006877071573399007
},
{
"iter": 849000,
"lr": 0.0016579568838492984,
"loss": 1.6430862160632387e-05,
"test_loss": 8.976415119832382e-05
},
{
"iter": 850000,
"lr": 0.0016364896207549404,
"loss": 0.0003578809555619955,
"test_loss": 4.800086117029423e-06
},
{
"iter": 851000,
"lr": 0.0016151543078225005,
"loss": 0.00047125632409006357,
"test_loss": 0.00010609527816995978
},
{
"iter": 852000,
"lr": 0.0015939511557071559,
"loss": 2.165045589208603e-05,
"test_loss": 8.746737876208499e-06
},
{
"iter": 853000,
"lr": 0.001572880373759191,
"loss": 0.0011302112834528089,
"test_loss": 4.703798822447425e-06
},
{
"iter": 854000,
"lr": 0.0015519421700219249,
"loss": 8.221966709243134e-05,
"test_loss": 2.402101017651148e-05
},
{
"iter": 855000,
"lr": 0.0015311367512296603,
"loss": 6.909555668244138e-05,
"test_loss": 5.137875268701464e-05
},
{
"iter": 856000,
"lr": 0.0015104643228056438,
"loss": 8.623114990768954e-05,
"test_loss": 7.059338531689718e-05
},
{
"iter": 857000,
"lr": 0.0014899250888600335,
"loss": 0.00018331459432374686,
"test_loss": 0.00021130547975189984
},
{
"iter": 858000,
"lr": 0.0014695192521878896,
"loss": 2.208674413850531e-05,
"test_loss": 4.7459757297474425e-06
},
{
"iter": 859000,
"lr": 0.0014492470142671583,
"loss": 4.464257654035464e-05,
"test_loss": 4.156459908699617e-06
},
{
"iter": 860000,
"lr": 0.0014291085752567013,
"loss": 0.00012647236871998757,
"test_loss": 1.270379561901791e-05
},
{
"iter": 861000,
"lr": 0.0014091041339943083,
"loss": 1.5184614312602207e-05,
"test_loss": 1.725301808619406e-05
},
{
"iter": 862000,
"lr": 0.0013892338879947395,
"loss": 0.0002790640573948622,
"test_loss": 0.000454367371276021
},
{
"iter": 863000,
"lr": 0.0013694980334477656,
"loss": 4.954707401338965e-05,
"test_loss": 7.141205514926696e-06
},
{
"iter": 864000,
"lr": 0.0013498967652162438,
"loss": 0.0001272451045224443,
"test_loss": 0.00024000742996577173
},
{
"iter": 865000,
"lr": 0.0013304302768341793,
"loss": 1.345604960079072e-05,
"test_loss": 0.00028391738305799663
},
{
"iter": 866000,
"lr": 0.001311098760504832,
"loss": 2.108882472384721e-05,
"test_loss": 1.2611117199412547e-05
},
{
"iter": 867000,
"lr": 0.0012919024070988017,
"loss": 3.0207815143512562e-05,
"test_loss": 1.4785734492761549e-05
},
{
"iter": 868000,
"lr": 0.0012728414061521536,
"loss": 0.0003364590520504862,
"test_loss": 1.116009570978349e-05
},
{
"iter": 869000,
"lr": 0.0012539159458645436,
"loss": 2.2847414584248327e-05,
"test_loss": 3.099195600952953e-05
},
{
"iter": 870000,
"lr": 0.0012351262130973625,
"loss": 4.173811248620041e-05,
"test_loss": 5.257342127151787e-05
},
{
"iter": 871000,
"lr": 0.0012164723933718875,
"loss": 0.00012329079618211836,
"test_loss": 5.137546395417303e-06
},
{
"iter": 872000,
"lr": 0.0011979546708674512,
"loss": 1.4191511581884697e-05,
"test_loss": 0.0008924142457544804
},
{
"iter": 873000,
"lr": 0.001179573228419629,
"loss": 8.65324091137154e-06,
"test_loss": 1.5654064554837532e-05
},
{
"iter": 874000,
"lr": 0.0011613282475184225,
"loss": 1.581216201884672e-05,
"test_loss": 7.2268662734131794e-06
},
{
"iter": 875000,
"lr": 0.0011432199083064778,
"loss": 0.0005633010296151042,
"test_loss": 5.085852080810582e-06
},
{
"iter": 876000,
"lr": 0.0011252483895773052,
"loss": 0.00011907926818821579,
"test_loss": 1.649415207793936e-05
},
{
"iter": 877000,
"lr": 0.0011074138687735054,
"loss": 7.952123996801674e-05,
"test_loss": 1.5155103028519079e-05
},
{
"iter": 878000,
"lr": 0.00108971652198503,
"loss": 5.916960617469158e-06,
"test_loss": 2.5194585759891197e-05
},
{
"iter": 879000,
"lr": 0.0010721565239474322,
"loss": 5.152490484761074e-05,
"test_loss": 1.0781694072647952e-05
},
{
"iter": 880000,
"lr": 0.0010547340480401503,
"loss": 6.890996883157641e-05,
"test_loss": 0.0004860750923398882
},
{
"iter": 881000,
"lr": 0.0010374492662847876,
"loss": 5.443764530355111e-05,
"test_loss": 0.0005180255393497646
},
{
"iter": 882000,
"lr": 0.0010203023493434219,
"loss": 1.0066329195979051e-05,
"test_loss": 3.512095645419322e-05
},
{
"iter": 883000,
"lr": 0.0010032934665169114,
"loss": 6.574297731276602e-05,
"test_loss": 0.00018978955631610006
},
{
"iter": 884000,
"lr": 0.0009864227857432372,
"loss": 4.9753864004742354e-05,
"test_loss": 1.3553080862038769e-05
},
{
"iter": 885000,
"lr": 0.0009696904735958241,
"loss": 4.891739990853239e-06,
"test_loss": 1.5957295545376837e-05
},
{
"iter": 886000,
"lr": 0.0009530966952819148,
"loss": 3.5550408938433975e-05,
"test_loss": 0.00014296772133093327
},
{
"iter": 887000,
"lr": 0.0009366416146409324,
"loss": 0.00018393978825770319,
"test_loss": 1.9510920537868515e-05
},
{
"iter": 888000,
"lr": 0.0009203253941428609,
"loss": 0.0006755493814125657,
"test_loss": 3.0341275305545423e-06
},
{
"iter": 889000,
"lr": 0.0009041481948866449,
"loss": 0.0004200747353024781,
"test_loss": 6.081018000259064e-05
},
{
"iter": 890000,
"lr": 0.0008881101765985913,
"loss": 0.0005278442986309528,
"test_loss": 6.723521073581651e-05
},
{
"iter": 891000,
"lr": 0.0008722114976308004,
"loss": 2.335923090868164e-05,
"test_loss": 4.614891440724023e-05
},
{
"iter": 892000,
"lr": 0.0008564523149596006,
"loss": 1.2066566341673024e-05,
"test_loss": 0.0005126264877617359
},
{
"iter": 893000,
"lr": 0.0008408327841839946,
"loss": 6.017923624312971e-06,
"test_loss": 4.03363628720399e-05
},
{
"iter": 894000,
"lr": 0.000825353059524129,
"loss": 0.0003033427055925131,
"test_loss": 1.6842457625898533e-05
},
{
"iter": 895000,
"lr": 0.0008100132938197644,
"loss": 1.5553920093225315e-05,
"test_loss": 1.5987581718945876e-05
},
{
"iter": 896000,
"lr": 0.0007948136385287738,
"loss": 0.0005272008129395545,
"test_loss": 0.00016645963478367776
},
{
"iter": 897000,
"lr": 0.000779754243725642,
"loss": 0.0002830813464242965,
"test_loss": 3.013761670445092e-06
},
{
"iter": 898000,
"lr": 0.0007648352580999858,
"loss": 8.423028339166194e-05,
"test_loss": 3.5929133446188644e-05
},
{
"iter": 899000,
"lr": 0.0007500568289550856,
"loss": 9.4511968200095e-05,
"test_loss": 0.0001721340959193185
},
{
"iter": 900000,
"lr": 0.0007354191022064297,
"loss": 1.1183694368810393e-05,
"test_loss": 0.0008018710650503635
},
{
"iter": 901000,
"lr": 0.0007209222223802793,
"loss": 4.57848836958874e-05,
"test_loss": 3.749586085177725e-06
},
{
"iter": 902000,
"lr": 0.0007065663326122326,
"loss": 6.750726697646314e-06,
"test_loss": 8.288851677207276e-05
},
{
"iter": 903000,
"lr": 0.0006923515746458161,
"loss": 0.00034657781361602247,
"test_loss": 3.340317789479741e-06
},
{
"iter": 904000,
"lr": 0.0006782780888310891,
"loss": 7.161756911955308e-06,
"test_loss": 1.7308414044236997e-06
},
{
"iter": 905000,
"lr": 0.0006643460141232501,
"loss": 4.136999632464722e-05,
"test_loss": 0.00010594076593406498
},
{
"iter": 906000,
"lr": 0.0006505554880812706,
"loss": 0.00025627820286899805,
"test_loss": 1.1893820555997081e-05
},
{
"iter": 907000,
"lr": 0.0006369066468665321,
"loss": 9.961667274183128e-06,
"test_loss": 0.00023488559236284345
},
{
"iter": 908000,
"lr": 0.0006233996252414899,
"loss": 0.00015723236720077693,
"test_loss": 4.733757577923825e-06
},
{
"iter": 909000,
"lr": 0.0006100345565683313,
"loss": 0.00033518910640850663,
"test_loss": 2.8449994715629146e-06
},
{
"iter": 910000,
"lr": 0.000596811572807668,
"loss": 2.0492127077886835e-05,
"test_loss": 2.274215148645453e-06
},
{
"iter": 911000,
"lr": 0.0005837308045172307,
"loss": 4.3859736251761205e-06,
"test_loss": 4.082681334693916e-05
},
{
"iter": 912000,
"lr": 0.0005707923808505752,
"loss": 0.000343496649293229,
"test_loss": 8.09923221822828e-05
},
{
"iter": 913000,
"lr": 0.0005579964295558151,
"loss": 4.502659976424184e-06,
"test_loss": 0.0006849374040029943
},
{
"iter": 914000,
"lr": 0.0005453430769743563,
"loss": 9.261580999009311e-06,
"test_loss": 1.3452558050630614e-05
},
{
"iter": 915000,
"lr": 0.0005328324480396492,
"loss": 1.7644626495894045e-05,
"test_loss": 0.0007716813706792891
},
{
"iter": 916000,
"lr": 0.0005204646662759524,
"loss": 5.989650617266307e-06,
"test_loss": 4.778150923812063e-06
},
{
"iter": 917000,
"lr": 0.0005082398537971191,
"loss": 6.039868458174169e-05,
"test_loss": 4.847549917030847e-06
},
{
"iter": 918000,
"lr": 0.0004961581313053927,
"loss": 8.25791503302753e-05,
"test_loss": 1.0734435818449128e-05
},
{
"iter": 919000,
"lr": 0.000484219618090205,
"loss": 0.0003194988239556551,
"test_loss": 8.774680281931069e-06
},
{
"iter": 920000,
"lr": 0.00047242443202700796,
"loss": 0.00022832464310340583,
"test_loss": 1.964176590263378e-05
},
{
"iter": 921000,
"lr": 0.0004607726895761045,
"loss": 0.00033203387283720076,
"test_loss": 4.22712582803797e-06
},
{
"iter": 922000,
"lr": 0.0004492645057815043,
"loss": 8.524995064362884e-05,
"test_loss": 0.0013903349172323942
},
{
"iter": 923000,
"lr": 0.000437899994269778,
"loss": 2.0461860913201235e-05,
"test_loss": 3.845985247608041e-06
},
{
"iter": 924000,
"lr": 0.0004266792672489469,
"loss": 5.635166235151701e-05,
"test_loss": 1.5701800293754786e-05
},
{
"iter": 925000,
"lr": 0.0004156024355073667,
"loss": 5.627243353956146e-06,
"test_loss": 0.0003363931318745017
},
{
"iter": 926000,
"lr": 0.0004046696084126388,
"loss": 6.8001972977072e-06,
"test_loss": 2.2508485926664434e-05
},
{
"iter": 927000,
"lr": 0.000393880893910526,
"loss": 0.0003149032418150455,
"test_loss": 3.1790641514817253e-06
},
{
"iter": 928000,
"lr": 0.00038323639852388844,
"loss": 0.00039288634434342384,
"test_loss": 4.5199394662631676e-06
},
{
"iter": 929000,
"lr": 0.0003727362273516361,
"loss": 8.490125765092671e-06,
"test_loss": 1.262229670828674e-05
},
{
"iter": 930000,
"lr": 0.00036238048406768316,
"loss": 5.076874913356733e-06,
"test_loss": 3.4755064461933216e-06
},
{
"iter": 931000,
"lr": 0.0003521692709199303,
"loss": 6.071407187846489e-05,
"test_loss": 1.5660383496651775e-06
},
{
"iter": 932000,
"lr": 0.000342102688729254,
"loss": 3.4121158023481257e-06,
"test_loss": 5.974631676508579e-06
},
{
"iter": 933000,
"lr": 0.0003321808368885074,
"loss": 9.25468611967517e-06,
"test_loss": 3.3887927202158608e-06
},
{
"iter": 934000,
"lr": 0.00032240381336154426,
"loss": 1.1478377928142436e-05,
"test_loss": 2.8369368010316975e-06
},
{
"iter": 935000,
"lr": 0.0003127717146822517,
"loss": 1.9028684619115666e-05,
"test_loss": 1.6014113498385996e-05
},
{
"iter": 936000,
"lr": 0.00030328463595359086,
"loss": 4.904146771878004e-05,
"test_loss": 3.839561395579949e-05
},
{
"iter": 937000,
"lr": 0.0002939426708466642,
"loss": 7.962711606523953e-06,
"test_loss": 7.902066863607615e-05
},
{
"iter": 938000,
"lr": 0.00028474591159978664,
"loss": 1.625324694032315e-05,
"test_loss": 4.6168966036930215e-06
},
{
"iter": 939000,
"lr": 0.0002756944490175776,
"loss": 4.550354333332507e-06,
"test_loss": 2.7188445528736338e-05
},
{
"iter": 940000,
"lr": 0.0002667883724700637,
"loss": 0.00017539634427521378,
"test_loss": 0.0001001652199192904
},
{
"iter": 941000,
"lr": 0.0002580277698917926,
"loss": 1.7185160686494783e-05,
"test_loss": 2.5357696358696558e-05
},
{
"iter": 942000,
"lr": 0.0002494127277809739,
"loss": 7.3880082709365524e-06,
"test_loss": 2.1761927200714126e-05
},
{
"iter": 943000,
"lr": 0.00024094333119861473,
"loss": 3.6780188565899152e-06,
"test_loss": 2.6281165901309578e-06
},
{
"iter": 944000,
"lr": 0.00023261966376768566,
"loss": 8.227321814047173e-06,
"test_loss": 3.912461579602677e-06
},
{
"iter": 945000,
"lr": 0.0002244418076722944,
"loss": 2.888506423914805e-05,
"test_loss": 0.00014227665087673813
},
{
"iter": 946000,
"lr": 0.00021640984365687335,
"loss": 1.9348353816894814e-05,
"test_loss": 0.0007827307563275099
},
{
"iter": 947000,
"lr": 0.00020852385102538355,
"loss": 3.792852658079937e-05,
"test_loss": 1.3585070519184228e-05
},
{
"iter": 948000,
"lr": 0.00020078390764053045,
"loss": 0.00022314030502457172,
"test_loss": 5.15370411449112e-05
},
{
"iter": 949000,
"lr": 0.00019319008992299596,
"loss": 5.887927272851812e-06,
"test_loss": 4.1903120290953666e-05
},
{
"iter": 950000,
"lr": 0.00018574247285068428,
"loss": 9.919288459059317e-06,
"test_loss": 3.818649929598905e-06
},
{
"iter": 951000,
"lr": 0.0001784411299579775,
"loss": 5.246303408057429e-05,
"test_loss": 9.928096915245987e-06
},
{
"iter": 952000,
"lr": 0.0001712861333350161,
"loss": 5.6578023759357166e-06,
"test_loss": 2.8946558359166374e-06
},
{
"iter": 953000,
"lr": 0.0001642775536269847,
"loss": 2.8398319500411162e-06,
"test_loss": 3.4058761229971424e-05
},
{
"iter": 954000,
"lr": 0.00015741546003341246,
"loss": 6.617196777369827e-05,
"test_loss": 2.911276533268392e-05
},
{
"iter": 955000,
"lr": 0.00015069992030749047,
"loss": 2.8424505217117257e-05,
"test_loss": 1.6483627405250445e-05
},
{
"iter": 956000,
"lr": 0.00014413100075540386,
"loss": 3.826751708402298e-06,
"test_loss": 4.1245537431677803e-05
},
{
"iter": 957000,
"lr": 0.00013770876623567913,
"loss": 2.6849127607420087e-05,
"test_loss": 2.937400495284237e-06
},
{
"iter": 958000,
"lr": 0.00013143328015853792,
"loss": 0.00010185006249230355,
"test_loss": 0.00030261732172220945
},
{
"iter": 959000,
"lr": 0.0001253046044852775,
"loss": 3.1075498554855585e-05,
"test_loss": 6.723819751641713e-06
},
{
"iter": 960000,
"lr": 0.0001193227997276548,
"loss": 7.052519322314765e-06,
"test_loss": 6.038361243554391e-05
},
{
"iter": 961000,
"lr": 0.00011348792494729004,
"loss": 0.00010120654769707471,
"test_loss": 5.2386699280759785e-06
},
{
"iter": 962000,
"lr": 0.00010780003775508396,
"loss": 8.87551959749544e-06,
"test_loss": 3.0359337870322634e-06
},
{
"iter": 963000,
"lr": 0.00010225919431064833,
"loss": 3.739465682883747e-06,
"test_loss": 2.2930753402761184e-05
},
{
"iter": 964000,
"lr": 9.686544932174965e-05,
"loss": 6.809431397414301e-06,
"test_loss": 5.255215000943281e-06
},
{
"iter": 965000,
"lr": 9.161885604377805e-05,
"loss": 1.1975382221862674e-05,
"test_loss": 0.00015044203610159457
},
{
"iter": 966000,
"lr": 8.651946627920598e-05,
"loss": 9.873991803033277e-05,
"test_loss": 1.9049507500312757e-06
},
{
"iter": 967000,
"lr": 8.156733037709032e-05,
"loss": 0.00013476998719852418,
"test_loss": 2.3277038962987717e-06
},
{
"iter": 968000,
"lr": 7.676249723256951e-05,
"loss": 1.687855001364369e-05,
"test_loss": 1.2148187124694232e-05
},
{
"iter": 969000,
"lr": 7.210501428638054e-05,
"loss": 5.662288094754331e-05,
"test_loss": 3.639381930042873e-06
},
{
"iter": 970000,
"lr": 6.759492752439434e-05,
"loss": 0.00020329163817223161,
"test_loss": 6.568419485120103e-05
},
{
"iter": 971000,
"lr": 6.32322814771563e-05,
"loss": 0.00015618573524989188,
"test_loss": 1.5959316442604177e-05
},
{
"iter": 972000,
"lr": 5.901711921944809e-05,
"loss": 0.00027873486396856606,
"test_loss": 1.3292824405652937e-06
},
{
"iter": 973000,
"lr": 5.494948236986652e-05,
"loss": 0.0023992196656763554,
"test_loss": 4.828254532185383e-06
},
{
"iter": 974000,
"lr": 5.1029411090407147e-05,
"loss": 9.959682211047038e-05,
"test_loss": 2.803298684739275e-06
},
{
"iter": 975000,
"lr": 4.7256944086072925e-05,
"loss": 0.00010963205568259582,
"test_loss": 3.7992108445905615e-06
},
{
"iter": 976000,
"lr": 4.363211860448621e-05,
"loss": 8.675256685819477e-05,
"test_loss": 1.3235597862149007e-06
},
{
"iter": 977000,
"lr": 4.0154970435527417e-05,
"loss": 2.451550699333893e-06,
"test_loss": 1.5176030956354225e-06
},
{
"iter": 978000,
"lr": 3.682553391097527e-05,
"loss": 1.7485963326180354e-06,
"test_loss": 1.9054164113185834e-06
},
{
"iter": 979000,
"lr": 3.364384190417215e-05,
"loss": 1.5184309631877113e-05,
"test_loss": 5.056808004155755e-05
},
{
"iter": 980000,
"lr": 3.060992582969929e-05,
"loss": 0.00023750533000566065,
"test_loss": 3.626388433985994e-06
},
{
"iter": 981000,
"lr": 2.7723815643062072e-05,
"loss": 0.0002798773057293147,
"test_loss": 0.00029111039475537837
},
{
"iter": 982000,
"lr": 2.4985539840403623e-05,
"loss": 1.186399458674714e-05,
"test_loss": 6.133056558610406e-06
},
{
"iter": 983000,
"lr": 2.239512545821003e-05,
"loss": 7.101956725819036e-06,
"test_loss": 1.3834019227942917e-05
},
{
"iter": 984000,
"lr": 1.9952598073058872e-05,
"loss": 0.0002528270415496081,
"test_loss": 0.00018363670096732676
},
{
"iter": 985000,
"lr": 1.7657981801352824e-05,
"loss": 7.170325261540711e-06,
"test_loss": 5.4830943554406986e-06
},
{
"iter": 986000,
"lr": 1.5511299299089786e-05,
"loss": 0.00016129027062561363,
"test_loss": 2.3034147034195485e-06
},
{
"iter": 987000,
"lr": 1.3512571761638129e-05,
"loss": 7.088255188136827e-06,
"test_loss": 8.106122550088912e-06
},
{
"iter": 988000,
"lr": 1.1661818923523495e-05,
"loss": 2.8824793844250962e-05,
"test_loss": 1.2851400242652744e-05
},
{
"iter": 989000,
"lr": 9.959059058237314e-06,
"loss": 4.9114441935671493e-05,
"test_loss": 3.792488996623433e-06
},
{
"iter": 990000,
"lr": 8.404308978056947e-06,
"loss": 4.560325760394335e-05,
"test_loss": 2.776517612801399e-05
},
{
"iter": 991000,
"lr": 6.9975840338774945e-06,
"loss": 0.0001276397961191833,
"test_loss": 1.8969069060403854e-05
},
{
"iter": 992000,
"lr": 5.738898115063581e-06,
"loss": 9.210954885929823e-06,
"test_loss": 2.034863655353547e-06
},
{
"iter": 993000,
"lr": 4.6282636493044854e-06,
"loss": 4.193899076199159e-05,
"test_loss": 3.7138702282391023e-06
},
{
"iter": 994000,
"lr": 3.6656916025008922e-06,
"loss": 4.066589826834388e-05,
"test_loss": 3.4758181755023543e-06
},
{
"iter": 995000,
"lr": 2.8511914786516586e-06,
"loss": 6.010940978740109e-06,
"test_loss": 1.6219426015595673e-06
},
{
"iter": 996000,
"lr": 2.1847713197622234e-06,
"loss": 3.000273682118859e-05,
"test_loss": 2.5010400349856354e-05
},
{
"iter": 997000,
"lr": 1.6664377057596756e-06,
"loss": 8.361146319657564e-05,
"test_loss": 3.075581162192975e-06
},
{
"iter": 998000,
"lr": 1.296195754436137e-06,
"loss": 6.416995893232524e-05,
"test_loss": 8.637872815597802e-05
},
{
"iter": 999000,
"lr": 1.0740491213904765e-06,
"loss": 5.448848696687492e-06,
"test_loss": 1.3696559108211659e-05
}
]