diff --git "a/experiments/sft_gpt2-120m/20251209_070038/sft_gpt2-120m_metrics.jsonl" "b/experiments/sft_gpt2-120m/20251209_070038/sft_gpt2-120m_metrics.jsonl" --- "a/experiments/sft_gpt2-120m/20251209_070038/sft_gpt2-120m_metrics.jsonl" +++ "b/experiments/sft_gpt2-120m/20251209_070038/sft_gpt2-120m_metrics.jsonl" @@ -23211,3 +23211,1117 @@ {"epoch": 16, "step": 23194, "loss": 0.029489798471331596, "nll_loss": 0.029489798471331596} {"epoch": 16, "step": 23195, "loss": 0.05000549927353859, "nll_loss": 0.05000549927353859} {"epoch": 16, "step": 23196, "loss": 0.01674886792898178, "nll_loss": 0.01674886792898178} +{"epoch": 16, "step": 23197, "loss": 0.01741219125688076, "nll_loss": 0.01741219125688076} +{"epoch": 16, "step": 23198, "loss": 0.020566139370203018, "nll_loss": 0.020566139370203018} +{"epoch": 16, "step": 23199, "loss": 0.030263271182775497, "nll_loss": 0.030263271182775497} +{"epoch": 16, "step": 23200, "loss": 0.023728974163532257, "nll_loss": 0.023728974163532257} +{"epoch": 16, "step": 23201, "loss": 0.03734159097075462, "nll_loss": 0.03734159097075462} +{"epoch": 16, "step": 23202, "loss": 0.027458064258098602, "nll_loss": 0.027458064258098602} +{"epoch": 16, "step": 23203, "loss": 0.01594671793282032, "nll_loss": 0.01594671793282032} +{"epoch": 16, "step": 23204, "loss": 0.023844201117753983, "nll_loss": 0.023844201117753983} +{"epoch": 16, "step": 23205, "loss": 0.02949720248579979, "nll_loss": 0.02949720248579979} +{"epoch": 16, "step": 23206, "loss": 0.018290484324097633, "nll_loss": 0.018290484324097633} +{"epoch": 16, "step": 23207, "loss": 0.01974952220916748, "nll_loss": 0.01974952220916748} +{"epoch": 16, "step": 23208, "loss": 0.026474062353372574, "nll_loss": 0.026474062353372574} +{"epoch": 16, "step": 23209, "loss": 0.013686933554708958, "nll_loss": 0.013686933554708958} +{"epoch": 16, "step": 23210, "loss": 0.016168758273124695, "nll_loss": 0.016168758273124695} +{"epoch": 16, "step": 23211, "loss": 0.03942481800913811, "nll_loss": 0.03942481800913811} +{"epoch": 16, "step": 23212, "loss": 0.02837376482784748, "nll_loss": 0.02837376482784748} +{"epoch": 16, "step": 23213, "loss": 0.013582240790128708, "nll_loss": 0.013582240790128708} +{"epoch": 16, "step": 23214, "loss": 0.03059607744216919, "nll_loss": 0.03059607744216919} +{"epoch": 16, "step": 23215, "loss": 0.021811021491885185, "nll_loss": 0.021811021491885185} +{"epoch": 16, "step": 23216, "loss": 0.02740534394979477, "nll_loss": 0.02740534394979477} +{"epoch": 16, "step": 23217, "loss": 0.017767667770385742, "nll_loss": 0.017767667770385742} +{"epoch": 16, "step": 23218, "loss": 0.038821741938591, "nll_loss": 0.038821741938591} +{"epoch": 16, "step": 23219, "loss": 0.032569561153650284, "nll_loss": 0.032569561153650284} +{"epoch": 16, "step": 23220, "loss": 0.0277095939964056, "nll_loss": 0.0277095939964056} +{"epoch": 16, "step": 23221, "loss": 0.019318880513310432, "nll_loss": 0.019318880513310432} +{"epoch": 16, "step": 23222, "loss": 0.018630189821124077, "nll_loss": 0.018630189821124077} +{"epoch": 16, "step": 23223, "loss": 0.026202475652098656, "nll_loss": 0.026202475652098656} +{"epoch": 16, "step": 23224, "loss": 0.026907676830887794, "nll_loss": 0.026907676830887794} +{"epoch": 16, "step": 23225, "loss": 0.0242349561303854, "nll_loss": 0.0242349561303854} +{"epoch": 16, "step": 23226, "loss": 0.03452429920434952, "nll_loss": 0.03452429920434952} +{"epoch": 16, "step": 23227, "loss": 0.03563334792852402, "nll_loss": 0.03563334792852402} +{"epoch": 16, "step": 23228, "loss": 0.022237904369831085, "nll_loss": 0.022237904369831085} +{"epoch": 16, "step": 23229, "loss": 0.027575740590691566, "nll_loss": 0.027575740590691566} +{"epoch": 16, "step": 23230, "loss": 0.03366535156965256, "nll_loss": 0.03366535156965256} +{"epoch": 16, "step": 23231, "loss": 0.019782230257987976, "nll_loss": 0.019782230257987976} +{"epoch": 16, "step": 23232, "loss": 0.031191321089863777, "nll_loss": 0.031191321089863777} +{"epoch": 16, "step": 23233, "loss": 0.012404962442815304, "nll_loss": 0.012404962442815304} +{"epoch": 16, "step": 23234, "loss": 0.04730970412492752, "nll_loss": 0.04730970412492752} +{"epoch": 16, "step": 23235, "loss": 0.0166628398001194, "nll_loss": 0.0166628398001194} +{"epoch": 16, "step": 23236, "loss": 0.043164946138858795, "nll_loss": 0.043164946138858795} +{"epoch": 16, "step": 23237, "loss": 0.06797807663679123, "nll_loss": 0.06797807663679123} +{"epoch": 16, "step": 23238, "loss": 0.01731162704527378, "nll_loss": 0.01731162704527378} +{"epoch": 16, "step": 23239, "loss": 0.03685220703482628, "nll_loss": 0.03685220703482628} +{"epoch": 16, "step": 23240, "loss": 0.04831928014755249, "nll_loss": 0.04831928014755249} +{"epoch": 16, "step": 23241, "loss": 0.022399459034204483, "nll_loss": 0.022399459034204483} +{"epoch": 16, "step": 23242, "loss": 0.02761002816259861, "nll_loss": 0.02761002816259861} +{"epoch": 16, "step": 23243, "loss": 0.01621306501328945, "nll_loss": 0.01621306501328945} +{"epoch": 16, "step": 23244, "loss": 0.02762153372168541, "nll_loss": 0.02762153372168541} +{"epoch": 16, "step": 23245, "loss": 0.01824609935283661, "nll_loss": 0.01824609935283661} +{"epoch": 16, "step": 23246, "loss": 0.01452239602804184, "nll_loss": 0.01452239602804184} +{"epoch": 16, "step": 23247, "loss": 0.014697253704071045, "nll_loss": 0.014697253704071045} +{"epoch": 16, "step": 23248, "loss": 0.02913731150329113, "nll_loss": 0.02913731150329113} +{"epoch": 16, "step": 23249, "loss": 0.013916975818574429, "nll_loss": 0.013916975818574429} +{"epoch": 16, "step": 23250, "loss": 0.020143471658229828, "nll_loss": 0.020143471658229828} +{"epoch": 16, "step": 23251, "loss": 0.028228404000401497, "nll_loss": 0.028228404000401497} +{"epoch": 16, "step": 23252, "loss": 0.015762660652399063, "nll_loss": 0.015762660652399063} +{"epoch": 16, "step": 23253, "loss": 0.011919372715055943, "nll_loss": 0.011919372715055943} +{"epoch": 16, "step": 23254, "loss": 0.020898722112178802, "nll_loss": 0.020898722112178802} +{"epoch": 16, "step": 23255, "loss": 0.015814267098903656, "nll_loss": 0.015814267098903656} +{"epoch": 16, "step": 23256, "loss": 0.03611059859395027, "nll_loss": 0.03611059859395027} +{"epoch": 16, "step": 23257, "loss": 0.030072277411818504, "nll_loss": 0.030072277411818504} +{"epoch": 16, "step": 23258, "loss": 0.03863447532057762, "nll_loss": 0.03863447532057762} +{"epoch": 16, "step": 23259, "loss": 0.04983803257346153, "nll_loss": 0.04983803257346153} +{"epoch": 16, "step": 23260, "loss": 0.02171044982969761, "nll_loss": 0.02171044982969761} +{"epoch": 16, "step": 23261, "loss": 0.02228916995227337, "nll_loss": 0.02228916995227337} +{"epoch": 16, "step": 23262, "loss": 0.018136588856577873, "nll_loss": 0.018136588856577873} +{"epoch": 16, "step": 23263, "loss": 0.024317938834428787, "nll_loss": 0.024317938834428787} +{"epoch": 16, "step": 23264, "loss": 0.017251282930374146, "nll_loss": 0.017251282930374146} +{"epoch": 16, "step": 23265, "loss": 0.027902988716959953, "nll_loss": 0.027902988716959953} +{"epoch": 16, "step": 23266, "loss": 0.04231742396950722, "nll_loss": 0.04231742396950722} +{"epoch": 16, "step": 23267, "loss": 0.029166119173169136, "nll_loss": 0.029166119173169136} +{"epoch": 16, "step": 23268, "loss": 0.025594918057322502, "nll_loss": 0.025594918057322502} +{"epoch": 16, "step": 23269, "loss": 0.03144733980298042, "nll_loss": 0.03144733980298042} +{"epoch": 16, "step": 23270, "loss": 0.017773235216736794, "nll_loss": 0.017773235216736794} +{"epoch": 16, "step": 23271, "loss": 0.01569157838821411, "nll_loss": 0.01569157838821411} +{"epoch": 16, "step": 23272, "loss": 0.028642237186431885, "nll_loss": 0.028642237186431885} +{"epoch": 16, "step": 23273, "loss": 0.015018677338957787, "nll_loss": 0.015018677338957787} +{"epoch": 16, "step": 23274, "loss": 0.029490012675523758, "nll_loss": 0.029490012675523758} +{"epoch": 16, "step": 23275, "loss": 0.021629735827445984, "nll_loss": 0.021629735827445984} +{"epoch": 16, "step": 23276, "loss": 0.02446805126965046, "nll_loss": 0.02446805126965046} +{"epoch": 16, "step": 23277, "loss": 0.01927281729876995, "nll_loss": 0.01927281729876995} +{"epoch": 16, "step": 23278, "loss": 0.011350991204380989, "nll_loss": 0.011350991204380989} +{"epoch": 16, "step": 23279, "loss": 0.03569064289331436, "nll_loss": 0.03569064289331436} +{"epoch": 16, "step": 23280, "loss": 0.01210506446659565, "nll_loss": 0.01210506446659565} +{"epoch": 16, "step": 23281, "loss": 0.014901017770171165, "nll_loss": 0.014901017770171165} +{"epoch": 16, "step": 23282, "loss": 0.03096536360681057, "nll_loss": 0.03096536360681057} +{"epoch": 16, "step": 23283, "loss": 0.04236762970685959, "nll_loss": 0.04236762970685959} +{"epoch": 16, "step": 23284, "loss": 0.019553693011403084, "nll_loss": 0.019553693011403084} +{"epoch": 16, "step": 23285, "loss": 0.02543838880956173, "nll_loss": 0.02543838880956173} +{"epoch": 16, "step": 23286, "loss": 0.04190603271126747, "nll_loss": 0.04190603271126747} +{"epoch": 16, "step": 23287, "loss": 0.019405614584684372, "nll_loss": 0.019405614584684372} +{"epoch": 16, "step": 23288, "loss": 0.022174082696437836, "nll_loss": 0.022174082696437836} +{"epoch": 16, "step": 23289, "loss": 0.023330044001340866, "nll_loss": 0.023330044001340866} +{"epoch": 16, "step": 23290, "loss": 0.01576499082148075, "nll_loss": 0.01576499082148075} +{"epoch": 16, "step": 23291, "loss": 0.01799789071083069, "nll_loss": 0.01799789071083069} +{"epoch": 16, "step": 23292, "loss": 0.01532019767910242, "nll_loss": 0.01532019767910242} +{"epoch": 16, "step": 23293, "loss": 0.018000798299908638, "nll_loss": 0.018000798299908638} +{"epoch": 16, "step": 23294, "loss": 0.029163748025894165, "nll_loss": 0.029163748025894165} +{"epoch": 16, "step": 23295, "loss": 0.020093420520424843, "nll_loss": 0.020093420520424843} +{"epoch": 16, "step": 23296, "loss": 0.030149059370160103, "nll_loss": 0.030149059370160103} +{"epoch": 16, "step": 23297, "loss": 0.019751200452446938, "nll_loss": 0.019751200452446938} +{"epoch": 16, "step": 23298, "loss": 0.019901160150766373, "nll_loss": 0.019901160150766373} +{"epoch": 16, "step": 23299, "loss": 0.028430840000510216, "nll_loss": 0.028430840000510216} +{"epoch": 16, "step": 23300, "loss": 0.01717720367014408, "nll_loss": 0.01717720367014408} +{"epoch": 16, "step": 23301, "loss": 0.04637725278735161, "nll_loss": 0.04637725278735161} +{"epoch": 16, "step": 23302, "loss": 0.015545804984867573, "nll_loss": 0.015545804984867573} +{"epoch": 16, "step": 23303, "loss": 0.03517654910683632, "nll_loss": 0.03517654910683632} +{"epoch": 16, "step": 23304, "loss": 0.021693652495741844, "nll_loss": 0.021693652495741844} +{"epoch": 16, "step": 23305, "loss": 0.018104637041687965, "nll_loss": 0.018104637041687965} +{"epoch": 16, "step": 23306, "loss": 0.025382865220308304, "nll_loss": 0.025382865220308304} +{"epoch": 16, "step": 23307, "loss": 0.024550195783376694, "nll_loss": 0.024550195783376694} +{"epoch": 16, "step": 23308, "loss": 0.042717915028333664, "nll_loss": 0.042717915028333664} +{"epoch": 16, "step": 23309, "loss": 0.012155749835073948, "nll_loss": 0.012155749835073948} +{"epoch": 16, "step": 23310, "loss": 0.01823868416249752, "nll_loss": 0.01823868416249752} +{"epoch": 16, "step": 23311, "loss": 0.01017204113304615, "nll_loss": 0.01017204113304615} +{"epoch": 16, "step": 23312, "loss": 0.021235119551420212, "nll_loss": 0.021235119551420212} +{"epoch": 16, "step": 23313, "loss": 0.01777292601764202, "nll_loss": 0.01777292601764202} +{"epoch": 16, "step": 23314, "loss": 0.023356448858976364, "nll_loss": 0.023356448858976364} +{"epoch": 16, "step": 23315, "loss": 0.023516472429037094, "nll_loss": 0.023516472429037094} +{"epoch": 16, "step": 23316, "loss": 0.030335135757923126, "nll_loss": 0.030335135757923126} +{"epoch": 16, "step": 23317, "loss": 0.010376404039561749, "nll_loss": 0.010376404039561749} +{"epoch": 16, "step": 23318, "loss": 0.013234680518507957, "nll_loss": 0.013234680518507957} +{"epoch": 16, "step": 23319, "loss": 0.03568737208843231, "nll_loss": 0.03568737208843231} +{"epoch": 16, "step": 23320, "loss": 0.03316739574074745, "nll_loss": 0.03316739574074745} +{"epoch": 16, "step": 23321, "loss": 0.010691633448004723, "nll_loss": 0.010691633448004723} +{"epoch": 16, "step": 23322, "loss": 0.014909012243151665, "nll_loss": 0.014909012243151665} +{"epoch": 16, "step": 23323, "loss": 0.027315903455018997, "nll_loss": 0.027315903455018997} +{"epoch": 16, "step": 23324, "loss": 0.015414620749652386, "nll_loss": 0.015414620749652386} +{"epoch": 16, "step": 23325, "loss": 0.015961218625307083, "nll_loss": 0.015961218625307083} +{"epoch": 16, "step": 23326, "loss": 0.019628912210464478, "nll_loss": 0.019628912210464478} +{"epoch": 16, "step": 23327, "loss": 0.021320890635252, "nll_loss": 0.021320890635252} +{"epoch": 16, "step": 23328, "loss": 0.028991175815463066, "nll_loss": 0.028991175815463066} +{"epoch": 16, "step": 23329, "loss": 0.02684120088815689, "nll_loss": 0.02684120088815689} +{"epoch": 16, "step": 23330, "loss": 0.025613835081458092, "nll_loss": 0.025613835081458092} +{"epoch": 16, "step": 23331, "loss": 0.031721118837594986, "nll_loss": 0.031721118837594986} +{"epoch": 16, "step": 23332, "loss": 0.008454374969005585, "nll_loss": 0.008454374969005585} +{"epoch": 16, "step": 23333, "loss": 0.03404640033841133, "nll_loss": 0.03404640033841133} +{"epoch": 16, "step": 23334, "loss": 0.02664675936102867, "nll_loss": 0.02664675936102867} +{"epoch": 16, "step": 23335, "loss": 0.03792155161499977, "nll_loss": 0.03792155161499977} +{"epoch": 16, "step": 23336, "loss": 0.023439394310116768, "nll_loss": 0.023439394310116768} +{"epoch": 16, "step": 23337, "loss": 0.027642276138067245, "nll_loss": 0.027642276138067245} +{"epoch": 16, "step": 23338, "loss": 0.01361246220767498, "nll_loss": 0.01361246220767498} +{"epoch": 16, "step": 23339, "loss": 0.017377691343426704, "nll_loss": 0.017377691343426704} +{"epoch": 16, "step": 23340, "loss": 0.015700628980994225, "nll_loss": 0.015700628980994225} +{"epoch": 16, "step": 23341, "loss": 0.03369653597474098, "nll_loss": 0.03369653597474098} +{"epoch": 16, "step": 23342, "loss": 0.02551899291574955, "nll_loss": 0.02551899291574955} +{"epoch": 16, "step": 23343, "loss": 0.03017139621078968, "nll_loss": 0.03017139621078968} +{"epoch": 16, "step": 23344, "loss": 0.0395621694624424, "nll_loss": 0.0395621694624424} +{"epoch": 16, "step": 23345, "loss": 0.043813712894916534, "nll_loss": 0.043813712894916534} +{"epoch": 16, "step": 23346, "loss": 0.01805255003273487, "nll_loss": 0.01805255003273487} +{"epoch": 16, "step": 23347, "loss": 0.027458997443318367, "nll_loss": 0.027458997443318367} +{"epoch": 16, "step": 23348, "loss": 0.02459046244621277, "nll_loss": 0.02459046244621277} +{"epoch": 16, "step": 23349, "loss": 0.018084215000271797, "nll_loss": 0.018084215000271797} +{"epoch": 16, "step": 23350, "loss": 0.01663641445338726, "nll_loss": 0.01663641445338726} +{"epoch": 16, "step": 23351, "loss": 0.020683348178863525, "nll_loss": 0.020683348178863525} +{"epoch": 16, "step": 23352, "loss": 0.022812670096755028, "nll_loss": 0.022812670096755028} +{"epoch": 16, "step": 23353, "loss": 0.02519942820072174, "nll_loss": 0.02519942820072174} +{"epoch": 16, "step": 23354, "loss": 0.02704603038728237, "nll_loss": 0.02704603038728237} +{"epoch": 16, "step": 23355, "loss": 0.031062684953212738, "nll_loss": 0.031062684953212738} +{"epoch": 16, "step": 23356, "loss": 0.0515189990401268, "nll_loss": 0.0515189990401268} +{"epoch": 16, "step": 23357, "loss": 0.008828812278807163, "nll_loss": 0.008828812278807163} +{"epoch": 16, "step": 23358, "loss": 0.01885533146560192, "nll_loss": 0.01885533146560192} +{"epoch": 16, "step": 23359, "loss": 0.027982445433735847, "nll_loss": 0.027982445433735847} +{"epoch": 16, "step": 23360, "loss": 0.020602094009518623, "nll_loss": 0.020602094009518623} +{"epoch": 16, "step": 23361, "loss": 0.019411325454711914, "nll_loss": 0.019411325454711914} +{"epoch": 16, "step": 23362, "loss": 0.02427596226334572, "nll_loss": 0.02427596226334572} +{"epoch": 16, "step": 23363, "loss": 0.025001175701618195, "nll_loss": 0.025001175701618195} +{"epoch": 16, "step": 23364, "loss": 0.022697636857628822, "nll_loss": 0.022697636857628822} +{"epoch": 16, "step": 23365, "loss": 0.02429816871881485, "nll_loss": 0.02429816871881485} +{"epoch": 16, "step": 23366, "loss": 0.05833904445171356, "nll_loss": 0.05833904445171356} +{"epoch": 16, "step": 23367, "loss": 0.010784679092466831, "nll_loss": 0.010784679092466831} +{"epoch": 16, "step": 23368, "loss": 0.021702002733945847, "nll_loss": 0.021702002733945847} +{"epoch": 16, "step": 23369, "loss": 0.02370927296578884, "nll_loss": 0.02370927296578884} +{"epoch": 16, "step": 23370, "loss": 0.039089180529117584, "nll_loss": 0.039089180529117584} +{"epoch": 16, "step": 23371, "loss": 0.02471167966723442, "nll_loss": 0.02471167966723442} +{"epoch": 16, "step": 23372, "loss": 0.048146992921829224, "nll_loss": 0.048146992921829224} +{"epoch": 16, "step": 23373, "loss": 0.01726408116519451, "nll_loss": 0.01726408116519451} +{"epoch": 16, "step": 23374, "loss": 0.03803115338087082, "nll_loss": 0.03803115338087082} +{"epoch": 16, "step": 23375, "loss": 0.01797945238649845, "nll_loss": 0.01797945238649845} +{"epoch": 16, "step": 23376, "loss": 0.018842821940779686, "nll_loss": 0.018842821940779686} +{"epoch": 16, "step": 23377, "loss": 0.009749791584908962, "nll_loss": 0.009749791584908962} +{"epoch": 16, "step": 23378, "loss": 0.0222418662160635, "nll_loss": 0.0222418662160635} +{"epoch": 16, "step": 23379, "loss": 0.029461784288287163, "nll_loss": 0.029461784288287163} +{"epoch": 16, "step": 23380, "loss": 0.017170362174510956, "nll_loss": 0.017170362174510956} +{"epoch": 16, "step": 23381, "loss": 0.012607358396053314, "nll_loss": 0.012607358396053314} +{"epoch": 16, "step": 23382, "loss": 0.026916855946183205, "nll_loss": 0.026916855946183205} +{"epoch": 16, "step": 23383, "loss": 0.02139996364712715, "nll_loss": 0.02139996364712715} +{"epoch": 16, "step": 23384, "loss": 0.028126513585448265, "nll_loss": 0.028126513585448265} +{"epoch": 16, "step": 23385, "loss": 0.02209189347922802, "nll_loss": 0.02209189347922802} +{"epoch": 16, "step": 23386, "loss": 0.03662655130028725, "nll_loss": 0.03662655130028725} +{"epoch": 16, "step": 23387, "loss": 0.02271992154419422, "nll_loss": 0.02271992154419422} +{"epoch": 16, "step": 23388, "loss": 0.01353228185325861, "nll_loss": 0.01353228185325861} +{"epoch": 16, "step": 23389, "loss": 0.03754081204533577, "nll_loss": 0.03754081204533577} +{"epoch": 16, "step": 23390, "loss": 0.01939159817993641, "nll_loss": 0.01939159817993641} +{"epoch": 16, "step": 23391, "loss": 0.014813175424933434, "nll_loss": 0.014813175424933434} +{"epoch": 16, "step": 23392, "loss": 0.015653222799301147, "nll_loss": 0.015653222799301147} +{"epoch": 16, "step": 23393, "loss": 0.019358981400728226, "nll_loss": 0.019358981400728226} +{"epoch": 16, "step": 23394, "loss": 0.009939904324710369, "nll_loss": 0.009939904324710369} +{"epoch": 16, "step": 23395, "loss": 0.028781529515981674, "nll_loss": 0.028781529515981674} +{"epoch": 16, "step": 23396, "loss": 0.014079658314585686, "nll_loss": 0.014079658314585686} +{"epoch": 16, "step": 23397, "loss": 0.03745555877685547, "nll_loss": 0.03745555877685547} +{"epoch": 16, "step": 23398, "loss": 0.028294052928686142, "nll_loss": 0.028294052928686142} +{"epoch": 16, "step": 23399, "loss": 0.04334946721792221, "nll_loss": 0.04334946721792221} +{"epoch": 16, "step": 23400, "loss": 0.025800174102187157, "nll_loss": 0.025800174102187157} +{"epoch": 16, "step": 23401, "loss": 0.025149445980787277, "nll_loss": 0.025149445980787277} +{"epoch": 16, "step": 23402, "loss": 0.01881909929215908, "nll_loss": 0.01881909929215908} +{"epoch": 16, "step": 23403, "loss": 0.03316248580813408, "nll_loss": 0.03316248580813408} +{"epoch": 16, "step": 23404, "loss": 0.03436075150966644, "nll_loss": 0.03436075150966644} +{"epoch": 16, "step": 23405, "loss": 0.030681932345032692, "nll_loss": 0.030681932345032692} +{"epoch": 16, "step": 23406, "loss": 0.03597625717520714, "nll_loss": 0.03597625717520714} +{"epoch": 16, "step": 23407, "loss": 0.03027552366256714, "nll_loss": 0.03027552366256714} +{"epoch": 16, "step": 23408, "loss": 0.03896354138851166, "nll_loss": 0.03896354138851166} +{"epoch": 16, "step": 23409, "loss": 0.02088092267513275, "nll_loss": 0.02088092267513275} +{"epoch": 16, "step": 23410, "loss": 0.037812910974025726, "nll_loss": 0.037812910974025726} +{"epoch": 16, "step": 23411, "loss": 0.025105668231844902, "nll_loss": 0.025105668231844902} +{"epoch": 16, "step": 23412, "loss": 0.01929521933197975, "nll_loss": 0.01929521933197975} +{"epoch": 16, "step": 23413, "loss": 0.03641538321971893, "nll_loss": 0.03641538321971893} +{"epoch": 16, "step": 23414, "loss": 0.05213276669383049, "nll_loss": 0.05213276669383049} +{"epoch": 16, "step": 23415, "loss": 0.05415736883878708, "nll_loss": 0.05415736883878708} +{"epoch": 16, "step": 23416, "loss": 0.05261696130037308, "nll_loss": 0.05261696130037308} +{"epoch": 16, "step": 23417, "loss": 0.028347138315439224, "nll_loss": 0.028347138315439224} +{"epoch": 16, "step": 23418, "loss": 0.029714440926909447, "nll_loss": 0.029714440926909447} +{"epoch": 16, "step": 23419, "loss": 0.01119899284094572, "nll_loss": 0.01119899284094572} +{"epoch": 16, "step": 23420, "loss": 0.02712314762175083, "nll_loss": 0.02712314762175083} +{"epoch": 16, "step": 23421, "loss": 0.016395991668105125, "nll_loss": 0.016395991668105125} +{"epoch": 16, "step": 23422, "loss": 0.03831502050161362, "nll_loss": 0.03831502050161362} +{"epoch": 16, "step": 23423, "loss": 0.01408920343965292, "nll_loss": 0.01408920343965292} +{"epoch": 16, "step": 23424, "loss": 0.031148415058851242, "nll_loss": 0.031148415058851242} +{"epoch": 16, "step": 23425, "loss": 0.0170080978423357, "nll_loss": 0.0170080978423357} +{"epoch": 16, "step": 23426, "loss": 0.007345998659729958, "nll_loss": 0.007345998659729958} +{"epoch": 16, "step": 23427, "loss": 0.03497163951396942, "nll_loss": 0.03497163951396942} +{"epoch": 16, "step": 23428, "loss": 0.03491132706403732, "nll_loss": 0.03491132706403732} +{"epoch": 16, "step": 23429, "loss": 0.015331566333770752, "nll_loss": 0.015331566333770752} +{"epoch": 16, "step": 23430, "loss": 0.02223644033074379, "nll_loss": 0.02223644033074379} +{"epoch": 16, "step": 23431, "loss": 0.03167017549276352, "nll_loss": 0.03167017549276352} +{"epoch": 16, "step": 23432, "loss": 0.029458889737725258, "nll_loss": 0.029458889737725258} +{"epoch": 16, "step": 23433, "loss": 0.020431606099009514, "nll_loss": 0.020431606099009514} +{"epoch": 16, "step": 23434, "loss": 0.023784657940268517, "nll_loss": 0.023784657940268517} +{"epoch": 16, "step": 23435, "loss": 0.022938471287488937, "nll_loss": 0.022938471287488937} +{"epoch": 16, "step": 23436, "loss": 0.012656955979764462, "nll_loss": 0.012656955979764462} +{"epoch": 16, "step": 23437, "loss": 0.01018083281815052, "nll_loss": 0.01018083281815052} +{"epoch": 16, "step": 23438, "loss": 0.02222513034939766, "nll_loss": 0.02222513034939766} +{"epoch": 16, "step": 23439, "loss": 0.01500684767961502, "nll_loss": 0.01500684767961502} +{"epoch": 16, "step": 23440, "loss": 0.02676364965736866, "nll_loss": 0.02676364965736866} +{"epoch": 16, "step": 23441, "loss": 0.009413812309503555, "nll_loss": 0.009413812309503555} +{"epoch": 16, "step": 23442, "loss": 0.01889742538332939, "nll_loss": 0.01889742538332939} +{"epoch": 16, "step": 23443, "loss": 0.027958789840340614, "nll_loss": 0.027958789840340614} +{"epoch": 16, "step": 23444, "loss": 0.03070446103811264, "nll_loss": 0.03070446103811264} +{"epoch": 16, "step": 23445, "loss": 0.013581525534391403, "nll_loss": 0.013581525534391403} +{"epoch": 16, "step": 23446, "loss": 0.01774377003312111, "nll_loss": 0.01774377003312111} +{"epoch": 16, "step": 23447, "loss": 0.009576681070029736, "nll_loss": 0.009576681070029736} +{"epoch": 16, "step": 23448, "loss": 0.014030268415808678, "nll_loss": 0.014030268415808678} +{"epoch": 16, "step": 23449, "loss": 0.022771062329411507, "nll_loss": 0.022771062329411507} +{"epoch": 16, "step": 23450, "loss": 0.03129367530345917, "nll_loss": 0.03129367530345917} +{"epoch": 16, "step": 23451, "loss": 0.019364235922694206, "nll_loss": 0.019364235922694206} +{"epoch": 16, "step": 23452, "loss": 0.05092012137174606, "nll_loss": 0.05092012137174606} +{"epoch": 16, "step": 23453, "loss": 0.03389132767915726, "nll_loss": 0.03389132767915726} +{"epoch": 16, "step": 23454, "loss": 0.03474046662449837, "nll_loss": 0.03474046662449837} +{"epoch": 16, "step": 23455, "loss": 0.012924729846417904, "nll_loss": 0.012924729846417904} +{"epoch": 16, "step": 23456, "loss": 0.028655581176280975, "nll_loss": 0.028655581176280975} +{"epoch": 16, "step": 23457, "loss": 0.011658867821097374, "nll_loss": 0.011658867821097374} +{"epoch": 16, "step": 23458, "loss": 0.024796411395072937, "nll_loss": 0.024796411395072937} +{"epoch": 16, "step": 23459, "loss": 0.01408492773771286, "nll_loss": 0.01408492773771286} +{"epoch": 16, "step": 23460, "loss": 0.040497101843357086, "nll_loss": 0.040497101843357086} +{"epoch": 16, "step": 23461, "loss": 0.01923310197889805, "nll_loss": 0.01923310197889805} +{"epoch": 16, "step": 23462, "loss": 0.005347745027393103, "nll_loss": 0.005347745027393103} +{"epoch": 16, "step": 23463, "loss": 0.04256203770637512, "nll_loss": 0.04256203770637512} +{"epoch": 16, "step": 23464, "loss": 0.017574789002537727, "nll_loss": 0.017574789002537727} +{"epoch": 16, "step": 23465, "loss": 0.021428551524877548, "nll_loss": 0.021428551524877548} +{"epoch": 16, "step": 23466, "loss": 0.02906038984656334, "nll_loss": 0.02906038984656334} +{"epoch": 16, "step": 23467, "loss": 0.006021664943546057, "nll_loss": 0.006021664943546057} +{"epoch": 16, "step": 23468, "loss": 0.028806965798139572, "nll_loss": 0.028806965798139572} +{"epoch": 16, "step": 23469, "loss": 0.05472559481859207, "nll_loss": 0.05472559481859207} +{"epoch": 16, "step": 23470, "loss": 0.02450363151729107, "nll_loss": 0.02450363151729107} +{"epoch": 16, "step": 23471, "loss": 0.03988373279571533, "nll_loss": 0.03988373279571533} +{"epoch": 16, "step": 23472, "loss": 0.028174569830298424, "nll_loss": 0.028174569830298424} +{"epoch": 16, "step": 23473, "loss": 0.017011111602187157, "nll_loss": 0.017011111602187157} +{"epoch": 16, "step": 23474, "loss": 0.017549067735671997, "nll_loss": 0.017549067735671997} +{"epoch": 16, "step": 23475, "loss": 0.017501968890428543, "nll_loss": 0.017501968890428543} +{"epoch": 16, "step": 23476, "loss": 0.020558273419737816, "nll_loss": 0.020558273419737816} +{"epoch": 16, "step": 23477, "loss": 0.024008173495531082, "nll_loss": 0.024008173495531082} +{"epoch": 16, "step": 23478, "loss": 0.01960599049925804, "nll_loss": 0.01960599049925804} +{"epoch": 16, "step": 23479, "loss": 0.027067728340625763, "nll_loss": 0.027067728340625763} +{"epoch": 16, "step": 23480, "loss": 0.02792791649699211, "nll_loss": 0.02792791649699211} +{"epoch": 16, "step": 23481, "loss": 0.029054945334792137, "nll_loss": 0.029054945334792137} +{"epoch": 16, "step": 23482, "loss": 0.027077287435531616, "nll_loss": 0.027077287435531616} +{"epoch": 16, "step": 23483, "loss": 0.04678618535399437, "nll_loss": 0.04678618535399437} +{"epoch": 16, "step": 23484, "loss": 0.026149531826376915, "nll_loss": 0.026149531826376915} +{"epoch": 16, "step": 23485, "loss": 0.02284340374171734, "nll_loss": 0.02284340374171734} +{"epoch": 16, "step": 23486, "loss": 0.031870078295469284, "nll_loss": 0.031870078295469284} +{"epoch": 16, "step": 23487, "loss": 0.05184045061469078, "nll_loss": 0.05184045061469078} +{"epoch": 16, "step": 23488, "loss": 0.051826998591423035, "nll_loss": 0.051826998591423035} +{"epoch": 16, "step": 23489, "loss": 0.024809740483760834, "nll_loss": 0.024809740483760834} +{"epoch": 16, "step": 23490, "loss": 0.02599165588617325, "nll_loss": 0.02599165588617325} +{"epoch": 16, "step": 23491, "loss": 0.016917726024985313, "nll_loss": 0.016917726024985313} +{"epoch": 16, "step": 23492, "loss": 0.01933923363685608, "nll_loss": 0.01933923363685608} +{"epoch": 16, "step": 23493, "loss": 0.024975398555397987, "nll_loss": 0.024975398555397987} +{"epoch": 16, "step": 23494, "loss": 0.02938969060778618, "nll_loss": 0.02938969060778618} +{"epoch": 16, "step": 23495, "loss": 0.033612899482250214, "nll_loss": 0.033612899482250214} +{"epoch": 16, "step": 23496, "loss": 0.02001803368330002, "nll_loss": 0.02001803368330002} +{"epoch": 16, "step": 23497, "loss": 0.012512410059571266, "nll_loss": 0.012512410059571266} +{"epoch": 16, "step": 23498, "loss": 0.050826068967580795, "nll_loss": 0.050826068967580795} +{"epoch": 16, "step": 23499, "loss": 0.02079683169722557, "nll_loss": 0.02079683169722557} +{"epoch": 16, "step": 23500, "loss": 0.027419935911893845, "nll_loss": 0.027419935911893845} +{"epoch": 16, "step": 23501, "loss": 0.02912082150578499, "nll_loss": 0.02912082150578499} +{"epoch": 16, "step": 23502, "loss": 0.03669467940926552, "nll_loss": 0.03669467940926552} +{"epoch": 16, "step": 23503, "loss": 0.015237048268318176, "nll_loss": 0.015237048268318176} +{"epoch": 16, "step": 23504, "loss": 0.01831352524459362, "nll_loss": 0.01831352524459362} +{"epoch": 16, "step": 23505, "loss": 0.019971881061792374, "nll_loss": 0.019971881061792374} +{"epoch": 16, "step": 23506, "loss": 0.017988506704568863, "nll_loss": 0.017988506704568863} +{"epoch": 16, "step": 23507, "loss": 0.046086616814136505, "nll_loss": 0.046086616814136505} +{"epoch": 16, "step": 23508, "loss": 0.022770067676901817, "nll_loss": 0.022770067676901817} +{"epoch": 16, "step": 23509, "loss": 0.02162676304578781, "nll_loss": 0.02162676304578781} +{"epoch": 16, "step": 23510, "loss": 0.026430612429976463, "nll_loss": 0.026430612429976463} +{"epoch": 16, "step": 23511, "loss": 0.015165131539106369, "nll_loss": 0.015165131539106369} +{"epoch": 16, "step": 23512, "loss": 0.0416247621178627, "nll_loss": 0.0416247621178627} +{"epoch": 16, "step": 23513, "loss": 0.024053305387496948, "nll_loss": 0.024053305387496948} +{"epoch": 16, "step": 23514, "loss": 0.04462996497750282, "nll_loss": 0.04462996497750282} +{"epoch": 16, "step": 23515, "loss": 0.01965770125389099, "nll_loss": 0.01965770125389099} +{"epoch": 16, "step": 23516, "loss": 0.01987934298813343, "nll_loss": 0.01987934298813343} +{"epoch": 16, "step": 23517, "loss": 0.03381185606122017, "nll_loss": 0.03381185606122017} +{"epoch": 16, "step": 23518, "loss": 0.028161918744444847, "nll_loss": 0.028161918744444847} +{"epoch": 16, "step": 23519, "loss": 0.027782045304775238, "nll_loss": 0.027782045304775238} +{"epoch": 16, "step": 23520, "loss": 0.0204436257481575, "nll_loss": 0.0204436257481575} +{"epoch": 16, "step": 23521, "loss": 0.016922932118177414, "nll_loss": 0.016922932118177414} +{"epoch": 16, "step": 23522, "loss": 0.022961203008890152, "nll_loss": 0.022961203008890152} +{"epoch": 16, "step": 23523, "loss": 0.03068877011537552, "nll_loss": 0.03068877011537552} +{"epoch": 16, "step": 23524, "loss": 0.024379462003707886, "nll_loss": 0.024379462003707886} +{"epoch": 16, "step": 23525, "loss": 0.030689207836985588, "nll_loss": 0.030689207836985588} +{"epoch": 16, "step": 23526, "loss": 0.024550724774599075, "nll_loss": 0.024550724774599075} +{"epoch": 16, "step": 23527, "loss": 0.05232642963528633, "nll_loss": 0.05232642963528633} +{"epoch": 16, "step": 23528, "loss": 0.01953563652932644, "nll_loss": 0.01953563652932644} +{"epoch": 16, "step": 23529, "loss": 0.027282115072011948, "nll_loss": 0.027282115072011948} +{"epoch": 16, "step": 23530, "loss": 0.027462873607873917, "nll_loss": 0.027462873607873917} +{"epoch": 16, "step": 23531, "loss": 0.0172671377658844, "nll_loss": 0.0172671377658844} +{"epoch": 16, "step": 23532, "loss": 0.01343871746212244, "nll_loss": 0.01343871746212244} +{"epoch": 16, "step": 23533, "loss": 0.026518329977989197, "nll_loss": 0.026518329977989197} +{"epoch": 16, "step": 23534, "loss": 0.028409318998456, "nll_loss": 0.028409318998456} +{"epoch": 16, "step": 23535, "loss": 0.027867848053574562, "nll_loss": 0.027867848053574562} +{"epoch": 16, "step": 23536, "loss": 0.026839759200811386, "nll_loss": 0.026839759200811386} +{"epoch": 16, "step": 23537, "loss": 0.01974164880812168, "nll_loss": 0.01974164880812168} +{"epoch": 16, "step": 23538, "loss": 0.014122198335826397, "nll_loss": 0.014122198335826397} +{"epoch": 16, "step": 23539, "loss": 0.02790798805654049, "nll_loss": 0.02790798805654049} +{"epoch": 16, "step": 23540, "loss": 0.018150540068745613, "nll_loss": 0.018150540068745613} +{"epoch": 16, "step": 23541, "loss": 0.036695096641778946, "nll_loss": 0.036695096641778946} +{"epoch": 16, "step": 23542, "loss": 0.01638164557516575, "nll_loss": 0.01638164557516575} +{"epoch": 16, "step": 23543, "loss": 0.023741960525512695, "nll_loss": 0.023741960525512695} +{"epoch": 16, "step": 23544, "loss": 0.008546598255634308, "nll_loss": 0.008546598255634308} +{"epoch": 16, "step": 23545, "loss": 0.05134747177362442, "nll_loss": 0.05134747177362442} +{"epoch": 16, "step": 23546, "loss": 0.024304844439029694, "nll_loss": 0.024304844439029694} +{"epoch": 16, "step": 23547, "loss": 0.04568466171622276, "nll_loss": 0.04568466171622276} +{"epoch": 16, "step": 23548, "loss": 0.014059726148843765, "nll_loss": 0.014059726148843765} +{"epoch": 16, "step": 23549, "loss": 0.016226354986429214, "nll_loss": 0.016226354986429214} +{"epoch": 16, "step": 23550, "loss": 0.033999159932136536, "nll_loss": 0.033999159932136536} +{"epoch": 16, "step": 23551, "loss": 0.04819828271865845, "nll_loss": 0.04819828271865845} +{"epoch": 16, "step": 23552, "loss": 0.04822136089205742, "nll_loss": 0.04822136089205742} +{"epoch": 16, "step": 23553, "loss": 0.007538724225014448, "nll_loss": 0.007538724225014448} +{"epoch": 16, "step": 23554, "loss": 0.023684771731495857, "nll_loss": 0.023684771731495857} +{"epoch": 16, "step": 23555, "loss": 0.02261774241924286, "nll_loss": 0.02261774241924286} +{"epoch": 16, "step": 23556, "loss": 0.01988813653588295, "nll_loss": 0.01988813653588295} +{"epoch": 16, "step": 23557, "loss": 0.02019374445080757, "nll_loss": 0.02019374445080757} +{"epoch": 16, "step": 23558, "loss": 0.019428184255957603, "nll_loss": 0.019428184255957603} +{"epoch": 16, "step": 23559, "loss": 0.01942901499569416, "nll_loss": 0.01942901499569416} +{"epoch": 16, "step": 23560, "loss": 0.04455724358558655, "nll_loss": 0.04455724358558655} +{"epoch": 16, "step": 23561, "loss": 0.016260433942079544, "nll_loss": 0.016260433942079544} +{"epoch": 16, "step": 23562, "loss": 0.039340753108263016, "nll_loss": 0.039340753108263016} +{"epoch": 16, "step": 23563, "loss": 0.018376395106315613, "nll_loss": 0.018376395106315613} +{"epoch": 16, "step": 23564, "loss": 0.024469075724482536, "nll_loss": 0.024469075724482536} +{"epoch": 16, "step": 23565, "loss": 0.016961535438895226, "nll_loss": 0.016961535438895226} +{"epoch": 16, "step": 23566, "loss": 0.016854027286171913, "nll_loss": 0.016854027286171913} +{"epoch": 16, "step": 23567, "loss": 0.03370235115289688, "nll_loss": 0.03370235115289688} +{"epoch": 16, "step": 23568, "loss": 0.024077003821730614, "nll_loss": 0.024077003821730614} +{"epoch": 16, "step": 23569, "loss": 0.013687972910702229, "nll_loss": 0.013687972910702229} +{"epoch": 16, "step": 23570, "loss": 0.027238862589001656, "nll_loss": 0.027238862589001656} +{"epoch": 16, "step": 23571, "loss": 0.023627152666449547, "nll_loss": 0.023627152666449547} +{"epoch": 16, "step": 23572, "loss": 0.025822512805461884, "nll_loss": 0.025822512805461884} +{"epoch": 16, "step": 23573, "loss": 0.01889362931251526, "nll_loss": 0.01889362931251526} +{"epoch": 16, "step": 23574, "loss": 0.05996908247470856, "nll_loss": 0.05996908247470856} +{"epoch": 16, "step": 23575, "loss": 0.015542428940534592, "nll_loss": 0.015542428940534592} +{"epoch": 16, "step": 23576, "loss": 0.022468779236078262, "nll_loss": 0.022468779236078262} +{"epoch": 16, "step": 23577, "loss": 0.03485875576734543, "nll_loss": 0.03485875576734543} +{"epoch": 16, "step": 23578, "loss": 0.03498489037156105, "nll_loss": 0.03498489037156105} +{"epoch": 16, "step": 23579, "loss": 0.03895875811576843, "nll_loss": 0.03895875811576843} +{"epoch": 16, "step": 23580, "loss": 0.012749316170811653, "nll_loss": 0.012749316170811653} +{"epoch": 16, "step": 23581, "loss": 0.025109970942139626, "nll_loss": 0.025109970942139626} +{"epoch": 16, "step": 23582, "loss": 0.012592514045536518, "nll_loss": 0.012592514045536518} +{"epoch": 16, "step": 23583, "loss": 0.02682637609541416, "nll_loss": 0.02682637609541416} +{"epoch": 16, "step": 23584, "loss": 0.02757362462580204, "nll_loss": 0.02757362462580204} +{"epoch": 16, "step": 23585, "loss": 0.023202549666166306, "nll_loss": 0.023202549666166306} +{"epoch": 16, "step": 23586, "loss": 0.03567873314023018, "nll_loss": 0.03567873314023018} +{"epoch": 16, "step": 23587, "loss": 0.029055528342723846, "nll_loss": 0.029055528342723846} +{"epoch": 16, "step": 23588, "loss": 0.028084034100174904, "nll_loss": 0.028084034100174904} +{"epoch": 16, "step": 23589, "loss": 0.006113117560744286, "nll_loss": 0.006113117560744286} +{"epoch": 16, "step": 23590, "loss": 0.019069993868470192, "nll_loss": 0.019069993868470192} +{"epoch": 16, "step": 23591, "loss": 0.02090393751859665, "nll_loss": 0.02090393751859665} +{"epoch": 16, "step": 23592, "loss": 0.02799120359122753, "nll_loss": 0.02799120359122753} +{"epoch": 16, "step": 23593, "loss": 0.022561388090252876, "nll_loss": 0.022561388090252876} +{"epoch": 16, "step": 23594, "loss": 0.030955279245972633, "nll_loss": 0.030955279245972633} +{"epoch": 16, "step": 23595, "loss": 0.017678789794445038, "nll_loss": 0.017678789794445038} +{"epoch": 16, "step": 23596, "loss": 0.03518478572368622, "nll_loss": 0.03518478572368622} +{"epoch": 16, "step": 23597, "loss": 0.019984887912869453, "nll_loss": 0.019984887912869453} +{"epoch": 16, "step": 23598, "loss": 0.01698465645313263, "nll_loss": 0.01698465645313263} +{"epoch": 16, "step": 23599, "loss": 0.029614979401230812, "nll_loss": 0.029614979401230812} +{"epoch": 16, "step": 23600, "loss": 0.008435402996838093, "nll_loss": 0.008435402996838093} +{"epoch": 16, "step": 23601, "loss": 0.02558904141187668, "nll_loss": 0.02558904141187668} +{"epoch": 16, "step": 23602, "loss": 0.03422178328037262, "nll_loss": 0.03422178328037262} +{"epoch": 16, "step": 23603, "loss": 0.015204397030174732, "nll_loss": 0.015204397030174732} +{"epoch": 16, "step": 23604, "loss": 0.030533870682120323, "nll_loss": 0.030533870682120323} +{"epoch": 16, "step": 23605, "loss": 0.022517036646604538, "nll_loss": 0.022517036646604538} +{"epoch": 16, "step": 23606, "loss": 0.014304316602647305, "nll_loss": 0.014304316602647305} +{"epoch": 16, "step": 23607, "loss": 0.012166772037744522, "nll_loss": 0.012166772037744522} +{"epoch": 16, "step": 23608, "loss": 0.0394282341003418, "nll_loss": 0.0394282341003418} +{"epoch": 16, "step": 23609, "loss": 0.01994229108095169, "nll_loss": 0.01994229108095169} +{"epoch": 16, "step": 23610, "loss": 0.02847033180296421, "nll_loss": 0.02847033180296421} +{"epoch": 16, "step": 23611, "loss": 0.034965891391038895, "nll_loss": 0.034965891391038895} +{"epoch": 16, "step": 23612, "loss": 0.03391773998737335, "nll_loss": 0.03391773998737335} +{"epoch": 16, "step": 23613, "loss": 0.02158544585108757, "nll_loss": 0.02158544585108757} +{"epoch": 16, "step": 23614, "loss": 0.01816568523645401, "nll_loss": 0.01816568523645401} +{"epoch": 16, "step": 23615, "loss": 0.022099556401371956, "nll_loss": 0.022099556401371956} +{"epoch": 16, "step": 23616, "loss": 0.006347576156258583, "nll_loss": 0.006347576156258583} +{"epoch": 16, "step": 23617, "loss": 0.008334990590810776, "nll_loss": 0.008334990590810776} +{"epoch": 16, "step": 23618, "loss": 0.0249245073646307, "nll_loss": 0.0249245073646307} +{"epoch": 16, "step": 23619, "loss": 0.021635839715600014, "nll_loss": 0.021635839715600014} +{"epoch": 16, "step": 23620, "loss": 0.022876132279634476, "nll_loss": 0.022876132279634476} +{"epoch": 16, "step": 23621, "loss": 0.04486817866563797, "nll_loss": 0.04486817866563797} +{"epoch": 16, "step": 23622, "loss": 0.011985098011791706, "nll_loss": 0.011985098011791706} +{"epoch": 16, "step": 23623, "loss": 0.02857290953397751, "nll_loss": 0.02857290953397751} +{"epoch": 16, "step": 23624, "loss": 0.013282624073326588, "nll_loss": 0.013282624073326588} +{"epoch": 16, "step": 23625, "loss": 0.035400211811065674, "nll_loss": 0.035400211811065674} +{"epoch": 16, "step": 23626, "loss": 0.0258359145373106, "nll_loss": 0.0258359145373106} +{"epoch": 16, "step": 23627, "loss": 0.03253761678934097, "nll_loss": 0.03253761678934097} +{"epoch": 16, "step": 23628, "loss": 0.026808520779013634, "nll_loss": 0.026808520779013634} +{"epoch": 16, "step": 23629, "loss": 0.021540919318795204, "nll_loss": 0.021540919318795204} +{"epoch": 16, "step": 23630, "loss": 0.02254650928080082, "nll_loss": 0.02254650928080082} +{"epoch": 16, "step": 23631, "loss": 0.027771444991230965, "nll_loss": 0.027771444991230965} +{"epoch": 16, "step": 23632, "loss": 0.008319530636072159, "nll_loss": 0.008319530636072159} +{"epoch": 16, "step": 23633, "loss": 0.02814142405986786, "nll_loss": 0.02814142405986786} +{"epoch": 16, "step": 23634, "loss": 0.024005571380257607, "nll_loss": 0.024005571380257607} +{"epoch": 16, "step": 23635, "loss": 0.03421473130583763, "nll_loss": 0.03421473130583763} +{"epoch": 16, "step": 23636, "loss": 0.03939709812402725, "nll_loss": 0.03939709812402725} +{"epoch": 16, "step": 23637, "loss": 0.021967638283967972, "nll_loss": 0.021967638283967972} +{"epoch": 16, "step": 23638, "loss": 0.02333017997443676, "nll_loss": 0.02333017997443676} +{"epoch": 16, "step": 23639, "loss": 0.031095365062355995, "nll_loss": 0.031095365062355995} +{"epoch": 16, "step": 23640, "loss": 0.020897112786769867, "nll_loss": 0.020897112786769867} +{"epoch": 16, "step": 23641, "loss": 0.0064336820505559444, "nll_loss": 0.0064336820505559444} +{"epoch": 16, "step": 23642, "loss": 0.03658458963036537, "nll_loss": 0.03658458963036537} +{"epoch": 16, "step": 23643, "loss": 0.014289561659097672, "nll_loss": 0.014289561659097672} +{"epoch": 16, "step": 23644, "loss": 0.01077709998935461, "nll_loss": 0.01077709998935461} +{"epoch": 16, "step": 23645, "loss": 0.02470439486205578, "nll_loss": 0.02470439486205578} +{"epoch": 16, "step": 23646, "loss": 0.013001304119825363, "nll_loss": 0.013001304119825363} +{"epoch": 16, "step": 23647, "loss": 0.019298797473311424, "nll_loss": 0.019298797473311424} +{"epoch": 16, "step": 23648, "loss": 0.025552913546562195, "nll_loss": 0.025552913546562195} +{"epoch": 16, "step": 23649, "loss": 0.023564239963889122, "nll_loss": 0.023564239963889122} +{"epoch": 16, "step": 23650, "loss": 0.029763590544462204, "nll_loss": 0.029763590544462204} +{"epoch": 16, "step": 23651, "loss": 0.02315947227180004, "nll_loss": 0.02315947227180004} +{"epoch": 16, "step": 23652, "loss": 0.03409246727824211, "nll_loss": 0.03409246727824211} +{"epoch": 16, "step": 23653, "loss": 0.01622360199689865, "nll_loss": 0.01622360199689865} +{"epoch": 16, "step": 23654, "loss": 0.030306966975331306, "nll_loss": 0.030306966975331306} +{"epoch": 16, "step": 23655, "loss": 0.018050167709589005, "nll_loss": 0.018050167709589005} +{"epoch": 16, "step": 23656, "loss": 0.021638112142682076, "nll_loss": 0.021638112142682076} +{"epoch": 16, "step": 23657, "loss": 0.019860779866576195, "nll_loss": 0.019860779866576195} +{"epoch": 16, "step": 23658, "loss": 0.018571050837635994, "nll_loss": 0.018571050837635994} +{"epoch": 16, "step": 23659, "loss": 0.01916118897497654, "nll_loss": 0.01916118897497654} +{"epoch": 16, "step": 23660, "loss": 0.03261398524045944, "nll_loss": 0.03261398524045944} +{"epoch": 16, "step": 23661, "loss": 0.03571705147624016, "nll_loss": 0.03571705147624016} +{"epoch": 16, "step": 23662, "loss": 0.015375831164419651, "nll_loss": 0.015375831164419651} +{"epoch": 16, "step": 23663, "loss": 0.03647930547595024, "nll_loss": 0.03647930547595024} +{"epoch": 16, "step": 23664, "loss": 0.04171255603432655, "nll_loss": 0.04171255603432655} +{"epoch": 16, "step": 23665, "loss": 0.01634400337934494, "nll_loss": 0.01634400337934494} +{"epoch": 16, "step": 23666, "loss": 0.027997873723506927, "nll_loss": 0.027997873723506927} +{"epoch": 16, "step": 23667, "loss": 0.019452286884188652, "nll_loss": 0.019452286884188652} +{"epoch": 16, "step": 23668, "loss": 0.022987613454461098, "nll_loss": 0.022987613454461098} +{"epoch": 16, "step": 23669, "loss": 0.018221715465188026, "nll_loss": 0.018221715465188026} +{"epoch": 16, "step": 23670, "loss": 0.03022262267768383, "nll_loss": 0.03022262267768383} +{"epoch": 16, "step": 23671, "loss": 0.017972806468605995, "nll_loss": 0.017972806468605995} +{"epoch": 16, "step": 23672, "loss": 0.030230751261115074, "nll_loss": 0.030230751261115074} +{"epoch": 16, "step": 23673, "loss": 0.029103770852088928, "nll_loss": 0.029103770852088928} +{"epoch": 16, "step": 23674, "loss": 0.030507013201713562, "nll_loss": 0.030507013201713562} +{"epoch": 16, "step": 23675, "loss": 0.028003111481666565, "nll_loss": 0.028003111481666565} +{"epoch": 16, "step": 23676, "loss": 0.02268623374402523, "nll_loss": 0.02268623374402523} +{"epoch": 16, "step": 23677, "loss": 0.011811972595751286, "nll_loss": 0.011811972595751286} +{"epoch": 16, "step": 23678, "loss": 0.022758087143301964, "nll_loss": 0.022758087143301964} +{"epoch": 16, "step": 23679, "loss": 0.02390250749886036, "nll_loss": 0.02390250749886036} +{"epoch": 16, "step": 23680, "loss": 0.034108687192201614, "nll_loss": 0.034108687192201614} +{"epoch": 16, "step": 23681, "loss": 0.01151376310735941, "nll_loss": 0.01151376310735941} +{"epoch": 16, "step": 23682, "loss": 0.018861671909689903, "nll_loss": 0.018861671909689903} +{"epoch": 16, "step": 23683, "loss": 0.026656020432710648, "nll_loss": 0.026656020432710648} +{"epoch": 16, "step": 23684, "loss": 0.03467901796102524, "nll_loss": 0.03467901796102524} +{"epoch": 16, "step": 23685, "loss": 0.031182872131466866, "nll_loss": 0.031182872131466866} +{"epoch": 16, "step": 23686, "loss": 0.024260902777314186, "nll_loss": 0.024260902777314186} +{"epoch": 16, "step": 23687, "loss": 0.013202013447880745, "nll_loss": 0.013202013447880745} +{"epoch": 16, "step": 23688, "loss": 0.0500575490295887, "nll_loss": 0.0500575490295887} +{"epoch": 16, "step": 23689, "loss": 0.013637478463351727, "nll_loss": 0.013637478463351727} +{"epoch": 16, "step": 23690, "loss": 0.03306487202644348, "nll_loss": 0.03306487202644348} +{"epoch": 16, "step": 23691, "loss": 0.017227012664079666, "nll_loss": 0.017227012664079666} +{"epoch": 16, "step": 23692, "loss": 0.09770563989877701, "nll_loss": 0.09770563989877701} +{"epoch": 16, "step": 23693, "loss": 0.012191551737487316, "nll_loss": 0.012191551737487316} +{"epoch": 16, "step": 23694, "loss": 0.026758262887597084, "nll_loss": 0.026758262887597084} +{"epoch": 16, "step": 23695, "loss": 0.025796210393309593, "nll_loss": 0.025796210393309593} +{"epoch": 16, "step": 23696, "loss": 0.03418780863285065, "nll_loss": 0.03418780863285065} +{"epoch": 16, "step": 23697, "loss": 0.02367996983230114, "nll_loss": 0.02367996983230114} +{"epoch": 16, "step": 23698, "loss": 0.018828170374035835, "nll_loss": 0.018828170374035835} +{"epoch": 16, "step": 23699, "loss": 0.020908594131469727, "nll_loss": 0.020908594131469727} +{"epoch": 16, "step": 23700, "loss": 0.024819951504468918, "nll_loss": 0.024819951504468918} +{"epoch": 16, "step": 23701, "loss": 0.012362685054540634, "nll_loss": 0.012362685054540634} +{"epoch": 16, "step": 23702, "loss": 0.022279877215623856, "nll_loss": 0.022279877215623856} +{"epoch": 16, "step": 23703, "loss": 0.014784102328121662, "nll_loss": 0.014784102328121662} +{"epoch": 16, "step": 23704, "loss": 0.019277218729257584, "nll_loss": 0.019277218729257584} +{"epoch": 16, "step": 23705, "loss": 0.020734917372465134, "nll_loss": 0.020734917372465134} +{"epoch": 16, "step": 23706, "loss": 0.027471808716654778, "nll_loss": 0.027471808716654778} +{"epoch": 16, "step": 23707, "loss": 0.020142827183008194, "nll_loss": 0.020142827183008194} +{"epoch": 16, "step": 23708, "loss": 0.023563245311379433, "nll_loss": 0.023563245311379433} +{"epoch": 16, "step": 23709, "loss": 0.03220183402299881, "nll_loss": 0.03220183402299881} +{"epoch": 16, "step": 23710, "loss": 0.01860007457435131, "nll_loss": 0.01860007457435131} +{"epoch": 16, "step": 23711, "loss": 0.02768534980714321, "nll_loss": 0.02768534980714321} +{"epoch": 16, "step": 23712, "loss": 0.030966907739639282, "nll_loss": 0.030966907739639282} +{"epoch": 16, "step": 23713, "loss": 0.012462329119443893, "nll_loss": 0.012462329119443893} +{"epoch": 16, "step": 23714, "loss": 0.031856097280979156, "nll_loss": 0.031856097280979156} +{"epoch": 16, "step": 23715, "loss": 0.018873313441872597, "nll_loss": 0.018873313441872597} +{"epoch": 16, "step": 23716, "loss": 0.03320472314953804, "nll_loss": 0.03320472314953804} +{"epoch": 16, "step": 23717, "loss": 0.011525229550898075, "nll_loss": 0.011525229550898075} +{"epoch": 16, "step": 23718, "loss": 0.012020347639918327, "nll_loss": 0.012020347639918327} +{"epoch": 16, "step": 23719, "loss": 0.0213021133095026, "nll_loss": 0.0213021133095026} +{"epoch": 16, "step": 23720, "loss": 0.027974408119916916, "nll_loss": 0.027974408119916916} +{"epoch": 16, "step": 23721, "loss": 0.03893360495567322, "nll_loss": 0.03893360495567322} +{"epoch": 16, "step": 23722, "loss": 0.02991269901394844, "nll_loss": 0.02991269901394844} +{"epoch": 16, "step": 23723, "loss": 0.007071713916957378, "nll_loss": 0.007071713916957378} +{"epoch": 16, "step": 23724, "loss": 0.018117712810635567, "nll_loss": 0.018117712810635567} +{"epoch": 16, "step": 23725, "loss": 0.02290685661137104, "nll_loss": 0.02290685661137104} +{"epoch": 16, "step": 23726, "loss": 0.017284274101257324, "nll_loss": 0.017284274101257324} +{"epoch": 16, "step": 23727, "loss": 0.014358742162585258, "nll_loss": 0.014358742162585258} +{"epoch": 16, "step": 23728, "loss": 0.020135750994086266, "nll_loss": 0.020135750994086266} +{"epoch": 16, "step": 23729, "loss": 0.007823669351637363, "nll_loss": 0.007823669351637363} +{"epoch": 16, "step": 23730, "loss": 0.016396529972553253, "nll_loss": 0.016396529972553253} +{"epoch": 16, "step": 23731, "loss": 0.03128466382622719, "nll_loss": 0.03128466382622719} +{"epoch": 16, "step": 23732, "loss": 0.03210127353668213, "nll_loss": 0.03210127353668213} +{"epoch": 16, "step": 23733, "loss": 0.01537817157804966, "nll_loss": 0.01537817157804966} +{"epoch": 16, "step": 23734, "loss": 0.021066341549158096, "nll_loss": 0.021066341549158096} +{"epoch": 16, "step": 23735, "loss": 0.031441766768693924, "nll_loss": 0.031441766768693924} +{"epoch": 16, "step": 23736, "loss": 0.02001473866403103, "nll_loss": 0.02001473866403103} +{"epoch": 16, "step": 23737, "loss": 0.04507226496934891, "nll_loss": 0.04507226496934891} +{"epoch": 16, "step": 23738, "loss": 0.009889344684779644, "nll_loss": 0.009889344684779644} +{"epoch": 16, "step": 23739, "loss": 0.012452930212020874, "nll_loss": 0.012452930212020874} +{"epoch": 16, "step": 23740, "loss": 0.023740800097584724, "nll_loss": 0.023740800097584724} +{"epoch": 16, "step": 23741, "loss": 0.02218271791934967, "nll_loss": 0.02218271791934967} +{"epoch": 16, "step": 23742, "loss": 0.02478898875415325, "nll_loss": 0.02478898875415325} +{"epoch": 16, "step": 23743, "loss": 0.010904255323112011, "nll_loss": 0.010904255323112011} +{"epoch": 16, "step": 23744, "loss": 0.015567240305244923, "nll_loss": 0.015567240305244923} +{"epoch": 16, "step": 23745, "loss": 0.021951179951429367, "nll_loss": 0.021951179951429367} +{"epoch": 16, "step": 23746, "loss": 0.022477908059954643, "nll_loss": 0.022477908059954643} +{"epoch": 16, "step": 23747, "loss": 0.037644363939762115, "nll_loss": 0.037644363939762115} +{"epoch": 16, "step": 23748, "loss": 0.06165555864572525, "nll_loss": 0.06165555864572525} +{"epoch": 16, "step": 23749, "loss": 0.02444262057542801, "nll_loss": 0.02444262057542801} +{"epoch": 16, "step": 23750, "loss": 0.023931220173835754, "nll_loss": 0.023931220173835754} +{"epoch": 16, "step": 23751, "loss": 0.07563593238592148, "nll_loss": 0.07563593238592148} +{"epoch": 16, "step": 23752, "loss": 0.06424055248498917, "nll_loss": 0.06424055248498917} +{"epoch": 16, "step": 23753, "loss": 0.005877757910639048, "nll_loss": 0.005877757910639048} +{"epoch": 16, "step": 23754, "loss": 0.01557666901499033, "nll_loss": 0.01557666901499033} +{"epoch": 16, "step": 23755, "loss": 0.044105999171733856, "nll_loss": 0.044105999171733856} +{"epoch": 16, "step": 23756, "loss": 0.04439408704638481, "nll_loss": 0.04439408704638481} +{"epoch": 16, "step": 23757, "loss": 0.010559260845184326, "nll_loss": 0.010559260845184326} +{"epoch": 16, "step": 23758, "loss": 0.0261802040040493, "nll_loss": 0.0261802040040493} +{"epoch": 16, "step": 23759, "loss": 0.017574306577444077, "nll_loss": 0.017574306577444077} +{"epoch": 16, "step": 23760, "loss": 0.02688611112535, "nll_loss": 0.02688611112535} +{"epoch": 16, "step": 23761, "loss": 0.018763355910778046, "nll_loss": 0.018763355910778046} +{"epoch": 16, "step": 23762, "loss": 0.029139172285795212, "nll_loss": 0.029139172285795212} +{"epoch": 16, "step": 23763, "loss": 0.01663164608180523, "nll_loss": 0.01663164608180523} +{"epoch": 16, "step": 23764, "loss": 0.03620545193552971, "nll_loss": 0.03620545193552971} +{"epoch": 16, "step": 23765, "loss": 0.02102804370224476, "nll_loss": 0.02102804370224476} +{"epoch": 16, "step": 23766, "loss": 0.014717805199325085, "nll_loss": 0.014717805199325085} +{"epoch": 16, "step": 23767, "loss": 0.02093885838985443, "nll_loss": 0.02093885838985443} +{"epoch": 16, "step": 23768, "loss": 0.0183844156563282, "nll_loss": 0.0183844156563282} +{"epoch": 16, "step": 23769, "loss": 0.02014070376753807, "nll_loss": 0.02014070376753807} +{"epoch": 16, "step": 23770, "loss": 0.030065909028053284, "nll_loss": 0.030065909028053284} +{"epoch": 16, "step": 23771, "loss": 0.022695327177643776, "nll_loss": 0.022695327177643776} +{"epoch": 16, "step": 23772, "loss": 0.025869768112897873, "nll_loss": 0.025869768112897873} +{"epoch": 16, "step": 23773, "loss": 0.022221900522708893, "nll_loss": 0.022221900522708893} +{"epoch": 16, "step": 23774, "loss": 0.020620206370949745, "nll_loss": 0.020620206370949745} +{"epoch": 16, "step": 23775, "loss": 0.029337113723158836, "nll_loss": 0.029337113723158836} +{"epoch": 16, "step": 23776, "loss": 0.02605840563774109, "nll_loss": 0.02605840563774109} +{"epoch": 16, "step": 23777, "loss": 0.03035544604063034, "nll_loss": 0.03035544604063034} +{"epoch": 16, "step": 23778, "loss": 0.02226961776614189, "nll_loss": 0.02226961776614189} +{"epoch": 16, "step": 23779, "loss": 0.03356892988085747, "nll_loss": 0.03356892988085747} +{"epoch": 16, "step": 23780, "loss": 0.03804420307278633, "nll_loss": 0.03804420307278633} +{"epoch": 16, "step": 23781, "loss": 0.03302682191133499, "nll_loss": 0.03302682191133499} +{"epoch": 16, "step": 23782, "loss": 0.010654496029019356, "nll_loss": 0.010654496029019356} +{"epoch": 16, "step": 23783, "loss": 0.031891338527202606, "nll_loss": 0.031891338527202606} +{"epoch": 16, "step": 23784, "loss": 0.03602834790945053, "nll_loss": 0.03602834790945053} +{"epoch": 16, "step": 23785, "loss": 0.01627257838845253, "nll_loss": 0.01627257838845253} +{"epoch": 16, "step": 23786, "loss": 0.024415958672761917, "nll_loss": 0.024415958672761917} +{"epoch": 16, "step": 23787, "loss": 0.03698412701487541, "nll_loss": 0.03698412701487541} +{"epoch": 16, "step": 23788, "loss": 0.025728654116392136, "nll_loss": 0.025728654116392136} +{"epoch": 16, "step": 23789, "loss": 0.021318113431334496, "nll_loss": 0.021318113431334496} +{"epoch": 16, "step": 23790, "loss": 0.01815212331712246, "nll_loss": 0.01815212331712246} +{"epoch": 16, "step": 23791, "loss": 0.024816572666168213, "nll_loss": 0.024816572666168213} +{"epoch": 16, "step": 23792, "loss": 0.03849596157670021, "nll_loss": 0.03849596157670021} +{"epoch": 16, "step": 23793, "loss": 0.015041843056678772, "nll_loss": 0.015041843056678772} +{"epoch": 16, "step": 23794, "loss": 0.028447067365050316, "nll_loss": 0.028447067365050316} +{"epoch": 16, "step": 23795, "loss": 0.02287677675485611, "nll_loss": 0.02287677675485611} +{"epoch": 16, "step": 23796, "loss": 0.022285910323262215, "nll_loss": 0.022285910323262215} +{"epoch": 16, "step": 23797, "loss": 0.025641420856118202, "nll_loss": 0.025641420856118202} +{"epoch": 16, "step": 23798, "loss": 0.03119400329887867, "nll_loss": 0.03119400329887867} +{"epoch": 16, "step": 23799, "loss": 0.018854757770895958, "nll_loss": 0.018854757770895958} +{"epoch": 16, "step": 23800, "loss": 0.0202492568641901, "nll_loss": 0.0202492568641901} +{"epoch": 16, "step": 23801, "loss": 0.02943563647568226, "nll_loss": 0.02943563647568226} +{"epoch": 16, "step": 23802, "loss": 0.027830321341753006, "nll_loss": 0.027830321341753006} +{"epoch": 16, "step": 23803, "loss": 0.016621621325612068, "nll_loss": 0.016621621325612068} +{"epoch": 16, "step": 23804, "loss": 0.018097057938575745, "nll_loss": 0.018097057938575745} +{"epoch": 16, "step": 23805, "loss": 0.011644257232546806, "nll_loss": 0.011644257232546806} +{"epoch": 16, "step": 23806, "loss": 0.03178783878684044, "nll_loss": 0.03178783878684044} +{"epoch": 16, "step": 23807, "loss": 0.024356916546821594, "nll_loss": 0.024356916546821594} +{"epoch": 16, "step": 23808, "loss": 0.007645273581147194, "nll_loss": 0.007645273581147194} +{"epoch": 16, "step": 23809, "loss": 0.015300415456295013, "nll_loss": 0.015300415456295013} +{"epoch": 16, "step": 23810, "loss": 0.017980340868234634, "nll_loss": 0.017980340868234634} +{"epoch": 16, "step": 23811, "loss": 0.024141909554600716, "nll_loss": 0.024141909554600716} +{"epoch": 16, "step": 23812, "loss": 0.019027672708034515, "nll_loss": 0.019027672708034515} +{"epoch": 16, "step": 23813, "loss": 0.03471682220697403, "nll_loss": 0.03471682220697403} +{"epoch": 16, "step": 23814, "loss": 0.06699781119823456, "nll_loss": 0.06699781119823456} +{"epoch": 16, "step": 23815, "loss": 0.026669945567846298, "nll_loss": 0.026669945567846298} +{"epoch": 16, "step": 23816, "loss": 0.01911313645541668, "nll_loss": 0.01911313645541668} +{"epoch": 16, "step": 23817, "loss": 0.014886184595525265, "nll_loss": 0.014886184595525265} +{"epoch": 16, "step": 23818, "loss": 0.021991275250911713, "nll_loss": 0.021991275250911713} +{"epoch": 16, "step": 23819, "loss": 0.03259356692433357, "nll_loss": 0.03259356692433357} +{"epoch": 16, "step": 23820, "loss": 0.03205137327313423, "nll_loss": 0.03205137327313423} +{"epoch": 16, "step": 23821, "loss": 0.03213127329945564, "nll_loss": 0.03213127329945564} +{"epoch": 16, "step": 23822, "loss": 0.02264704741537571, "nll_loss": 0.02264704741537571} +{"epoch": 16, "step": 23823, "loss": 0.04264885187149048, "nll_loss": 0.04264885187149048} +{"epoch": 16, "step": 23824, "loss": 0.027147280052304268, "nll_loss": 0.027147280052304268} +{"epoch": 16, "step": 23825, "loss": 0.019758831709623337, "nll_loss": 0.019758831709623337} +{"epoch": 16, "step": 23826, "loss": 0.035292018204927444, "nll_loss": 0.035292018204927444} +{"epoch": 16, "step": 23827, "loss": 0.0262680072337389, "nll_loss": 0.0262680072337389} +{"epoch": 16, "step": 23828, "loss": 0.035433314740657806, "nll_loss": 0.035433314740657806} +{"epoch": 16, "step": 23829, "loss": 0.02086230367422104, "nll_loss": 0.02086230367422104} +{"epoch": 16, "step": 23830, "loss": 0.016529470682144165, "nll_loss": 0.016529470682144165} +{"epoch": 16, "step": 23831, "loss": 0.029054967686533928, "nll_loss": 0.029054967686533928} +{"epoch": 16, "step": 23832, "loss": 0.01129230111837387, "nll_loss": 0.01129230111837387} +{"epoch": 16, "step": 23833, "loss": 0.019863206893205643, "nll_loss": 0.019863206893205643} +{"epoch": 16, "step": 23834, "loss": 0.01939460076391697, "nll_loss": 0.01939460076391697} +{"epoch": 16, "step": 23835, "loss": 0.035746585577726364, "nll_loss": 0.035746585577726364} +{"epoch": 16, "step": 23836, "loss": 0.025172077119350433, "nll_loss": 0.025172077119350433} +{"epoch": 16, "step": 23837, "loss": 0.02884887158870697, "nll_loss": 0.02884887158870697} +{"epoch": 16, "step": 23838, "loss": 0.023873237892985344, "nll_loss": 0.023873237892985344} +{"epoch": 16, "step": 23839, "loss": 0.026747357100248337, "nll_loss": 0.026747357100248337} +{"epoch": 16, "step": 23840, "loss": 0.027231959626078606, "nll_loss": 0.027231959626078606} +{"epoch": 16, "step": 23841, "loss": 0.026538534089922905, "nll_loss": 0.026538534089922905} +{"epoch": 16, "step": 23842, "loss": 0.03634004667401314, "nll_loss": 0.03634004667401314} +{"epoch": 16, "step": 23843, "loss": 0.013390183448791504, "nll_loss": 0.013390183448791504} +{"epoch": 16, "step": 23844, "loss": 0.015948934480547905, "nll_loss": 0.015948934480547905} +{"epoch": 16, "step": 23845, "loss": 0.025869261473417282, "nll_loss": 0.025869261473417282} +{"epoch": 16, "step": 23846, "loss": 0.011324015446007252, "nll_loss": 0.011324015446007252} +{"epoch": 16, "step": 23847, "loss": 0.03254789486527443, "nll_loss": 0.03254789486527443} +{"epoch": 16, "step": 23848, "loss": 0.015101845376193523, "nll_loss": 0.015101845376193523} +{"epoch": 16, "step": 23849, "loss": 0.02445184253156185, "nll_loss": 0.02445184253156185} +{"epoch": 16, "step": 23850, "loss": 0.02368968166410923, "nll_loss": 0.02368968166410923} +{"epoch": 16, "step": 23851, "loss": 0.026957910507917404, "nll_loss": 0.026957910507917404} +{"epoch": 16, "step": 23852, "loss": 0.029136892408132553, "nll_loss": 0.029136892408132553} +{"epoch": 16, "step": 23853, "loss": 0.017000112682580948, "nll_loss": 0.017000112682580948} +{"epoch": 16, "step": 23854, "loss": 0.012932397425174713, "nll_loss": 0.012932397425174713} +{"epoch": 16, "step": 23855, "loss": 0.027311142534017563, "nll_loss": 0.027311142534017563} +{"epoch": 16, "step": 23856, "loss": 0.031072132289409637, "nll_loss": 0.031072132289409637} +{"epoch": 16, "step": 23857, "loss": 0.010404513217508793, "nll_loss": 0.010404513217508793} +{"epoch": 16, "step": 23858, "loss": 0.013043477199971676, "nll_loss": 0.013043477199971676} +{"epoch": 16, "step": 23859, "loss": 0.027464941143989563, "nll_loss": 0.027464941143989563} +{"epoch": 16, "step": 23860, "loss": 0.0177923534065485, "nll_loss": 0.0177923534065485} +{"epoch": 16, "step": 23861, "loss": 0.024211889132857323, "nll_loss": 0.024211889132857323} +{"epoch": 16, "step": 23862, "loss": 0.03552117198705673, "nll_loss": 0.03552117198705673} +{"epoch": 16, "step": 23863, "loss": 0.023353993892669678, "nll_loss": 0.023353993892669678} +{"epoch": 16, "step": 23864, "loss": 0.01902594231069088, "nll_loss": 0.01902594231069088} +{"epoch": 16, "step": 23865, "loss": 0.027753544971346855, "nll_loss": 0.027753544971346855} +{"epoch": 16, "step": 23866, "loss": 0.019028756767511368, "nll_loss": 0.019028756767511368} +{"epoch": 16, "step": 23867, "loss": 0.029844868928194046, "nll_loss": 0.029844868928194046} +{"epoch": 16, "step": 23868, "loss": 0.018007494509220123, "nll_loss": 0.018007494509220123} +{"epoch": 16, "step": 23869, "loss": 0.03961191326379776, "nll_loss": 0.03961191326379776} +{"epoch": 16, "step": 23870, "loss": 0.02824079804122448, "nll_loss": 0.02824079804122448} +{"epoch": 16, "step": 23871, "loss": 0.02232147380709648, "nll_loss": 0.02232147380709648} +{"epoch": 16, "step": 23872, "loss": 0.01509509701281786, "nll_loss": 0.01509509701281786} +{"epoch": 16, "step": 23873, "loss": 0.017221158370375633, "nll_loss": 0.017221158370375633} +{"epoch": 16, "step": 23874, "loss": 0.02300378866493702, "nll_loss": 0.02300378866493702} +{"epoch": 16, "step": 23875, "loss": 0.02943606860935688, "nll_loss": 0.02943606860935688} +{"epoch": 16, "step": 23876, "loss": 0.024209750816226006, "nll_loss": 0.024209750816226006} +{"epoch": 16, "step": 23877, "loss": 0.026957273483276367, "nll_loss": 0.026957273483276367} +{"epoch": 16, "step": 23878, "loss": 0.03562774509191513, "nll_loss": 0.03562774509191513} +{"epoch": 16, "step": 23879, "loss": 0.015367806889116764, "nll_loss": 0.015367806889116764} +{"epoch": 16, "step": 23880, "loss": 0.026902180165052414, "nll_loss": 0.026902180165052414} +{"epoch": 16, "step": 23881, "loss": 0.03945838660001755, "nll_loss": 0.03945838660001755} +{"epoch": 16, "step": 23882, "loss": 0.018877722322940826, "nll_loss": 0.018877722322940826} +{"epoch": 16, "step": 23883, "loss": 0.012131468392908573, "nll_loss": 0.012131468392908573} +{"epoch": 16, "step": 23884, "loss": 0.029849203303456306, "nll_loss": 0.029849203303456306} +{"epoch": 16, "step": 23885, "loss": 0.01830226182937622, "nll_loss": 0.01830226182937622} +{"epoch": 16, "step": 23886, "loss": 0.03471866250038147, "nll_loss": 0.03471866250038147} +{"epoch": 16, "step": 23887, "loss": 0.02709774486720562, "nll_loss": 0.02709774486720562} +{"epoch": 16, "step": 23888, "loss": 0.03954530879855156, "nll_loss": 0.03954530879855156} +{"epoch": 16, "step": 23889, "loss": 0.026972059160470963, "nll_loss": 0.026972059160470963} +{"epoch": 16, "step": 23890, "loss": 0.023518778383731842, "nll_loss": 0.023518778383731842} +{"epoch": 16, "step": 23891, "loss": 0.014580062590539455, "nll_loss": 0.014580062590539455} +{"epoch": 16, "step": 23892, "loss": 0.031090131029486656, "nll_loss": 0.031090131029486656} +{"epoch": 16, "step": 23893, "loss": 0.020814115181565285, "nll_loss": 0.020814115181565285} +{"epoch": 16, "step": 23894, "loss": 0.012886331416666508, "nll_loss": 0.012886331416666508} +{"epoch": 16, "step": 23895, "loss": 0.02026127278804779, "nll_loss": 0.02026127278804779} +{"epoch": 16, "step": 23896, "loss": 0.02789776585996151, "nll_loss": 0.02789776585996151} +{"epoch": 16, "step": 23897, "loss": 0.021229347214102745, "nll_loss": 0.021229347214102745} +{"epoch": 16, "step": 23898, "loss": 0.022268814966082573, "nll_loss": 0.022268814966082573} +{"epoch": 16, "step": 23899, "loss": 0.019001752138137817, "nll_loss": 0.019001752138137817} +{"epoch": 16, "step": 23900, "loss": 0.02491091564297676, "nll_loss": 0.02491091564297676} +{"epoch": 16, "step": 23901, "loss": 0.037660151720047, "nll_loss": 0.037660151720047} +{"epoch": 16, "step": 23902, "loss": 0.03274409472942352, "nll_loss": 0.03274409472942352} +{"epoch": 16, "step": 23903, "loss": 0.030714593827724457, "nll_loss": 0.030714593827724457} +{"epoch": 16, "step": 23904, "loss": 0.03599727898836136, "nll_loss": 0.03599727898836136} +{"epoch": 16, "step": 23905, "loss": 0.009048668667674065, "nll_loss": 0.009048668667674065} +{"epoch": 16, "step": 23906, "loss": 0.02490878291428089, "nll_loss": 0.02490878291428089} +{"epoch": 16, "step": 23907, "loss": 0.021218249574303627, "nll_loss": 0.021218249574303627} +{"epoch": 16, "step": 23908, "loss": 0.017870759591460228, "nll_loss": 0.017870759591460228} +{"epoch": 16, "step": 23909, "loss": 0.0438048355281353, "nll_loss": 0.0438048355281353} +{"epoch": 16, "step": 23910, "loss": 0.024962104856967926, "nll_loss": 0.024962104856967926} +{"epoch": 16, "step": 23911, "loss": 0.03372586891055107, "nll_loss": 0.03372586891055107} +{"epoch": 16, "step": 23912, "loss": 0.022893767803907394, "nll_loss": 0.022893767803907394} +{"epoch": 16, "step": 23913, "loss": 0.008624621666967869, "nll_loss": 0.008624621666967869} +{"epoch": 16, "step": 23914, "loss": 0.028234628960490227, "nll_loss": 0.028234628960490227} +{"epoch": 16, "step": 23915, "loss": 0.021892894059419632, "nll_loss": 0.021892894059419632} +{"epoch": 16, "step": 23916, "loss": 0.023074092343449593, "nll_loss": 0.023074092343449593} +{"epoch": 16, "step": 23917, "loss": 0.021471969783306122, "nll_loss": 0.021471969783306122} +{"epoch": 16, "step": 23918, "loss": 0.02924525737762451, "nll_loss": 0.02924525737762451} +{"epoch": 16, "step": 23919, "loss": 0.03697685897350311, "nll_loss": 0.03697685897350311} +{"epoch": 16, "step": 23920, "loss": 0.021009912714362144, "nll_loss": 0.021009912714362144} +{"epoch": 16, "step": 23921, "loss": 0.017190944403409958, "nll_loss": 0.017190944403409958} +{"epoch": 16, "step": 23922, "loss": 0.03732827678322792, "nll_loss": 0.03732827678322792} +{"epoch": 16, "step": 23923, "loss": 0.050485435873270035, "nll_loss": 0.050485435873270035} +{"epoch": 16, "step": 23924, "loss": 0.021428994834423065, "nll_loss": 0.021428994834423065} +{"epoch": 16, "step": 23925, "loss": 0.010772035457193851, "nll_loss": 0.010772035457193851} +{"epoch": 16, "step": 23926, "loss": 0.030544757843017578, "nll_loss": 0.030544757843017578} +{"epoch": 16, "step": 23927, "loss": 0.03301702439785004, "nll_loss": 0.03301702439785004} +{"epoch": 16, "step": 23928, "loss": 0.01614159531891346, "nll_loss": 0.01614159531891346} +{"epoch": 16, "step": 23929, "loss": 0.016459152102470398, "nll_loss": 0.016459152102470398} +{"epoch": 16, "step": 23930, "loss": 0.014503124170005322, "nll_loss": 0.014503124170005322} +{"epoch": 16, "step": 23931, "loss": 0.012393608689308167, "nll_loss": 0.012393608689308167} +{"epoch": 16, "step": 23932, "loss": 0.025018716230988503, "nll_loss": 0.025018716230988503} +{"epoch": 16, "step": 23933, "loss": 0.03206290677189827, "nll_loss": 0.03206290677189827} +{"epoch": 16, "step": 23934, "loss": 0.018503304570913315, "nll_loss": 0.018503304570913315} +{"epoch": 16, "step": 23935, "loss": 0.026741882786154747, "nll_loss": 0.026741882786154747} +{"epoch": 16, "step": 23936, "loss": 0.021661849692463875, "nll_loss": 0.021661849692463875} +{"epoch": 16, "step": 23937, "loss": 0.031505946069955826, "nll_loss": 0.031505946069955826} +{"epoch": 16, "step": 23938, "loss": 0.02943313494324684, "nll_loss": 0.02943313494324684} +{"epoch": 16, "step": 23939, "loss": 0.016546906903386116, "nll_loss": 0.016546906903386116} +{"epoch": 16, "step": 23940, "loss": 0.022294923663139343, "nll_loss": 0.022294923663139343} +{"epoch": 16, "step": 23941, "loss": 0.01751737855374813, "nll_loss": 0.01751737855374813} +{"epoch": 16, "step": 23942, "loss": 0.030977025628089905, "nll_loss": 0.030977025628089905} +{"epoch": 16, "step": 23943, "loss": 0.019598688930273056, "nll_loss": 0.019598688930273056} +{"epoch": 16, "step": 23944, "loss": 0.021643714979290962, "nll_loss": 0.021643714979290962} +{"epoch": 16, "step": 23945, "loss": 0.0313209593296051, "nll_loss": 0.0313209593296051} +{"epoch": 16, "step": 23946, "loss": 0.02591228485107422, "nll_loss": 0.02591228485107422} +{"epoch": 16, "step": 23947, "loss": 0.03724367544054985, "nll_loss": 0.03724367544054985} +{"epoch": 16, "step": 23948, "loss": 0.03240997716784477, "nll_loss": 0.03240997716784477} +{"epoch": 16, "step": 23949, "loss": 0.040488243103027344, "nll_loss": 0.040488243103027344} +{"epoch": 16, "step": 23950, "loss": 0.03996960073709488, "nll_loss": 0.03996960073709488} +{"epoch": 16, "step": 23951, "loss": 0.01315859891474247, "nll_loss": 0.01315859891474247} +{"epoch": 16, "step": 23952, "loss": 0.01197738479822874, "nll_loss": 0.01197738479822874} +{"epoch": 16, "step": 23953, "loss": 0.02931150794029236, "nll_loss": 0.02931150794029236} +{"epoch": 16, "step": 23954, "loss": 0.02334275096654892, "nll_loss": 0.02334275096654892} +{"epoch": 16, "step": 23955, "loss": 0.022764671593904495, "nll_loss": 0.022764671593904495} +{"epoch": 16, "step": 23956, "loss": 0.026289818808436394, "nll_loss": 0.026289818808436394} +{"epoch": 16, "step": 23957, "loss": 0.03832444176077843, "nll_loss": 0.03832444176077843} +{"epoch": 16, "step": 23958, "loss": 0.029111580923199654, "nll_loss": 0.029111580923199654} +{"epoch": 16, "step": 23959, "loss": 0.016170864924788475, "nll_loss": 0.016170864924788475} +{"epoch": 16, "step": 23960, "loss": 0.029610786586999893, "nll_loss": 0.029610786586999893} +{"epoch": 16, "step": 23961, "loss": 0.03234298527240753, "nll_loss": 0.03234298527240753} +{"epoch": 16, "step": 23962, "loss": 0.020232899114489555, "nll_loss": 0.020232899114489555} +{"epoch": 16, "step": 23963, "loss": 0.015886183828115463, "nll_loss": 0.015886183828115463} +{"epoch": 16, "step": 23964, "loss": 0.043933212757110596, "nll_loss": 0.043933212757110596} +{"epoch": 16, "step": 23965, "loss": 0.01531314104795456, "nll_loss": 0.01531314104795456} +{"epoch": 16, "step": 23966, "loss": 0.038712918758392334, "nll_loss": 0.038712918758392334} +{"epoch": 16, "step": 23967, "loss": 0.025510890409350395, "nll_loss": 0.025510890409350395} +{"epoch": 16, "step": 23968, "loss": 0.04892944172024727, "nll_loss": 0.04892944172024727} +{"epoch": 16, "step": 23969, "loss": 0.026702342554926872, "nll_loss": 0.026702342554926872} +{"epoch": 16, "step": 23970, "loss": 0.06333985924720764, "nll_loss": 0.06333985924720764} +{"epoch": 16, "step": 23971, "loss": 0.02461402676999569, "nll_loss": 0.02461402676999569} +{"epoch": 16, "step": 23972, "loss": 0.024284275248646736, "nll_loss": 0.024284275248646736} +{"epoch": 16, "step": 23973, "loss": 0.01761208474636078, "nll_loss": 0.01761208474636078} +{"epoch": 16, "step": 23974, "loss": 0.02042129822075367, "nll_loss": 0.02042129822075367} +{"epoch": 16, "step": 23975, "loss": 0.026031671091914177, "nll_loss": 0.026031671091914177} +{"epoch": 16, "step": 23976, "loss": 0.01402698177844286, "nll_loss": 0.01402698177844286} +{"epoch": 16, "step": 23977, "loss": 0.04690494015812874, "nll_loss": 0.04690494015812874} +{"epoch": 16, "step": 23978, "loss": 0.01661776192486286, "nll_loss": 0.01661776192486286} +{"epoch": 16, "step": 23979, "loss": 0.012789367698132992, "nll_loss": 0.012789367698132992} +{"epoch": 16, "step": 23980, "loss": 0.028957800939679146, "nll_loss": 0.028957800939679146} +{"epoch": 16, "step": 23981, "loss": 0.01865486055612564, "nll_loss": 0.01865486055612564} +{"epoch": 16, "step": 23982, "loss": 0.01556476578116417, "nll_loss": 0.01556476578116417} +{"epoch": 16, "step": 23983, "loss": 0.04222962260246277, "nll_loss": 0.04222962260246277} +{"epoch": 16, "step": 23984, "loss": 0.02979305200278759, "nll_loss": 0.02979305200278759} +{"epoch": 16, "step": 23985, "loss": 0.013983692042529583, "nll_loss": 0.013983692042529583} +{"epoch": 16, "step": 23986, "loss": 0.03452237695455551, "nll_loss": 0.03452237695455551} +{"epoch": 16, "step": 23987, "loss": 0.03181888535618782, "nll_loss": 0.03181888535618782} +{"epoch": 16, "step": 23988, "loss": 0.01531308889389038, "nll_loss": 0.01531308889389038} +{"epoch": 16, "step": 23989, "loss": 0.01671074517071247, "nll_loss": 0.01671074517071247} +{"epoch": 16, "step": 23990, "loss": 0.026980236172676086, "nll_loss": 0.026980236172676086} +{"epoch": 16, "step": 23991, "loss": 0.0368104949593544, "nll_loss": 0.0368104949593544} +{"epoch": 16, "step": 23992, "loss": 0.01978272944688797, "nll_loss": 0.01978272944688797} +{"epoch": 16, "step": 23993, "loss": 0.019532911479473114, "nll_loss": 0.019532911479473114} +{"epoch": 16, "step": 23994, "loss": 0.030310364440083504, "nll_loss": 0.030310364440083504} +{"epoch": 16, "step": 23995, "loss": 0.021016938611865044, "nll_loss": 0.021016938611865044} +{"epoch": 16, "step": 23996, "loss": 0.02185613289475441, "nll_loss": 0.02185613289475441} +{"epoch": 16, "step": 23997, "loss": 0.020426888018846512, "nll_loss": 0.020426888018846512} +{"epoch": 16, "step": 23998, "loss": 0.024537649005651474, "nll_loss": 0.024537649005651474} +{"epoch": 16, "step": 23999, "loss": 0.012264147400856018, "nll_loss": 0.012264147400856018} +{"epoch": 16, "step": 24000, "loss": 0.027661843225359917, "nll_loss": 0.027661843225359917} +{"epoch": 16, "step": 24001, "loss": 0.022298747673630714, "nll_loss": 0.022298747673630714} +{"epoch": 16, "step": 24002, "loss": 0.01460221316665411, "nll_loss": 0.01460221316665411} +{"epoch": 16, "step": 24003, "loss": 0.025352494791150093, "nll_loss": 0.025352494791150093} +{"epoch": 16, "step": 24004, "loss": 0.02127443440258503, "nll_loss": 0.02127443440258503} +{"epoch": 16, "step": 24005, "loss": 0.01398930512368679, "nll_loss": 0.01398930512368679} +{"epoch": 16, "step": 24006, "loss": 0.02088753879070282, "nll_loss": 0.02088753879070282} +{"epoch": 16, "step": 24007, "loss": 0.029078733175992966, "nll_loss": 0.029078733175992966} +{"epoch": 16, "step": 24008, "loss": 0.015677381306886673, "nll_loss": 0.015677381306886673} +{"epoch": 16, "step": 24009, "loss": 0.01630415953695774, "nll_loss": 0.01630415953695774} +{"epoch": 16, "step": 24010, "loss": 0.027154644951224327, "nll_loss": 0.027154644951224327} +{"epoch": 16, "step": 24011, "loss": 0.014638223685324192, "nll_loss": 0.014638223685324192} +{"epoch": 16, "step": 24012, "loss": 0.010343166999518871, "nll_loss": 0.010343166999518871} +{"epoch": 16, "step": 24013, "loss": 0.025864500552415848, "nll_loss": 0.025864500552415848} +{"epoch": 16, "step": 24014, "loss": 0.019521035254001617, "nll_loss": 0.019521035254001617} +{"epoch": 16, "step": 24015, "loss": 0.01749810203909874, "nll_loss": 0.01749810203909874} +{"epoch": 16, "step": 24016, "loss": 0.052404146641492844, "nll_loss": 0.052404146641492844} +{"epoch": 16, "step": 24017, "loss": 0.022758202627301216, "nll_loss": 0.022758202627301216} +{"epoch": 16, "step": 24018, "loss": 0.03081320971250534, "nll_loss": 0.03081320971250534} +{"epoch": 16, "step": 24019, "loss": 0.027080174535512924, "nll_loss": 0.027080174535512924} +{"epoch": 16, "step": 24020, "loss": 0.036555059254169464, "nll_loss": 0.036555059254169464} +{"epoch": 16, "step": 24021, "loss": 0.028614649549126625, "nll_loss": 0.028614649549126625} +{"epoch": 16, "step": 24022, "loss": 0.025159038603305817, "nll_loss": 0.025159038603305817} +{"epoch": 16, "step": 24023, "loss": 0.014264429919421673, "nll_loss": 0.014264429919421673} +{"epoch": 16, "step": 24024, "loss": 0.026214683428406715, "nll_loss": 0.026214683428406715} +{"epoch": 16, "step": 24025, "loss": 0.02057180367410183, "nll_loss": 0.02057180367410183} +{"epoch": 16, "step": 24026, "loss": 0.022766131907701492, "nll_loss": 0.022766131907701492} +{"epoch": 16, "step": 24027, "loss": 0.009950622916221619, "nll_loss": 0.009950622916221619} +{"epoch": 16, "step": 24028, "loss": 0.02569776400923729, "nll_loss": 0.02569776400923729} +{"epoch": 16, "step": 24029, "loss": 0.03209630772471428, "nll_loss": 0.03209630772471428} +{"epoch": 16, "step": 24030, "loss": 0.027401918545365334, "nll_loss": 0.027401918545365334} +{"epoch": 16, "step": 24031, "loss": 0.031194128096103668, "nll_loss": 0.031194128096103668} +{"epoch": 16, "step": 24032, "loss": 0.010932615958154202, "nll_loss": 0.010932615958154202} +{"epoch": 16, "step": 24033, "loss": 0.007587665691971779, "nll_loss": 0.007587665691971779} +{"epoch": 16, "step": 24034, "loss": 0.03739481046795845, "nll_loss": 0.03739481046795845} +{"epoch": 16, "step": 24035, "loss": 0.022966094315052032, "nll_loss": 0.022966094315052032} +{"epoch": 16, "step": 24036, "loss": 0.02571532130241394, "nll_loss": 0.02571532130241394} +{"epoch": 16, "step": 24037, "loss": 0.04770275205373764, "nll_loss": 0.04770275205373764} +{"epoch": 16, "step": 24038, "loss": 0.0393838956952095, "nll_loss": 0.0393838956952095} +{"epoch": 16, "step": 24039, "loss": 0.021116087213158607, "nll_loss": 0.021116087213158607} +{"epoch": 16, "step": 24040, "loss": 0.02094382233917713, "nll_loss": 0.02094382233917713} +{"epoch": 16, "step": 24041, "loss": 0.03085683286190033, "nll_loss": 0.03085683286190033} +{"epoch": 16, "step": 24042, "loss": 0.03871241211891174, "nll_loss": 0.03871241211891174} +{"epoch": 16, "step": 24043, "loss": 0.02030569314956665, "nll_loss": 0.02030569314956665} +{"epoch": 16, "step": 24044, "loss": 0.06281081587076187, "nll_loss": 0.06281081587076187} +{"epoch": 16, "step": 24045, "loss": 0.030639324337244034, "nll_loss": 0.030639324337244034} +{"epoch": 16, "step": 24046, "loss": 0.034217458218336105, "nll_loss": 0.034217458218336105} +{"epoch": 16, "step": 24047, "loss": 0.02263812907040119, "nll_loss": 0.02263812907040119} +{"epoch": 16, "step": 24048, "loss": 0.04221707955002785, "nll_loss": 0.04221707955002785} +{"epoch": 16, "step": 24049, "loss": 0.034803763031959534, "nll_loss": 0.034803763031959534} +{"epoch": 16, "step": 24050, "loss": 0.03299642354249954, "nll_loss": 0.03299642354249954} +{"epoch": 16, "step": 24051, "loss": 0.023186571896076202, "nll_loss": 0.023186571896076202} +{"epoch": 16, "step": 24052, "loss": 0.04087546840310097, "nll_loss": 0.04087546840310097} +{"epoch": 16, "step": 24053, "loss": 0.03725382313132286, "nll_loss": 0.03725382313132286} +{"epoch": 16, "step": 24054, "loss": 0.0195530503988266, "nll_loss": 0.0195530503988266} +{"epoch": 16, "step": 24055, "loss": 0.052526090294122696, "nll_loss": 0.052526090294122696} +{"epoch": 16, "step": 24056, "loss": 0.03447060286998749, "nll_loss": 0.03447060286998749} +{"epoch": 16, "step": 24057, "loss": 0.025713179260492325, "nll_loss": 0.025713179260492325} +{"epoch": 16, "step": 24058, "loss": 0.0450548492372036, "nll_loss": 0.0450548492372036} +{"epoch": 16, "step": 24059, "loss": 0.020269639790058136, "nll_loss": 0.020269639790058136} +{"epoch": 16, "step": 24060, "loss": 0.010025857016444206, "nll_loss": 0.010025857016444206} +{"epoch": 16, "step": 24061, "loss": 0.02758301980793476, "nll_loss": 0.02758301980793476} +{"epoch": 16, "step": 24062, "loss": 0.017109081149101257, "nll_loss": 0.017109081149101257} +{"epoch": 16, "step": 24063, "loss": 0.013733003288507462, "nll_loss": 0.013733003288507462} +{"epoch": 16, "step": 24064, "loss": 0.022607143968343735, "nll_loss": 0.022607143968343735} +{"epoch": 16, "step": 24065, "loss": 0.00870576687157154, "nll_loss": 0.00870576687157154} +{"epoch": 16, "step": 24066, "loss": 0.033473461866378784, "nll_loss": 0.033473461866378784} +{"epoch": 16, "step": 24067, "loss": 0.02590092457830906, "nll_loss": 0.02590092457830906} +{"epoch": 16, "step": 24068, "loss": 0.04631371051073074, "nll_loss": 0.04631371051073074} +{"epoch": 16, "step": 24069, "loss": 0.026587458327412605, "nll_loss": 0.026587458327412605} +{"epoch": 16, "step": 24070, "loss": 0.023021159693598747, "nll_loss": 0.023021159693598747} +{"epoch": 16, "step": 24071, "loss": 0.03537965565919876, "nll_loss": 0.03537965565919876} +{"epoch": 16, "step": 24072, "loss": 0.05906693637371063, "nll_loss": 0.05906693637371063} +{"epoch": 16, "step": 24073, "loss": 0.012668280862271786, "nll_loss": 0.012668280862271786} +{"epoch": 16, "step": 24074, "loss": 0.01424580067396164, "nll_loss": 0.01424580067396164} +{"epoch": 16, "step": 24075, "loss": 0.019495321437716484, "nll_loss": 0.019495321437716484} +{"epoch": 16, "step": 24076, "loss": 0.01801292411983013, "nll_loss": 0.01801292411983013} +{"epoch": 16, "step": 24077, "loss": 0.01694517582654953, "nll_loss": 0.01694517582654953} +{"epoch": 16, "step": 24078, "loss": 0.01587512716650963, "nll_loss": 0.01587512716650963} +{"epoch": 16, "step": 24079, "loss": 0.02855907939374447, "nll_loss": 0.02855907939374447} +{"epoch": 16, "step": 24080, "loss": 0.021429413929581642, "nll_loss": 0.021429413929581642} +{"epoch": 16, "step": 24081, "loss": 0.022480757907032967, "nll_loss": 0.022480757907032967} +{"epoch": 16, "step": 24082, "loss": 0.027532508596777916, "nll_loss": 0.027532508596777916} +{"epoch": 16, "step": 24083, "loss": 0.01569061167538166, "nll_loss": 0.01569061167538166} +{"epoch": 16, "step": 24084, "loss": 0.02481660060584545, "nll_loss": 0.02481660060584545} +{"epoch": 16, "step": 24085, "loss": 0.05855419859290123, "nll_loss": 0.05855419859290123} +{"epoch": 16, "step": 24086, "loss": 0.029040683060884476, "nll_loss": 0.029040683060884476} +{"epoch": 16, "step": 24087, "loss": 0.015410277061164379, "nll_loss": 0.015410277061164379} +{"epoch": 16, "step": 24088, "loss": 0.019015273079276085, "nll_loss": 0.019015273079276085} +{"epoch": 16, "step": 24089, "loss": 0.01630510203540325, "nll_loss": 0.01630510203540325} +{"epoch": 16, "step": 24090, "loss": 0.030262574553489685, "nll_loss": 0.030262574553489685} +{"epoch": 16, "step": 24091, "loss": 0.02844519354403019, "nll_loss": 0.02844519354403019} +{"epoch": 16, "step": 24092, "loss": 0.03221588954329491, "nll_loss": 0.03221588954329491} +{"epoch": 16, "step": 24093, "loss": 0.04533768445253372, "nll_loss": 0.04533768445253372} +{"epoch": 16, "step": 24094, "loss": 0.02184232696890831, "nll_loss": 0.02184232696890831} +{"epoch": 16, "step": 24095, "loss": 0.054363593459129333, "nll_loss": 0.054363593459129333} +{"epoch": 16, "step": 24096, "loss": 0.04338300600647926, "nll_loss": 0.04338300600647926} +{"epoch": 16, "step": 24097, "loss": 0.024527790024876595, "nll_loss": 0.024527790024876595} +{"epoch": 16, "step": 24098, "loss": 0.02864942140877247, "nll_loss": 0.02864942140877247} +{"epoch": 16, "step": 24099, "loss": 0.022697048261761665, "nll_loss": 0.022697048261761665} +{"epoch": 16, "step": 24100, "loss": 0.044578418135643005, "nll_loss": 0.044578418135643005} +{"epoch": 16, "step": 24101, "loss": 0.022328916937112808, "nll_loss": 0.022328916937112808} +{"epoch": 16, "step": 24102, "loss": 0.03646654635667801, "nll_loss": 0.03646654635667801} +{"epoch": 16, "step": 24103, "loss": 0.0340508334338665, "nll_loss": 0.0340508334338665} +{"epoch": 16, "step": 24104, "loss": 0.012407777830958366, "nll_loss": 0.012407777830958366} +{"epoch": 16, "step": 24105, "loss": 0.015052474103868008, "nll_loss": 0.015052474103868008} +{"epoch": 16, "step": 24106, "loss": 0.02309807389974594, "nll_loss": 0.02309807389974594} +{"epoch": 16, "step": 24107, "loss": 0.058774229139089584, "nll_loss": 0.058774229139089584} +{"epoch": 16, "step": 24108, "loss": 0.02611190639436245, "nll_loss": 0.02611190639436245} +{"epoch": 16, "step": 24109, "loss": 0.020844966173171997, "nll_loss": 0.020844966173171997} +{"epoch": 16, "step": 24110, "loss": 0.016090352088212967, "nll_loss": 0.016090352088212967} +{"epoch": 16, "step": 24111, "loss": 0.025781644508242607, "nll_loss": 0.025781644508242607} +{"epoch": 16, "step": 24112, "loss": 0.017050419002771378, "nll_loss": 0.017050419002771378} +{"epoch": 16, "step": 24113, "loss": 0.008311508223414421, "nll_loss": 0.008311508223414421} +{"epoch": 16, "step": 24114, "loss": 0.02627888321876526, "nll_loss": 0.02627888321876526} +{"epoch": 16, "step": 24115, "loss": 0.028176993131637573, "nll_loss": 0.028176993131637573} +{"epoch": 16, "step": 24116, "loss": 0.03495484218001366, "nll_loss": 0.03495484218001366} +{"epoch": 16, "step": 24117, "loss": 0.024169694632291794, "nll_loss": 0.024169694632291794} +{"epoch": 16, "step": 24118, "loss": 0.014253850094974041, "nll_loss": 0.014253850094974041} +{"epoch": 16, "step": 24119, "loss": 0.043543923646211624, "nll_loss": 0.043543923646211624} +{"epoch": 16, "step": 24120, "loss": 0.017017418518662453, "nll_loss": 0.017017418518662453} +{"epoch": 16, "step": 24121, "loss": 0.028315145522356033, "nll_loss": 0.028315145522356033} +{"epoch": 16, "step": 24122, "loss": 0.026499006897211075, "nll_loss": 0.026499006897211075} +{"epoch": 16, "step": 24123, "loss": 0.02520609460771084, "nll_loss": 0.02520609460771084} +{"epoch": 16, "step": 24124, "loss": 0.029571905732154846, "nll_loss": 0.029571905732154846} +{"epoch": 16, "step": 24125, "loss": 0.016128843650221825, "nll_loss": 0.016128843650221825} +{"epoch": 16, "step": 24126, "loss": 0.021064795553684235, "nll_loss": 0.021064795553684235} +{"epoch": 16, "step": 24127, "loss": 0.03676587715744972, "nll_loss": 0.03676587715744972} +{"epoch": 16, "step": 24128, "loss": 0.03501179814338684, "nll_loss": 0.03501179814338684} +{"epoch": 16, "step": 24129, "loss": 0.026893725618720055, "nll_loss": 0.026893725618720055} +{"epoch": 16, "step": 24130, "loss": 0.019884033128619194, "nll_loss": 0.019884033128619194} +{"epoch": 16, "step": 24131, "loss": 0.03135930374264717, "nll_loss": 0.03135930374264717} +{"epoch": 16, "step": 24132, "loss": 0.01882448047399521, "nll_loss": 0.01882448047399521} +{"epoch": 16, "step": 24133, "loss": 0.015059830620884895, "nll_loss": 0.015059830620884895} +{"epoch": 16, "step": 24134, "loss": 0.01703442819416523, "nll_loss": 0.01703442819416523} +{"epoch": 16, "step": 24135, "loss": 0.03488951548933983, "nll_loss": 0.03488951548933983} +{"epoch": 16, "step": 24136, "loss": 0.01409084815531969, "nll_loss": 0.01409084815531969} +{"epoch": 16, "step": 24137, "loss": 0.02757105603814125, "nll_loss": 0.02757105603814125} +{"epoch": 16, "step": 24138, "loss": 0.023880502209067345, "nll_loss": 0.023880502209067345} +{"epoch": 16, "step": 24139, "loss": 0.031162220984697342, "nll_loss": 0.031162220984697342} +{"epoch": 16, "step": 24140, "loss": 0.03612218052148819, "nll_loss": 0.03612218052148819} +{"epoch": 16, "step": 24141, "loss": 0.03181925415992737, "nll_loss": 0.03181925415992737} +{"epoch": 16, "step": 24142, "loss": 0.022979862987995148, "nll_loss": 0.022979862987995148} +{"epoch": 16, "step": 24143, "loss": 0.016237344592809677, "nll_loss": 0.016237344592809677} +{"epoch": 16, "step": 24144, "loss": 0.028506580740213394, "nll_loss": 0.028506580740213394} +{"epoch": 16, "step": 24145, "loss": 0.02364111691713333, "nll_loss": 0.02364111691713333} +{"epoch": 16, "step": 24146, "loss": 0.035684190690517426, "nll_loss": 0.035684190690517426} +{"epoch": 16, "step": 24147, "loss": 0.024494284763932228, "nll_loss": 0.024494284763932228} +{"epoch": 16, "step": 24148, "loss": 0.024096712470054626, "nll_loss": 0.024096712470054626} +{"epoch": 16, "step": 24149, "loss": 0.020507529377937317, "nll_loss": 0.020507529377937317} +{"epoch": 16, "step": 24150, "loss": 0.01907806098461151, "nll_loss": 0.01907806098461151} +{"epoch": 16, "step": 24151, "loss": 0.018454162403941154, "nll_loss": 0.018454162403941154} +{"epoch": 16, "step": 24152, "loss": 0.025192255154252052, "nll_loss": 0.025192255154252052} +{"epoch": 16, "step": 24153, "loss": 0.023504482582211494, "nll_loss": 0.023504482582211494} +{"epoch": 16, "step": 24154, "loss": 0.023456335067749023, "nll_loss": 0.023456335067749023} +{"epoch": 16, "step": 24155, "loss": 0.01774412952363491, "nll_loss": 0.01774412952363491} +{"epoch": 16, "step": 24156, "loss": 0.03175384923815727, "nll_loss": 0.03175384923815727} +{"epoch": 16, "step": 24157, "loss": 0.019616615027189255, "nll_loss": 0.019616615027189255} +{"epoch": 16, "step": 24158, "loss": 0.009198767133057117, "nll_loss": 0.009198767133057117} +{"epoch": 16, "step": 24159, "loss": 0.023298026993870735, "nll_loss": 0.023298026993870735} +{"epoch": 16, "step": 24160, "loss": 0.021774252876639366, "nll_loss": 0.021774252876639366} +{"epoch": 16, "step": 24161, "loss": 0.03369544446468353, "nll_loss": 0.03369544446468353} +{"epoch": 16, "step": 24162, "loss": 0.02299482189118862, "nll_loss": 0.02299482189118862} +{"epoch": 16, "step": 24163, "loss": 0.022064613178372383, "nll_loss": 0.022064613178372383} +{"epoch": 16, "step": 24164, "loss": 0.030928052961826324, "nll_loss": 0.030928052961826324} +{"epoch": 16, "step": 24165, "loss": 0.026868075132369995, "nll_loss": 0.026868075132369995} +{"epoch": 16, "step": 24166, "loss": 0.05573475733399391, "nll_loss": 0.05573475733399391} +{"epoch": 16, "step": 24167, "loss": 0.029006391763687134, "nll_loss": 0.029006391763687134} +{"epoch": 16, "step": 24168, "loss": 0.033671677112579346, "nll_loss": 0.033671677112579346} +{"epoch": 16, "step": 24169, "loss": 0.009923300705850124, "nll_loss": 0.009923300705850124} +{"epoch": 16, "step": 24170, "loss": 0.03490627557039261, "nll_loss": 0.03490627557039261} +{"epoch": 16, "step": 24171, "loss": 0.0064830477349460125, "nll_loss": 0.0064830477349460125} +{"epoch": 16, "step": 24172, "loss": 0.05480705946683884, "nll_loss": 0.05480705946683884} +{"epoch": 16, "step": 24173, "loss": 0.021676158532500267, "nll_loss": 0.021676158532500267} +{"epoch": 16, "step": 24174, "loss": 0.028283195570111275, "nll_loss": 0.028283195570111275} +{"epoch": 16, "step": 24175, "loss": 0.05379463732242584, "nll_loss": 0.05379463732242584} +{"epoch": 16, "step": 24176, "loss": 0.020232491195201874, "nll_loss": 0.020232491195201874} +{"epoch": 16, "step": 24177, "loss": 0.016642728820443153, "nll_loss": 0.016642728820443153} +{"epoch": 16, "step": 24178, "loss": 0.017694056034088135, "nll_loss": 0.017694056034088135} +{"epoch": 16, "step": 24179, "loss": 0.026699254289269447, "nll_loss": 0.026699254289269447} +{"epoch": 16, "step": 24180, "loss": 0.04617684334516525, "nll_loss": 0.04617684334516525} +{"epoch": 16, "step": 24181, "loss": 0.020300915464758873, "nll_loss": 0.020300915464758873} +{"epoch": 16, "step": 24182, "loss": 0.015708724036812782, "nll_loss": 0.015708724036812782} +{"epoch": 16, "step": 24183, "loss": 0.023689143359661102, "nll_loss": 0.023689143359661102} +{"epoch": 16, "step": 24184, "loss": 0.02777932584285736, "nll_loss": 0.02777932584285736} +{"epoch": 16, "step": 24185, "loss": 0.026621714234352112, "nll_loss": 0.026621714234352112} +{"epoch": 16, "step": 24186, "loss": 0.019607778638601303, "nll_loss": 0.019607778638601303} +{"epoch": 16, "step": 24187, "loss": 0.020343849435448647, "nll_loss": 0.020343849435448647} +{"epoch": 16, "step": 24188, "loss": 0.0170073751360178, "nll_loss": 0.0170073751360178} +{"epoch": 16, "step": 24189, "loss": 0.0575186051428318, "nll_loss": 0.0575186051428318} +{"epoch": 16, "step": 24190, "loss": 0.04117323085665703, "nll_loss": 0.04117323085665703} +{"epoch": 16, "step": 24191, "loss": 0.02467104233801365, "nll_loss": 0.02467104233801365} +{"epoch": 16, "step": 24192, "loss": 0.03091508336365223, "nll_loss": 0.03091508336365223} +{"epoch": 16, "step": 24193, "loss": 0.022681748494505882, "nll_loss": 0.022681748494505882} +{"epoch": 16, "step": 24194, "loss": 0.011349961161613464, "nll_loss": 0.011349961161613464} +{"epoch": 16, "step": 24195, "loss": 0.021389884874224663, "nll_loss": 0.021389884874224663} +{"epoch": 16, "step": 24196, "loss": 0.053855374455451965, "nll_loss": 0.053855374455451965} +{"epoch": 16, "step": 24197, "loss": 0.05710531398653984, "nll_loss": 0.05710531398653984} +{"epoch": 16, "step": 24198, "loss": 0.025227509438991547, "nll_loss": 0.025227509438991547} +{"epoch": 16, "step": 24199, "loss": 0.020983034744858742, "nll_loss": 0.020983034744858742} +{"epoch": 16, "step": 24200, "loss": 0.02523871697485447, "nll_loss": 0.02523871697485447} +{"epoch": 16, "step": 24201, "loss": 0.04507948085665703, "nll_loss": 0.04507948085665703} +{"epoch": 16, "step": 24202, "loss": 0.023144859820604324, "nll_loss": 0.023144859820604324} +{"epoch": 16, "step": 24203, "loss": 0.03233868628740311, "nll_loss": 0.03233868628740311} +{"epoch": 16, "step": 24204, "loss": 0.03830074518918991, "nll_loss": 0.03830074518918991} +{"epoch": 16, "step": 24205, "loss": 0.027800781652331352, "nll_loss": 0.027800781652331352} +{"epoch": 16, "step": 24206, "loss": 0.040670718997716904, "nll_loss": 0.040670718997716904} +{"epoch": 16, "step": 24207, "loss": 0.03014158457517624, "nll_loss": 0.03014158457517624} +{"epoch": 16, "step": 24208, "loss": 0.012628709897398949, "nll_loss": 0.012628709897398949} +{"epoch": 16, "step": 24209, "loss": 0.028322942554950714, "nll_loss": 0.028322942554950714} +{"epoch": 16, "step": 24210, "loss": 0.018621928989887238, "nll_loss": 0.018621928989887238} +{"epoch": 16, "step": 24211, "loss": 0.026586631312966347, "nll_loss": 0.026586631312966347} +{"epoch": 16, "step": 24212, "loss": 0.029809221625328064, "nll_loss": 0.029809221625328064} +{"epoch": 16, "step": 24213, "loss": 0.01372281089425087, "nll_loss": 0.01372281089425087} +{"epoch": 16, "step": 24214, "loss": 0.028145039454102516, "nll_loss": 0.028145039454102516} +{"epoch": 16, "step": 24215, "loss": 0.031026726588606834, "nll_loss": 0.031026726588606834} +{"epoch": 16, "step": 24216, "loss": 0.017514625564217567, "nll_loss": 0.017514625564217567} +{"epoch": 16, "step": 24217, "loss": 0.04122474417090416, "nll_loss": 0.04122474417090416} +{"epoch": 16, "step": 24218, "loss": 0.020033404231071472, "nll_loss": 0.020033404231071472} +{"epoch": 16, "step": 24219, "loss": 0.04859242960810661, "nll_loss": 0.04859242960810661} +{"epoch": 16, "step": 24220, "loss": 0.013319442979991436, "nll_loss": 0.013319442979991436} +{"epoch": 16, "step": 24221, "loss": 0.02298917807638645, "nll_loss": 0.02298917807638645} +{"epoch": 16, "step": 24222, "loss": 0.028095796704292297, "nll_loss": 0.028095796704292297} +{"epoch": 16, "step": 24223, "loss": 0.011810990050435066, "nll_loss": 0.011810990050435066} +{"epoch": 16, "step": 24224, "loss": 0.028227873146533966, "nll_loss": 0.028227873146533966} +{"epoch": 16, "step": 24225, "loss": 0.030965041369199753, "nll_loss": 0.030965041369199753} +{"epoch": 16, "step": 24226, "loss": 0.016284164041280746, "nll_loss": 0.016284164041280746} +{"epoch": 16, "step": 24227, "loss": 0.024720661342144012, "nll_loss": 0.024720661342144012} +{"epoch": 16, "step": 24228, "loss": 0.029235757887363434, "nll_loss": 0.029235757887363434} +{"epoch": 16, "step": 24229, "loss": 0.025470880791544914, "nll_loss": 0.025470880791544914} +{"epoch": 16, "step": 24230, "loss": 0.012263712473213673, "nll_loss": 0.012263712473213673} +{"epoch": 16, "step": 24231, "loss": 0.07293185591697693, "nll_loss": 0.07293185591697693} +{"epoch": 16, "step": 24232, "loss": 0.027058009058237076, "nll_loss": 0.027058009058237076} +{"epoch": 16, "step": 24233, "loss": 0.02397676184773445, "nll_loss": 0.02397676184773445} +{"epoch": 16, "step": 24234, "loss": 0.03949735313653946, "nll_loss": 0.03949735313653946} +{"epoch": 16, "step": 24235, "loss": 0.1094725951552391, "nll_loss": 0.1094725951552391} +{"epoch": 16, "step": 24236, "loss": 0.029828377068042755, "nll_loss": 0.029828377068042755} +{"epoch": 16, "step": 24237, "loss": 0.030720612034201622, "nll_loss": 0.030720612034201622} +{"epoch": 16, "step": 24238, "loss": 0.015087239444255829, "nll_loss": 0.015087239444255829} +{"epoch": 16, "step": 24239, "loss": 0.045759037137031555, "nll_loss": 0.045759037137031555} +{"epoch": 16, "step": 24240, "loss": 0.025543212890625, "nll_loss": 0.025543212890625} +{"epoch": 16, "step": 24241, "loss": 0.0183855053037405, "nll_loss": 0.0183855053037405} +{"epoch": 16, "step": 24242, "loss": 0.04149661213159561, "nll_loss": 0.04149661213159561} +{"epoch": 16, "step": 24243, "loss": 0.008350984193384647, "nll_loss": 0.008350984193384647} +{"epoch": 16, "step": 24244, "loss": 0.02207614853978157, "nll_loss": 0.02207614853978157} +{"epoch": 16, "step": 24245, "loss": 0.031023431569337845, "nll_loss": 0.031023431569337845} +{"epoch": 16, "step": 24246, "loss": 0.02979767508804798, "nll_loss": 0.02979767508804798} +{"epoch": 16, "step": 24247, "loss": 0.03865235671401024, "nll_loss": 0.03865235671401024} +{"epoch": 16, "step": 24248, "loss": 0.03914659842848778, "nll_loss": 0.03914659842848778} +{"epoch": 16, "step": 24249, "loss": 0.02414872497320175, "nll_loss": 0.02414872497320175} +{"epoch": 16, "step": 24250, "loss": 0.029180213809013367, "nll_loss": 0.029180213809013367} +{"epoch": 16, "step": 24251, "loss": 0.022188162431120872, "nll_loss": 0.022188162431120872} +{"epoch": 16, "step": 24252, "loss": 0.02043449878692627, "nll_loss": 0.02043449878692627} +{"epoch": 16, "step": 24253, "loss": 0.015351200476288795, "nll_loss": 0.015351200476288795} +{"epoch": 16, "step": 24254, "loss": 0.029058560729026794, "nll_loss": 0.029058560729026794} +{"epoch": 16, "step": 24255, "loss": 0.02540092170238495, "nll_loss": 0.02540092170238495} +{"epoch": 16, "step": 24256, "loss": 0.022833440452814102, "nll_loss": 0.022833440452814102} +{"epoch": 16, "step": 24257, "loss": 0.0367979034781456, "nll_loss": 0.0367979034781456} +{"epoch": 16, "step": 24258, "loss": 0.01724950596690178, "nll_loss": 0.01724950596690178} +{"epoch": 16, "step": 24259, "loss": 0.02702655829489231, "nll_loss": 0.02702655829489231} +{"epoch": 16, "step": 24260, "loss": 0.020154723897576332, "nll_loss": 0.020154723897576332} +{"epoch": 16, "step": 24261, "loss": 0.03167097270488739, "nll_loss": 0.03167097270488739} +{"epoch": 16, "step": 24262, "loss": 0.032586365938186646, "nll_loss": 0.032586365938186646} +{"epoch": 16, "step": 24263, "loss": 0.020242171362042427, "nll_loss": 0.020242171362042427} +{"epoch": 16, "step": 24264, "loss": 0.017808111384510994, "nll_loss": 0.017808111384510994} +{"epoch": 16, "step": 24265, "loss": 0.04085944592952728, "nll_loss": 0.04085944592952728} +{"epoch": 16, "step": 24266, "loss": 0.018748246133327484, "nll_loss": 0.018748246133327484} +{"epoch": 16, "step": 24267, "loss": 0.02386024035513401, "nll_loss": 0.02386024035513401} +{"epoch": 16, "step": 24268, "loss": 0.038548972457647324, "nll_loss": 0.038548972457647324} +{"epoch": 16, "step": 24269, "loss": 0.019483711570501328, "nll_loss": 0.019483711570501328} +{"epoch": 16, "step": 24270, "loss": 0.013232767581939697, "nll_loss": 0.013232767581939697} +{"epoch": 16, "step": 24271, "loss": 0.014551831409335136, "nll_loss": 0.014551831409335136} +{"epoch": 16, "step": 24272, "loss": 0.03069581836462021, "nll_loss": 0.03069581836462021} +{"epoch": 16, "step": 24273, "loss": 0.02957041934132576, "nll_loss": 0.02957041934132576} +{"epoch": 16, "step": 24274, "loss": 0.013315999880433083, "nll_loss": 0.013315999880433083} +{"epoch": 16, "step": 24275, "loss": 0.03686327114701271, "nll_loss": 0.03686327114701271} +{"epoch": 16, "step": 24276, "loss": 0.01787630096077919, "nll_loss": 0.01787630096077919} +{"epoch": 16, "step": 24277, "loss": 0.019619105383753777, "nll_loss": 0.019619105383753777} +{"epoch": 16, "step": 24278, "loss": 0.020144924521446228, "nll_loss": 0.020144924521446228} +{"epoch": 16, "step": 24279, "loss": 0.021649088710546494, "nll_loss": 0.021649088710546494} +{"epoch": 16, "step": 24280, "loss": 0.017478154972195625, "nll_loss": 0.017478154972195625} +{"epoch": 16, "step": 24281, "loss": 0.02908920682966709, "nll_loss": 0.02908920682966709} +{"epoch": 16, "step": 24282, "loss": 0.026195460930466652, "nll_loss": 0.026195460930466652} +{"epoch": 16, "step": 24283, "loss": 0.018482226878404617, "nll_loss": 0.018482226878404617} +{"epoch": 16, "step": 24284, "loss": 0.042061518877744675, "nll_loss": 0.042061518877744675} +{"epoch": 16, "step": 24285, "loss": 0.03954295441508293, "nll_loss": 0.03954295441508293} +{"epoch": 16, "step": 24286, "loss": 0.0441942922770977, "nll_loss": 0.0441942922770977} +{"epoch": 16, "step": 24287, "loss": 0.03234349191188812, "nll_loss": 0.03234349191188812} +{"epoch": 16, "step": 24288, "loss": 0.014627709053456783, "nll_loss": 0.014627709053456783} +{"epoch": 16, "step": 24289, "loss": 0.016239572316408157, "nll_loss": 0.016239572316408157} +{"epoch": 16, "step": 24290, "loss": 0.03700865060091019, "nll_loss": 0.03700865060091019} +{"epoch": 16, "step": 24291, "loss": 0.02770294062793255, "nll_loss": 0.02770294062793255} +{"epoch": 16, "step": 24292, "loss": 0.028627904132008553, "nll_loss": 0.028627904132008553} +{"epoch": 16, "step": 24293, "loss": 0.02662690542638302, "nll_loss": 0.02662690542638302} +{"epoch": 16, "step": 24294, "loss": 0.013388395309448242, "nll_loss": 0.013388395309448242} +{"epoch": 16, "step": 24295, "loss": 0.030157340690493584, "nll_loss": 0.030157340690493584} +{"epoch": 16, "step": 24296, "loss": 0.018460942432284355, "nll_loss": 0.018460942432284355} +{"epoch": 16, "step": 24297, "loss": 0.024016888812184334, "nll_loss": 0.024016888812184334} +{"epoch": 16, "step": 24298, "loss": 0.02434419095516205, "nll_loss": 0.02434419095516205} +{"epoch": 16, "step": 24299, "loss": 0.0255360696464777, "nll_loss": 0.0255360696464777} +{"epoch": 16, "step": 24300, "loss": 0.0315590426325798, "nll_loss": 0.0315590426325798} +{"epoch": 16, "step": 24301, "loss": 0.017659181728959084, "nll_loss": 0.017659181728959084} +{"epoch": 16, "step": 24302, "loss": 0.03209049627184868, "nll_loss": 0.03209049627184868} +{"epoch": 16, "step": 24303, "loss": 0.025197036564350128, "nll_loss": 0.025197036564350128} +{"epoch": 16, "step": 24304, "loss": 0.014623505063354969, "nll_loss": 0.014623505063354969} +{"epoch": 16, "step": 24305, "loss": 0.021211469545960426, "nll_loss": 0.021211469545960426} +{"epoch": 16, "step": 24306, "loss": 0.028172671794891357, "nll_loss": 0.028172671794891357} +{"epoch": 16, "step": 24307, "loss": 0.019341034814715385, "nll_loss": 0.019341034814715385} +{"epoch": 16, "step": 24308, "loss": 0.025691917166113853, "nll_loss": 0.025691917166113853} +{"epoch": 16, "step": 24309, "loss": 0.02732778526842594, "nll_loss": 0.02732778526842594} +{"epoch": 16, "step": 24310, "eval_rougeL": 0.23964140298317876}