sdar_4b_trace_sft-final / trainer_log.jsonl
autoprogrammer's picture
Upload sdar_4b_trace_sft-final
e682cfb verified
{"current_steps": 5, "total_steps": 1404, "loss": 0.3054, "lr": 9.30232558139535e-07, "epoch": 0.0106951871657754, "percentage": 0.36, "elapsed_time": "0:02:02", "remaining_time": "9:29:48"}
{"current_steps": 10, "total_steps": 1404, "loss": 0.2661, "lr": 2.0930232558139536e-06, "epoch": 0.0213903743315508, "percentage": 0.71, "elapsed_time": "0:02:05", "remaining_time": "4:51:48"}
{"current_steps": 15, "total_steps": 1404, "loss": 0.2409, "lr": 3.2558139534883724e-06, "epoch": 0.03208556149732621, "percentage": 1.07, "elapsed_time": "0:02:09", "remaining_time": "3:19:34"}
{"current_steps": 20, "total_steps": 1404, "loss": 0.2228, "lr": 4.418604651162791e-06, "epoch": 0.0427807486631016, "percentage": 1.42, "elapsed_time": "0:02:12", "remaining_time": "2:32:52"}
{"current_steps": 25, "total_steps": 1404, "loss": 0.2258, "lr": 5.58139534883721e-06, "epoch": 0.053475935828877004, "percentage": 1.78, "elapsed_time": "0:02:16", "remaining_time": "2:05:08"}
{"current_steps": 30, "total_steps": 1404, "loss": 0.2103, "lr": 6.744186046511628e-06, "epoch": 0.06417112299465241, "percentage": 2.14, "elapsed_time": "0:02:19", "remaining_time": "1:46:22"}
{"current_steps": 35, "total_steps": 1404, "loss": 0.2122, "lr": 7.906976744186048e-06, "epoch": 0.0748663101604278, "percentage": 2.49, "elapsed_time": "0:02:22", "remaining_time": "1:32:57"}
{"current_steps": 40, "total_steps": 1404, "loss": 0.1996, "lr": 9.069767441860465e-06, "epoch": 0.0855614973262032, "percentage": 2.85, "elapsed_time": "0:02:25", "remaining_time": "1:22:52"}
{"current_steps": 45, "total_steps": 1404, "loss": 0.2311, "lr": 9.999986679414613e-06, "epoch": 0.0962566844919786, "percentage": 3.21, "elapsed_time": "0:02:29", "remaining_time": "1:15:04"}
{"current_steps": 50, "total_steps": 1404, "loss": 0.2319, "lr": 9.999520466378376e-06, "epoch": 0.10695187165775401, "percentage": 3.56, "elapsed_time": "0:02:32", "remaining_time": "1:08:51"}
{"current_steps": 55, "total_steps": 1404, "loss": 0.2368, "lr": 9.998388295046227e-06, "epoch": 0.11764705882352941, "percentage": 3.92, "elapsed_time": "0:02:35", "remaining_time": "1:03:39"}
{"current_steps": 60, "total_steps": 1404, "loss": 0.2354, "lr": 9.996590316228402e-06, "epoch": 0.12834224598930483, "percentage": 4.27, "elapsed_time": "0:02:39", "remaining_time": "0:59:28"}
{"current_steps": 65, "total_steps": 1404, "loss": 0.234, "lr": 9.994126769423656e-06, "epoch": 0.13903743315508021, "percentage": 4.63, "elapsed_time": "0:02:42", "remaining_time": "0:55:47"}
{"current_steps": 70, "total_steps": 1404, "loss": 0.2541, "lr": 9.990997982787348e-06, "epoch": 0.1497326203208556, "percentage": 4.99, "elapsed_time": "0:02:46", "remaining_time": "0:52:44"}
{"current_steps": 75, "total_steps": 1404, "loss": 0.2496, "lr": 9.98720437308773e-06, "epoch": 0.16042780748663102, "percentage": 5.34, "elapsed_time": "0:02:49", "remaining_time": "0:49:59"}
{"current_steps": 80, "total_steps": 1404, "loss": 0.2797, "lr": 9.982746445650437e-06, "epoch": 0.1711229946524064, "percentage": 5.7, "elapsed_time": "0:02:52", "remaining_time": "0:47:33"}
{"current_steps": 85, "total_steps": 1404, "loss": 0.2518, "lr": 9.977624794291172e-06, "epoch": 0.18181818181818182, "percentage": 6.05, "elapsed_time": "0:02:55", "remaining_time": "0:45:25"}
{"current_steps": 90, "total_steps": 1404, "loss": 0.261, "lr": 9.97184010123661e-06, "epoch": 0.1925133689839572, "percentage": 6.41, "elapsed_time": "0:02:58", "remaining_time": "0:43:32"}
{"current_steps": 95, "total_steps": 1404, "loss": 0.2564, "lr": 9.965393137033512e-06, "epoch": 0.20320855614973263, "percentage": 6.77, "elapsed_time": "0:03:02", "remaining_time": "0:41:52"}
{"current_steps": 100, "total_steps": 1404, "loss": 0.2501, "lr": 9.958284760446104e-06, "epoch": 0.21390374331550802, "percentage": 7.12, "elapsed_time": "0:03:05", "remaining_time": "0:40:19"}
{"current_steps": 105, "total_steps": 1404, "loss": 0.2504, "lr": 9.950515918341666e-06, "epoch": 0.22459893048128343, "percentage": 7.48, "elapsed_time": "0:03:08", "remaining_time": "0:38:54"}
{"current_steps": 110, "total_steps": 1404, "loss": 0.2706, "lr": 9.942087645564415e-06, "epoch": 0.23529411764705882, "percentage": 7.83, "elapsed_time": "0:03:11", "remaining_time": "0:37:38"}
{"current_steps": 115, "total_steps": 1404, "loss": 0.2499, "lr": 9.93300106479766e-06, "epoch": 0.24598930481283424, "percentage": 8.19, "elapsed_time": "0:03:15", "remaining_time": "0:36:31"}
{"current_steps": 120, "total_steps": 1404, "loss": 0.2628, "lr": 9.923257386414253e-06, "epoch": 0.25668449197860965, "percentage": 8.55, "elapsed_time": "0:03:19", "remaining_time": "0:35:31"}
{"current_steps": 125, "total_steps": 1404, "loss": 0.2642, "lr": 9.912857908315363e-06, "epoch": 0.26737967914438504, "percentage": 8.9, "elapsed_time": "0:03:22", "remaining_time": "0:34:31"}
{"current_steps": 130, "total_steps": 1404, "loss": 0.2669, "lr": 9.901804015757588e-06, "epoch": 0.27807486631016043, "percentage": 9.26, "elapsed_time": "0:03:25", "remaining_time": "0:33:34"}
{"current_steps": 135, "total_steps": 1404, "loss": 0.2809, "lr": 9.89009718116843e-06, "epoch": 0.2887700534759358, "percentage": 9.62, "elapsed_time": "0:03:28", "remaining_time": "0:32:43"}
{"current_steps": 140, "total_steps": 1404, "loss": 0.2705, "lr": 9.877738963950175e-06, "epoch": 0.2994652406417112, "percentage": 9.97, "elapsed_time": "0:03:32", "remaining_time": "0:31:57"}
{"current_steps": 145, "total_steps": 1404, "loss": 0.2548, "lr": 9.864731010272152e-06, "epoch": 0.31016042780748665, "percentage": 10.33, "elapsed_time": "0:03:35", "remaining_time": "0:31:11"}
{"current_steps": 150, "total_steps": 1404, "loss": 0.2534, "lr": 9.851075052851476e-06, "epoch": 0.32085561497326204, "percentage": 10.68, "elapsed_time": "0:03:38", "remaining_time": "0:30:28"}
{"current_steps": 155, "total_steps": 1404, "loss": 0.2438, "lr": 9.83677291072223e-06, "epoch": 0.3315508021390374, "percentage": 11.04, "elapsed_time": "0:03:41", "remaining_time": "0:29:48"}
{"current_steps": 160, "total_steps": 1404, "loss": 0.2791, "lr": 9.821826488993168e-06, "epoch": 0.3422459893048128, "percentage": 11.4, "elapsed_time": "0:03:45", "remaining_time": "0:29:12"}
{"current_steps": 165, "total_steps": 1404, "loss": 0.2734, "lr": 9.806237778593941e-06, "epoch": 0.35294117647058826, "percentage": 11.75, "elapsed_time": "0:03:48", "remaining_time": "0:28:37"}
{"current_steps": 170, "total_steps": 1404, "loss": 0.2463, "lr": 9.790008856009902e-06, "epoch": 0.36363636363636365, "percentage": 12.11, "elapsed_time": "0:03:51", "remaining_time": "0:28:02"}
{"current_steps": 175, "total_steps": 1404, "loss": 0.2813, "lr": 9.773141883005507e-06, "epoch": 0.37433155080213903, "percentage": 12.46, "elapsed_time": "0:03:54", "remaining_time": "0:27:30"}
{"current_steps": 180, "total_steps": 1404, "loss": 0.2724, "lr": 9.755639106336347e-06, "epoch": 0.3850267379679144, "percentage": 12.82, "elapsed_time": "0:03:58", "remaining_time": "0:26:59"}
{"current_steps": 185, "total_steps": 1404, "loss": 0.271, "lr": 9.737502857449894e-06, "epoch": 0.39572192513368987, "percentage": 13.18, "elapsed_time": "0:04:01", "remaining_time": "0:26:32"}
{"current_steps": 190, "total_steps": 1404, "loss": 0.2467, "lr": 9.718735552174923e-06, "epoch": 0.40641711229946526, "percentage": 13.53, "elapsed_time": "0:04:04", "remaining_time": "0:26:04"}
{"current_steps": 195, "total_steps": 1404, "loss": 0.2621, "lr": 9.699339690399717e-06, "epoch": 0.41711229946524064, "percentage": 13.89, "elapsed_time": "0:04:08", "remaining_time": "0:25:38"}
{"current_steps": 200, "total_steps": 1404, "loss": 0.2791, "lr": 9.679317855739073e-06, "epoch": 0.42780748663101603, "percentage": 14.25, "elapsed_time": "0:04:11", "remaining_time": "0:25:13"}
{"current_steps": 205, "total_steps": 1404, "loss": 0.2829, "lr": 9.658672715190151e-06, "epoch": 0.4385026737967914, "percentage": 14.6, "elapsed_time": "0:04:14", "remaining_time": "0:24:49"}
{"current_steps": 210, "total_steps": 1404, "loss": 0.2866, "lr": 9.637407018777224e-06, "epoch": 0.44919786096256686, "percentage": 14.96, "elapsed_time": "0:04:18", "remaining_time": "0:24:27"}
{"current_steps": 215, "total_steps": 1404, "loss": 0.2422, "lr": 9.615523599185353e-06, "epoch": 0.45989304812834225, "percentage": 15.31, "elapsed_time": "0:04:21", "remaining_time": "0:24:04"}
{"current_steps": 220, "total_steps": 1404, "loss": 0.269, "lr": 9.593025371383064e-06, "epoch": 0.47058823529411764, "percentage": 15.67, "elapsed_time": "0:04:24", "remaining_time": "0:23:42"}
{"current_steps": 225, "total_steps": 1404, "loss": 0.2686, "lr": 9.569915332234068e-06, "epoch": 0.48128342245989303, "percentage": 16.03, "elapsed_time": "0:04:27", "remaining_time": "0:23:21"}
{"current_steps": 230, "total_steps": 1404, "loss": 0.273, "lr": 9.546196560098062e-06, "epoch": 0.4919786096256685, "percentage": 16.38, "elapsed_time": "0:04:30", "remaining_time": "0:23:03"}
{"current_steps": 235, "total_steps": 1404, "loss": 0.2395, "lr": 9.521872214420668e-06, "epoch": 0.5026737967914439, "percentage": 16.74, "elapsed_time": "0:04:34", "remaining_time": "0:22:43"}
{"current_steps": 240, "total_steps": 1404, "loss": 0.2682, "lr": 9.496945535312597e-06, "epoch": 0.5133689839572193, "percentage": 17.09, "elapsed_time": "0:04:37", "remaining_time": "0:22:25"}
{"current_steps": 245, "total_steps": 1404, "loss": 0.2557, "lr": 9.471419843118036e-06, "epoch": 0.5240641711229946, "percentage": 17.45, "elapsed_time": "0:04:40", "remaining_time": "0:22:06"}
{"current_steps": 250, "total_steps": 1404, "loss": 0.266, "lr": 9.44529853797238e-06, "epoch": 0.5347593582887701, "percentage": 17.81, "elapsed_time": "0:04:43", "remaining_time": "0:21:49"}
{"current_steps": 255, "total_steps": 1404, "loss": 0.2779, "lr": 9.418585099349306e-06, "epoch": 0.5454545454545454, "percentage": 18.16, "elapsed_time": "0:04:47", "remaining_time": "0:21:34"}
{"current_steps": 260, "total_steps": 1404, "loss": 0.2508, "lr": 9.391283085597299e-06, "epoch": 0.5561497326203209, "percentage": 18.52, "elapsed_time": "0:04:50", "remaining_time": "0:21:17"}
{"current_steps": 265, "total_steps": 1404, "loss": 0.2727, "lr": 9.36339613346565e-06, "epoch": 0.5668449197860963, "percentage": 18.87, "elapsed_time": "0:04:53", "remaining_time": "0:21:02"}
{"current_steps": 270, "total_steps": 1404, "loss": 0.2714, "lr": 9.33492795762005e-06, "epoch": 0.5775401069518716, "percentage": 19.23, "elapsed_time": "0:04:56", "remaining_time": "0:20:46"}
{"current_steps": 275, "total_steps": 1404, "loss": 0.2585, "lr": 9.305882350147763e-06, "epoch": 0.5882352941176471, "percentage": 19.59, "elapsed_time": "0:05:00", "remaining_time": "0:20:32"}
{"current_steps": 280, "total_steps": 1404, "loss": 0.2584, "lr": 9.276263180052498e-06, "epoch": 0.5989304812834224, "percentage": 19.94, "elapsed_time": "0:05:03", "remaining_time": "0:20:18"}
{"current_steps": 285, "total_steps": 1404, "loss": 0.2771, "lr": 9.246074392739057e-06, "epoch": 0.6096256684491979, "percentage": 20.3, "elapsed_time": "0:05:06", "remaining_time": "0:20:03"}
{"current_steps": 290, "total_steps": 1404, "loss": 0.265, "lr": 9.21532000948778e-06, "epoch": 0.6203208556149733, "percentage": 20.66, "elapsed_time": "0:05:09", "remaining_time": "0:19:50"}
{"current_steps": 295, "total_steps": 1404, "loss": 0.2653, "lr": 9.184004126918891e-06, "epoch": 0.6310160427807486, "percentage": 21.01, "elapsed_time": "0:05:12", "remaining_time": "0:19:36"}
{"current_steps": 300, "total_steps": 1404, "loss": 0.2373, "lr": 9.152130916446817e-06, "epoch": 0.6417112299465241, "percentage": 21.37, "elapsed_time": "0:05:16", "remaining_time": "0:19:24"}
{"current_steps": 305, "total_steps": 1404, "loss": 0.2779, "lr": 9.119704623724528e-06, "epoch": 0.6524064171122995, "percentage": 21.72, "elapsed_time": "0:05:19", "remaining_time": "0:19:12"}
{"current_steps": 310, "total_steps": 1404, "loss": 0.2813, "lr": 9.086729568078006e-06, "epoch": 0.6631016042780749, "percentage": 22.08, "elapsed_time": "0:05:22", "remaining_time": "0:18:59"}
{"current_steps": 315, "total_steps": 1404, "loss": 0.284, "lr": 9.05321014193089e-06, "epoch": 0.6737967914438503, "percentage": 22.44, "elapsed_time": "0:05:26", "remaining_time": "0:18:47"}
{"current_steps": 320, "total_steps": 1404, "loss": 0.2646, "lr": 9.019150810219376e-06, "epoch": 0.6844919786096256, "percentage": 22.79, "elapsed_time": "0:05:29", "remaining_time": "0:18:35"}
{"current_steps": 325, "total_steps": 1404, "loss": 0.2693, "lr": 8.984556109797484e-06, "epoch": 0.6951871657754011, "percentage": 23.15, "elapsed_time": "0:05:32", "remaining_time": "0:18:24"}
{"current_steps": 330, "total_steps": 1404, "loss": 0.2662, "lr": 8.949430648832716e-06, "epoch": 0.7058823529411765, "percentage": 23.5, "elapsed_time": "0:05:35", "remaining_time": "0:18:13"}
{"current_steps": 335, "total_steps": 1404, "loss": 0.2745, "lr": 8.91377910619223e-06, "epoch": 0.7165775401069518, "percentage": 23.86, "elapsed_time": "0:05:39", "remaining_time": "0:18:02"}
{"current_steps": 340, "total_steps": 1404, "loss": 0.2462, "lr": 8.8776062308196e-06, "epoch": 0.7272727272727273, "percentage": 24.22, "elapsed_time": "0:05:42", "remaining_time": "0:17:51"}
{"current_steps": 345, "total_steps": 1404, "loss": 0.2663, "lr": 8.84091684110223e-06, "epoch": 0.7379679144385026, "percentage": 24.57, "elapsed_time": "0:05:45", "remaining_time": "0:17:41"}
{"current_steps": 350, "total_steps": 1404, "loss": 0.2595, "lr": 8.803715824229525e-06, "epoch": 0.7486631016042781, "percentage": 24.93, "elapsed_time": "0:05:48", "remaining_time": "0:17:30"}
{"current_steps": 355, "total_steps": 1404, "loss": 0.2476, "lr": 8.766008135541896e-06, "epoch": 0.7593582887700535, "percentage": 25.28, "elapsed_time": "0:05:52", "remaining_time": "0:17:20"}
{"current_steps": 360, "total_steps": 1404, "loss": 0.2399, "lr": 8.727798797870688e-06, "epoch": 0.7700534759358288, "percentage": 25.64, "elapsed_time": "0:05:55", "remaining_time": "0:17:10"}
{"current_steps": 365, "total_steps": 1404, "loss": 0.2568, "lr": 8.689092900869112e-06, "epoch": 0.7807486631016043, "percentage": 26.0, "elapsed_time": "0:05:58", "remaining_time": "0:17:00"}
{"current_steps": 370, "total_steps": 1404, "loss": 0.2779, "lr": 8.649895600334284e-06, "epoch": 0.7914438502673797, "percentage": 26.35, "elapsed_time": "0:06:01", "remaining_time": "0:16:51"}
{"current_steps": 375, "total_steps": 1404, "loss": 0.2738, "lr": 8.610212117520453e-06, "epoch": 0.8021390374331551, "percentage": 26.71, "elapsed_time": "0:06:05", "remaining_time": "0:16:41"}
{"current_steps": 380, "total_steps": 1404, "loss": 0.2564, "lr": 8.570047738443502e-06, "epoch": 0.8128342245989305, "percentage": 27.07, "elapsed_time": "0:06:08", "remaining_time": "0:16:32"}
{"current_steps": 385, "total_steps": 1404, "loss": 0.2459, "lr": 8.52940781317683e-06, "epoch": 0.8235294117647058, "percentage": 27.42, "elapsed_time": "0:06:11", "remaining_time": "0:16:23"}
{"current_steps": 390, "total_steps": 1404, "loss": 0.2639, "lr": 8.48829775513869e-06, "epoch": 0.8342245989304813, "percentage": 27.78, "elapsed_time": "0:06:14", "remaining_time": "0:16:14"}
{"current_steps": 395, "total_steps": 1404, "loss": 0.2545, "lr": 8.446723040371114e-06, "epoch": 0.8449197860962567, "percentage": 28.13, "elapsed_time": "0:06:18", "remaining_time": "0:16:06"}
{"current_steps": 400, "total_steps": 1404, "loss": 0.2712, "lr": 8.40468920681047e-06, "epoch": 0.8556149732620321, "percentage": 28.49, "elapsed_time": "0:06:21", "remaining_time": "0:15:57"}
{"current_steps": 405, "total_steps": 1404, "loss": 0.27, "lr": 8.362201853549777e-06, "epoch": 0.8663101604278075, "percentage": 28.85, "elapsed_time": "0:06:24", "remaining_time": "0:15:48"}
{"current_steps": 410, "total_steps": 1404, "loss": 0.2823, "lr": 8.319266640092899e-06, "epoch": 0.8770053475935828, "percentage": 29.2, "elapsed_time": "0:06:27", "remaining_time": "0:15:39"}
{"current_steps": 415, "total_steps": 1404, "loss": 0.2555, "lr": 8.275889285600656e-06, "epoch": 0.8877005347593583, "percentage": 29.56, "elapsed_time": "0:06:31", "remaining_time": "0:15:32"}
{"current_steps": 420, "total_steps": 1404, "loss": 0.2615, "lr": 8.23207556812902e-06, "epoch": 0.8983957219251337, "percentage": 29.91, "elapsed_time": "0:06:34", "remaining_time": "0:15:23"}
{"current_steps": 425, "total_steps": 1404, "loss": 0.2512, "lr": 8.187831323859445e-06, "epoch": 0.9090909090909091, "percentage": 30.27, "elapsed_time": "0:06:37", "remaining_time": "0:15:15"}
{"current_steps": 430, "total_steps": 1404, "loss": 0.2568, "lr": 8.143162446321465e-06, "epoch": 0.9197860962566845, "percentage": 30.63, "elapsed_time": "0:06:40", "remaining_time": "0:15:07"}
{"current_steps": 435, "total_steps": 1404, "loss": 0.2506, "lr": 8.098074885607646e-06, "epoch": 0.93048128342246, "percentage": 30.98, "elapsed_time": "0:06:44", "remaining_time": "0:14:59"}
{"current_steps": 440, "total_steps": 1404, "loss": 0.2586, "lr": 8.052574647581009e-06, "epoch": 0.9411764705882353, "percentage": 31.34, "elapsed_time": "0:06:47", "remaining_time": "0:14:52"}
{"current_steps": 445, "total_steps": 1404, "loss": 0.2576, "lr": 8.006667793075026e-06, "epoch": 0.9518716577540107, "percentage": 31.7, "elapsed_time": "0:06:50", "remaining_time": "0:14:44"}
{"current_steps": 450, "total_steps": 1404, "loss": 0.2363, "lr": 7.960360437086287e-06, "epoch": 0.9625668449197861, "percentage": 32.05, "elapsed_time": "0:06:53", "remaining_time": "0:14:37"}
{"current_steps": 455, "total_steps": 1404, "loss": 0.2677, "lr": 7.91365874795995e-06, "epoch": 0.9732620320855615, "percentage": 32.41, "elapsed_time": "0:06:56", "remaining_time": "0:14:29"}
{"current_steps": 460, "total_steps": 1404, "loss": 0.2702, "lr": 7.866568946568107e-06, "epoch": 0.983957219251337, "percentage": 32.76, "elapsed_time": "0:07:00", "remaining_time": "0:14:22"}
{"current_steps": 465, "total_steps": 1404, "loss": 0.2487, "lr": 7.819097305481112e-06, "epoch": 0.9946524064171123, "percentage": 33.12, "elapsed_time": "0:07:03", "remaining_time": "0:14:15"}
{"current_steps": 470, "total_steps": 1404, "loss": 0.1638, "lr": 7.771250148132067e-06, "epoch": 1.0042780748663103, "percentage": 33.48, "elapsed_time": "0:08:13", "remaining_time": "0:16:20"}
{"current_steps": 475, "total_steps": 1404, "loss": 0.1013, "lr": 7.723033847974503e-06, "epoch": 1.0149732620320855, "percentage": 33.83, "elapsed_time": "0:08:16", "remaining_time": "0:16:11"}
{"current_steps": 480, "total_steps": 1404, "loss": 0.0924, "lr": 7.674454827633413e-06, "epoch": 1.025668449197861, "percentage": 34.19, "elapsed_time": "0:08:19", "remaining_time": "0:16:02"}
{"current_steps": 485, "total_steps": 1404, "loss": 0.1075, "lr": 7.625519558049722e-06, "epoch": 1.0363636363636364, "percentage": 34.54, "elapsed_time": "0:08:23", "remaining_time": "0:15:53"}
{"current_steps": 490, "total_steps": 1404, "loss": 0.0926, "lr": 7.576234557618336e-06, "epoch": 1.0470588235294118, "percentage": 34.9, "elapsed_time": "0:08:26", "remaining_time": "0:15:44"}
{"current_steps": 495, "total_steps": 1404, "loss": 0.1054, "lr": 7.526606391319862e-06, "epoch": 1.0577540106951873, "percentage": 35.26, "elapsed_time": "0:08:29", "remaining_time": "0:15:35"}
{"current_steps": 500, "total_steps": 1404, "loss": 0.0999, "lr": 7.476641669846121e-06, "epoch": 1.0684491978609625, "percentage": 35.61, "elapsed_time": "0:08:33", "remaining_time": "0:15:27"}
{"current_steps": 505, "total_steps": 1404, "loss": 0.1082, "lr": 7.426347048719577e-06, "epoch": 1.079144385026738, "percentage": 35.97, "elapsed_time": "0:08:36", "remaining_time": "0:15:18"}
{"current_steps": 510, "total_steps": 1404, "loss": 0.1227, "lr": 7.375729227406789e-06, "epoch": 1.0898395721925134, "percentage": 36.32, "elapsed_time": "0:08:39", "remaining_time": "0:15:10"}
{"current_steps": 515, "total_steps": 1404, "loss": 0.0943, "lr": 7.324794948426015e-06, "epoch": 1.1005347593582888, "percentage": 36.68, "elapsed_time": "0:08:42", "remaining_time": "0:15:01"}
{"current_steps": 520, "total_steps": 1404, "loss": 0.1038, "lr": 7.273550996449077e-06, "epoch": 1.1112299465240643, "percentage": 37.04, "elapsed_time": "0:08:45", "remaining_time": "0:14:54"}
{"current_steps": 525, "total_steps": 1404, "loss": 0.0956, "lr": 7.222004197397613e-06, "epoch": 1.1219251336898395, "percentage": 37.39, "elapsed_time": "0:08:49", "remaining_time": "0:14:45"}
{"current_steps": 530, "total_steps": 1404, "loss": 0.0946, "lr": 7.170161417533836e-06, "epoch": 1.132620320855615, "percentage": 37.75, "elapsed_time": "0:08:52", "remaining_time": "0:14:37"}
{"current_steps": 535, "total_steps": 1404, "loss": 0.0868, "lr": 7.118029562545915e-06, "epoch": 1.1433155080213904, "percentage": 38.11, "elapsed_time": "0:08:55", "remaining_time": "0:14:29"}
{"current_steps": 540, "total_steps": 1404, "loss": 0.1009, "lr": 7.065615576628107e-06, "epoch": 1.1540106951871658, "percentage": 38.46, "elapsed_time": "0:08:58", "remaining_time": "0:14:21"}
{"current_steps": 545, "total_steps": 1404, "loss": 0.1067, "lr": 7.0129264415557585e-06, "epoch": 1.1647058823529413, "percentage": 38.82, "elapsed_time": "0:09:01", "remaining_time": "0:14:14"}
{"current_steps": 550, "total_steps": 1404, "loss": 0.1009, "lr": 6.959969175755306e-06, "epoch": 1.1754010695187165, "percentage": 39.17, "elapsed_time": "0:09:05", "remaining_time": "0:14:06"}
{"current_steps": 555, "total_steps": 1404, "loss": 0.0912, "lr": 6.906750833369386e-06, "epoch": 1.186096256684492, "percentage": 39.53, "elapsed_time": "0:09:08", "remaining_time": "0:13:58"}
{"current_steps": 560, "total_steps": 1404, "loss": 0.1026, "lr": 6.8532785033171975e-06, "epoch": 1.1967914438502674, "percentage": 39.89, "elapsed_time": "0:09:11", "remaining_time": "0:13:51"}
{"current_steps": 565, "total_steps": 1404, "loss": 0.0985, "lr": 6.799559308350219e-06, "epoch": 1.2074866310160428, "percentage": 40.24, "elapsed_time": "0:09:14", "remaining_time": "0:13:44"}
{"current_steps": 570, "total_steps": 1404, "loss": 0.0982, "lr": 6.745600404103431e-06, "epoch": 1.2181818181818183, "percentage": 40.6, "elapsed_time": "0:09:18", "remaining_time": "0:13:36"}
{"current_steps": 575, "total_steps": 1404, "loss": 0.1084, "lr": 6.6914089781421535e-06, "epoch": 1.2288770053475937, "percentage": 40.95, "elapsed_time": "0:09:21", "remaining_time": "0:13:29"}
{"current_steps": 580, "total_steps": 1404, "loss": 0.1054, "lr": 6.636992249004629e-06, "epoch": 1.239572192513369, "percentage": 41.31, "elapsed_time": "0:09:24", "remaining_time": "0:13:21"}
{"current_steps": 585, "total_steps": 1404, "loss": 0.1045, "lr": 6.582357465240488e-06, "epoch": 1.2502673796791444, "percentage": 41.67, "elapsed_time": "0:09:27", "remaining_time": "0:13:14"}
{"current_steps": 590, "total_steps": 1404, "loss": 0.0883, "lr": 6.527511904445194e-06, "epoch": 1.2609625668449198, "percentage": 42.02, "elapsed_time": "0:09:31", "remaining_time": "0:13:07"}
{"current_steps": 595, "total_steps": 1404, "loss": 0.0946, "lr": 6.472462872290654e-06, "epoch": 1.2716577540106953, "percentage": 42.38, "elapsed_time": "0:09:34", "remaining_time": "0:13:00"}
{"current_steps": 600, "total_steps": 1404, "loss": 0.0996, "lr": 6.417217701552059e-06, "epoch": 1.2823529411764705, "percentage": 42.74, "elapsed_time": "0:09:37", "remaining_time": "0:12:53"}
{"current_steps": 605, "total_steps": 1404, "loss": 0.0963, "lr": 6.36178375113113e-06, "epoch": 1.293048128342246, "percentage": 43.09, "elapsed_time": "0:09:40", "remaining_time": "0:12:46"}
{"current_steps": 610, "total_steps": 1404, "loss": 0.0986, "lr": 6.3061684050758776e-06, "epoch": 1.3037433155080214, "percentage": 43.45, "elapsed_time": "0:09:43", "remaining_time": "0:12:39"}
{"current_steps": 615, "total_steps": 1404, "loss": 0.0925, "lr": 6.250379071597018e-06, "epoch": 1.3144385026737968, "percentage": 43.8, "elapsed_time": "0:09:47", "remaining_time": "0:12:33"}
{"current_steps": 620, "total_steps": 1404, "loss": 0.1125, "lr": 6.194423182081161e-06, "epoch": 1.3251336898395722, "percentage": 44.16, "elapsed_time": "0:09:50", "remaining_time": "0:12:26"}
{"current_steps": 625, "total_steps": 1404, "loss": 0.1038, "lr": 6.138308190100918e-06, "epoch": 1.3358288770053477, "percentage": 44.52, "elapsed_time": "0:09:53", "remaining_time": "0:12:19"}
{"current_steps": 630, "total_steps": 1404, "loss": 0.1097, "lr": 6.082041570422059e-06, "epoch": 1.346524064171123, "percentage": 44.87, "elapsed_time": "0:09:56", "remaining_time": "0:12:12"}
{"current_steps": 635, "total_steps": 1404, "loss": 0.1001, "lr": 6.025630818007833e-06, "epoch": 1.3572192513368984, "percentage": 45.23, "elapsed_time": "0:09:59", "remaining_time": "0:12:06"}
{"current_steps": 640, "total_steps": 1404, "loss": 0.1018, "lr": 5.969083447020606e-06, "epoch": 1.3679144385026738, "percentage": 45.58, "elapsed_time": "0:10:03", "remaining_time": "0:12:00"}
{"current_steps": 645, "total_steps": 1404, "loss": 0.1043, "lr": 5.912406989820948e-06, "epoch": 1.3786096256684492, "percentage": 45.94, "elapsed_time": "0:10:06", "remaining_time": "0:11:53"}
{"current_steps": 650, "total_steps": 1404, "loss": 0.0961, "lr": 5.855608995964283e-06, "epoch": 1.3893048128342245, "percentage": 46.3, "elapsed_time": "0:10:09", "remaining_time": "0:11:47"}
{"current_steps": 655, "total_steps": 1404, "loss": 0.1025, "lr": 5.798697031195257e-06, "epoch": 1.4, "percentage": 46.65, "elapsed_time": "0:10:12", "remaining_time": "0:11:40"}
{"current_steps": 660, "total_steps": 1404, "loss": 0.0993, "lr": 5.741678676439946e-06, "epoch": 1.4106951871657754, "percentage": 47.01, "elapsed_time": "0:10:16", "remaining_time": "0:11:34"}
{"current_steps": 665, "total_steps": 1404, "loss": 0.0968, "lr": 5.684561526796045e-06, "epoch": 1.4213903743315508, "percentage": 47.36, "elapsed_time": "0:10:19", "remaining_time": "0:11:28"}
{"current_steps": 670, "total_steps": 1404, "loss": 0.0824, "lr": 5.627353190521168e-06, "epoch": 1.4320855614973262, "percentage": 47.72, "elapsed_time": "0:10:22", "remaining_time": "0:11:22"}
{"current_steps": 675, "total_steps": 1404, "loss": 0.0994, "lr": 5.570061288019385e-06, "epoch": 1.4427807486631017, "percentage": 48.08, "elapsed_time": "0:10:25", "remaining_time": "0:11:15"}
{"current_steps": 680, "total_steps": 1404, "loss": 0.1007, "lr": 5.51269345082617e-06, "epoch": 1.4534759358288771, "percentage": 48.43, "elapsed_time": "0:10:29", "remaining_time": "0:11:09"}
{"current_steps": 685, "total_steps": 1404, "loss": 0.1021, "lr": 5.455257320591825e-06, "epoch": 1.4641711229946524, "percentage": 48.79, "elapsed_time": "0:10:32", "remaining_time": "0:11:03"}
{"current_steps": 690, "total_steps": 1404, "loss": 0.0918, "lr": 5.397760548063591e-06, "epoch": 1.4748663101604278, "percentage": 49.15, "elapsed_time": "0:10:35", "remaining_time": "0:10:57"}
{"current_steps": 695, "total_steps": 1404, "loss": 0.0967, "lr": 5.340210792066531e-06, "epoch": 1.4855614973262032, "percentage": 49.5, "elapsed_time": "0:10:38", "remaining_time": "0:10:51"}
{"current_steps": 700, "total_steps": 1404, "loss": 0.0859, "lr": 5.282615718483344e-06, "epoch": 1.4962566844919787, "percentage": 49.86, "elapsed_time": "0:10:41", "remaining_time": "0:10:45"}
{"current_steps": 705, "total_steps": 1404, "loss": 0.0858, "lr": 5.224982999233228e-06, "epoch": 1.506951871657754, "percentage": 50.21, "elapsed_time": "0:10:45", "remaining_time": "0:10:39"}
{"current_steps": 710, "total_steps": 1404, "loss": 0.1037, "lr": 5.167320311249951e-06, "epoch": 1.5176470588235293, "percentage": 50.57, "elapsed_time": "0:10:48", "remaining_time": "0:10:33"}
{"current_steps": 715, "total_steps": 1404, "loss": 0.0845, "lr": 5.109635335459256e-06, "epoch": 1.5283422459893048, "percentage": 50.93, "elapsed_time": "0:10:51", "remaining_time": "0:10:28"}
{"current_steps": 720, "total_steps": 1404, "loss": 0.0875, "lr": 5.051935755755713e-06, "epoch": 1.5390374331550802, "percentage": 51.28, "elapsed_time": "0:10:54", "remaining_time": "0:10:22"}
{"current_steps": 725, "total_steps": 1404, "loss": 0.0957, "lr": 4.9942292579791965e-06, "epoch": 1.5497326203208557, "percentage": 51.64, "elapsed_time": "0:10:58", "remaining_time": "0:10:16"}
{"current_steps": 730, "total_steps": 1404, "loss": 0.08, "lr": 4.936523528891111e-06, "epoch": 1.5604278074866311, "percentage": 51.99, "elapsed_time": "0:11:01", "remaining_time": "0:10:10"}
{"current_steps": 735, "total_steps": 1404, "loss": 0.1025, "lr": 4.878826255150453e-06, "epoch": 1.5711229946524066, "percentage": 52.35, "elapsed_time": "0:11:04", "remaining_time": "0:10:04"}
{"current_steps": 740, "total_steps": 1404, "loss": 0.0905, "lr": 4.821145122289941e-06, "epoch": 1.5818181818181818, "percentage": 52.71, "elapsed_time": "0:11:07", "remaining_time": "0:09:59"}
{"current_steps": 745, "total_steps": 1404, "loss": 0.0863, "lr": 4.763487813692252e-06, "epoch": 1.5925133689839572, "percentage": 53.06, "elapsed_time": "0:11:10", "remaining_time": "0:09:53"}
{"current_steps": 750, "total_steps": 1404, "loss": 0.0884, "lr": 4.705862009566564e-06, "epoch": 1.6032085561497325, "percentage": 53.42, "elapsed_time": "0:11:14", "remaining_time": "0:09:47"}
{"current_steps": 755, "total_steps": 1404, "loss": 0.0919, "lr": 4.648275385925522e-06, "epoch": 1.613903743315508, "percentage": 53.77, "elapsed_time": "0:11:18", "remaining_time": "0:09:42"}
{"current_steps": 760, "total_steps": 1404, "loss": 0.0956, "lr": 4.5907356135627605e-06, "epoch": 1.6245989304812833, "percentage": 54.13, "elapsed_time": "0:11:21", "remaining_time": "0:09:37"}
{"current_steps": 765, "total_steps": 1404, "loss": 0.1017, "lr": 4.533250357031104e-06, "epoch": 1.6352941176470588, "percentage": 54.49, "elapsed_time": "0:11:24", "remaining_time": "0:09:31"}
{"current_steps": 770, "total_steps": 1404, "loss": 0.0968, "lr": 4.475827273621639e-06, "epoch": 1.6459893048128342, "percentage": 54.84, "elapsed_time": "0:11:27", "remaining_time": "0:09:26"}
{"current_steps": 775, "total_steps": 1404, "loss": 0.0973, "lr": 4.418474012343711e-06, "epoch": 1.6566844919786097, "percentage": 55.2, "elapsed_time": "0:11:30", "remaining_time": "0:09:20"}
{"current_steps": 780, "total_steps": 1404, "loss": 0.0884, "lr": 4.361198212906048e-06, "epoch": 1.6673796791443851, "percentage": 55.56, "elapsed_time": "0:11:34", "remaining_time": "0:09:15"}
{"current_steps": 785, "total_steps": 1404, "loss": 0.087, "lr": 4.304007504699118e-06, "epoch": 1.6780748663101606, "percentage": 55.91, "elapsed_time": "0:11:37", "remaining_time": "0:09:09"}
{"current_steps": 790, "total_steps": 1404, "loss": 0.0772, "lr": 4.246909505778862e-06, "epoch": 1.6887700534759358, "percentage": 56.27, "elapsed_time": "0:11:40", "remaining_time": "0:09:04"}
{"current_steps": 795, "total_steps": 1404, "loss": 0.0973, "lr": 4.189911821851928e-06, "epoch": 1.6994652406417112, "percentage": 56.62, "elapsed_time": "0:11:44", "remaining_time": "0:08:59"}
{"current_steps": 800, "total_steps": 1404, "loss": 0.0869, "lr": 4.1330220452625644e-06, "epoch": 1.7101604278074867, "percentage": 56.98, "elapsed_time": "0:11:47", "remaining_time": "0:08:54"}
{"current_steps": 805, "total_steps": 1404, "loss": 0.0985, "lr": 4.076247753981285e-06, "epoch": 1.720855614973262, "percentage": 57.34, "elapsed_time": "0:11:50", "remaining_time": "0:08:48"}
{"current_steps": 810, "total_steps": 1404, "loss": 0.0862, "lr": 4.019596510595447e-06, "epoch": 1.7315508021390373, "percentage": 57.69, "elapsed_time": "0:11:53", "remaining_time": "0:08:43"}
{"current_steps": 815, "total_steps": 1404, "loss": 0.0933, "lr": 3.963075861301886e-06, "epoch": 1.7422459893048128, "percentage": 58.05, "elapsed_time": "0:11:57", "remaining_time": "0:08:38"}
{"current_steps": 820, "total_steps": 1404, "loss": 0.0883, "lr": 3.9066933349017165e-06, "epoch": 1.7529411764705882, "percentage": 58.4, "elapsed_time": "0:12:00", "remaining_time": "0:08:33"}
{"current_steps": 825, "total_steps": 1404, "loss": 0.0988, "lr": 3.8504564417974795e-06, "epoch": 1.7636363636363637, "percentage": 58.76, "elapsed_time": "0:12:03", "remaining_time": "0:08:28"}
{"current_steps": 830, "total_steps": 1404, "loss": 0.0922, "lr": 3.7943726729927154e-06, "epoch": 1.7743315508021391, "percentage": 59.12, "elapsed_time": "0:12:06", "remaining_time": "0:08:22"}
{"current_steps": 835, "total_steps": 1404, "loss": 0.0807, "lr": 3.738449499094121e-06, "epoch": 1.7850267379679146, "percentage": 59.47, "elapsed_time": "0:12:10", "remaining_time": "0:08:17"}
{"current_steps": 840, "total_steps": 1404, "loss": 0.0741, "lr": 3.682694369316446e-06, "epoch": 1.79572192513369, "percentage": 59.83, "elapsed_time": "0:12:13", "remaining_time": "0:08:12"}
{"current_steps": 845, "total_steps": 1404, "loss": 0.0836, "lr": 3.6271147104902192e-06, "epoch": 1.8064171122994652, "percentage": 60.19, "elapsed_time": "0:12:16", "remaining_time": "0:08:07"}
{"current_steps": 850, "total_steps": 1404, "loss": 0.0911, "lr": 3.5717179260724544e-06, "epoch": 1.8171122994652407, "percentage": 60.54, "elapsed_time": "0:12:19", "remaining_time": "0:08:02"}
{"current_steps": 855, "total_steps": 1404, "loss": 0.094, "lr": 3.5165113951604874e-06, "epoch": 1.8278074866310159, "percentage": 60.9, "elapsed_time": "0:12:23", "remaining_time": "0:07:57"}
{"current_steps": 860, "total_steps": 1404, "loss": 0.0818, "lr": 3.461502471509045e-06, "epoch": 1.8385026737967913, "percentage": 61.25, "elapsed_time": "0:12:26", "remaining_time": "0:07:52"}
{"current_steps": 865, "total_steps": 1404, "loss": 0.0891, "lr": 3.4066984825506855e-06, "epoch": 1.8491978609625668, "percentage": 61.61, "elapsed_time": "0:12:29", "remaining_time": "0:07:47"}
{"current_steps": 870, "total_steps": 1404, "loss": 0.0906, "lr": 3.35210672841976e-06, "epoch": 1.8598930481283422, "percentage": 61.97, "elapsed_time": "0:12:32", "remaining_time": "0:07:42"}
{"current_steps": 875, "total_steps": 1404, "loss": 0.0856, "lr": 3.297734480980002e-06, "epoch": 1.8705882352941177, "percentage": 62.32, "elapsed_time": "0:12:36", "remaining_time": "0:07:37"}
{"current_steps": 880, "total_steps": 1404, "loss": 0.0845, "lr": 3.2435889828558753e-06, "epoch": 1.881283422459893, "percentage": 62.68, "elapsed_time": "0:12:39", "remaining_time": "0:07:32"}
{"current_steps": 885, "total_steps": 1404, "loss": 0.0956, "lr": 3.1896774464678327e-06, "epoch": 1.8919786096256686, "percentage": 63.03, "elapsed_time": "0:12:42", "remaining_time": "0:07:27"}
{"current_steps": 890, "total_steps": 1404, "loss": 0.0824, "lr": 3.1360070530715885e-06, "epoch": 1.902673796791444, "percentage": 63.39, "elapsed_time": "0:12:45", "remaining_time": "0:07:22"}
{"current_steps": 895, "total_steps": 1404, "loss": 0.0873, "lr": 3.0825849518015334e-06, "epoch": 1.9133689839572192, "percentage": 63.75, "elapsed_time": "0:12:49", "remaining_time": "0:07:17"}
{"current_steps": 900, "total_steps": 1404, "loss": 0.0836, "lr": 3.029418258718454e-06, "epoch": 1.9240641711229947, "percentage": 64.1, "elapsed_time": "0:12:52", "remaining_time": "0:07:12"}
{"current_steps": 905, "total_steps": 1404, "loss": 0.0875, "lr": 2.9765140558616287e-06, "epoch": 1.93475935828877, "percentage": 64.46, "elapsed_time": "0:12:55", "remaining_time": "0:07:07"}
{"current_steps": 910, "total_steps": 1404, "loss": 0.0791, "lr": 2.9238793903054757e-06, "epoch": 1.9454545454545453, "percentage": 64.81, "elapsed_time": "0:12:59", "remaining_time": "0:07:03"}
{"current_steps": 915, "total_steps": 1404, "loss": 0.0777, "lr": 2.8715212732208523e-06, "epoch": 1.9561497326203208, "percentage": 65.17, "elapsed_time": "0:13:02", "remaining_time": "0:06:58"}
{"current_steps": 920, "total_steps": 1404, "loss": 0.0853, "lr": 2.819446678941126e-06, "epoch": 1.9668449197860962, "percentage": 65.53, "elapsed_time": "0:13:06", "remaining_time": "0:06:53"}
{"current_steps": 925, "total_steps": 1404, "loss": 0.08, "lr": 2.7676625440331756e-06, "epoch": 1.9775401069518717, "percentage": 65.88, "elapsed_time": "0:13:09", "remaining_time": "0:06:48"}
{"current_steps": 930, "total_steps": 1404, "loss": 0.0876, "lr": 2.7161757663734012e-06, "epoch": 1.988235294117647, "percentage": 66.24, "elapsed_time": "0:13:12", "remaining_time": "0:06:44"}
{"current_steps": 935, "total_steps": 1404, "loss": 0.0874, "lr": 2.6649932042288994e-06, "epoch": 1.9989304812834225, "percentage": 66.6, "elapsed_time": "0:13:16", "remaining_time": "0:06:39"}
{"current_steps": 940, "total_steps": 1404, "loss": 0.0265, "lr": 2.6141216753439115e-06, "epoch": 2.0085561497326205, "percentage": 66.95, "elapsed_time": "0:14:22", "remaining_time": "0:07:05"}
{"current_steps": 945, "total_steps": 1404, "loss": 0.026, "lr": 2.5635679560316703e-06, "epoch": 2.0192513368983955, "percentage": 67.31, "elapsed_time": "0:14:25", "remaining_time": "0:07:00"}
{"current_steps": 950, "total_steps": 1404, "loss": 0.0245, "lr": 2.5133387802717585e-06, "epoch": 2.029946524064171, "percentage": 67.66, "elapsed_time": "0:14:29", "remaining_time": "0:06:55"}
{"current_steps": 955, "total_steps": 1404, "loss": 0.0213, "lr": 2.4634408388131255e-06, "epoch": 2.0406417112299464, "percentage": 68.02, "elapsed_time": "0:14:32", "remaining_time": "0:06:50"}
{"current_steps": 960, "total_steps": 1404, "loss": 0.0217, "lr": 2.4138807782828423e-06, "epoch": 2.051336898395722, "percentage": 68.38, "elapsed_time": "0:14:35", "remaining_time": "0:06:45"}
{"current_steps": 965, "total_steps": 1404, "loss": 0.0213, "lr": 2.3646652003007348e-06, "epoch": 2.0620320855614973, "percentage": 68.73, "elapsed_time": "0:14:38", "remaining_time": "0:06:39"}
{"current_steps": 970, "total_steps": 1404, "loss": 0.0278, "lr": 2.3158006606000345e-06, "epoch": 2.0727272727272728, "percentage": 69.09, "elapsed_time": "0:14:41", "remaining_time": "0:06:34"}
{"current_steps": 975, "total_steps": 1404, "loss": 0.0239, "lr": 2.267293668154114e-06, "epoch": 2.083422459893048, "percentage": 69.44, "elapsed_time": "0:14:45", "remaining_time": "0:06:29"}
{"current_steps": 980, "total_steps": 1404, "loss": 0.0254, "lr": 2.2191506843094628e-06, "epoch": 2.0941176470588236, "percentage": 69.8, "elapsed_time": "0:14:48", "remaining_time": "0:06:24"}
{"current_steps": 985, "total_steps": 1404, "loss": 0.022, "lr": 2.1713781219250157e-06, "epoch": 2.104812834224599, "percentage": 70.16, "elapsed_time": "0:14:51", "remaining_time": "0:06:19"}
{"current_steps": 990, "total_steps": 1404, "loss": 0.0216, "lr": 2.1239823445179236e-06, "epoch": 2.1155080213903745, "percentage": 70.51, "elapsed_time": "0:14:55", "remaining_time": "0:06:14"}
{"current_steps": 995, "total_steps": 1404, "loss": 0.0211, "lr": 2.076969665415908e-06, "epoch": 2.1262032085561495, "percentage": 70.87, "elapsed_time": "0:14:58", "remaining_time": "0:06:09"}
{"current_steps": 1000, "total_steps": 1404, "loss": 0.0246, "lr": 2.0303463469163004e-06, "epoch": 2.136898395721925, "percentage": 71.23, "elapsed_time": "0:15:01", "remaining_time": "0:06:04"}
{"current_steps": 1005, "total_steps": 1404, "loss": 0.024, "lr": 1.984118599451866e-06, "epoch": 2.1475935828877004, "percentage": 71.58, "elapsed_time": "0:15:04", "remaining_time": "0:05:59"}
{"current_steps": 1010, "total_steps": 1404, "loss": 0.025, "lr": 1.938292580763561e-06, "epoch": 2.158288770053476, "percentage": 71.94, "elapsed_time": "0:15:08", "remaining_time": "0:05:54"}
{"current_steps": 1015, "total_steps": 1404, "loss": 0.0295, "lr": 1.8928743950802863e-06, "epoch": 2.1689839572192513, "percentage": 72.29, "elapsed_time": "0:15:11", "remaining_time": "0:05:49"}
{"current_steps": 1020, "total_steps": 1404, "loss": 0.0158, "lr": 1.847870092305773e-06, "epoch": 2.1796791443850267, "percentage": 72.65, "elapsed_time": "0:15:14", "remaining_time": "0:05:44"}
{"current_steps": 1025, "total_steps": 1404, "loss": 0.0211, "lr": 1.8032856672127191e-06, "epoch": 2.190374331550802, "percentage": 73.01, "elapsed_time": "0:15:18", "remaining_time": "0:05:39"}
{"current_steps": 1030, "total_steps": 1404, "loss": 0.0189, "lr": 1.7591270586442517e-06, "epoch": 2.2010695187165776, "percentage": 73.36, "elapsed_time": "0:15:21", "remaining_time": "0:05:34"}
{"current_steps": 1035, "total_steps": 1404, "loss": 0.0175, "lr": 1.7154001487228478e-06, "epoch": 2.211764705882353, "percentage": 73.72, "elapsed_time": "0:15:25", "remaining_time": "0:05:29"}
{"current_steps": 1040, "total_steps": 1404, "loss": 0.0215, "lr": 1.672110762066811e-06, "epoch": 2.2224598930481285, "percentage": 74.07, "elapsed_time": "0:15:28", "remaining_time": "0:05:25"}
{"current_steps": 1045, "total_steps": 1404, "loss": 0.0182, "lr": 1.6292646650144072e-06, "epoch": 2.233155080213904, "percentage": 74.43, "elapsed_time": "0:15:32", "remaining_time": "0:05:20"}
{"current_steps": 1050, "total_steps": 1404, "loss": 0.0176, "lr": 1.5868675648557568e-06, "epoch": 2.243850267379679, "percentage": 74.79, "elapsed_time": "0:15:35", "remaining_time": "0:05:15"}
{"current_steps": 1055, "total_steps": 1404, "loss": 0.02, "lr": 1.544925109072607e-06, "epoch": 2.2545454545454544, "percentage": 75.14, "elapsed_time": "0:15:39", "remaining_time": "0:05:10"}
{"current_steps": 1060, "total_steps": 1404, "loss": 0.0185, "lr": 1.50344288458606e-06, "epoch": 2.26524064171123, "percentage": 75.5, "elapsed_time": "0:15:42", "remaining_time": "0:05:05"}
{"current_steps": 1065, "total_steps": 1404, "loss": 0.0165, "lr": 1.462426417012361e-06, "epoch": 2.2759358288770053, "percentage": 75.85, "elapsed_time": "0:15:46", "remaining_time": "0:05:01"}
{"current_steps": 1070, "total_steps": 1404, "loss": 0.019, "lr": 1.4218811699268752e-06, "epoch": 2.2866310160427807, "percentage": 76.21, "elapsed_time": "0:15:49", "remaining_time": "0:04:56"}
{"current_steps": 1075, "total_steps": 1404, "loss": 0.0179, "lr": 1.38181254413631e-06, "epoch": 2.297326203208556, "percentage": 76.57, "elapsed_time": "0:15:52", "remaining_time": "0:04:51"}
{"current_steps": 1080, "total_steps": 1404, "loss": 0.0199, "lr": 1.3422258769592967e-06, "epoch": 2.3080213903743316, "percentage": 76.92, "elapsed_time": "0:15:55", "remaining_time": "0:04:46"}
{"current_steps": 1085, "total_steps": 1404, "loss": 0.0194, "lr": 1.3031264415154477e-06, "epoch": 2.318716577540107, "percentage": 77.28, "elapsed_time": "0:15:58", "remaining_time": "0:04:41"}
{"current_steps": 1090, "total_steps": 1404, "loss": 0.0213, "lr": 1.2645194460229454e-06, "epoch": 2.3294117647058825, "percentage": 77.64, "elapsed_time": "0:16:02", "remaining_time": "0:04:37"}
{"current_steps": 1095, "total_steps": 1404, "loss": 0.0216, "lr": 1.2264100331047878e-06, "epoch": 2.3401069518716575, "percentage": 77.99, "elapsed_time": "0:16:05", "remaining_time": "0:04:32"}
{"current_steps": 1100, "total_steps": 1404, "loss": 0.0198, "lr": 1.1888032791037697e-06, "epoch": 2.350802139037433, "percentage": 78.35, "elapsed_time": "0:16:09", "remaining_time": "0:04:27"}
{"current_steps": 1105, "total_steps": 1404, "loss": 0.019, "lr": 1.1517041934062834e-06, "epoch": 2.3614973262032084, "percentage": 78.7, "elapsed_time": "0:16:12", "remaining_time": "0:04:23"}
{"current_steps": 1110, "total_steps": 1404, "loss": 0.0169, "lr": 1.115117717775056e-06, "epoch": 2.372192513368984, "percentage": 79.06, "elapsed_time": "0:16:15", "remaining_time": "0:04:18"}
{"current_steps": 1115, "total_steps": 1404, "loss": 0.0219, "lr": 1.0790487256908826e-06, "epoch": 2.3828877005347593, "percentage": 79.42, "elapsed_time": "0:16:18", "remaining_time": "0:04:13"}
{"current_steps": 1120, "total_steps": 1404, "loss": 0.0273, "lr": 1.043502021703449e-06, "epoch": 2.3935828877005347, "percentage": 79.77, "elapsed_time": "0:16:22", "remaining_time": "0:04:09"}
{"current_steps": 1125, "total_steps": 1404, "loss": 0.0242, "lr": 1.0084823407913563e-06, "epoch": 2.40427807486631, "percentage": 80.13, "elapsed_time": "0:16:25", "remaining_time": "0:04:04"}
{"current_steps": 1130, "total_steps": 1404, "loss": 0.0171, "lr": 9.739943477313918e-07, "epoch": 2.4149732620320856, "percentage": 80.48, "elapsed_time": "0:16:28", "remaining_time": "0:03:59"}
{"current_steps": 1135, "total_steps": 1404, "loss": 0.0207, "lr": 9.400426364771648e-07, "epoch": 2.425668449197861, "percentage": 80.84, "elapsed_time": "0:16:31", "remaining_time": "0:03:55"}
{"current_steps": 1140, "total_steps": 1404, "loss": 0.0154, "lr": 9.066317295471688e-07, "epoch": 2.4363636363636365, "percentage": 81.2, "elapsed_time": "0:16:35", "remaining_time": "0:03:50"}
{"current_steps": 1145, "total_steps": 1404, "loss": 0.017, "lr": 8.737660774223655e-07, "epoch": 2.447058823529412, "percentage": 81.55, "elapsed_time": "0:16:38", "remaining_time": "0:03:45"}
{"current_steps": 1150, "total_steps": 1404, "loss": 0.0174, "lr": 8.414500579533536e-07, "epoch": 2.4577540106951874, "percentage": 81.91, "elapsed_time": "0:16:41", "remaining_time": "0:03:41"}
{"current_steps": 1155, "total_steps": 1404, "loss": 0.0268, "lr": 8.096879757772297e-07, "epoch": 2.4684491978609624, "percentage": 82.26, "elapsed_time": "0:16:44", "remaining_time": "0:03:36"}
{"current_steps": 1160, "total_steps": 1404, "loss": 0.0192, "lr": 7.784840617441858e-07, "epoch": 2.479144385026738, "percentage": 82.62, "elapsed_time": "0:16:48", "remaining_time": "0:03:32"}
{"current_steps": 1165, "total_steps": 1404, "loss": 0.0163, "lr": 7.47842472353939e-07, "epoch": 2.4898395721925133, "percentage": 82.98, "elapsed_time": "0:16:51", "remaining_time": "0:03:27"}
{"current_steps": 1170, "total_steps": 1404, "loss": 0.0195, "lr": 7.177672892020743e-07, "epoch": 2.5005347593582887, "percentage": 83.33, "elapsed_time": "0:16:54", "remaining_time": "0:03:22"}
{"current_steps": 1175, "total_steps": 1404, "loss": 0.0182, "lr": 6.882625184363534e-07, "epoch": 2.511229946524064, "percentage": 83.69, "elapsed_time": "0:16:57", "remaining_time": "0:03:18"}
{"current_steps": 1180, "total_steps": 1404, "loss": 0.0232, "lr": 6.593320902230748e-07, "epoch": 2.5219251336898396, "percentage": 84.05, "elapsed_time": "0:17:01", "remaining_time": "0:03:13"}
{"current_steps": 1185, "total_steps": 1404, "loss": 0.0178, "lr": 6.309798582235671e-07, "epoch": 2.532620320855615, "percentage": 84.4, "elapsed_time": "0:17:04", "remaining_time": "0:03:09"}
{"current_steps": 1190, "total_steps": 1404, "loss": 0.0193, "lr": 6.032095990808567e-07, "epoch": 2.5433155080213905, "percentage": 84.76, "elapsed_time": "0:17:07", "remaining_time": "0:03:04"}
{"current_steps": 1195, "total_steps": 1404, "loss": 0.0203, "lr": 5.760250119166061e-07, "epoch": 2.5540106951871655, "percentage": 85.11, "elapsed_time": "0:17:11", "remaining_time": "0:03:00"}
{"current_steps": 1200, "total_steps": 1404, "loss": 0.0194, "lr": 5.494297178383729e-07, "epoch": 2.564705882352941, "percentage": 85.47, "elapsed_time": "0:17:14", "remaining_time": "0:02:55"}
{"current_steps": 1205, "total_steps": 1404, "loss": 0.0172, "lr": 5.234272594572604e-07, "epoch": 2.5754010695187164, "percentage": 85.83, "elapsed_time": "0:17:17", "remaining_time": "0:02:51"}
{"current_steps": 1210, "total_steps": 1404, "loss": 0.0222, "lr": 4.980211004160306e-07, "epoch": 2.586096256684492, "percentage": 86.18, "elapsed_time": "0:17:20", "remaining_time": "0:02:46"}
{"current_steps": 1215, "total_steps": 1404, "loss": 0.0168, "lr": 4.7321462492772975e-07, "epoch": 2.5967914438502673, "percentage": 86.54, "elapsed_time": "0:17:24", "remaining_time": "0:02:42"}
{"current_steps": 1220, "total_steps": 1404, "loss": 0.0188, "lr": 4.490111373248918e-07, "epoch": 2.6074866310160427, "percentage": 86.89, "elapsed_time": "0:17:27", "remaining_time": "0:02:37"}
{"current_steps": 1225, "total_steps": 1404, "loss": 0.024, "lr": 4.2541386161939424e-07, "epoch": 2.618181818181818, "percentage": 87.25, "elapsed_time": "0:17:30", "remaining_time": "0:02:33"}
{"current_steps": 1230, "total_steps": 1404, "loss": 0.0204, "lr": 4.024259410730008e-07, "epoch": 2.6288770053475936, "percentage": 87.61, "elapsed_time": "0:17:33", "remaining_time": "0:02:29"}
{"current_steps": 1235, "total_steps": 1404, "loss": 0.0207, "lr": 3.800504377786651e-07, "epoch": 2.639572192513369, "percentage": 87.96, "elapsed_time": "0:17:37", "remaining_time": "0:02:24"}
{"current_steps": 1240, "total_steps": 1404, "loss": 0.0199, "lr": 3.582903322526482e-07, "epoch": 2.6502673796791445, "percentage": 88.32, "elapsed_time": "0:17:40", "remaining_time": "0:02:20"}
{"current_steps": 1245, "total_steps": 1404, "loss": 0.0226, "lr": 3.371485230374988e-07, "epoch": 2.66096256684492, "percentage": 88.68, "elapsed_time": "0:17:43", "remaining_time": "0:02:15"}
{"current_steps": 1250, "total_steps": 1404, "loss": 0.0166, "lr": 3.166278263159539e-07, "epoch": 2.6716577540106954, "percentage": 89.03, "elapsed_time": "0:17:47", "remaining_time": "0:02:11"}
{"current_steps": 1255, "total_steps": 1404, "loss": 0.0226, "lr": 2.9673097553581385e-07, "epoch": 2.682352941176471, "percentage": 89.39, "elapsed_time": "0:17:50", "remaining_time": "0:02:07"}
{"current_steps": 1260, "total_steps": 1404, "loss": 0.0164, "lr": 2.7746062104583473e-07, "epoch": 2.693048128342246, "percentage": 89.74, "elapsed_time": "0:17:53", "remaining_time": "0:02:02"}
{"current_steps": 1265, "total_steps": 1404, "loss": 0.0222, "lr": 2.588193297426844e-07, "epoch": 2.7037433155080213, "percentage": 90.1, "elapsed_time": "0:17:56", "remaining_time": "0:01:58"}
{"current_steps": 1270, "total_steps": 1404, "loss": 0.0226, "lr": 2.4080958472902873e-07, "epoch": 2.7144385026737967, "percentage": 90.46, "elapsed_time": "0:18:00", "remaining_time": "0:01:53"}
{"current_steps": 1275, "total_steps": 1404, "loss": 0.0145, "lr": 2.2343378498276391e-07, "epoch": 2.725133689839572, "percentage": 90.81, "elapsed_time": "0:18:03", "remaining_time": "0:01:49"}
{"current_steps": 1280, "total_steps": 1404, "loss": 0.0173, "lr": 2.0669424503746871e-07, "epoch": 2.7358288770053476, "percentage": 91.17, "elapsed_time": "0:18:06", "remaining_time": "0:01:45"}
{"current_steps": 1285, "total_steps": 1404, "loss": 0.0185, "lr": 1.9059319467409244e-07, "epoch": 2.746524064171123, "percentage": 91.52, "elapsed_time": "0:18:09", "remaining_time": "0:01:40"}
{"current_steps": 1290, "total_steps": 1404, "loss": 0.0143, "lr": 1.7513277862394263e-07, "epoch": 2.7572192513368985, "percentage": 91.88, "elapsed_time": "0:18:13", "remaining_time": "0:01:36"}
{"current_steps": 1295, "total_steps": 1404, "loss": 0.0212, "lr": 1.603150562829936e-07, "epoch": 2.767914438502674, "percentage": 92.24, "elapsed_time": "0:18:16", "remaining_time": "0:01:32"}
{"current_steps": 1300, "total_steps": 1404, "loss": 0.0156, "lr": 1.4614200143756975e-07, "epoch": 2.778609625668449, "percentage": 92.59, "elapsed_time": "0:18:19", "remaining_time": "0:01:27"}
{"current_steps": 1305, "total_steps": 1404, "loss": 0.0163, "lr": 1.3261550200142415e-07, "epoch": 2.7893048128342244, "percentage": 92.95, "elapsed_time": "0:18:22", "remaining_time": "0:01:23"}
{"current_steps": 1310, "total_steps": 1404, "loss": 0.0176, "lr": 1.197373597642637e-07, "epoch": 2.8, "percentage": 93.3, "elapsed_time": "0:18:25", "remaining_time": "0:01:19"}
{"current_steps": 1315, "total_steps": 1404, "loss": 0.0127, "lr": 1.0750929015174216e-07, "epoch": 2.8106951871657753, "percentage": 93.66, "elapsed_time": "0:18:29", "remaining_time": "0:01:15"}
{"current_steps": 1320, "total_steps": 1404, "loss": 0.0166, "lr": 9.593292199695403e-08, "epoch": 2.8213903743315507, "percentage": 94.02, "elapsed_time": "0:18:32", "remaining_time": "0:01:10"}
{"current_steps": 1325, "total_steps": 1404, "loss": 0.0189, "lr": 8.500979732347259e-08, "epoch": 2.832085561497326, "percentage": 94.37, "elapsed_time": "0:18:35", "remaining_time": "0:01:06"}
{"current_steps": 1330, "total_steps": 1404, "loss": 0.0178, "lr": 7.47413711399414e-08, "epoch": 2.8427807486631016, "percentage": 94.73, "elapsed_time": "0:18:38", "remaining_time": "0:01:02"}
{"current_steps": 1335, "total_steps": 1404, "loss": 0.0139, "lr": 6.51290112462627e-08, "epoch": 2.853475935828877, "percentage": 95.09, "elapsed_time": "0:18:42", "remaining_time": "0:00:57"}
{"current_steps": 1340, "total_steps": 1404, "loss": 0.0144, "lr": 5.617399805139867e-08, "epoch": 2.8641711229946525, "percentage": 95.44, "elapsed_time": "0:18:45", "remaining_time": "0:00:53"}
{"current_steps": 1345, "total_steps": 1404, "loss": 0.0129, "lr": 4.7877524402817345e-08, "epoch": 2.874866310160428, "percentage": 95.8, "elapsed_time": "0:18:48", "remaining_time": "0:00:49"}
{"current_steps": 1350, "total_steps": 1404, "loss": 0.0191, "lr": 4.024069542759801e-08, "epoch": 2.8855614973262034, "percentage": 96.15, "elapsed_time": "0:18:51", "remaining_time": "0:00:45"}
{"current_steps": 1355, "total_steps": 1404, "loss": 0.0169, "lr": 3.3264528385225094e-08, "epoch": 2.896256684491979, "percentage": 96.51, "elapsed_time": "0:18:55", "remaining_time": "0:00:41"}
{"current_steps": 1360, "total_steps": 1404, "loss": 0.0157, "lr": 2.6949952532083768e-08, "epoch": 2.9069518716577543, "percentage": 96.87, "elapsed_time": "0:18:58", "remaining_time": "0:00:36"}
{"current_steps": 1365, "total_steps": 1404, "loss": 0.0194, "lr": 2.1297808997678417e-08, "epoch": 2.9176470588235293, "percentage": 97.22, "elapsed_time": "0:19:01", "remaining_time": "0:00:32"}
{"current_steps": 1370, "total_steps": 1404, "loss": 0.0148, "lr": 1.6308850672591692e-08, "epoch": 2.9283422459893047, "percentage": 97.58, "elapsed_time": "0:19:05", "remaining_time": "0:00:28"}
{"current_steps": 1375, "total_steps": 1404, "loss": 0.0168, "lr": 1.1983742108195862e-08, "epoch": 2.93903743315508, "percentage": 97.93, "elapsed_time": "0:19:09", "remaining_time": "0:00:24"}
{"current_steps": 1380, "total_steps": 1404, "loss": 0.0153, "lr": 8.323059428130831e-09, "epoch": 2.9497326203208556, "percentage": 98.29, "elapsed_time": "0:19:12", "remaining_time": "0:00:20"}
{"current_steps": 1385, "total_steps": 1404, "loss": 0.0208, "lr": 5.3272902515622e-09, "epoch": 2.960427807486631, "percentage": 98.65, "elapsed_time": "0:19:15", "remaining_time": "0:00:15"}
{"current_steps": 1390, "total_steps": 1404, "loss": 0.017, "lr": 2.996833628228779e-09, "epoch": 2.9711229946524065, "percentage": 99.0, "elapsed_time": "0:19:19", "remaining_time": "0:00:11"}
{"current_steps": 1395, "total_steps": 1404, "loss": 0.0144, "lr": 1.3319999852867692e-09, "epoch": 2.981818181818182, "percentage": 99.36, "elapsed_time": "0:19:22", "remaining_time": "0:00:07"}
{"current_steps": 1400, "total_steps": 1404, "loss": 0.02, "lr": 3.330110859600666e-10, "epoch": 2.9925133689839574, "percentage": 99.72, "elapsed_time": "0:19:25", "remaining_time": "0:00:03"}
{"current_steps": 1404, "total_steps": 1404, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:20:33", "remaining_time": "0:00:00"}