Training in progress, step 7500
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0bea2294954e12f121f7e94d85fda7c7245728ed5984316f4a55409084ca9e74
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:497ecf0d286f382b71e3c3094ba2b0aaddb606ebe3997d1ecbec8d6e79399e42
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a3a924de21f7e5f5ddf8de1a2d51e3e0de5d6a737f0d622b85cfda689ba679c
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c54be22b3807c8db115c8f46225d471a06fed0d353a0cf3fbdfd5a81ecab371
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -1236,3 +1236,314 @@
|
|
| 1236 |
{"current_steps": 6180, "total_steps": 12698, "loss": 0.2407, "lr": 2.4389903512294115e-05, "epoch": 3.40683572216097, "percentage": 48.67, "elapsed_time": "11:10:54", "remaining_time": "11:47:36"}
|
| 1237 |
{"current_steps": 6185, "total_steps": 12698, "loss": 0.2503, "lr": 2.4363079453703467e-05, "epoch": 3.4095920617420066, "percentage": 48.71, "elapsed_time": "11:11:43", "remaining_time": "11:47:21"}
|
| 1238 |
{"current_steps": 6190, "total_steps": 12698, "loss": 0.2466, "lr": 2.4336247151979128e-05, "epoch": 3.412348401323043, "percentage": 48.75, "elapsed_time": "11:12:33", "remaining_time": "11:47:06"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1236 |
{"current_steps": 6180, "total_steps": 12698, "loss": 0.2407, "lr": 2.4389903512294115e-05, "epoch": 3.40683572216097, "percentage": 48.67, "elapsed_time": "11:10:54", "remaining_time": "11:47:36"}
|
| 1237 |
{"current_steps": 6185, "total_steps": 12698, "loss": 0.2503, "lr": 2.4363079453703467e-05, "epoch": 3.4095920617420066, "percentage": 48.71, "elapsed_time": "11:11:43", "remaining_time": "11:47:21"}
|
| 1238 |
{"current_steps": 6190, "total_steps": 12698, "loss": 0.2466, "lr": 2.4336247151979128e-05, "epoch": 3.412348401323043, "percentage": 48.75, "elapsed_time": "11:12:33", "remaining_time": "11:47:06"}
|
| 1239 |
+
{"current_steps": 6195, "total_steps": 12698, "loss": 0.2416, "lr": 2.4309406657815146e-05, "epoch": 3.4151047409040793, "percentage": 48.79, "elapsed_time": "11:13:25", "remaining_time": "11:46:54"}
|
| 1240 |
+
{"current_steps": 6200, "total_steps": 12698, "loss": 0.2435, "lr": 2.4282558021921086e-05, "epoch": 3.4178610804851157, "percentage": 48.83, "elapsed_time": "11:14:15", "remaining_time": "11:46:39"}
|
| 1241 |
+
{"current_steps": 6205, "total_steps": 12698, "loss": 0.2529, "lr": 2.425570129502187e-05, "epoch": 3.420617420066152, "percentage": 48.87, "elapsed_time": "11:15:10", "remaining_time": "11:46:30"}
|
| 1242 |
+
{"current_steps": 6210, "total_steps": 12698, "loss": 0.2461, "lr": 2.4228836527857705e-05, "epoch": 3.4233737596471885, "percentage": 48.91, "elapsed_time": "11:15:58", "remaining_time": "11:46:14"}
|
| 1243 |
+
{"current_steps": 6215, "total_steps": 12698, "loss": 0.2419, "lr": 2.4201963771184008e-05, "epoch": 3.426130099228225, "percentage": 48.94, "elapsed_time": "11:16:56", "remaining_time": "11:46:08"}
|
| 1244 |
+
{"current_steps": 6220, "total_steps": 12698, "loss": 0.2391, "lr": 2.4175083075771283e-05, "epoch": 3.4288864388092613, "percentage": 48.98, "elapsed_time": "11:17:49", "remaining_time": "11:45:55"}
|
| 1245 |
+
{"current_steps": 6225, "total_steps": 12698, "loss": 0.248, "lr": 2.4148194492405013e-05, "epoch": 3.4316427783902976, "percentage": 49.02, "elapsed_time": "11:18:35", "remaining_time": "11:45:37"}
|
| 1246 |
+
{"current_steps": 6230, "total_steps": 12698, "loss": 0.2393, "lr": 2.4121298071885613e-05, "epoch": 3.434399117971334, "percentage": 49.06, "elapsed_time": "11:19:08", "remaining_time": "11:45:05"}
|
| 1247 |
+
{"current_steps": 6235, "total_steps": 12698, "loss": 0.2495, "lr": 2.409439386502828e-05, "epoch": 3.4371554575523704, "percentage": 49.1, "elapsed_time": "11:19:35", "remaining_time": "11:44:26"}
|
| 1248 |
+
{"current_steps": 6240, "total_steps": 12698, "loss": 0.2301, "lr": 2.4067481922662945e-05, "epoch": 3.439911797133407, "percentage": 49.14, "elapsed_time": "11:20:02", "remaining_time": "11:43:47"}
|
| 1249 |
+
{"current_steps": 6245, "total_steps": 12698, "loss": 0.2391, "lr": 2.4040562295634137e-05, "epoch": 3.442668136714443, "percentage": 49.18, "elapsed_time": "11:20:28", "remaining_time": "11:43:08"}
|
| 1250 |
+
{"current_steps": 6250, "total_steps": 12698, "loss": 0.2489, "lr": 2.4013635034800897e-05, "epoch": 3.4454244762954795, "percentage": 49.22, "elapsed_time": "11:20:54", "remaining_time": "11:42:28"}
|
| 1251 |
+
{"current_steps": 6255, "total_steps": 12698, "loss": 0.2473, "lr": 2.398670019103672e-05, "epoch": 3.448180815876516, "percentage": 49.26, "elapsed_time": "11:21:18", "remaining_time": "11:41:47"}
|
| 1252 |
+
{"current_steps": 6260, "total_steps": 12698, "loss": 0.2453, "lr": 2.395975781522938e-05, "epoch": 3.4509371554575523, "percentage": 49.3, "elapsed_time": "11:21:49", "remaining_time": "11:41:13"}
|
| 1253 |
+
{"current_steps": 6265, "total_steps": 12698, "loss": 0.2295, "lr": 2.3932807958280938e-05, "epoch": 3.4536934950385887, "percentage": 49.34, "elapsed_time": "11:22:14", "remaining_time": "11:40:31"}
|
| 1254 |
+
{"current_steps": 6270, "total_steps": 12698, "loss": 0.2394, "lr": 2.390585067110754e-05, "epoch": 3.456449834619625, "percentage": 49.38, "elapsed_time": "11:22:43", "remaining_time": "11:39:56"}
|
| 1255 |
+
{"current_steps": 6275, "total_steps": 12698, "loss": 0.2173, "lr": 2.38788860046394e-05, "epoch": 3.4592061742006615, "percentage": 49.42, "elapsed_time": "11:23:08", "remaining_time": "11:39:15"}
|
| 1256 |
+
{"current_steps": 6280, "total_steps": 12698, "loss": 0.2413, "lr": 2.3851914009820645e-05, "epoch": 3.461962513781698, "percentage": 49.46, "elapsed_time": "11:23:34", "remaining_time": "11:38:36"}
|
| 1257 |
+
{"current_steps": 6285, "total_steps": 12698, "loss": 0.2342, "lr": 2.3824934737609283e-05, "epoch": 3.464718853362734, "percentage": 49.5, "elapsed_time": "11:23:59", "remaining_time": "11:37:55"}
|
| 1258 |
+
{"current_steps": 6290, "total_steps": 12698, "loss": 0.2335, "lr": 2.3797948238977044e-05, "epoch": 3.4674751929437706, "percentage": 49.54, "elapsed_time": "11:24:27", "remaining_time": "11:37:17"}
|
| 1259 |
+
{"current_steps": 6295, "total_steps": 12698, "loss": 0.239, "lr": 2.3770954564909326e-05, "epoch": 3.470231532524807, "percentage": 49.57, "elapsed_time": "11:24:53", "remaining_time": "11:36:38"}
|
| 1260 |
+
{"current_steps": 6300, "total_steps": 12698, "loss": 0.2216, "lr": 2.3743953766405067e-05, "epoch": 3.4729878721058434, "percentage": 49.61, "elapsed_time": "11:25:20", "remaining_time": "11:35:59"}
|
| 1261 |
+
{"current_steps": 6305, "total_steps": 12698, "loss": 0.2406, "lr": 2.3716945894476692e-05, "epoch": 3.4757442116868797, "percentage": 49.65, "elapsed_time": "11:25:46", "remaining_time": "11:35:20"}
|
| 1262 |
+
{"current_steps": 6310, "total_steps": 12698, "loss": 0.2293, "lr": 2.3689931000149962e-05, "epoch": 3.478500551267916, "percentage": 49.69, "elapsed_time": "11:26:12", "remaining_time": "11:34:41"}
|
| 1263 |
+
{"current_steps": 6315, "total_steps": 12698, "loss": 0.2286, "lr": 2.3662909134463917e-05, "epoch": 3.4812568908489525, "percentage": 49.73, "elapsed_time": "11:26:38", "remaining_time": "11:34:02"}
|
| 1264 |
+
{"current_steps": 6320, "total_steps": 12698, "loss": 0.2264, "lr": 2.363588034847077e-05, "epoch": 3.484013230429989, "percentage": 49.77, "elapsed_time": "11:27:03", "remaining_time": "11:33:21"}
|
| 1265 |
+
{"current_steps": 6325, "total_steps": 12698, "loss": 0.2324, "lr": 2.3608844693235807e-05, "epoch": 3.4867695700110253, "percentage": 49.81, "elapsed_time": "11:27:33", "remaining_time": "11:32:46"}
|
| 1266 |
+
{"current_steps": 6330, "total_steps": 12698, "loss": 0.2239, "lr": 2.358180221983729e-05, "epoch": 3.4895259095920617, "percentage": 49.85, "elapsed_time": "11:27:56", "remaining_time": "11:32:04"}
|
| 1267 |
+
{"current_steps": 6335, "total_steps": 12698, "loss": 0.2339, "lr": 2.3554752979366367e-05, "epoch": 3.492282249173098, "percentage": 49.89, "elapsed_time": "11:28:23", "remaining_time": "11:31:25"}
|
| 1268 |
+
{"current_steps": 6340, "total_steps": 12698, "loss": 0.2403, "lr": 2.352769702292696e-05, "epoch": 3.4950385887541344, "percentage": 49.93, "elapsed_time": "11:28:45", "remaining_time": "11:30:43"}
|
| 1269 |
+
{"current_steps": 6345, "total_steps": 12698, "loss": 0.2253, "lr": 2.3500634401635695e-05, "epoch": 3.497794928335171, "percentage": 49.97, "elapsed_time": "11:29:16", "remaining_time": "11:30:08"}
|
| 1270 |
+
{"current_steps": 6350, "total_steps": 12698, "loss": 0.2262, "lr": 2.3473565166621778e-05, "epoch": 3.500551267916207, "percentage": 50.01, "elapsed_time": "11:29:41", "remaining_time": "11:29:28"}
|
| 1271 |
+
{"current_steps": 6355, "total_steps": 12698, "loss": 0.2318, "lr": 2.3446489369026912e-05, "epoch": 3.5033076074972436, "percentage": 50.05, "elapsed_time": "11:30:13", "remaining_time": "11:28:55"}
|
| 1272 |
+
{"current_steps": 6360, "total_steps": 12698, "loss": 0.2366, "lr": 2.3419407060005207e-05, "epoch": 3.50606394707828, "percentage": 50.09, "elapsed_time": "11:30:38", "remaining_time": "11:28:15"}
|
| 1273 |
+
{"current_steps": 6365, "total_steps": 12698, "loss": 0.2259, "lr": 2.339231829072307e-05, "epoch": 3.5088202866593163, "percentage": 50.13, "elapsed_time": "11:31:03", "remaining_time": "11:27:34"}
|
| 1274 |
+
{"current_steps": 6370, "total_steps": 12698, "loss": 0.2333, "lr": 2.33652231123591e-05, "epoch": 3.5115766262403527, "percentage": 50.17, "elapsed_time": "11:31:30", "remaining_time": "11:26:56"}
|
| 1275 |
+
{"current_steps": 6375, "total_steps": 12698, "loss": 0.2284, "lr": 2.3338121576104028e-05, "epoch": 3.514332965821389, "percentage": 50.2, "elapsed_time": "11:31:58", "remaining_time": "11:26:19"}
|
| 1276 |
+
{"current_steps": 6380, "total_steps": 12698, "loss": 0.2168, "lr": 2.3311013733160585e-05, "epoch": 3.5170893054024255, "percentage": 50.24, "elapsed_time": "11:32:28", "remaining_time": "11:25:44"}
|
| 1277 |
+
{"current_steps": 6385, "total_steps": 12698, "loss": 0.2242, "lr": 2.3283899634743414e-05, "epoch": 3.519845644983462, "percentage": 50.28, "elapsed_time": "11:32:52", "remaining_time": "11:25:03"}
|
| 1278 |
+
{"current_steps": 6390, "total_steps": 12698, "loss": 0.2392, "lr": 2.3256779332078986e-05, "epoch": 3.5226019845644982, "percentage": 50.32, "elapsed_time": "11:33:20", "remaining_time": "11:24:26"}
|
| 1279 |
+
{"current_steps": 6395, "total_steps": 12698, "loss": 0.2263, "lr": 2.322965287640548e-05, "epoch": 3.5253583241455346, "percentage": 50.36, "elapsed_time": "11:33:48", "remaining_time": "11:23:49"}
|
| 1280 |
+
{"current_steps": 6400, "total_steps": 12698, "loss": 0.2393, "lr": 2.3202520318972708e-05, "epoch": 3.528114663726571, "percentage": 50.4, "elapsed_time": "11:34:13", "remaining_time": "11:23:09"}
|
| 1281 |
+
{"current_steps": 6405, "total_steps": 12698, "loss": 0.227, "lr": 2.317538171104202e-05, "epoch": 3.5308710033076074, "percentage": 50.44, "elapsed_time": "11:34:39", "remaining_time": "11:22:30"}
|
| 1282 |
+
{"current_steps": 6410, "total_steps": 12698, "loss": 0.2329, "lr": 2.314823710388618e-05, "epoch": 3.5336273428886438, "percentage": 50.48, "elapsed_time": "11:35:09", "remaining_time": "11:21:55"}
|
| 1283 |
+
{"current_steps": 6415, "total_steps": 12698, "loss": 0.2228, "lr": 2.312108654878929e-05, "epoch": 3.53638368246968, "percentage": 50.52, "elapsed_time": "11:35:34", "remaining_time": "11:21:15"}
|
| 1284 |
+
{"current_steps": 6420, "total_steps": 12698, "loss": 0.2357, "lr": 2.3093930097046697e-05, "epoch": 3.5391400220507165, "percentage": 50.56, "elapsed_time": "11:36:02", "remaining_time": "11:20:38"}
|
| 1285 |
+
{"current_steps": 6425, "total_steps": 12698, "loss": 0.2191, "lr": 2.3066767799964885e-05, "epoch": 3.541896361631753, "percentage": 50.6, "elapsed_time": "11:36:29", "remaining_time": "11:20:01"}
|
| 1286 |
+
{"current_steps": 6430, "total_steps": 12698, "loss": 0.2175, "lr": 2.303959970886138e-05, "epoch": 3.5446527012127893, "percentage": 50.64, "elapsed_time": "11:36:55", "remaining_time": "11:19:22"}
|
| 1287 |
+
{"current_steps": 6435, "total_steps": 12698, "loss": 0.2188, "lr": 2.3012425875064657e-05, "epoch": 3.5474090407938257, "percentage": 50.68, "elapsed_time": "11:37:21", "remaining_time": "11:18:42"}
|
| 1288 |
+
{"current_steps": 6440, "total_steps": 12698, "loss": 0.237, "lr": 2.298524634991403e-05, "epoch": 3.550165380374862, "percentage": 50.72, "elapsed_time": "11:37:49", "remaining_time": "11:18:06"}
|
| 1289 |
+
{"current_steps": 6445, "total_steps": 12698, "loss": 0.2288, "lr": 2.2958061184759586e-05, "epoch": 3.5529217199558984, "percentage": 50.76, "elapsed_time": "11:38:19", "remaining_time": "11:17:30"}
|
| 1290 |
+
{"current_steps": 6450, "total_steps": 12698, "loss": 0.2339, "lr": 2.2930870430962055e-05, "epoch": 3.555678059536935, "percentage": 50.8, "elapsed_time": "11:38:53", "remaining_time": "11:17:00"}
|
| 1291 |
+
{"current_steps": 6455, "total_steps": 12698, "loss": 0.2249, "lr": 2.2903674139892717e-05, "epoch": 3.558434399117971, "percentage": 50.83, "elapsed_time": "11:39:20", "remaining_time": "11:16:22"}
|
| 1292 |
+
{"current_steps": 6460, "total_steps": 12698, "loss": 0.2368, "lr": 2.2876472362933333e-05, "epoch": 3.5611907386990076, "percentage": 50.87, "elapsed_time": "11:39:49", "remaining_time": "11:15:46"}
|
| 1293 |
+
{"current_steps": 6465, "total_steps": 12698, "loss": 0.2324, "lr": 2.2849265151476016e-05, "epoch": 3.563947078280044, "percentage": 50.91, "elapsed_time": "11:40:17", "remaining_time": "11:15:09"}
|
| 1294 |
+
{"current_steps": 6470, "total_steps": 12698, "loss": 0.2176, "lr": 2.2822052556923145e-05, "epoch": 3.5667034178610804, "percentage": 50.95, "elapsed_time": "11:40:42", "remaining_time": "11:14:29"}
|
| 1295 |
+
{"current_steps": 6475, "total_steps": 12698, "loss": 0.2209, "lr": 2.279483463068728e-05, "epoch": 3.5694597574421167, "percentage": 50.99, "elapsed_time": "11:41:10", "remaining_time": "11:13:53"}
|
| 1296 |
+
{"current_steps": 6480, "total_steps": 12698, "loss": 0.2155, "lr": 2.2767611424191043e-05, "epoch": 3.572216097023153, "percentage": 51.03, "elapsed_time": "11:41:34", "remaining_time": "11:13:12"}
|
| 1297 |
+
{"current_steps": 6485, "total_steps": 12698, "loss": 0.2169, "lr": 2.274038298886704e-05, "epoch": 3.5749724366041895, "percentage": 51.07, "elapsed_time": "11:42:01", "remaining_time": "11:12:34"}
|
| 1298 |
+
{"current_steps": 6490, "total_steps": 12698, "loss": 0.2111, "lr": 2.271314937615775e-05, "epoch": 3.577728776185226, "percentage": 51.11, "elapsed_time": "11:42:28", "remaining_time": "11:11:57"}
|
| 1299 |
+
{"current_steps": 6495, "total_steps": 12698, "loss": 0.2136, "lr": 2.2685910637515427e-05, "epoch": 3.5804851157662623, "percentage": 51.15, "elapsed_time": "11:42:54", "remaining_time": "11:11:18"}
|
| 1300 |
+
{"current_steps": 6500, "total_steps": 12698, "loss": 0.2155, "lr": 2.2658666824402037e-05, "epoch": 3.5832414553472987, "percentage": 51.19, "elapsed_time": "11:43:21", "remaining_time": "11:10:40"}
|
| 1301 |
+
{"current_steps": 6505, "total_steps": 12698, "loss": 0.2459, "lr": 2.26314179882891e-05, "epoch": 3.585997794928335, "percentage": 51.23, "elapsed_time": "11:43:45", "remaining_time": "11:09:59"}
|
| 1302 |
+
{"current_steps": 6510, "total_steps": 12698, "loss": 0.2179, "lr": 2.2604164180657648e-05, "epoch": 3.5887541345093714, "percentage": 51.27, "elapsed_time": "11:44:11", "remaining_time": "11:09:21"}
|
| 1303 |
+
{"current_steps": 6515, "total_steps": 12698, "loss": 0.2284, "lr": 2.2576905452998093e-05, "epoch": 3.591510474090408, "percentage": 51.31, "elapsed_time": "11:44:37", "remaining_time": "11:08:43"}
|
| 1304 |
+
{"current_steps": 6520, "total_steps": 12698, "loss": 0.2136, "lr": 2.2549641856810144e-05, "epoch": 3.594266813671444, "percentage": 51.35, "elapsed_time": "11:45:03", "remaining_time": "11:08:04"}
|
| 1305 |
+
{"current_steps": 6525, "total_steps": 12698, "loss": 0.2175, "lr": 2.252237344360272e-05, "epoch": 3.5970231532524806, "percentage": 51.39, "elapsed_time": "11:45:32", "remaining_time": "11:07:29"}
|
| 1306 |
+
{"current_steps": 6530, "total_steps": 12698, "loss": 0.2169, "lr": 2.249510026489383e-05, "epoch": 3.599779492833517, "percentage": 51.43, "elapsed_time": "11:46:02", "remaining_time": "11:06:54"}
|
| 1307 |
+
{"current_steps": 6535, "total_steps": 12698, "loss": 0.2172, "lr": 2.2467822372210487e-05, "epoch": 3.6025358324145533, "percentage": 51.46, "elapsed_time": "11:46:31", "remaining_time": "11:06:18"}
|
| 1308 |
+
{"current_steps": 6540, "total_steps": 12698, "loss": 0.2231, "lr": 2.244053981708861e-05, "epoch": 3.6052921719955897, "percentage": 51.5, "elapsed_time": "11:46:58", "remaining_time": "11:05:40"}
|
| 1309 |
+
{"current_steps": 6545, "total_steps": 12698, "loss": 0.2203, "lr": 2.241325265107293e-05, "epoch": 3.608048511576626, "percentage": 51.54, "elapsed_time": "11:47:26", "remaining_time": "11:05:04"}
|
| 1310 |
+
{"current_steps": 6550, "total_steps": 12698, "loss": 0.2115, "lr": 2.238596092571689e-05, "epoch": 3.6108048511576625, "percentage": 51.58, "elapsed_time": "11:47:50", "remaining_time": "11:04:23"}
|
| 1311 |
+
{"current_steps": 6555, "total_steps": 12698, "loss": 0.2322, "lr": 2.2358664692582542e-05, "epoch": 3.613561190738699, "percentage": 51.62, "elapsed_time": "11:48:20", "remaining_time": "11:03:49"}
|
| 1312 |
+
{"current_steps": 6560, "total_steps": 12698, "loss": 0.2272, "lr": 2.2331364003240456e-05, "epoch": 3.6163175303197352, "percentage": 51.66, "elapsed_time": "11:48:45", "remaining_time": "11:03:09"}
|
| 1313 |
+
{"current_steps": 6565, "total_steps": 12698, "loss": 0.233, "lr": 2.230405890926962e-05, "epoch": 3.6190738699007716, "percentage": 51.7, "elapsed_time": "11:49:13", "remaining_time": "11:02:32"}
|
| 1314 |
+
{"current_steps": 6570, "total_steps": 12698, "loss": 0.2318, "lr": 2.2276749462257355e-05, "epoch": 3.621830209481808, "percentage": 51.74, "elapsed_time": "11:49:37", "remaining_time": "11:01:52"}
|
| 1315 |
+
{"current_steps": 6575, "total_steps": 12698, "loss": 0.2304, "lr": 2.2249435713799188e-05, "epoch": 3.6245865490628444, "percentage": 51.78, "elapsed_time": "11:50:04", "remaining_time": "11:01:15"}
|
| 1316 |
+
{"current_steps": 6580, "total_steps": 12698, "loss": 0.2296, "lr": 2.2222117715498788e-05, "epoch": 3.6273428886438808, "percentage": 51.82, "elapsed_time": "11:50:32", "remaining_time": "11:00:39"}
|
| 1317 |
+
{"current_steps": 6585, "total_steps": 12698, "loss": 0.2334, "lr": 2.2194795518967847e-05, "epoch": 3.630099228224917, "percentage": 51.86, "elapsed_time": "11:50:58", "remaining_time": "11:00:00"}
|
| 1318 |
+
{"current_steps": 6590, "total_steps": 12698, "loss": 0.2166, "lr": 2.2167469175825974e-05, "epoch": 3.6328555678059535, "percentage": 51.9, "elapsed_time": "11:51:30", "remaining_time": "10:59:27"}
|
| 1319 |
+
{"current_steps": 6595, "total_steps": 12698, "loss": 0.2238, "lr": 2.214013873770065e-05, "epoch": 3.63561190738699, "percentage": 51.94, "elapsed_time": "11:51:55", "remaining_time": "10:58:49"}
|
| 1320 |
+
{"current_steps": 6600, "total_steps": 12698, "loss": 0.2304, "lr": 2.211280425622705e-05, "epoch": 3.6383682469680263, "percentage": 51.98, "elapsed_time": "11:52:20", "remaining_time": "10:58:09"}
|
| 1321 |
+
{"current_steps": 6605, "total_steps": 12698, "loss": 0.2228, "lr": 2.2085465783048022e-05, "epoch": 3.6411245865490627, "percentage": 52.02, "elapsed_time": "11:52:44", "remaining_time": "10:57:29"}
|
| 1322 |
+
{"current_steps": 6610, "total_steps": 12698, "loss": 0.2212, "lr": 2.2058123369813932e-05, "epoch": 3.643880926130099, "percentage": 52.06, "elapsed_time": "11:53:11", "remaining_time": "10:56:52"}
|
| 1323 |
+
{"current_steps": 6615, "total_steps": 12698, "loss": 0.2115, "lr": 2.203077706818259e-05, "epoch": 3.646637265711136, "percentage": 52.09, "elapsed_time": "11:53:42", "remaining_time": "10:56:18"}
|
| 1324 |
+
{"current_steps": 6620, "total_steps": 12698, "loss": 0.2259, "lr": 2.2003426929819184e-05, "epoch": 3.649393605292172, "percentage": 52.13, "elapsed_time": "11:54:11", "remaining_time": "10:55:43"}
|
| 1325 |
+
{"current_steps": 6625, "total_steps": 12698, "loss": 0.2026, "lr": 2.1976073006396113e-05, "epoch": 3.6521499448732087, "percentage": 52.17, "elapsed_time": "11:54:38", "remaining_time": "10:55:06"}
|
| 1326 |
+
{"current_steps": 6630, "total_steps": 12698, "loss": 0.2224, "lr": 2.1948715349592944e-05, "epoch": 3.6549062844542446, "percentage": 52.21, "elapsed_time": "11:55:04", "remaining_time": "10:54:27"}
|
| 1327 |
+
{"current_steps": 6635, "total_steps": 12698, "loss": 0.2187, "lr": 2.1921354011096302e-05, "epoch": 3.6576626240352814, "percentage": 52.25, "elapsed_time": "11:55:32", "remaining_time": "10:53:51"}
|
| 1328 |
+
{"current_steps": 6640, "total_steps": 12698, "loss": 0.2272, "lr": 2.1893989042599744e-05, "epoch": 3.6604189636163174, "percentage": 52.29, "elapsed_time": "11:55:57", "remaining_time": "10:53:12"}
|
| 1329 |
+
{"current_steps": 6645, "total_steps": 12698, "loss": 0.209, "lr": 2.1866620495803722e-05, "epoch": 3.663175303197354, "percentage": 52.33, "elapsed_time": "11:56:22", "remaining_time": "10:52:33"}
|
| 1330 |
+
{"current_steps": 6650, "total_steps": 12698, "loss": 0.2326, "lr": 2.183924842241542e-05, "epoch": 3.66593164277839, "percentage": 52.37, "elapsed_time": "11:56:49", "remaining_time": "10:51:56"}
|
| 1331 |
+
{"current_steps": 6655, "total_steps": 12698, "loss": 0.2188, "lr": 2.1811872874148688e-05, "epoch": 3.668687982359427, "percentage": 52.41, "elapsed_time": "11:57:20", "remaining_time": "10:51:22"}
|
| 1332 |
+
{"current_steps": 6660, "total_steps": 12698, "loss": 0.2141, "lr": 2.178449390272396e-05, "epoch": 3.671444321940463, "percentage": 52.45, "elapsed_time": "11:57:52", "remaining_time": "10:50:49"}
|
| 1333 |
+
{"current_steps": 6665, "total_steps": 12698, "loss": 0.2088, "lr": 2.175711155986811e-05, "epoch": 3.6742006615214997, "percentage": 52.49, "elapsed_time": "11:58:21", "remaining_time": "10:50:14"}
|
| 1334 |
+
{"current_steps": 6670, "total_steps": 12698, "loss": 0.2127, "lr": 2.172972589731441e-05, "epoch": 3.6769570011025356, "percentage": 52.53, "elapsed_time": "11:58:50", "remaining_time": "10:49:39"}
|
| 1335 |
+
{"current_steps": 6675, "total_steps": 12698, "loss": 0.2081, "lr": 2.170233696680238e-05, "epoch": 3.6797133406835725, "percentage": 52.57, "elapsed_time": "11:59:17", "remaining_time": "10:49:01"}
|
| 1336 |
+
{"current_steps": 6680, "total_steps": 12698, "loss": 0.2039, "lr": 2.167494482007772e-05, "epoch": 3.6824696802646084, "percentage": 52.61, "elapsed_time": "11:59:46", "remaining_time": "10:48:26"}
|
| 1337 |
+
{"current_steps": 6685, "total_steps": 12698, "loss": 0.2071, "lr": 2.164754950889221e-05, "epoch": 3.6852260198456452, "percentage": 52.65, "elapsed_time": "12:00:09", "remaining_time": "10:47:46"}
|
| 1338 |
+
{"current_steps": 6690, "total_steps": 12698, "loss": 0.2059, "lr": 2.1620151085003625e-05, "epoch": 3.687982359426681, "percentage": 52.69, "elapsed_time": "12:00:36", "remaining_time": "10:47:09"}
|
| 1339 |
+
{"current_steps": 6695, "total_steps": 12698, "loss": 0.2225, "lr": 2.1592749600175594e-05, "epoch": 3.690738699007718, "percentage": 52.72, "elapsed_time": "12:01:06", "remaining_time": "10:46:34"}
|
| 1340 |
+
{"current_steps": 6700, "total_steps": 12698, "loss": 0.2315, "lr": 2.1565345106177533e-05, "epoch": 3.693495038588754, "percentage": 52.76, "elapsed_time": "12:01:28", "remaining_time": "10:45:53"}
|
| 1341 |
+
{"current_steps": 6705, "total_steps": 12698, "loss": 0.2066, "lr": 2.1537937654784556e-05, "epoch": 3.6962513781697908, "percentage": 52.8, "elapsed_time": "12:01:53", "remaining_time": "10:45:14"}
|
| 1342 |
+
{"current_steps": 6710, "total_steps": 12698, "loss": 0.2128, "lr": 2.1510527297777357e-05, "epoch": 3.6990077177508267, "percentage": 52.84, "elapsed_time": "12:02:21", "remaining_time": "10:44:37"}
|
| 1343 |
+
{"current_steps": 6715, "total_steps": 12698, "loss": 0.2135, "lr": 2.148311408694212e-05, "epoch": 3.7017640573318635, "percentage": 52.88, "elapsed_time": "12:02:47", "remaining_time": "10:43:59"}
|
| 1344 |
+
{"current_steps": 6720, "total_steps": 12698, "loss": 0.2149, "lr": 2.1455698074070422e-05, "epoch": 3.7045203969128995, "percentage": 52.92, "elapsed_time": "12:03:13", "remaining_time": "10:43:22"}
|
| 1345 |
+
{"current_steps": 6725, "total_steps": 12698, "loss": 0.2263, "lr": 2.1428279310959136e-05, "epoch": 3.7072767364939363, "percentage": 52.96, "elapsed_time": "12:03:37", "remaining_time": "10:42:42"}
|
| 1346 |
+
{"current_steps": 6730, "total_steps": 12698, "loss": 0.2183, "lr": 2.1400857849410324e-05, "epoch": 3.7100330760749722, "percentage": 53.0, "elapsed_time": "12:04:05", "remaining_time": "10:42:06"}
|
| 1347 |
+
{"current_steps": 6735, "total_steps": 12698, "loss": 0.212, "lr": 2.1373433741231144e-05, "epoch": 3.712789415656009, "percentage": 53.04, "elapsed_time": "12:04:31", "remaining_time": "10:41:29"}
|
| 1348 |
+
{"current_steps": 6740, "total_steps": 12698, "loss": 0.2219, "lr": 2.1346007038233774e-05, "epoch": 3.715545755237045, "percentage": 53.08, "elapsed_time": "12:04:58", "remaining_time": "10:40:51"}
|
| 1349 |
+
{"current_steps": 6745, "total_steps": 12698, "loss": 0.2214, "lr": 2.131857779223528e-05, "epoch": 3.718302094818082, "percentage": 53.12, "elapsed_time": "12:05:28", "remaining_time": "10:40:16"}
|
| 1350 |
+
{"current_steps": 6750, "total_steps": 12698, "loss": 0.125, "lr": 2.129114605505752e-05, "epoch": 3.7210584343991178, "percentage": 53.16, "elapsed_time": "12:05:58", "remaining_time": "10:39:42"}
|
| 1351 |
+
{"current_steps": 6755, "total_steps": 12698, "loss": 0.0889, "lr": 2.126371187852708e-05, "epoch": 3.7238147739801546, "percentage": 53.2, "elapsed_time": "12:06:23", "remaining_time": "10:39:04"}
|
| 1352 |
+
{"current_steps": 6760, "total_steps": 12698, "loss": 0.0849, "lr": 2.1236275314475144e-05, "epoch": 3.7265711135611905, "percentage": 53.24, "elapsed_time": "12:06:48", "remaining_time": "10:38:26"}
|
| 1353 |
+
{"current_steps": 6765, "total_steps": 12698, "loss": 0.1026, "lr": 2.120883641473742e-05, "epoch": 3.7293274531422274, "percentage": 53.28, "elapsed_time": "12:07:12", "remaining_time": "10:37:46"}
|
| 1354 |
+
{"current_steps": 6770, "total_steps": 12698, "loss": 0.0848, "lr": 2.1181395231154004e-05, "epoch": 3.7320837927232633, "percentage": 53.32, "elapsed_time": "12:07:42", "remaining_time": "10:37:12"}
|
| 1355 |
+
{"current_steps": 6775, "total_steps": 12698, "loss": 0.0995, "lr": 2.1153951815569326e-05, "epoch": 3.7348401323043, "percentage": 53.35, "elapsed_time": "12:08:05", "remaining_time": "10:36:32"}
|
| 1356 |
+
{"current_steps": 6780, "total_steps": 12698, "loss": 0.1405, "lr": 2.112650621983203e-05, "epoch": 3.737596471885336, "percentage": 53.39, "elapsed_time": "12:08:33", "remaining_time": "10:35:55"}
|
| 1357 |
+
{"current_steps": 6785, "total_steps": 12698, "loss": 0.0927, "lr": 2.1099058495794874e-05, "epoch": 3.740352811466373, "percentage": 53.43, "elapsed_time": "12:08:58", "remaining_time": "10:35:17"}
|
| 1358 |
+
{"current_steps": 6790, "total_steps": 12698, "loss": 0.106, "lr": 2.1071608695314644e-05, "epoch": 3.743109151047409, "percentage": 53.47, "elapsed_time": "12:09:30", "remaining_time": "10:34:44"}
|
| 1359 |
+
{"current_steps": 6795, "total_steps": 12698, "loss": 0.1073, "lr": 2.104415687025204e-05, "epoch": 3.7458654906284456, "percentage": 53.51, "elapsed_time": "12:10:22", "remaining_time": "10:34:30"}
|
| 1360 |
+
{"current_steps": 6800, "total_steps": 12698, "loss": 0.0829, "lr": 2.1016703072471593e-05, "epoch": 3.7486218302094816, "percentage": 53.55, "elapsed_time": "12:10:55", "remaining_time": "10:33:58"}
|
| 1361 |
+
{"current_steps": 6805, "total_steps": 12698, "loss": 0.091, "lr": 2.0989247353841557e-05, "epoch": 3.7513781697905184, "percentage": 53.59, "elapsed_time": "12:11:30", "remaining_time": "10:33:28"}
|
| 1362 |
+
{"current_steps": 6810, "total_steps": 12698, "loss": 0.0922, "lr": 2.0961789766233824e-05, "epoch": 3.7541345093715544, "percentage": 53.63, "elapsed_time": "12:12:04", "remaining_time": "10:32:57"}
|
| 1363 |
+
{"current_steps": 6815, "total_steps": 12698, "loss": 0.1226, "lr": 2.0934330361523812e-05, "epoch": 3.756890848952591, "percentage": 53.67, "elapsed_time": "12:12:37", "remaining_time": "10:32:26"}
|
| 1364 |
+
{"current_steps": 6820, "total_steps": 12698, "loss": 0.0871, "lr": 2.0906869191590365e-05, "epoch": 3.759647188533627, "percentage": 53.71, "elapsed_time": "12:13:05", "remaining_time": "10:31:49"}
|
| 1365 |
+
{"current_steps": 6825, "total_steps": 12698, "loss": 0.0834, "lr": 2.0879406308315668e-05, "epoch": 3.762403528114664, "percentage": 53.75, "elapsed_time": "12:13:29", "remaining_time": "10:31:10"}
|
| 1366 |
+
{"current_steps": 6830, "total_steps": 12698, "loss": 0.0755, "lr": 2.0851941763585147e-05, "epoch": 3.7651598676957, "percentage": 53.79, "elapsed_time": "12:13:52", "remaining_time": "10:30:30"}
|
| 1367 |
+
{"current_steps": 6835, "total_steps": 12698, "loss": 0.0985, "lr": 2.082447560928736e-05, "epoch": 3.7679162072767367, "percentage": 53.83, "elapsed_time": "12:14:13", "remaining_time": "10:29:49"}
|
| 1368 |
+
{"current_steps": 6840, "total_steps": 12698, "loss": 0.0976, "lr": 2.079700789731391e-05, "epoch": 3.7706725468577726, "percentage": 53.87, "elapsed_time": "12:14:46", "remaining_time": "10:29:16"}
|
| 1369 |
+
{"current_steps": 6845, "total_steps": 12698, "loss": 0.1013, "lr": 2.0769538679559343e-05, "epoch": 3.7734288864388095, "percentage": 53.91, "elapsed_time": "12:15:13", "remaining_time": "10:28:40"}
|
| 1370 |
+
{"current_steps": 6850, "total_steps": 12698, "loss": 0.0994, "lr": 2.074206800792105e-05, "epoch": 3.7761852260198454, "percentage": 53.95, "elapsed_time": "12:15:39", "remaining_time": "10:28:03"}
|
| 1371 |
+
{"current_steps": 6855, "total_steps": 12698, "loss": 0.1236, "lr": 2.071459593429916e-05, "epoch": 3.7789415656008822, "percentage": 53.98, "elapsed_time": "12:16:14", "remaining_time": "10:27:33"}
|
| 1372 |
+
{"current_steps": 6860, "total_steps": 12698, "loss": 0.0848, "lr": 2.0687122510596462e-05, "epoch": 3.781697905181918, "percentage": 54.02, "elapsed_time": "12:16:36", "remaining_time": "10:26:52"}
|
| 1373 |
+
{"current_steps": 6865, "total_steps": 12698, "loss": 0.1167, "lr": 2.06596477887183e-05, "epoch": 3.784454244762955, "percentage": 54.06, "elapsed_time": "12:16:59", "remaining_time": "10:26:11"}
|
| 1374 |
+
{"current_steps": 6870, "total_steps": 12698, "loss": 0.12, "lr": 2.0632171820572454e-05, "epoch": 3.787210584343991, "percentage": 54.1, "elapsed_time": "12:17:32", "remaining_time": "10:25:40"}
|
| 1375 |
+
{"current_steps": 6875, "total_steps": 12698, "loss": 0.0894, "lr": 2.0604694658069065e-05, "epoch": 3.7899669239250278, "percentage": 54.14, "elapsed_time": "12:18:00", "remaining_time": "10:25:04"}
|
| 1376 |
+
{"current_steps": 6880, "total_steps": 12698, "loss": 0.194, "lr": 2.057721635312054e-05, "epoch": 3.7927232635060637, "percentage": 54.18, "elapsed_time": "12:18:43", "remaining_time": "10:24:41"}
|
| 1377 |
+
{"current_steps": 6885, "total_steps": 12698, "loss": 0.1867, "lr": 2.054973695764143e-05, "epoch": 3.7954796030871005, "percentage": 54.22, "elapsed_time": "12:19:20", "remaining_time": "10:24:13"}
|
| 1378 |
+
{"current_steps": 6890, "total_steps": 12698, "loss": 0.1045, "lr": 2.0522256523548362e-05, "epoch": 3.7982359426681365, "percentage": 54.26, "elapsed_time": "12:19:53", "remaining_time": "10:23:42"}
|
| 1379 |
+
{"current_steps": 6895, "total_steps": 12698, "loss": 0.1638, "lr": 2.049477510275991e-05, "epoch": 3.8009922822491733, "percentage": 54.3, "elapsed_time": "12:20:35", "remaining_time": "10:23:18"}
|
| 1380 |
+
{"current_steps": 6900, "total_steps": 12698, "loss": 0.1163, "lr": 2.0467292747196516e-05, "epoch": 3.8037486218302092, "percentage": 54.34, "elapsed_time": "12:21:14", "remaining_time": "10:22:51"}
|
| 1381 |
+
{"current_steps": 6905, "total_steps": 12698, "loss": 0.0895, "lr": 2.04398095087804e-05, "epoch": 3.806504961411246, "percentage": 54.38, "elapsed_time": "12:21:49", "remaining_time": "10:22:21"}
|
| 1382 |
+
{"current_steps": 6910, "total_steps": 12698, "loss": 0.0984, "lr": 2.041232543943543e-05, "epoch": 3.809261300992282, "percentage": 54.42, "elapsed_time": "12:22:14", "remaining_time": "10:21:43"}
|
| 1383 |
+
{"current_steps": 6915, "total_steps": 12698, "loss": 0.087, "lr": 2.038484059108707e-05, "epoch": 3.812017640573319, "percentage": 54.46, "elapsed_time": "12:22:42", "remaining_time": "10:21:07"}
|
| 1384 |
+
{"current_steps": 6920, "total_steps": 12698, "loss": 0.0885, "lr": 2.0357355015662228e-05, "epoch": 3.8147739801543548, "percentage": 54.5, "elapsed_time": "12:23:14", "remaining_time": "10:20:34"}
|
| 1385 |
+
{"current_steps": 6925, "total_steps": 12698, "loss": 0.0846, "lr": 2.0329868765089197e-05, "epoch": 3.8175303197353916, "percentage": 54.54, "elapsed_time": "12:23:35", "remaining_time": "10:19:53"}
|
| 1386 |
+
{"current_steps": 6930, "total_steps": 12698, "loss": 0.0861, "lr": 2.0302381891297553e-05, "epoch": 3.8202866593164275, "percentage": 54.58, "elapsed_time": "12:23:55", "remaining_time": "10:19:11"}
|
| 1387 |
+
{"current_steps": 6935, "total_steps": 12698, "loss": 0.0771, "lr": 2.0274894446218042e-05, "epoch": 3.8230429988974644, "percentage": 54.61, "elapsed_time": "12:24:18", "remaining_time": "10:18:31"}
|
| 1388 |
+
{"current_steps": 6940, "total_steps": 12698, "loss": 0.1338, "lr": 2.024740648178249e-05, "epoch": 3.8257993384785003, "percentage": 54.65, "elapsed_time": "12:25:01", "remaining_time": "10:18:08"}
|
| 1389 |
+
{"current_steps": 6945, "total_steps": 12698, "loss": 0.0679, "lr": 2.0219918049923707e-05, "epoch": 3.828555678059537, "percentage": 54.69, "elapsed_time": "12:25:21", "remaining_time": "10:17:25"}
|
| 1390 |
+
{"current_steps": 6950, "total_steps": 12698, "loss": 0.0785, "lr": 2.0192429202575372e-05, "epoch": 3.831312017640573, "percentage": 54.73, "elapsed_time": "12:25:45", "remaining_time": "10:16:46"}
|
| 1391 |
+
{"current_steps": 6955, "total_steps": 12698, "loss": 0.0812, "lr": 2.0164939991671976e-05, "epoch": 3.83406835722161, "percentage": 54.77, "elapsed_time": "12:26:08", "remaining_time": "10:16:07"}
|
| 1392 |
+
{"current_steps": 6960, "total_steps": 12698, "loss": 0.0947, "lr": 2.0137450469148674e-05, "epoch": 3.836824696802646, "percentage": 54.81, "elapsed_time": "12:26:49", "remaining_time": "10:15:42"}
|
| 1393 |
+
{"current_steps": 6965, "total_steps": 12698, "loss": 0.1086, "lr": 2.0109960686941223e-05, "epoch": 3.8395810363836826, "percentage": 54.85, "elapsed_time": "12:27:22", "remaining_time": "10:15:10"}
|
| 1394 |
+
{"current_steps": 6970, "total_steps": 12698, "loss": 0.1228, "lr": 2.0082470696985856e-05, "epoch": 3.8423373759647186, "percentage": 54.89, "elapsed_time": "12:27:55", "remaining_time": "10:14:39"}
|
| 1395 |
+
{"current_steps": 6975, "total_steps": 12698, "loss": 0.0948, "lr": 2.005498055121921e-05, "epoch": 3.8450937155457554, "percentage": 54.93, "elapsed_time": "12:28:20", "remaining_time": "10:14:00"}
|
| 1396 |
+
{"current_steps": 6980, "total_steps": 12698, "loss": 0.111, "lr": 2.0027490301578217e-05, "epoch": 3.8478500551267913, "percentage": 54.97, "elapsed_time": "12:28:50", "remaining_time": "10:13:26"}
|
| 1397 |
+
{"current_steps": 6985, "total_steps": 12698, "loss": 0.1237, "lr": 2e-05, "epoch": 3.850606394707828, "percentage": 55.01, "elapsed_time": "12:29:21", "remaining_time": "10:12:54"}
|
| 1398 |
+
{"current_steps": 6990, "total_steps": 12698, "loss": 0.0945, "lr": 1.997250969842179e-05, "epoch": 3.853362734288864, "percentage": 55.05, "elapsed_time": "12:29:47", "remaining_time": "10:12:16"}
|
| 1399 |
+
{"current_steps": 6995, "total_steps": 12698, "loss": 0.1124, "lr": 1.9945019448780798e-05, "epoch": 3.856119073869901, "percentage": 55.09, "elapsed_time": "12:30:09", "remaining_time": "10:11:36"}
|
| 1400 |
+
{"current_steps": 7000, "total_steps": 12698, "loss": 0.0978, "lr": 1.9917529303014148e-05, "epoch": 3.8588754134509373, "percentage": 55.13, "elapsed_time": "12:30:38", "remaining_time": "10:11:01"}
|
| 1401 |
+
{"current_steps": 7005, "total_steps": 12698, "loss": 0.0898, "lr": 1.9890039313058784e-05, "epoch": 3.8616317530319737, "percentage": 55.17, "elapsed_time": "12:31:20", "remaining_time": "10:10:37"}
|
| 1402 |
+
{"current_steps": 7010, "total_steps": 12698, "loss": 0.0824, "lr": 1.986254953085133e-05, "epoch": 3.86438809261301, "percentage": 55.21, "elapsed_time": "12:31:48", "remaining_time": "10:10:01"}
|
| 1403 |
+
{"current_steps": 7015, "total_steps": 12698, "loss": 0.0773, "lr": 1.9835060008328028e-05, "epoch": 3.8671444321940465, "percentage": 55.24, "elapsed_time": "12:32:26", "remaining_time": "10:09:33"}
|
| 1404 |
+
{"current_steps": 7020, "total_steps": 12698, "loss": 0.0854, "lr": 1.9807570797424634e-05, "epoch": 3.869900771775083, "percentage": 55.28, "elapsed_time": "12:32:50", "remaining_time": "10:08:55"}
|
| 1405 |
+
{"current_steps": 7025, "total_steps": 12698, "loss": 0.1002, "lr": 1.97800819500763e-05, "epoch": 3.8726571113561192, "percentage": 55.32, "elapsed_time": "12:33:46", "remaining_time": "10:08:42"}
|
| 1406 |
+
{"current_steps": 7030, "total_steps": 12698, "loss": 0.0887, "lr": 1.9752593518217514e-05, "epoch": 3.8754134509371556, "percentage": 55.36, "elapsed_time": "12:34:08", "remaining_time": "10:08:02"}
|
| 1407 |
+
{"current_steps": 7035, "total_steps": 12698, "loss": 0.1068, "lr": 1.972510555378196e-05, "epoch": 3.878169790518192, "percentage": 55.4, "elapsed_time": "12:34:32", "remaining_time": "10:07:22"}
|
| 1408 |
+
{"current_steps": 7040, "total_steps": 12698, "loss": 0.0718, "lr": 1.969761810870245e-05, "epoch": 3.8809261300992284, "percentage": 55.44, "elapsed_time": "12:34:57", "remaining_time": "10:06:45"}
|
| 1409 |
+
{"current_steps": 7045, "total_steps": 12698, "loss": 0.0916, "lr": 1.967013123491081e-05, "epoch": 3.8836824696802648, "percentage": 55.48, "elapsed_time": "12:35:27", "remaining_time": "10:06:11"}
|
| 1410 |
+
{"current_steps": 7050, "total_steps": 12698, "loss": 0.0909, "lr": 1.964264498433778e-05, "epoch": 3.886438809261301, "percentage": 55.52, "elapsed_time": "12:35:53", "remaining_time": "10:05:34"}
|
| 1411 |
+
{"current_steps": 7055, "total_steps": 12698, "loss": 0.0788, "lr": 1.9615159408912937e-05, "epoch": 3.8891951488423375, "percentage": 55.56, "elapsed_time": "12:36:19", "remaining_time": "10:04:56"}
|
| 1412 |
+
{"current_steps": 7060, "total_steps": 12698, "loss": 0.0901, "lr": 1.9587674560564573e-05, "epoch": 3.891951488423374, "percentage": 55.6, "elapsed_time": "12:36:45", "remaining_time": "10:04:20"}
|
| 1413 |
+
{"current_steps": 7065, "total_steps": 12698, "loss": 0.0894, "lr": 1.956019049121961e-05, "epoch": 3.8947078280044103, "percentage": 55.64, "elapsed_time": "12:37:08", "remaining_time": "10:03:40"}
|
| 1414 |
+
{"current_steps": 7070, "total_steps": 12698, "loss": 0.1058, "lr": 1.9532707252803488e-05, "epoch": 3.8974641675854467, "percentage": 55.68, "elapsed_time": "12:37:43", "remaining_time": "10:03:10"}
|
| 1415 |
+
{"current_steps": 7075, "total_steps": 12698, "loss": 0.0872, "lr": 1.9505224897240097e-05, "epoch": 3.900220507166483, "percentage": 55.72, "elapsed_time": "12:38:12", "remaining_time": "10:02:35"}
|
| 1416 |
+
{"current_steps": 7080, "total_steps": 12698, "loss": 0.1088, "lr": 1.9477743476451644e-05, "epoch": 3.9029768467475194, "percentage": 55.76, "elapsed_time": "12:38:32", "remaining_time": "10:01:54"}
|
| 1417 |
+
{"current_steps": 7085, "total_steps": 12698, "loss": 0.1029, "lr": 1.9450263042358574e-05, "epoch": 3.905733186328556, "percentage": 55.8, "elapsed_time": "12:39:11", "remaining_time": "10:01:27"}
|
| 1418 |
+
{"current_steps": 7090, "total_steps": 12698, "loss": 0.0914, "lr": 1.942278364687947e-05, "epoch": 3.908489525909592, "percentage": 55.84, "elapsed_time": "12:39:36", "remaining_time": "10:00:49"}
|
| 1419 |
+
{"current_steps": 7095, "total_steps": 12698, "loss": 0.0768, "lr": 1.939530534193094e-05, "epoch": 3.9112458654906286, "percentage": 55.87, "elapsed_time": "12:39:59", "remaining_time": "10:00:10"}
|
| 1420 |
+
{"current_steps": 7100, "total_steps": 12698, "loss": 0.0858, "lr": 1.9367828179427553e-05, "epoch": 3.914002205071665, "percentage": 55.91, "elapsed_time": "12:40:21", "remaining_time": "9:59:30"}
|
| 1421 |
+
{"current_steps": 7105, "total_steps": 12698, "loss": 0.1154, "lr": 1.9340352211281707e-05, "epoch": 3.9167585446527013, "percentage": 55.95, "elapsed_time": "12:41:05", "remaining_time": "9:59:07"}
|
| 1422 |
+
{"current_steps": 7110, "total_steps": 12698, "loss": 0.0721, "lr": 1.931287748940354e-05, "epoch": 3.9195148842337377, "percentage": 55.99, "elapsed_time": "12:41:25", "remaining_time": "9:58:26"}
|
| 1423 |
+
{"current_steps": 7115, "total_steps": 12698, "loss": 0.0886, "lr": 1.9285404065700847e-05, "epoch": 3.922271223814774, "percentage": 56.03, "elapsed_time": "12:42:07", "remaining_time": "9:58:01"}
|
| 1424 |
+
{"current_steps": 7120, "total_steps": 12698, "loss": 0.0844, "lr": 1.9257931992078956e-05, "epoch": 3.9250275633958105, "percentage": 56.07, "elapsed_time": "12:42:35", "remaining_time": "9:57:25"}
|
| 1425 |
+
{"current_steps": 7125, "total_steps": 12698, "loss": 0.0714, "lr": 1.923046132044066e-05, "epoch": 3.927783902976847, "percentage": 56.11, "elapsed_time": "12:43:00", "remaining_time": "9:56:48"}
|
| 1426 |
+
{"current_steps": 7130, "total_steps": 12698, "loss": 0.0947, "lr": 1.9202992102686096e-05, "epoch": 3.9305402425578833, "percentage": 56.15, "elapsed_time": "12:43:26", "remaining_time": "9:56:11"}
|
| 1427 |
+
{"current_steps": 7135, "total_steps": 12698, "loss": 0.0795, "lr": 1.9175524390712645e-05, "epoch": 3.9332965821389196, "percentage": 56.19, "elapsed_time": "12:43:55", "remaining_time": "9:55:37"}
|
| 1428 |
+
{"current_steps": 7140, "total_steps": 12698, "loss": 0.1094, "lr": 1.914805823641486e-05, "epoch": 3.936052921719956, "percentage": 56.23, "elapsed_time": "12:44:26", "remaining_time": "9:55:03"}
|
| 1429 |
+
{"current_steps": 7145, "total_steps": 12698, "loss": 0.1083, "lr": 1.9120593691684335e-05, "epoch": 3.9388092613009924, "percentage": 56.27, "elapsed_time": "12:44:54", "remaining_time": "9:54:28"}
|
| 1430 |
+
{"current_steps": 7150, "total_steps": 12698, "loss": 0.0681, "lr": 1.909313080840964e-05, "epoch": 3.941565600882029, "percentage": 56.31, "elapsed_time": "12:45:15", "remaining_time": "9:53:48"}
|
| 1431 |
+
{"current_steps": 7155, "total_steps": 12698, "loss": 0.1102, "lr": 1.9065669638476195e-05, "epoch": 3.944321940463065, "percentage": 56.35, "elapsed_time": "12:45:38", "remaining_time": "9:53:08"}
|
| 1432 |
+
{"current_steps": 7160, "total_steps": 12698, "loss": 0.0839, "lr": 1.903821023376618e-05, "epoch": 3.9470782800441016, "percentage": 56.39, "elapsed_time": "12:46:01", "remaining_time": "9:52:29"}
|
| 1433 |
+
{"current_steps": 7165, "total_steps": 12698, "loss": 0.0926, "lr": 1.9010752646158447e-05, "epoch": 3.949834619625138, "percentage": 56.43, "elapsed_time": "12:46:21", "remaining_time": "9:51:47"}
|
| 1434 |
+
{"current_steps": 7170, "total_steps": 12698, "loss": 0.1038, "lr": 1.8983296927528413e-05, "epoch": 3.9525909592061743, "percentage": 56.47, "elapsed_time": "12:46:53", "remaining_time": "9:51:16"}
|
| 1435 |
+
{"current_steps": 7175, "total_steps": 12698, "loss": 0.1148, "lr": 1.8955843129747965e-05, "epoch": 3.9553472987872107, "percentage": 56.5, "elapsed_time": "12:47:31", "remaining_time": "9:50:48"}
|
| 1436 |
+
{"current_steps": 7180, "total_steps": 12698, "loss": 0.09, "lr": 1.8928391304685363e-05, "epoch": 3.958103638368247, "percentage": 56.54, "elapsed_time": "12:48:02", "remaining_time": "9:50:15"}
|
| 1437 |
+
{"current_steps": 7185, "total_steps": 12698, "loss": 0.0915, "lr": 1.8900941504205133e-05, "epoch": 3.9608599779492835, "percentage": 56.58, "elapsed_time": "12:48:29", "remaining_time": "9:49:39"}
|
| 1438 |
+
{"current_steps": 7190, "total_steps": 12698, "loss": 0.086, "lr": 1.8873493780167972e-05, "epoch": 3.96361631753032, "percentage": 56.62, "elapsed_time": "12:48:50", "remaining_time": "9:48:59"}
|
| 1439 |
+
{"current_steps": 7195, "total_steps": 12698, "loss": 0.0842, "lr": 1.8846048184430677e-05, "epoch": 3.9663726571113562, "percentage": 56.66, "elapsed_time": "12:49:11", "remaining_time": "9:48:18"}
|
| 1440 |
+
{"current_steps": 7200, "total_steps": 12698, "loss": 0.0795, "lr": 1.8818604768846003e-05, "epoch": 3.9691289966923926, "percentage": 56.7, "elapsed_time": "12:49:32", "remaining_time": "9:47:37"}
|
| 1441 |
+
{"current_steps": 7205, "total_steps": 12698, "loss": 0.0974, "lr": 1.8791163585262588e-05, "epoch": 3.971885336273429, "percentage": 56.74, "elapsed_time": "12:49:53", "remaining_time": "9:46:57"}
|
| 1442 |
+
{"current_steps": 7210, "total_steps": 12698, "loss": 0.079, "lr": 1.876372468552486e-05, "epoch": 3.9746416758544654, "percentage": 56.78, "elapsed_time": "12:50:17", "remaining_time": "9:46:18"}
|
| 1443 |
+
{"current_steps": 7215, "total_steps": 12698, "loss": 0.0819, "lr": 1.8736288121472927e-05, "epoch": 3.9773980154355018, "percentage": 56.82, "elapsed_time": "12:50:40", "remaining_time": "9:45:40"}
|
| 1444 |
+
{"current_steps": 7220, "total_steps": 12698, "loss": 0.0952, "lr": 1.8708853944942486e-05, "epoch": 3.980154355016538, "percentage": 56.86, "elapsed_time": "12:51:04", "remaining_time": "9:45:01"}
|
| 1445 |
+
{"current_steps": 7225, "total_steps": 12698, "loss": 0.0753, "lr": 1.868142220776473e-05, "epoch": 3.9829106945975745, "percentage": 56.9, "elapsed_time": "12:51:43", "remaining_time": "9:44:35"}
|
| 1446 |
+
{"current_steps": 7230, "total_steps": 12698, "loss": 0.0805, "lr": 1.865399296176623e-05, "epoch": 3.985667034178611, "percentage": 56.94, "elapsed_time": "12:52:12", "remaining_time": "9:44:01"}
|
| 1447 |
+
{"current_steps": 7235, "total_steps": 12698, "loss": 0.0779, "lr": 1.862656625876886e-05, "epoch": 3.9884233737596473, "percentage": 56.98, "elapsed_time": "12:52:49", "remaining_time": "9:43:32"}
|
| 1448 |
+
{"current_steps": 7240, "total_steps": 12698, "loss": 0.1778, "lr": 1.8599142150589682e-05, "epoch": 3.9911797133406837, "percentage": 57.02, "elapsed_time": "12:53:58", "remaining_time": "9:43:28"}
|
| 1449 |
+
{"current_steps": 7245, "total_steps": 12698, "loss": 0.0785, "lr": 1.8571720689040867e-05, "epoch": 3.99393605292172, "percentage": 57.06, "elapsed_time": "12:54:21", "remaining_time": "9:42:49"}
|
| 1450 |
+
{"current_steps": 7250, "total_steps": 12698, "loss": 0.0906, "lr": 1.854430192592958e-05, "epoch": 3.9966923925027564, "percentage": 57.1, "elapsed_time": "12:54:55", "remaining_time": "9:42:19"}
|
| 1451 |
+
{"current_steps": 7255, "total_steps": 12698, "loss": 0.1084, "lr": 1.8516885913057886e-05, "epoch": 3.999448732083793, "percentage": 57.13, "elapsed_time": "12:55:31", "remaining_time": "9:41:49"}
|
| 1452 |
+
{"current_steps": 7260, "total_steps": 12698, "loss": 0.1779, "lr": 1.848947270222265e-05, "epoch": 4.002205071664829, "percentage": 57.17, "elapsed_time": "12:56:39", "remaining_time": "9:41:44"}
|
| 1453 |
+
{"current_steps": 7265, "total_steps": 12698, "loss": 0.1933, "lr": 1.8462062345215447e-05, "epoch": 4.004961411245866, "percentage": 57.21, "elapsed_time": "12:57:58", "remaining_time": "9:41:47"}
|
| 1454 |
+
{"current_steps": 7270, "total_steps": 12698, "loss": 0.183, "lr": 1.8434654893822474e-05, "epoch": 4.0077177508269015, "percentage": 57.25, "elapsed_time": "12:59:04", "remaining_time": "9:41:40"}
|
| 1455 |
+
{"current_steps": 7275, "total_steps": 12698, "loss": 0.1774, "lr": 1.8407250399824416e-05, "epoch": 4.010474090407938, "percentage": 57.29, "elapsed_time": "13:00:22", "remaining_time": "9:41:42"}
|
| 1456 |
+
{"current_steps": 7280, "total_steps": 12698, "loss": 0.1816, "lr": 1.837984891499638e-05, "epoch": 4.013230429988974, "percentage": 57.33, "elapsed_time": "13:01:40", "remaining_time": "9:41:45"}
|
| 1457 |
+
{"current_steps": 7285, "total_steps": 12698, "loss": 0.1854, "lr": 1.8352450491107793e-05, "epoch": 4.015986769570011, "percentage": 57.37, "elapsed_time": "13:03:00", "remaining_time": "9:41:47"}
|
| 1458 |
+
{"current_steps": 7290, "total_steps": 12698, "loss": 0.1931, "lr": 1.8325055179922285e-05, "epoch": 4.018743109151047, "percentage": 57.41, "elapsed_time": "13:04:15", "remaining_time": "9:41:47"}
|
| 1459 |
+
{"current_steps": 7295, "total_steps": 12698, "loss": 0.1815, "lr": 1.829766303319763e-05, "epoch": 4.021499448732084, "percentage": 57.45, "elapsed_time": "13:05:30", "remaining_time": "9:41:46"}
|
| 1460 |
+
{"current_steps": 7300, "total_steps": 12698, "loss": 0.1768, "lr": 1.82702741026856e-05, "epoch": 4.02425578831312, "percentage": 57.49, "elapsed_time": "13:06:36", "remaining_time": "9:41:39"}
|
| 1461 |
+
{"current_steps": 7305, "total_steps": 12698, "loss": 0.1642, "lr": 1.8242888440131894e-05, "epoch": 4.027012127894157, "percentage": 57.53, "elapsed_time": "13:07:39", "remaining_time": "9:41:29"}
|
| 1462 |
+
{"current_steps": 7310, "total_steps": 12698, "loss": 0.1824, "lr": 1.8215506097276047e-05, "epoch": 4.029768467475193, "percentage": 57.57, "elapsed_time": "13:08:50", "remaining_time": "9:41:26"}
|
| 1463 |
+
{"current_steps": 7315, "total_steps": 12698, "loss": 0.1707, "lr": 1.8188127125851315e-05, "epoch": 4.032524807056229, "percentage": 57.61, "elapsed_time": "13:10:00", "remaining_time": "9:41:20"}
|
| 1464 |
+
{"current_steps": 7320, "total_steps": 12698, "loss": 0.1776, "lr": 1.8160751577584587e-05, "epoch": 4.035281146637265, "percentage": 57.65, "elapsed_time": "13:11:11", "remaining_time": "9:41:17"}
|
| 1465 |
+
{"current_steps": 7325, "total_steps": 12698, "loss": 0.1697, "lr": 1.8133379504196288e-05, "epoch": 4.038037486218302, "percentage": 57.69, "elapsed_time": "13:12:22", "remaining_time": "9:41:13"}
|
| 1466 |
+
{"current_steps": 7330, "total_steps": 12698, "loss": 0.1737, "lr": 1.8106010957400263e-05, "epoch": 4.040793825799338, "percentage": 57.73, "elapsed_time": "13:13:26", "remaining_time": "9:41:03"}
|
| 1467 |
+
{"current_steps": 7335, "total_steps": 12698, "loss": 0.178, "lr": 1.807864598890371e-05, "epoch": 4.043550165380375, "percentage": 57.77, "elapsed_time": "13:14:35", "remaining_time": "9:40:57"}
|
| 1468 |
+
{"current_steps": 7340, "total_steps": 12698, "loss": 0.1705, "lr": 1.805128465040706e-05, "epoch": 4.046306504961411, "percentage": 57.8, "elapsed_time": "13:15:45", "remaining_time": "9:40:53"}
|
| 1469 |
+
{"current_steps": 7345, "total_steps": 12698, "loss": 0.178, "lr": 1.8023926993603894e-05, "epoch": 4.049062844542448, "percentage": 57.84, "elapsed_time": "13:17:00", "remaining_time": "9:40:51"}
|
| 1470 |
+
{"current_steps": 7350, "total_steps": 12698, "loss": 0.1911, "lr": 1.7996573070180823e-05, "epoch": 4.051819184123484, "percentage": 57.88, "elapsed_time": "13:18:11", "remaining_time": "9:40:46"}
|
| 1471 |
+
{"current_steps": 7355, "total_steps": 12698, "loss": 0.1716, "lr": 1.7969222931817412e-05, "epoch": 4.0545755237045205, "percentage": 57.92, "elapsed_time": "13:19:07", "remaining_time": "9:40:30"}
|
| 1472 |
+
{"current_steps": 7360, "total_steps": 12698, "loss": 0.1612, "lr": 1.7941876630186078e-05, "epoch": 4.057331863285556, "percentage": 57.96, "elapsed_time": "13:20:18", "remaining_time": "9:40:26"}
|
| 1473 |
+
{"current_steps": 7365, "total_steps": 12698, "loss": 0.1746, "lr": 1.7914534216951988e-05, "epoch": 4.060088202866593, "percentage": 58.0, "elapsed_time": "13:21:32", "remaining_time": "9:40:23"}
|
| 1474 |
+
{"current_steps": 7370, "total_steps": 12698, "loss": 0.1712, "lr": 1.7887195743772953e-05, "epoch": 4.062844542447629, "percentage": 58.04, "elapsed_time": "13:22:40", "remaining_time": "9:40:16"}
|
| 1475 |
+
{"current_steps": 7375, "total_steps": 12698, "loss": 0.179, "lr": 1.785986126229936e-05, "epoch": 4.065600882028666, "percentage": 58.08, "elapsed_time": "13:23:53", "remaining_time": "9:40:13"}
|
| 1476 |
+
{"current_steps": 7380, "total_steps": 12698, "loss": 0.1699, "lr": 1.783253082417403e-05, "epoch": 4.068357221609702, "percentage": 58.12, "elapsed_time": "13:25:09", "remaining_time": "9:40:11"}
|
| 1477 |
+
{"current_steps": 7385, "total_steps": 12698, "loss": 0.1642, "lr": 1.780520448103216e-05, "epoch": 4.071113561190739, "percentage": 58.16, "elapsed_time": "13:26:27", "remaining_time": "9:40:11"}
|
| 1478 |
+
{"current_steps": 7390, "total_steps": 12698, "loss": 0.1505, "lr": 1.7777882284501215e-05, "epoch": 4.073869900771775, "percentage": 58.2, "elapsed_time": "13:27:44", "remaining_time": "9:40:10"}
|
| 1479 |
+
{"current_steps": 7395, "total_steps": 12698, "loss": 0.1545, "lr": 1.7750564286200816e-05, "epoch": 4.0766262403528115, "percentage": 58.24, "elapsed_time": "13:28:57", "remaining_time": "9:40:06"}
|
| 1480 |
+
{"current_steps": 7400, "total_steps": 12698, "loss": 0.1782, "lr": 1.772325053774265e-05, "epoch": 4.0793825799338475, "percentage": 58.28, "elapsed_time": "13:30:06", "remaining_time": "9:39:59"}
|
| 1481 |
+
{"current_steps": 7405, "total_steps": 12698, "loss": 0.1603, "lr": 1.7695941090730385e-05, "epoch": 4.082138919514884, "percentage": 58.32, "elapsed_time": "13:30:57", "remaining_time": "9:39:39"}
|
| 1482 |
+
{"current_steps": 7410, "total_steps": 12698, "loss": 0.1816, "lr": 1.7668635996759547e-05, "epoch": 4.08489525909592, "percentage": 58.36, "elapsed_time": "13:32:06", "remaining_time": "9:39:32"}
|
| 1483 |
+
{"current_steps": 7415, "total_steps": 12698, "loss": 0.1866, "lr": 1.7641335307417465e-05, "epoch": 4.087651598676957, "percentage": 58.4, "elapsed_time": "13:33:20", "remaining_time": "9:39:28"}
|
| 1484 |
+
{"current_steps": 7420, "total_steps": 12698, "loss": 0.1803, "lr": 1.7614039074283117e-05, "epoch": 4.090407938257993, "percentage": 58.43, "elapsed_time": "13:34:31", "remaining_time": "9:39:23"}
|
| 1485 |
+
{"current_steps": 7425, "total_steps": 12698, "loss": 0.1735, "lr": 1.7586747348927075e-05, "epoch": 4.09316427783903, "percentage": 58.47, "elapsed_time": "13:35:43", "remaining_time": "9:39:18"}
|
| 1486 |
+
{"current_steps": 7430, "total_steps": 12698, "loss": 0.1827, "lr": 1.7559460182911396e-05, "epoch": 4.095920617420066, "percentage": 58.51, "elapsed_time": "13:37:00", "remaining_time": "9:39:16"}
|
| 1487 |
+
{"current_steps": 7435, "total_steps": 12698, "loss": 0.1734, "lr": 1.7532177627789516e-05, "epoch": 4.098676957001103, "percentage": 58.55, "elapsed_time": "13:38:17", "remaining_time": "9:39:14"}
|
| 1488 |
+
{"current_steps": 7440, "total_steps": 12698, "loss": 0.1774, "lr": 1.7504899735106173e-05, "epoch": 4.1014332965821385, "percentage": 58.59, "elapsed_time": "13:39:33", "remaining_time": "9:39:11"}
|
| 1489 |
+
{"current_steps": 7445, "total_steps": 12698, "loss": 0.18, "lr": 1.7477626556397283e-05, "epoch": 4.104189636163175, "percentage": 58.63, "elapsed_time": "13:40:52", "remaining_time": "9:39:11"}
|
| 1490 |
+
{"current_steps": 7450, "total_steps": 12698, "loss": 0.1805, "lr": 1.745035814318986e-05, "epoch": 4.106945975744211, "percentage": 58.67, "elapsed_time": "13:42:05", "remaining_time": "9:39:06"}
|
| 1491 |
+
{"current_steps": 7455, "total_steps": 12698, "loss": 0.1785, "lr": 1.7423094547001913e-05, "epoch": 4.109702315325248, "percentage": 58.71, "elapsed_time": "13:43:12", "remaining_time": "9:38:57"}
|
| 1492 |
+
{"current_steps": 7460, "total_steps": 12698, "loss": 0.1755, "lr": 1.7395835819342355e-05, "epoch": 4.112458654906284, "percentage": 58.75, "elapsed_time": "13:44:24", "remaining_time": "9:38:51"}
|
| 1493 |
+
{"current_steps": 7465, "total_steps": 12698, "loss": 0.1433, "lr": 1.7368582011710904e-05, "epoch": 4.115214994487321, "percentage": 58.79, "elapsed_time": "13:45:04", "remaining_time": "9:38:22"}
|
| 1494 |
+
{"current_steps": 7470, "total_steps": 12698, "loss": 0.178, "lr": 1.734133317559797e-05, "epoch": 4.117971334068357, "percentage": 58.83, "elapsed_time": "13:46:18", "remaining_time": "9:38:18"}
|
| 1495 |
+
{"current_steps": 7475, "total_steps": 12698, "loss": 0.172, "lr": 1.731408936248458e-05, "epoch": 4.120727673649394, "percentage": 58.87, "elapsed_time": "13:47:27", "remaining_time": "9:38:09"}
|
| 1496 |
+
{"current_steps": 7480, "total_steps": 12698, "loss": 0.1764, "lr": 1.7286850623842258e-05, "epoch": 4.12348401323043, "percentage": 58.91, "elapsed_time": "13:48:40", "remaining_time": "9:38:04"}
|
| 1497 |
+
{"current_steps": 7485, "total_steps": 12698, "loss": 0.1719, "lr": 1.7259617011132967e-05, "epoch": 4.126240352811466, "percentage": 58.95, "elapsed_time": "13:49:56", "remaining_time": "9:38:01"}
|
| 1498 |
+
{"current_steps": 7490, "total_steps": 12698, "loss": 0.1709, "lr": 1.7232388575808964e-05, "epoch": 4.128996692392502, "percentage": 58.99, "elapsed_time": "13:51:13", "remaining_time": "9:37:58"}
|
| 1499 |
+
{"current_steps": 7495, "total_steps": 12698, "loss": 0.1789, "lr": 1.7205165369312728e-05, "epoch": 4.131753031973539, "percentage": 59.03, "elapsed_time": "13:52:29", "remaining_time": "9:37:54"}
|
| 1500 |
+
{"current_steps": 7500, "total_steps": 12698, "loss": 0.1743, "lr": 1.7177947443076862e-05, "epoch": 4.134509371554575, "percentage": 59.06, "elapsed_time": "13:53:28", "remaining_time": "9:37:39"}
|
| 1501 |
+
{"current_steps": 7505, "total_steps": 12698, "loss": 0.1448, "lr": 1.715073484852399e-05, "epoch": 4.137265711135612, "percentage": 59.1, "elapsed_time": "13:55:01", "remaining_time": "9:37:47"}
|
| 1502 |
+
{"current_steps": 7510, "total_steps": 12698, "loss": 0.1705, "lr": 1.7123527637066673e-05, "epoch": 4.140022050716648, "percentage": 59.14, "elapsed_time": "13:56:13", "remaining_time": "9:37:40"}
|
| 1503 |
+
{"current_steps": 7515, "total_steps": 12698, "loss": 0.176, "lr": 1.7096325860107286e-05, "epoch": 4.142778390297685, "percentage": 59.18, "elapsed_time": "13:57:25", "remaining_time": "9:37:33"}
|
| 1504 |
+
{"current_steps": 7520, "total_steps": 12698, "loss": 0.1717, "lr": 1.7069129569037955e-05, "epoch": 4.145534729878721, "percentage": 59.22, "elapsed_time": "13:58:31", "remaining_time": "9:37:22"}
|
| 1505 |
+
{"current_steps": 7525, "total_steps": 12698, "loss": 0.1671, "lr": 1.704193881524042e-05, "epoch": 4.1482910694597575, "percentage": 59.26, "elapsed_time": "13:59:39", "remaining_time": "9:37:13"}
|
| 1506 |
+
{"current_steps": 7530, "total_steps": 12698, "loss": 0.1724, "lr": 1.7014753650085972e-05, "epoch": 4.151047409040794, "percentage": 59.3, "elapsed_time": "14:00:54", "remaining_time": "9:37:08"}
|
| 1507 |
+
{"current_steps": 7535, "total_steps": 12698, "loss": 0.1704, "lr": 1.6987574124935353e-05, "epoch": 4.15380374862183, "percentage": 59.34, "elapsed_time": "14:01:56", "remaining_time": "9:36:53"}
|
| 1508 |
+
{"current_steps": 7540, "total_steps": 12698, "loss": 0.1621, "lr": 1.6960400291138625e-05, "epoch": 4.156560088202866, "percentage": 59.38, "elapsed_time": "14:02:08", "remaining_time": "9:36:05"}
|
| 1509 |
+
{"current_steps": 7545, "total_steps": 12698, "loss": 0.1516, "lr": 1.693323220003512e-05, "epoch": 4.159316427783903, "percentage": 59.42, "elapsed_time": "14:02:21", "remaining_time": "9:35:17"}
|
| 1510 |
+
{"current_steps": 7550, "total_steps": 12698, "loss": 0.1489, "lr": 1.690606990295331e-05, "epoch": 4.16207276736494, "percentage": 59.46, "elapsed_time": "14:02:33", "remaining_time": "9:34:30"}
|
| 1511 |
+
{"current_steps": 7555, "total_steps": 12698, "loss": 0.139, "lr": 1.6878913451210715e-05, "epoch": 4.164829106945976, "percentage": 59.5, "elapsed_time": "14:02:46", "remaining_time": "9:33:42"}
|
| 1512 |
+
{"current_steps": 7560, "total_steps": 12698, "loss": 0.1431, "lr": 1.6851762896113827e-05, "epoch": 4.167585446527012, "percentage": 59.54, "elapsed_time": "14:02:59", "remaining_time": "9:32:55"}
|
| 1513 |
+
{"current_steps": 7565, "total_steps": 12698, "loss": 0.1508, "lr": 1.682461828895799e-05, "epoch": 4.1703417861080485, "percentage": 59.58, "elapsed_time": "14:03:11", "remaining_time": "9:32:07"}
|
| 1514 |
+
{"current_steps": 7570, "total_steps": 12698, "loss": 0.1344, "lr": 1.67974796810273e-05, "epoch": 4.173098125689085, "percentage": 59.62, "elapsed_time": "14:03:23", "remaining_time": "9:31:19"}
|
| 1515 |
+
{"current_steps": 7575, "total_steps": 12698, "loss": 0.1607, "lr": 1.6770347123594527e-05, "epoch": 4.175854465270121, "percentage": 59.66, "elapsed_time": "14:03:35", "remaining_time": "9:30:31"}
|
| 1516 |
+
{"current_steps": 7580, "total_steps": 12698, "loss": 0.1366, "lr": 1.674322066792102e-05, "epoch": 4.178610804851157, "percentage": 59.69, "elapsed_time": "14:03:47", "remaining_time": "9:29:43"}
|
| 1517 |
+
{"current_steps": 7585, "total_steps": 12698, "loss": 0.1458, "lr": 1.6716100365256593e-05, "epoch": 4.181367144432194, "percentage": 59.73, "elapsed_time": "14:04:00", "remaining_time": "9:28:56"}
|
| 1518 |
+
{"current_steps": 7590, "total_steps": 12698, "loss": 0.1421, "lr": 1.668898626683942e-05, "epoch": 4.184123484013231, "percentage": 59.77, "elapsed_time": "14:04:13", "remaining_time": "9:28:09"}
|
| 1519 |
+
{"current_steps": 7595, "total_steps": 12698, "loss": 0.1421, "lr": 1.6661878423895975e-05, "epoch": 4.186879823594267, "percentage": 59.81, "elapsed_time": "14:04:26", "remaining_time": "9:27:22"}
|
| 1520 |
+
{"current_steps": 7600, "total_steps": 12698, "loss": 0.1319, "lr": 1.6634776887640902e-05, "epoch": 4.189636163175303, "percentage": 59.85, "elapsed_time": "14:04:38", "remaining_time": "9:26:34"}
|
| 1521 |
+
{"current_steps": 7605, "total_steps": 12698, "loss": 0.1277, "lr": 1.6607681709276938e-05, "epoch": 4.19239250275634, "percentage": 59.89, "elapsed_time": "14:04:50", "remaining_time": "9:25:46"}
|
| 1522 |
+
{"current_steps": 7610, "total_steps": 12698, "loss": 0.1345, "lr": 1.6580592939994796e-05, "epoch": 4.195148842337376, "percentage": 59.93, "elapsed_time": "14:05:03", "remaining_time": "9:24:59"}
|
| 1523 |
+
{"current_steps": 7615, "total_steps": 12698, "loss": 0.1336, "lr": 1.655351063097309e-05, "epoch": 4.197905181918412, "percentage": 59.97, "elapsed_time": "14:05:15", "remaining_time": "9:24:12"}
|
| 1524 |
+
{"current_steps": 7620, "total_steps": 12698, "loss": 0.1409, "lr": 1.6526434833378232e-05, "epoch": 4.200661521499449, "percentage": 60.01, "elapsed_time": "14:05:30", "remaining_time": "9:23:26"}
|
| 1525 |
+
{"current_steps": 7625, "total_steps": 12698, "loss": 0.1389, "lr": 1.649936559836431e-05, "epoch": 4.203417861080485, "percentage": 60.05, "elapsed_time": "14:05:42", "remaining_time": "9:22:39"}
|
| 1526 |
+
{"current_steps": 7630, "total_steps": 12698, "loss": 0.1367, "lr": 1.6472302977073044e-05, "epoch": 4.206174200661522, "percentage": 60.09, "elapsed_time": "14:05:55", "remaining_time": "9:21:53"}
|
| 1527 |
+
{"current_steps": 7635, "total_steps": 12698, "loss": 0.1437, "lr": 1.644524702063364e-05, "epoch": 4.208930540242558, "percentage": 60.13, "elapsed_time": "14:06:10", "remaining_time": "9:21:07"}
|
| 1528 |
+
{"current_steps": 7640, "total_steps": 12698, "loss": 0.1427, "lr": 1.6418197780162718e-05, "epoch": 4.211686879823595, "percentage": 60.17, "elapsed_time": "14:06:26", "remaining_time": "9:20:22"}
|
| 1529 |
+
{"current_steps": 7645, "total_steps": 12698, "loss": 0.1367, "lr": 1.63911553067642e-05, "epoch": 4.214443219404631, "percentage": 60.21, "elapsed_time": "14:06:38", "remaining_time": "9:19:35"}
|
| 1530 |
+
{"current_steps": 7650, "total_steps": 12698, "loss": 0.1313, "lr": 1.6364119651529232e-05, "epoch": 4.2171995589856675, "percentage": 60.25, "elapsed_time": "14:06:50", "remaining_time": "9:18:48"}
|
| 1531 |
+
{"current_steps": 7655, "total_steps": 12698, "loss": 0.1341, "lr": 1.633709086553609e-05, "epoch": 4.219955898566703, "percentage": 60.29, "elapsed_time": "14:07:02", "remaining_time": "9:18:00"}
|
| 1532 |
+
{"current_steps": 7660, "total_steps": 12698, "loss": 0.1385, "lr": 1.6310068999850045e-05, "epoch": 4.22271223814774, "percentage": 60.32, "elapsed_time": "14:07:14", "remaining_time": "9:17:14"}
|
| 1533 |
+
{"current_steps": 7665, "total_steps": 12698, "loss": 0.1424, "lr": 1.6283054105523315e-05, "epoch": 4.225468577728776, "percentage": 60.36, "elapsed_time": "14:07:27", "remaining_time": "9:16:27"}
|
| 1534 |
+
{"current_steps": 7670, "total_steps": 12698, "loss": 0.1399, "lr": 1.6256046233594937e-05, "epoch": 4.228224917309813, "percentage": 60.4, "elapsed_time": "14:07:42", "remaining_time": "9:15:42"}
|
| 1535 |
+
{"current_steps": 7675, "total_steps": 12698, "loss": 0.135, "lr": 1.622904543509068e-05, "epoch": 4.230981256890849, "percentage": 60.44, "elapsed_time": "14:07:54", "remaining_time": "9:14:55"}
|
| 1536 |
+
{"current_steps": 7680, "total_steps": 12698, "loss": 0.1344, "lr": 1.620205176102296e-05, "epoch": 4.233737596471886, "percentage": 60.48, "elapsed_time": "14:08:06", "remaining_time": "9:14:08"}
|
| 1537 |
+
{"current_steps": 7685, "total_steps": 12698, "loss": 0.13, "lr": 1.6175065262390724e-05, "epoch": 4.236493936052922, "percentage": 60.52, "elapsed_time": "14:08:18", "remaining_time": "9:13:21"}
|
| 1538 |
+
{"current_steps": 7690, "total_steps": 12698, "loss": 0.1402, "lr": 1.614808599017936e-05, "epoch": 4.2392502756339585, "percentage": 60.56, "elapsed_time": "14:08:31", "remaining_time": "9:12:35"}
|
| 1539 |
+
{"current_steps": 7695, "total_steps": 12698, "loss": 0.1338, "lr": 1.612111399536061e-05, "epoch": 4.2420066152149944, "percentage": 60.6, "elapsed_time": "14:08:43", "remaining_time": "9:11:48"}
|
| 1540 |
+
{"current_steps": 7700, "total_steps": 12698, "loss": 0.1292, "lr": 1.609414932889246e-05, "epoch": 4.244762954796031, "percentage": 60.64, "elapsed_time": "14:08:55", "remaining_time": "9:11:01"}
|
| 1541 |
+
{"current_steps": 7705, "total_steps": 12698, "loss": 0.1204, "lr": 1.6067192041719065e-05, "epoch": 4.247519294377067, "percentage": 60.68, "elapsed_time": "14:09:06", "remaining_time": "9:10:14"}
|
| 1542 |
+
{"current_steps": 7710, "total_steps": 12698, "loss": 0.1379, "lr": 1.604024218477062e-05, "epoch": 4.250275633958104, "percentage": 60.72, "elapsed_time": "14:09:19", "remaining_time": "9:09:28"}
|
| 1543 |
+
{"current_steps": 7715, "total_steps": 12698, "loss": 0.1289, "lr": 1.601329980896329e-05, "epoch": 4.25303197353914, "percentage": 60.76, "elapsed_time": "14:09:31", "remaining_time": "9:08:41"}
|
| 1544 |
+
{"current_steps": 7720, "total_steps": 12698, "loss": 0.13, "lr": 1.59863649651991e-05, "epoch": 4.255788313120177, "percentage": 60.8, "elapsed_time": "14:09:43", "remaining_time": "9:07:54"}
|
| 1545 |
+
{"current_steps": 7725, "total_steps": 12698, "loss": 0.1277, "lr": 1.5959437704365866e-05, "epoch": 4.258544652701213, "percentage": 60.84, "elapsed_time": "14:09:56", "remaining_time": "9:07:09"}
|
| 1546 |
+
{"current_steps": 7730, "total_steps": 12698, "loss": 0.1364, "lr": 1.5932518077337055e-05, "epoch": 4.26130099228225, "percentage": 60.88, "elapsed_time": "14:10:08", "remaining_time": "9:06:22"}
|
| 1547 |
+
{"current_steps": 7735, "total_steps": 12698, "loss": 0.1309, "lr": 1.590560613497172e-05, "epoch": 4.2640573318632855, "percentage": 60.92, "elapsed_time": "14:10:20", "remaining_time": "9:05:36"}
|
| 1548 |
+
{"current_steps": 7740, "total_steps": 12698, "loss": 0.1322, "lr": 1.587870192811439e-05, "epoch": 4.266813671444322, "percentage": 60.95, "elapsed_time": "14:10:33", "remaining_time": "9:04:50"}
|
| 1549 |
+
{"current_steps": 7745, "total_steps": 12698, "loss": 0.1396, "lr": 1.5851805507594987e-05, "epoch": 4.269570011025358, "percentage": 60.99, "elapsed_time": "14:10:48", "remaining_time": "9:04:05"}
|