penfever commited on
Commit
32155db
·
verified ·
1 Parent(s): a2324dc

Training in progress, step 12000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51807f07c6ca1089af2765dd935b562326cf6ebe5b48bee30125c0407a16d3a1
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8a431f35c93cc45c5f0626f1ed8782b0cf3fad52044b60e5f67d52ae99bc342
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e084c862f6467cda9ab4675e851eca3c6830e4b495a50b014cb54fe36b8976b0
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bce38ef8ebbd02fe3e6301409b57f5c5319ad601a7c471afe4a12da35690f851
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea3d4c31fc9b8091275d5603e130314ac9a87a01c732f9a0628c2cd80a35002d
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62ca25b44abd5febd786205accf5229dfb958a5675223cc32c61e0987ef56e5d
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:264226dba1a0f1d326344bc2e130cef29f83874ddbf2890aa081dbd17f079416
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45d5b56bb5879c220019e6ec1f2ad00759a02d2ca8a1b33d32f54b3a0e9b741c
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -2130,3 +2130,302 @@
2130
  {"current_steps": 10650, "total_steps": 12698, "loss": 0.0721, "lr": 3.0897968432135105e-06, "epoch": 5.871003307607497, "percentage": 83.87, "elapsed_time": "18:59:54", "remaining_time": "3:39:12"}
2131
  {"current_steps": 10655, "total_steps": 12698, "loss": 0.0814, "lr": 3.0751341141845794e-06, "epoch": 5.873759647188534, "percentage": 83.91, "elapsed_time": "19:00:47", "remaining_time": "3:38:44"}
2132
  {"current_steps": 10660, "total_steps": 12698, "loss": 0.0848, "lr": 3.060503361179423e-06, "epoch": 5.87651598676957, "percentage": 83.95, "elapsed_time": "19:01:11", "remaining_time": "3:38:10"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2130
  {"current_steps": 10650, "total_steps": 12698, "loss": 0.0721, "lr": 3.0897968432135105e-06, "epoch": 5.871003307607497, "percentage": 83.87, "elapsed_time": "18:59:54", "remaining_time": "3:39:12"}
2131
  {"current_steps": 10655, "total_steps": 12698, "loss": 0.0814, "lr": 3.0751341141845794e-06, "epoch": 5.873759647188534, "percentage": 83.91, "elapsed_time": "19:00:47", "remaining_time": "3:38:44"}
2132
  {"current_steps": 10660, "total_steps": 12698, "loss": 0.0848, "lr": 3.060503361179423e-06, "epoch": 5.87651598676957, "percentage": 83.95, "elapsed_time": "19:01:11", "remaining_time": "3:38:10"}
2133
+ {"current_steps": 10665, "total_steps": 12698, "loss": 0.075, "lr": 3.045904611839827e-06, "epoch": 5.879272326350606, "percentage": 83.99, "elapsed_time": "19:01:33", "remaining_time": "3:37:36"}
2134
+ {"current_steps": 10670, "total_steps": 12698, "loss": 0.0682, "lr": 3.031337893747095e-06, "epoch": 5.882028665931642, "percentage": 84.03, "elapsed_time": "19:01:58", "remaining_time": "3:37:03"}
2135
+ {"current_steps": 10675, "total_steps": 12698, "loss": 0.0845, "lr": 3.0168032344220165e-06, "epoch": 5.884785005512679, "percentage": 84.07, "elapsed_time": "19:02:34", "remaining_time": "3:36:31"}
2136
+ {"current_steps": 10680, "total_steps": 12698, "loss": 0.0593, "lr": 3.0023006613248217e-06, "epoch": 5.887541345093716, "percentage": 84.11, "elapsed_time": "19:02:56", "remaining_time": "3:35:57"}
2137
+ {"current_steps": 10685, "total_steps": 12698, "loss": 0.076, "lr": 2.9878302018551087e-06, "epoch": 5.890297684674752, "percentage": 84.15, "elapsed_time": "19:03:20", "remaining_time": "3:35:24"}
2138
+ {"current_steps": 10690, "total_steps": 12698, "loss": 0.0738, "lr": 2.9733918833518127e-06, "epoch": 5.893054024255788, "percentage": 84.19, "elapsed_time": "19:03:46", "remaining_time": "3:34:50"}
2139
+ {"current_steps": 10695, "total_steps": 12698, "loss": 0.0816, "lr": 2.9589857330931404e-06, "epoch": 5.895810363836825, "percentage": 84.23, "elapsed_time": "19:04:18", "remaining_time": "3:34:18"}
2140
+ {"current_steps": 10700, "total_steps": 12698, "loss": 0.0783, "lr": 2.9446117782965266e-06, "epoch": 5.8985667034178615, "percentage": 84.27, "elapsed_time": "19:04:52", "remaining_time": "3:33:46"}
2141
+ {"current_steps": 10705, "total_steps": 12698, "loss": 0.0748, "lr": 2.9302700461185707e-06, "epoch": 5.901323042998897, "percentage": 84.3, "elapsed_time": "19:05:12", "remaining_time": "3:33:12"}
2142
+ {"current_steps": 10710, "total_steps": 12698, "loss": 0.0747, "lr": 2.915960563655014e-06, "epoch": 5.904079382579933, "percentage": 84.34, "elapsed_time": "19:05:34", "remaining_time": "3:32:38"}
2143
+ {"current_steps": 10715, "total_steps": 12698, "loss": 0.094, "lr": 2.9016833579406455e-06, "epoch": 5.90683572216097, "percentage": 84.38, "elapsed_time": "19:06:13", "remaining_time": "3:32:07"}
2144
+ {"current_steps": 10720, "total_steps": 12698, "loss": 0.0752, "lr": 2.8874384559492897e-06, "epoch": 5.909592061742007, "percentage": 84.42, "elapsed_time": "19:06:38", "remaining_time": "3:31:34"}
2145
+ {"current_steps": 10725, "total_steps": 12698, "loss": 0.0649, "lr": 2.8732258845937313e-06, "epoch": 5.912348401323043, "percentage": 84.46, "elapsed_time": "19:07:00", "remaining_time": "3:31:00"}
2146
+ {"current_steps": 10730, "total_steps": 12698, "loss": 0.0845, "lr": 2.8590456707256776e-06, "epoch": 5.915104740904079, "percentage": 84.5, "elapsed_time": "19:07:32", "remaining_time": "3:30:28"}
2147
+ {"current_steps": 10735, "total_steps": 12698, "loss": 0.0795, "lr": 2.8448978411356987e-06, "epoch": 5.917861080485116, "percentage": 84.54, "elapsed_time": "19:08:06", "remaining_time": "3:29:56"}
2148
+ {"current_steps": 10740, "total_steps": 12698, "loss": 0.0625, "lr": 2.830782422553189e-06, "epoch": 5.9206174200661525, "percentage": 84.58, "elapsed_time": "19:08:32", "remaining_time": "3:29:23"}
2149
+ {"current_steps": 10745, "total_steps": 12698, "loss": 0.0738, "lr": 2.8166994416463023e-06, "epoch": 5.9233737596471885, "percentage": 84.62, "elapsed_time": "19:09:10", "remaining_time": "3:28:52"}
2150
+ {"current_steps": 10750, "total_steps": 12698, "loss": 0.0645, "lr": 2.802648925021907e-06, "epoch": 5.926130099228224, "percentage": 84.66, "elapsed_time": "19:09:38", "remaining_time": "3:28:19"}
2151
+ {"current_steps": 10755, "total_steps": 12698, "loss": 0.0599, "lr": 2.788630899225542e-06, "epoch": 5.928886438809261, "percentage": 84.7, "elapsed_time": "19:10:02", "remaining_time": "3:27:46"}
2152
+ {"current_steps": 10760, "total_steps": 12698, "loss": 0.0819, "lr": 2.7746453907413616e-06, "epoch": 5.931642778390298, "percentage": 84.74, "elapsed_time": "19:10:29", "remaining_time": "3:27:12"}
2153
+ {"current_steps": 10765, "total_steps": 12698, "loss": 0.0729, "lr": 2.760692425992084e-06, "epoch": 5.934399117971334, "percentage": 84.78, "elapsed_time": "19:11:01", "remaining_time": "3:26:40"}
2154
+ {"current_steps": 10770, "total_steps": 12698, "loss": 0.0879, "lr": 2.7467720313389402e-06, "epoch": 5.93715545755237, "percentage": 84.82, "elapsed_time": "19:11:29", "remaining_time": "3:26:08"}
2155
+ {"current_steps": 10775, "total_steps": 12698, "loss": 0.0809, "lr": 2.73288423308163e-06, "epoch": 5.939911797133407, "percentage": 84.86, "elapsed_time": "19:11:55", "remaining_time": "3:25:34"}
2156
+ {"current_steps": 10780, "total_steps": 12698, "loss": 0.0939, "lr": 2.7190290574582647e-06, "epoch": 5.942668136714444, "percentage": 84.9, "elapsed_time": "19:12:19", "remaining_time": "3:25:01"}
2157
+ {"current_steps": 10785, "total_steps": 12698, "loss": 0.0631, "lr": 2.705206530645328e-06, "epoch": 5.9454244762954795, "percentage": 84.93, "elapsed_time": "19:12:39", "remaining_time": "3:24:27"}
2158
+ {"current_steps": 10790, "total_steps": 12698, "loss": 0.0787, "lr": 2.6914166787576167e-06, "epoch": 5.948180815876516, "percentage": 84.97, "elapsed_time": "19:13:02", "remaining_time": "3:23:53"}
2159
+ {"current_steps": 10795, "total_steps": 12698, "loss": 0.0665, "lr": 2.6776595278481955e-06, "epoch": 5.950937155457552, "percentage": 85.01, "elapsed_time": "19:13:23", "remaining_time": "3:23:19"}
2160
+ {"current_steps": 10800, "total_steps": 12698, "loss": 0.097, "lr": 2.6639351039083437e-06, "epoch": 5.953693495038589, "percentage": 85.05, "elapsed_time": "19:13:56", "remaining_time": "3:22:47"}
2161
+ {"current_steps": 10805, "total_steps": 12698, "loss": 0.0918, "lr": 2.650243432867521e-06, "epoch": 5.956449834619625, "percentage": 85.09, "elapsed_time": "19:14:43", "remaining_time": "3:22:18"}
2162
+ {"current_steps": 10810, "total_steps": 12698, "loss": 0.0719, "lr": 2.636584540593299e-06, "epoch": 5.959206174200662, "percentage": 85.13, "elapsed_time": "19:15:07", "remaining_time": "3:21:44"}
2163
+ {"current_steps": 10815, "total_steps": 12698, "loss": 0.0703, "lr": 2.62295845289132e-06, "epoch": 5.961962513781698, "percentage": 85.17, "elapsed_time": "19:15:30", "remaining_time": "3:21:11"}
2164
+ {"current_steps": 10820, "total_steps": 12698, "loss": 0.0696, "lr": 2.6093651955052492e-06, "epoch": 5.964718853362735, "percentage": 85.21, "elapsed_time": "19:15:53", "remaining_time": "3:20:37"}
2165
+ {"current_steps": 10825, "total_steps": 12698, "loss": 0.0637, "lr": 2.5958047941167296e-06, "epoch": 5.967475192943771, "percentage": 85.25, "elapsed_time": "19:16:13", "remaining_time": "3:20:03"}
2166
+ {"current_steps": 10830, "total_steps": 12698, "loss": 0.0826, "lr": 2.582277274345324e-06, "epoch": 5.970231532524807, "percentage": 85.29, "elapsed_time": "19:16:34", "remaining_time": "3:19:29"}
2167
+ {"current_steps": 10835, "total_steps": 12698, "loss": 0.0629, "lr": 2.568782661748479e-06, "epoch": 5.972987872105843, "percentage": 85.33, "elapsed_time": "19:16:57", "remaining_time": "3:18:55"}
2168
+ {"current_steps": 10840, "total_steps": 12698, "loss": 0.0667, "lr": 2.5553209818214632e-06, "epoch": 5.97574421168688, "percentage": 85.37, "elapsed_time": "19:17:18", "remaining_time": "3:18:21"}
2169
+ {"current_steps": 10845, "total_steps": 12698, "loss": 0.0664, "lr": 2.541892259997332e-06, "epoch": 5.978500551267916, "percentage": 85.41, "elapsed_time": "19:17:44", "remaining_time": "3:17:48"}
2170
+ {"current_steps": 10850, "total_steps": 12698, "loss": 0.0764, "lr": 2.5284965216468617e-06, "epoch": 5.981256890848953, "percentage": 85.45, "elapsed_time": "19:18:18", "remaining_time": "3:17:17"}
2171
+ {"current_steps": 10855, "total_steps": 12698, "loss": 0.0624, "lr": 2.5151337920785323e-06, "epoch": 5.984013230429989, "percentage": 85.49, "elapsed_time": "19:18:48", "remaining_time": "3:16:44"}
2172
+ {"current_steps": 10860, "total_steps": 12698, "loss": 0.0676, "lr": 2.501804096538447e-06, "epoch": 5.986769570011026, "percentage": 85.53, "elapsed_time": "19:19:17", "remaining_time": "3:16:12"}
2173
+ {"current_steps": 10865, "total_steps": 12698, "loss": 0.0838, "lr": 2.4885074602102987e-06, "epoch": 5.989525909592062, "percentage": 85.56, "elapsed_time": "19:20:09", "remaining_time": "3:15:43"}
2174
+ {"current_steps": 10870, "total_steps": 12698, "loss": 0.1384, "lr": 2.4752439082153235e-06, "epoch": 5.9922822491730985, "percentage": 85.6, "elapsed_time": "19:21:03", "remaining_time": "3:15:15"}
2175
+ {"current_steps": 10875, "total_steps": 12698, "loss": 0.0683, "lr": 2.462013465612254e-06, "epoch": 5.995038588754134, "percentage": 85.64, "elapsed_time": "19:21:33", "remaining_time": "3:14:42"}
2176
+ {"current_steps": 10880, "total_steps": 12698, "loss": 0.0668, "lr": 2.4488161573972667e-06, "epoch": 5.997794928335171, "percentage": 85.68, "elapsed_time": "19:21:57", "remaining_time": "3:14:09"}
2177
+ {"current_steps": 10885, "total_steps": 12698, "loss": 0.121, "lr": 2.435652008503939e-06, "epoch": 6.000551267916207, "percentage": 85.72, "elapsed_time": "19:22:52", "remaining_time": "3:13:41"}
2178
+ {"current_steps": 10890, "total_steps": 12698, "loss": 0.1894, "lr": 2.422521043803199e-06, "epoch": 6.003307607497244, "percentage": 85.76, "elapsed_time": "19:24:06", "remaining_time": "3:13:16"}
2179
+ {"current_steps": 10895, "total_steps": 12698, "loss": 0.1723, "lr": 2.4094232881032787e-06, "epoch": 6.00606394707828, "percentage": 85.8, "elapsed_time": "19:25:15", "remaining_time": "3:12:50"}
2180
+ {"current_steps": 10900, "total_steps": 12698, "loss": 0.174, "lr": 2.3963587661496713e-06, "epoch": 6.008820286659317, "percentage": 85.84, "elapsed_time": "19:26:31", "remaining_time": "3:12:25"}
2181
+ {"current_steps": 10905, "total_steps": 12698, "loss": 0.1641, "lr": 2.383327502625088e-06, "epoch": 6.011576626240353, "percentage": 85.88, "elapsed_time": "19:27:49", "remaining_time": "3:12:00"}
2182
+ {"current_steps": 10910, "total_steps": 12698, "loss": 0.1673, "lr": 2.3703295221493926e-06, "epoch": 6.0143329658213895, "percentage": 85.92, "elapsed_time": "19:29:08", "remaining_time": "3:11:36"}
2183
+ {"current_steps": 10915, "total_steps": 12698, "loss": 0.1808, "lr": 2.3573648492795754e-06, "epoch": 6.0170893054024255, "percentage": 85.96, "elapsed_time": "19:30:24", "remaining_time": "3:11:11"}
2184
+ {"current_steps": 10920, "total_steps": 12698, "loss": 0.1752, "lr": 2.3444335085096957e-06, "epoch": 6.019845644983462, "percentage": 86.0, "elapsed_time": "19:31:40", "remaining_time": "3:10:46"}
2185
+ {"current_steps": 10925, "total_steps": 12698, "loss": 0.1643, "lr": 2.33153552427084e-06, "epoch": 6.022601984564498, "percentage": 86.04, "elapsed_time": "19:32:52", "remaining_time": "3:10:20"}
2186
+ {"current_steps": 10930, "total_steps": 12698, "loss": 0.1525, "lr": 2.318670920931074e-06, "epoch": 6.025358324145535, "percentage": 86.08, "elapsed_time": "19:33:50", "remaining_time": "3:09:52"}
2187
+ {"current_steps": 10935, "total_steps": 12698, "loss": 0.1569, "lr": 2.3058397227954e-06, "epoch": 6.028114663726571, "percentage": 86.12, "elapsed_time": "19:35:03", "remaining_time": "3:09:27"}
2188
+ {"current_steps": 10940, "total_steps": 12698, "loss": 0.1653, "lr": 2.2930419541057015e-06, "epoch": 6.030871003307608, "percentage": 86.16, "elapsed_time": "19:36:15", "remaining_time": "3:09:01"}
2189
+ {"current_steps": 10945, "total_steps": 12698, "loss": 0.1617, "lr": 2.2802776390407087e-06, "epoch": 6.033627342888644, "percentage": 86.19, "elapsed_time": "19:37:24", "remaining_time": "3:08:34"}
2190
+ {"current_steps": 10950, "total_steps": 12698, "loss": 0.1616, "lr": 2.2675468017159518e-06, "epoch": 6.036383682469681, "percentage": 86.23, "elapsed_time": "19:38:32", "remaining_time": "3:08:08"}
2191
+ {"current_steps": 10955, "total_steps": 12698, "loss": 0.1544, "lr": 2.2548494661837063e-06, "epoch": 6.0391400220507165, "percentage": 86.27, "elapsed_time": "19:39:42", "remaining_time": "3:07:41"}
2192
+ {"current_steps": 10960, "total_steps": 12698, "loss": 0.16, "lr": 2.2421856564329515e-06, "epoch": 6.041896361631753, "percentage": 86.31, "elapsed_time": "19:40:49", "remaining_time": "3:07:15"}
2193
+ {"current_steps": 10965, "total_steps": 12698, "loss": 0.1616, "lr": 2.2295553963893313e-06, "epoch": 6.044652701212789, "percentage": 86.35, "elapsed_time": "19:41:57", "remaining_time": "3:06:48"}
2194
+ {"current_steps": 10970, "total_steps": 12698, "loss": 0.157, "lr": 2.2169587099151002e-06, "epoch": 6.047409040793826, "percentage": 86.39, "elapsed_time": "19:43:11", "remaining_time": "3:06:22"}
2195
+ {"current_steps": 10975, "total_steps": 12698, "loss": 0.1676, "lr": 2.204395620809088e-06, "epoch": 6.050165380374862, "percentage": 86.43, "elapsed_time": "19:44:23", "remaining_time": "3:05:56"}
2196
+ {"current_steps": 10980, "total_steps": 12698, "loss": 0.1854, "lr": 2.191866152806643e-06, "epoch": 6.052921719955899, "percentage": 86.47, "elapsed_time": "19:45:32", "remaining_time": "3:05:29"}
2197
+ {"current_steps": 10985, "total_steps": 12698, "loss": 0.1291, "lr": 2.1793703295795998e-06, "epoch": 6.055678059536935, "percentage": 86.51, "elapsed_time": "19:46:32", "remaining_time": "3:05:01"}
2198
+ {"current_steps": 10990, "total_steps": 12698, "loss": 0.1532, "lr": 2.1669081747362196e-06, "epoch": 6.058434399117972, "percentage": 86.55, "elapsed_time": "19:47:44", "remaining_time": "3:04:35"}
2199
+ {"current_steps": 10995, "total_steps": 12698, "loss": 0.1581, "lr": 2.1544797118211604e-06, "epoch": 6.061190738699008, "percentage": 86.59, "elapsed_time": "19:48:56", "remaining_time": "3:04:09"}
2200
+ {"current_steps": 11000, "total_steps": 12698, "loss": 0.1646, "lr": 2.1420849643154294e-06, "epoch": 6.063947078280044, "percentage": 86.63, "elapsed_time": "19:50:03", "remaining_time": "3:03:42"}
2201
+ {"current_steps": 11005, "total_steps": 12698, "loss": 0.1597, "lr": 2.129723955636329e-06, "epoch": 6.06670341786108, "percentage": 86.67, "elapsed_time": "19:51:19", "remaining_time": "3:03:16"}
2202
+ {"current_steps": 11010, "total_steps": 12698, "loss": 0.1593, "lr": 2.1173967091374227e-06, "epoch": 6.069459757442117, "percentage": 86.71, "elapsed_time": "19:52:36", "remaining_time": "3:02:50"}
2203
+ {"current_steps": 11015, "total_steps": 12698, "loss": 0.1397, "lr": 2.105103248108482e-06, "epoch": 6.072216097023153, "percentage": 86.75, "elapsed_time": "19:53:52", "remaining_time": "3:02:24"}
2204
+ {"current_steps": 11020, "total_steps": 12698, "loss": 0.1413, "lr": 2.0928435957754557e-06, "epoch": 6.07497243660419, "percentage": 86.79, "elapsed_time": "19:55:07", "remaining_time": "3:01:58"}
2205
+ {"current_steps": 11025, "total_steps": 12698, "loss": 0.1469, "lr": 2.080617775300413e-06, "epoch": 6.077728776185226, "percentage": 86.82, "elapsed_time": "19:56:22", "remaining_time": "3:01:32"}
2206
+ {"current_steps": 11030, "total_steps": 12698, "loss": 0.1426, "lr": 2.0684258097815047e-06, "epoch": 6.080485115766263, "percentage": 86.86, "elapsed_time": "19:57:11", "remaining_time": "3:01:02"}
2207
+ {"current_steps": 11035, "total_steps": 12698, "loss": 0.1636, "lr": 2.0562677222529204e-06, "epoch": 6.083241455347299, "percentage": 86.9, "elapsed_time": "19:58:19", "remaining_time": "3:00:35"}
2208
+ {"current_steps": 11040, "total_steps": 12698, "loss": 0.1704, "lr": 2.0441435356848436e-06, "epoch": 6.0859977949283355, "percentage": 86.94, "elapsed_time": "19:59:30", "remaining_time": "3:00:08"}
2209
+ {"current_steps": 11045, "total_steps": 12698, "loss": 0.1668, "lr": 2.0320532729834187e-06, "epoch": 6.088754134509371, "percentage": 86.98, "elapsed_time": "20:00:41", "remaining_time": "2:59:41"}
2210
+ {"current_steps": 11050, "total_steps": 12698, "loss": 0.165, "lr": 2.019996956990682e-06, "epoch": 6.091510474090408, "percentage": 87.02, "elapsed_time": "20:01:53", "remaining_time": "2:59:14"}
2211
+ {"current_steps": 11055, "total_steps": 12698, "loss": 0.1589, "lr": 2.0079746104845445e-06, "epoch": 6.094266813671444, "percentage": 87.06, "elapsed_time": "20:03:11", "remaining_time": "2:58:49"}
2212
+ {"current_steps": 11060, "total_steps": 12698, "loss": 0.1647, "lr": 1.9959862561787347e-06, "epoch": 6.097023153252481, "percentage": 87.1, "elapsed_time": "20:04:26", "remaining_time": "2:58:22"}
2213
+ {"current_steps": 11065, "total_steps": 12698, "loss": 0.1596, "lr": 1.984031916722762e-06, "epoch": 6.099779492833517, "percentage": 87.14, "elapsed_time": "20:05:42", "remaining_time": "2:57:56"}
2214
+ {"current_steps": 11070, "total_steps": 12698, "loss": 0.1685, "lr": 1.972111614701873e-06, "epoch": 6.102535832414554, "percentage": 87.18, "elapsed_time": "20:06:59", "remaining_time": "2:57:30"}
2215
+ {"current_steps": 11075, "total_steps": 12698, "loss": 0.1629, "lr": 1.9602253726370056e-06, "epoch": 6.10529217199559, "percentage": 87.22, "elapsed_time": "20:08:16", "remaining_time": "2:57:04"}
2216
+ {"current_steps": 11080, "total_steps": 12698, "loss": 0.1634, "lr": 1.9483732129847466e-06, "epoch": 6.1080485115766265, "percentage": 87.26, "elapsed_time": "20:09:29", "remaining_time": "2:56:37"}
2217
+ {"current_steps": 11085, "total_steps": 12698, "loss": 0.1615, "lr": 1.9365551581372964e-06, "epoch": 6.1108048511576625, "percentage": 87.3, "elapsed_time": "20:10:36", "remaining_time": "2:56:09"}
2218
+ {"current_steps": 11090, "total_steps": 12698, "loss": 0.1537, "lr": 1.924771230422413e-06, "epoch": 6.113561190738699, "percentage": 87.34, "elapsed_time": "20:11:42", "remaining_time": "2:55:41"}
2219
+ {"current_steps": 11095, "total_steps": 12698, "loss": 0.1315, "lr": 1.913021452103392e-06, "epoch": 6.116317530319735, "percentage": 87.38, "elapsed_time": "20:12:29", "remaining_time": "2:55:10"}
2220
+ {"current_steps": 11100, "total_steps": 12698, "loss": 0.1579, "lr": 1.901305845378998e-06, "epoch": 6.119073869900772, "percentage": 87.42, "elapsed_time": "20:13:42", "remaining_time": "2:54:43"}
2221
+ {"current_steps": 11105, "total_steps": 12698, "loss": 0.1578, "lr": 1.8896244323834412e-06, "epoch": 6.121830209481808, "percentage": 87.45, "elapsed_time": "20:14:51", "remaining_time": "2:54:16"}
2222
+ {"current_steps": 11110, "total_steps": 12698, "loss": 0.1602, "lr": 1.877977235186328e-06, "epoch": 6.124586549062845, "percentage": 87.49, "elapsed_time": "20:16:07", "remaining_time": "2:53:49"}
2223
+ {"current_steps": 11115, "total_steps": 12698, "loss": 0.1576, "lr": 1.8663642757926227e-06, "epoch": 6.127342888643881, "percentage": 87.53, "elapsed_time": "20:17:21", "remaining_time": "2:53:22"}
2224
+ {"current_steps": 11120, "total_steps": 12698, "loss": 0.1613, "lr": 1.8547855761426014e-06, "epoch": 6.130099228224918, "percentage": 87.57, "elapsed_time": "20:18:40", "remaining_time": "2:52:56"}
2225
+ {"current_steps": 11125, "total_steps": 12698, "loss": 0.1614, "lr": 1.843241158111817e-06, "epoch": 6.1328555678059535, "percentage": 87.61, "elapsed_time": "20:19:51", "remaining_time": "2:52:28"}
2226
+ {"current_steps": 11130, "total_steps": 12698, "loss": 0.1222, "lr": 1.8317310435110535e-06, "epoch": 6.13561190738699, "percentage": 87.65, "elapsed_time": "20:20:39", "remaining_time": "2:51:58"}
2227
+ {"current_steps": 11135, "total_steps": 12698, "loss": 0.1545, "lr": 1.820255254086285e-06, "epoch": 6.138368246968026, "percentage": 87.69, "elapsed_time": "20:21:40", "remaining_time": "2:51:29"}
2228
+ {"current_steps": 11140, "total_steps": 12698, "loss": 0.1561, "lr": 1.8088138115186304e-06, "epoch": 6.141124586549063, "percentage": 87.73, "elapsed_time": "20:22:52", "remaining_time": "2:51:01"}
2229
+ {"current_steps": 11145, "total_steps": 12698, "loss": 0.161, "lr": 1.7974067374243298e-06, "epoch": 6.143880926130099, "percentage": 87.77, "elapsed_time": "20:24:04", "remaining_time": "2:50:34"}
2230
+ {"current_steps": 11150, "total_steps": 12698, "loss": 0.1534, "lr": 1.786034053354684e-06, "epoch": 6.146637265711136, "percentage": 87.81, "elapsed_time": "20:25:10", "remaining_time": "2:50:05"}
2231
+ {"current_steps": 11155, "total_steps": 12698, "loss": 0.1503, "lr": 1.7746957807960141e-06, "epoch": 6.149393605292172, "percentage": 87.85, "elapsed_time": "20:26:19", "remaining_time": "2:49:37"}
2232
+ {"current_steps": 11160, "total_steps": 12698, "loss": 0.1579, "lr": 1.763391941169641e-06, "epoch": 6.152149944873209, "percentage": 87.89, "elapsed_time": "20:27:37", "remaining_time": "2:49:11"}
2233
+ {"current_steps": 11165, "total_steps": 12698, "loss": 0.1463, "lr": 1.7521225558318212e-06, "epoch": 6.154906284454245, "percentage": 87.93, "elapsed_time": "20:28:13", "remaining_time": "2:48:38"}
2234
+ {"current_steps": 11170, "total_steps": 12698, "loss": 0.1334, "lr": 1.7408876460737234e-06, "epoch": 6.157662624035281, "percentage": 87.97, "elapsed_time": "20:28:25", "remaining_time": "2:48:02"}
2235
+ {"current_steps": 11175, "total_steps": 12698, "loss": 0.1262, "lr": 1.7296872331213776e-06, "epoch": 6.160418963616317, "percentage": 88.01, "elapsed_time": "20:28:38", "remaining_time": "2:47:26"}
2236
+ {"current_steps": 11180, "total_steps": 12698, "loss": 0.1205, "lr": 1.7185213381356414e-06, "epoch": 6.163175303197354, "percentage": 88.05, "elapsed_time": "20:28:50", "remaining_time": "2:46:50"}
2237
+ {"current_steps": 11185, "total_steps": 12698, "loss": 0.1225, "lr": 1.7073899822121532e-06, "epoch": 6.16593164277839, "percentage": 88.08, "elapsed_time": "20:29:04", "remaining_time": "2:46:15"}
2238
+ {"current_steps": 11190, "total_steps": 12698, "loss": 0.1168, "lr": 1.6962931863813103e-06, "epoch": 6.168687982359427, "percentage": 88.12, "elapsed_time": "20:29:15", "remaining_time": "2:45:39"}
2239
+ {"current_steps": 11195, "total_steps": 12698, "loss": 0.1228, "lr": 1.6852309716082027e-06, "epoch": 6.171444321940463, "percentage": 88.16, "elapsed_time": "20:29:28", "remaining_time": "2:45:03"}
2240
+ {"current_steps": 11200, "total_steps": 12698, "loss": 0.1097, "lr": 1.6742033587925921e-06, "epoch": 6.1742006615215, "percentage": 88.2, "elapsed_time": "20:29:40", "remaining_time": "2:44:28"}
2241
+ {"current_steps": 11205, "total_steps": 12698, "loss": 0.1331, "lr": 1.6632103687688617e-06, "epoch": 6.176957001102536, "percentage": 88.24, "elapsed_time": "20:29:51", "remaining_time": "2:43:52"}
2242
+ {"current_steps": 11210, "total_steps": 12698, "loss": 0.124, "lr": 1.652252022305989e-06, "epoch": 6.1797133406835725, "percentage": 88.28, "elapsed_time": "20:30:04", "remaining_time": "2:43:16"}
2243
+ {"current_steps": 11215, "total_steps": 12698, "loss": 0.1114, "lr": 1.6413283401074975e-06, "epoch": 6.182469680264608, "percentage": 88.32, "elapsed_time": "20:30:17", "remaining_time": "2:42:41"}
2244
+ {"current_steps": 11220, "total_steps": 12698, "loss": 0.1145, "lr": 1.6304393428114185e-06, "epoch": 6.185226019845645, "percentage": 88.36, "elapsed_time": "20:30:30", "remaining_time": "2:42:05"}
2245
+ {"current_steps": 11225, "total_steps": 12698, "loss": 0.1162, "lr": 1.6195850509902534e-06, "epoch": 6.187982359426681, "percentage": 88.4, "elapsed_time": "20:30:42", "remaining_time": "2:41:30"}
2246
+ {"current_steps": 11230, "total_steps": 12698, "loss": 0.1017, "lr": 1.6087654851509339e-06, "epoch": 6.190738699007718, "percentage": 88.44, "elapsed_time": "20:30:54", "remaining_time": "2:40:54"}
2247
+ {"current_steps": 11235, "total_steps": 12698, "loss": 0.1026, "lr": 1.597980665734784e-06, "epoch": 6.193495038588754, "percentage": 88.48, "elapsed_time": "20:31:06", "remaining_time": "2:40:18"}
2248
+ {"current_steps": 11240, "total_steps": 12698, "loss": 0.106, "lr": 1.5872306131174896e-06, "epoch": 6.196251378169791, "percentage": 88.52, "elapsed_time": "20:31:19", "remaining_time": "2:39:43"}
2249
+ {"current_steps": 11245, "total_steps": 12698, "loss": 0.1143, "lr": 1.5765153476090444e-06, "epoch": 6.199007717750827, "percentage": 88.56, "elapsed_time": "20:31:32", "remaining_time": "2:39:07"}
2250
+ {"current_steps": 11250, "total_steps": 12698, "loss": 0.1179, "lr": 1.5658348894537167e-06, "epoch": 6.2017640573318635, "percentage": 88.6, "elapsed_time": "20:31:46", "remaining_time": "2:38:32"}
2251
+ {"current_steps": 11255, "total_steps": 12698, "loss": 0.1043, "lr": 1.5551892588300188e-06, "epoch": 6.2045203969128995, "percentage": 88.64, "elapsed_time": "20:31:58", "remaining_time": "2:37:57"}
2252
+ {"current_steps": 11260, "total_steps": 12698, "loss": 0.1159, "lr": 1.5445784758506599e-06, "epoch": 6.207276736493936, "percentage": 88.68, "elapsed_time": "20:32:12", "remaining_time": "2:37:21"}
2253
+ {"current_steps": 11265, "total_steps": 12698, "loss": 0.115, "lr": 1.5340025605625152e-06, "epoch": 6.210033076074972, "percentage": 88.71, "elapsed_time": "20:32:26", "remaining_time": "2:36:46"}
2254
+ {"current_steps": 11270, "total_steps": 12698, "loss": 0.1136, "lr": 1.523461532946584e-06, "epoch": 6.212789415656009, "percentage": 88.75, "elapsed_time": "20:32:42", "remaining_time": "2:36:11"}
2255
+ {"current_steps": 11275, "total_steps": 12698, "loss": 0.1084, "lr": 1.5129554129179514e-06, "epoch": 6.215545755237045, "percentage": 88.79, "elapsed_time": "20:32:54", "remaining_time": "2:35:36"}
2256
+ {"current_steps": 11280, "total_steps": 12698, "loss": 0.1056, "lr": 1.5024842203257506e-06, "epoch": 6.218302094818082, "percentage": 88.83, "elapsed_time": "20:33:06", "remaining_time": "2:35:00"}
2257
+ {"current_steps": 11285, "total_steps": 12698, "loss": 0.1076, "lr": 1.4920479749531302e-06, "epoch": 6.221058434399118, "percentage": 88.87, "elapsed_time": "20:33:18", "remaining_time": "2:34:25"}
2258
+ {"current_steps": 11290, "total_steps": 12698, "loss": 0.1142, "lr": 1.4816466965172094e-06, "epoch": 6.223814773980155, "percentage": 88.91, "elapsed_time": "20:33:31", "remaining_time": "2:33:50"}
2259
+ {"current_steps": 11295, "total_steps": 12698, "loss": 0.1145, "lr": 1.4712804046690466e-06, "epoch": 6.2265711135611905, "percentage": 88.95, "elapsed_time": "20:33:43", "remaining_time": "2:33:14"}
2260
+ {"current_steps": 11300, "total_steps": 12698, "loss": 0.1152, "lr": 1.460949118993602e-06, "epoch": 6.229327453142227, "percentage": 88.99, "elapsed_time": "20:33:58", "remaining_time": "2:32:39"}
2261
+ {"current_steps": 11305, "total_steps": 12698, "loss": 0.1061, "lr": 1.4506528590096957e-06, "epoch": 6.232083792723263, "percentage": 89.03, "elapsed_time": "20:34:11", "remaining_time": "2:32:04"}
2262
+ {"current_steps": 11310, "total_steps": 12698, "loss": 0.1098, "lr": 1.4403916441699762e-06, "epoch": 6.2348401323043, "percentage": 89.07, "elapsed_time": "20:34:23", "remaining_time": "2:31:29"}
2263
+ {"current_steps": 11315, "total_steps": 12698, "loss": 0.1059, "lr": 1.43016549386088e-06, "epoch": 6.237596471885336, "percentage": 89.11, "elapsed_time": "20:34:35", "remaining_time": "2:30:54"}
2264
+ {"current_steps": 11320, "total_steps": 12698, "loss": 0.1106, "lr": 1.419974427402595e-06, "epoch": 6.240352811466373, "percentage": 89.15, "elapsed_time": "20:34:47", "remaining_time": "2:30:18"}
2265
+ {"current_steps": 11325, "total_steps": 12698, "loss": 0.1061, "lr": 1.4098184640490331e-06, "epoch": 6.243109151047409, "percentage": 89.19, "elapsed_time": "20:35:00", "remaining_time": "2:29:43"}
2266
+ {"current_steps": 11330, "total_steps": 12698, "loss": 0.1021, "lr": 1.3996976229877768e-06, "epoch": 6.245865490628446, "percentage": 89.23, "elapsed_time": "20:35:11", "remaining_time": "2:29:08"}
2267
+ {"current_steps": 11335, "total_steps": 12698, "loss": 0.0981, "lr": 1.3896119233400595e-06, "epoch": 6.248621830209482, "percentage": 89.27, "elapsed_time": "20:35:23", "remaining_time": "2:28:33"}
2268
+ {"current_steps": 11340, "total_steps": 12698, "loss": 0.1062, "lr": 1.3795613841607148e-06, "epoch": 6.251378169790518, "percentage": 89.31, "elapsed_time": "20:35:36", "remaining_time": "2:27:58"}
2269
+ {"current_steps": 11345, "total_steps": 12698, "loss": 0.1047, "lr": 1.369546024438153e-06, "epoch": 6.254134509371554, "percentage": 89.34, "elapsed_time": "20:35:48", "remaining_time": "2:27:22"}
2270
+ {"current_steps": 11350, "total_steps": 12698, "loss": 0.0986, "lr": 1.3595658630943186e-06, "epoch": 6.256890848952591, "percentage": 89.38, "elapsed_time": "20:36:00", "remaining_time": "2:26:47"}
2271
+ {"current_steps": 11355, "total_steps": 12698, "loss": 0.1064, "lr": 1.34962091898466e-06, "epoch": 6.259647188533627, "percentage": 89.42, "elapsed_time": "20:36:12", "remaining_time": "2:26:12"}
2272
+ {"current_steps": 11360, "total_steps": 12698, "loss": 0.1105, "lr": 1.3397112108980826e-06, "epoch": 6.262403528114664, "percentage": 89.46, "elapsed_time": "20:36:24", "remaining_time": "2:25:37"}
2273
+ {"current_steps": 11365, "total_steps": 12698, "loss": 0.1014, "lr": 1.329836757556926e-06, "epoch": 6.2651598676957, "percentage": 89.5, "elapsed_time": "20:36:36", "remaining_time": "2:25:02"}
2274
+ {"current_steps": 11370, "total_steps": 12698, "loss": 0.1089, "lr": 1.3199975776169183e-06, "epoch": 6.267916207276737, "percentage": 89.54, "elapsed_time": "20:36:50", "remaining_time": "2:24:27"}
2275
+ {"current_steps": 11375, "total_steps": 12698, "loss": 0.1127, "lr": 1.3101936896671562e-06, "epoch": 6.270672546857773, "percentage": 89.58, "elapsed_time": "20:37:05", "remaining_time": "2:23:52"}
2276
+ {"current_steps": 11380, "total_steps": 12698, "loss": 0.1146, "lr": 1.3004251122300481e-06, "epoch": 6.2734288864388095, "percentage": 89.62, "elapsed_time": "20:37:18", "remaining_time": "2:23:18"}
2277
+ {"current_steps": 11385, "total_steps": 12698, "loss": 0.101, "lr": 1.2906918637612975e-06, "epoch": 6.276185226019845, "percentage": 89.66, "elapsed_time": "20:37:31", "remaining_time": "2:22:43"}
2278
+ {"current_steps": 11390, "total_steps": 12698, "loss": 0.1068, "lr": 1.2809939626498547e-06, "epoch": 6.278941565600882, "percentage": 89.7, "elapsed_time": "20:37:43", "remaining_time": "2:22:08"}
2279
+ {"current_steps": 11395, "total_steps": 12698, "loss": 0.1053, "lr": 1.2713314272178967e-06, "epoch": 6.281697905181918, "percentage": 89.74, "elapsed_time": "20:37:55", "remaining_time": "2:21:33"}
2280
+ {"current_steps": 11400, "total_steps": 12698, "loss": 0.0962, "lr": 1.2617042757207787e-06, "epoch": 6.284454244762955, "percentage": 89.78, "elapsed_time": "20:38:07", "remaining_time": "2:20:58"}
2281
+ {"current_steps": 11405, "total_steps": 12698, "loss": 0.1037, "lr": 1.2521125263470046e-06, "epoch": 6.287210584343991, "percentage": 89.82, "elapsed_time": "20:38:19", "remaining_time": "2:20:23"}
2282
+ {"current_steps": 11410, "total_steps": 12698, "loss": 0.1061, "lr": 1.2425561972181987e-06, "epoch": 6.289966923925028, "percentage": 89.86, "elapsed_time": "20:38:32", "remaining_time": "2:19:48"}
2283
+ {"current_steps": 11415, "total_steps": 12698, "loss": 0.1027, "lr": 1.2330353063890588e-06, "epoch": 6.292723263506064, "percentage": 89.9, "elapsed_time": "20:38:44", "remaining_time": "2:19:13"}
2284
+ {"current_steps": 11420, "total_steps": 12698, "loss": 0.1086, "lr": 1.223549871847336e-06, "epoch": 6.2954796030871005, "percentage": 89.94, "elapsed_time": "20:38:57", "remaining_time": "2:18:38"}
2285
+ {"current_steps": 11425, "total_steps": 12698, "loss": 0.1006, "lr": 1.2140999115137953e-06, "epoch": 6.2982359426681365, "percentage": 89.97, "elapsed_time": "20:39:10", "remaining_time": "2:18:04"}
2286
+ {"current_steps": 11430, "total_steps": 12698, "loss": 0.1043, "lr": 1.2046854432421706e-06, "epoch": 6.300992282249173, "percentage": 90.01, "elapsed_time": "20:39:22", "remaining_time": "2:17:29"}
2287
+ {"current_steps": 11435, "total_steps": 12698, "loss": 0.1063, "lr": 1.1953064848191497e-06, "epoch": 6.303748621830209, "percentage": 90.05, "elapsed_time": "20:39:35", "remaining_time": "2:16:54"}
2288
+ {"current_steps": 11440, "total_steps": 12698, "loss": 0.1075, "lr": 1.1859630539643297e-06, "epoch": 6.306504961411246, "percentage": 90.09, "elapsed_time": "20:39:47", "remaining_time": "2:16:20"}
2289
+ {"current_steps": 11445, "total_steps": 12698, "loss": 0.1083, "lr": 1.176655168330183e-06, "epoch": 6.309261300992282, "percentage": 90.13, "elapsed_time": "20:40:00", "remaining_time": "2:15:45"}
2290
+ {"current_steps": 11450, "total_steps": 12698, "loss": 0.0985, "lr": 1.167382845502032e-06, "epoch": 6.312017640573319, "percentage": 90.17, "elapsed_time": "20:40:12", "remaining_time": "2:15:10"}
2291
+ {"current_steps": 11455, "total_steps": 12698, "loss": 0.108, "lr": 1.1581461029980078e-06, "epoch": 6.314773980154355, "percentage": 90.21, "elapsed_time": "20:40:25", "remaining_time": "2:14:36"}
2292
+ {"current_steps": 11460, "total_steps": 12698, "loss": 0.1128, "lr": 1.148944958269016e-06, "epoch": 6.317530319735392, "percentage": 90.25, "elapsed_time": "20:40:39", "remaining_time": "2:14:01"}
2293
+ {"current_steps": 11465, "total_steps": 12698, "loss": 0.1004, "lr": 1.1397794286987107e-06, "epoch": 6.3202866593164275, "percentage": 90.29, "elapsed_time": "20:40:51", "remaining_time": "2:13:26"}
2294
+ {"current_steps": 11470, "total_steps": 12698, "loss": 0.1028, "lr": 1.1306495316034648e-06, "epoch": 6.323042998897464, "percentage": 90.33, "elapsed_time": "20:41:02", "remaining_time": "2:12:52"}
2295
+ {"current_steps": 11475, "total_steps": 12698, "loss": 0.1073, "lr": 1.1215552842323208e-06, "epoch": 6.3257993384785, "percentage": 90.37, "elapsed_time": "20:41:15", "remaining_time": "2:12:17"}
2296
+ {"current_steps": 11480, "total_steps": 12698, "loss": 0.1095, "lr": 1.1124967037669764e-06, "epoch": 6.328555678059537, "percentage": 90.41, "elapsed_time": "20:41:27", "remaining_time": "2:11:42"}
2297
+ {"current_steps": 11485, "total_steps": 12698, "loss": 0.109, "lr": 1.1034738073217356e-06, "epoch": 6.331312017640573, "percentage": 90.45, "elapsed_time": "20:41:39", "remaining_time": "2:11:08"}
2298
+ {"current_steps": 11490, "total_steps": 12698, "loss": 0.1018, "lr": 1.0944866119434948e-06, "epoch": 6.33406835722161, "percentage": 90.49, "elapsed_time": "20:41:51", "remaining_time": "2:10:33"}
2299
+ {"current_steps": 11495, "total_steps": 12698, "loss": 0.1099, "lr": 1.0855351346116927e-06, "epoch": 6.336824696802646, "percentage": 90.53, "elapsed_time": "20:42:04", "remaining_time": "2:09:59"}
2300
+ {"current_steps": 11500, "total_steps": 12698, "loss": 0.1021, "lr": 1.0766193922382895e-06, "epoch": 6.339581036383683, "percentage": 90.57, "elapsed_time": "20:42:16", "remaining_time": "2:09:24"}
2301
+ {"current_steps": 11505, "total_steps": 12698, "loss": 0.1104, "lr": 1.0677394016677333e-06, "epoch": 6.342337375964719, "percentage": 90.6, "elapsed_time": "20:42:28", "remaining_time": "2:08:50"}
2302
+ {"current_steps": 11510, "total_steps": 12698, "loss": 0.1157, "lr": 1.058895179676922e-06, "epoch": 6.345093715545755, "percentage": 90.64, "elapsed_time": "20:42:44", "remaining_time": "2:08:16"}
2303
+ {"current_steps": 11515, "total_steps": 12698, "loss": 0.1087, "lr": 1.050086742975176e-06, "epoch": 6.347850055126791, "percentage": 90.68, "elapsed_time": "20:42:56", "remaining_time": "2:07:41"}
2304
+ {"current_steps": 11520, "total_steps": 12698, "loss": 0.1031, "lr": 1.0413141082042167e-06, "epoch": 6.350606394707828, "percentage": 90.72, "elapsed_time": "20:43:07", "remaining_time": "2:07:07"}
2305
+ {"current_steps": 11525, "total_steps": 12698, "loss": 0.1038, "lr": 1.0325772919381127e-06, "epoch": 6.353362734288864, "percentage": 90.76, "elapsed_time": "20:43:20", "remaining_time": "2:06:32"}
2306
+ {"current_steps": 11530, "total_steps": 12698, "loss": 0.1057, "lr": 1.0238763106832694e-06, "epoch": 6.356119073869901, "percentage": 90.8, "elapsed_time": "20:43:32", "remaining_time": "2:05:58"}
2307
+ {"current_steps": 11535, "total_steps": 12698, "loss": 0.103, "lr": 1.015211180878386e-06, "epoch": 6.358875413450937, "percentage": 90.84, "elapsed_time": "20:43:44", "remaining_time": "2:05:23"}
2308
+ {"current_steps": 11540, "total_steps": 12698, "loss": 0.0984, "lr": 1.0065819188944247e-06, "epoch": 6.361631753031974, "percentage": 90.88, "elapsed_time": "20:43:56", "remaining_time": "2:04:49"}
2309
+ {"current_steps": 11545, "total_steps": 12698, "loss": 0.1061, "lr": 9.97988541034589e-07, "epoch": 6.36438809261301, "percentage": 90.92, "elapsed_time": "20:44:09", "remaining_time": "2:04:15"}
2310
+ {"current_steps": 11550, "total_steps": 12698, "loss": 0.1145, "lr": 9.894310635342852e-07, "epoch": 6.3671444321940465, "percentage": 90.96, "elapsed_time": "20:44:21", "remaining_time": "2:03:40"}
2311
+ {"current_steps": 11555, "total_steps": 12698, "loss": 0.1081, "lr": 9.809095025610894e-07, "epoch": 6.369900771775082, "percentage": 91.0, "elapsed_time": "20:44:33", "remaining_time": "2:03:06"}
2312
+ {"current_steps": 11560, "total_steps": 12698, "loss": 0.1021, "lr": 9.724238742147207e-07, "epoch": 6.372657111356119, "percentage": 91.04, "elapsed_time": "20:44:47", "remaining_time": "2:02:32"}
2313
+ {"current_steps": 11565, "total_steps": 12698, "loss": 0.1027, "lr": 9.63974194527022e-07, "epoch": 6.375413450937155, "percentage": 91.08, "elapsed_time": "20:45:04", "remaining_time": "2:01:58"}
2314
+ {"current_steps": 11570, "total_steps": 12698, "loss": 0.094, "lr": 9.555604794619056e-07, "epoch": 6.378169790518192, "percentage": 91.12, "elapsed_time": "20:45:17", "remaining_time": "2:01:24"}
2315
+ {"current_steps": 11575, "total_steps": 12698, "loss": 0.1034, "lr": 9.471827449153425e-07, "epoch": 6.380926130099228, "percentage": 91.16, "elapsed_time": "20:45:29", "remaining_time": "2:00:50"}
2316
+ {"current_steps": 11580, "total_steps": 12698, "loss": 0.1023, "lr": 9.38841006715323e-07, "epoch": 6.383682469680265, "percentage": 91.2, "elapsed_time": "20:45:41", "remaining_time": "2:00:16"}
2317
+ {"current_steps": 11585, "total_steps": 12698, "loss": 0.1062, "lr": 9.305352806218338e-07, "epoch": 6.386438809261301, "percentage": 91.23, "elapsed_time": "20:45:55", "remaining_time": "1:59:41"}
2318
+ {"current_steps": 11590, "total_steps": 12698, "loss": 0.1067, "lr": 9.222655823268201e-07, "epoch": 6.3891951488423375, "percentage": 91.27, "elapsed_time": "20:46:07", "remaining_time": "1:59:07"}
2319
+ {"current_steps": 11595, "total_steps": 12698, "loss": 0.0993, "lr": 9.140319274541621e-07, "epoch": 6.3919514884233735, "percentage": 91.31, "elapsed_time": "20:46:20", "remaining_time": "1:58:33"}
2320
+ {"current_steps": 11600, "total_steps": 12698, "loss": 0.1044, "lr": 9.058343315596407e-07, "epoch": 6.39470782800441, "percentage": 91.35, "elapsed_time": "20:46:32", "remaining_time": "1:57:59"}
2321
+ {"current_steps": 11605, "total_steps": 12698, "loss": 0.1941, "lr": 8.976728101309162e-07, "epoch": 6.397464167585446, "percentage": 91.39, "elapsed_time": "20:47:13", "remaining_time": "1:57:28"}
2322
+ {"current_steps": 11610, "total_steps": 12698, "loss": 0.215, "lr": 8.895473785874875e-07, "epoch": 6.400220507166483, "percentage": 91.43, "elapsed_time": "20:47:52", "remaining_time": "1:56:56"}
2323
+ {"current_steps": 11615, "total_steps": 12698, "loss": 0.2138, "lr": 8.814580522806748e-07, "epoch": 6.402976846747519, "percentage": 91.47, "elapsed_time": "20:48:51", "remaining_time": "1:56:26"}
2324
+ {"current_steps": 11620, "total_steps": 12698, "loss": 0.2068, "lr": 8.734048464935841e-07, "epoch": 6.405733186328556, "percentage": 91.51, "elapsed_time": "20:49:44", "remaining_time": "1:55:56"}
2325
+ {"current_steps": 11625, "total_steps": 12698, "loss": 0.2061, "lr": 8.653877764410734e-07, "epoch": 6.408489525909592, "percentage": 91.55, "elapsed_time": "20:50:36", "remaining_time": "1:55:25"}
2326
+ {"current_steps": 11630, "total_steps": 12698, "loss": 0.2104, "lr": 8.574068572697359e-07, "epoch": 6.411245865490629, "percentage": 91.59, "elapsed_time": "20:51:28", "remaining_time": "1:54:55"}
2327
+ {"current_steps": 11635, "total_steps": 12698, "loss": 0.2, "lr": 8.494621040578632e-07, "epoch": 6.4140022050716645, "percentage": 91.63, "elapsed_time": "20:52:22", "remaining_time": "1:54:25"}
2328
+ {"current_steps": 11640, "total_steps": 12698, "loss": 0.2024, "lr": 8.415535318154178e-07, "epoch": 6.416758544652701, "percentage": 91.67, "elapsed_time": "20:53:09", "remaining_time": "1:53:54"}
2329
+ {"current_steps": 11645, "total_steps": 12698, "loss": 0.2083, "lr": 8.336811554840074e-07, "epoch": 6.419514884233737, "percentage": 91.71, "elapsed_time": "20:54:06", "remaining_time": "1:53:24"}
2330
+ {"current_steps": 11650, "total_steps": 12698, "loss": 0.2068, "lr": 8.258449899368526e-07, "epoch": 6.422271223814774, "percentage": 91.75, "elapsed_time": "20:54:52", "remaining_time": "1:52:53"}
2331
+ {"current_steps": 11655, "total_steps": 12698, "loss": 0.2026, "lr": 8.180450499787662e-07, "epoch": 6.42502756339581, "percentage": 91.79, "elapsed_time": "20:55:41", "remaining_time": "1:52:22"}
2332
+ {"current_steps": 11660, "total_steps": 12698, "loss": 0.202, "lr": 8.102813503461115e-07, "epoch": 6.427783902976847, "percentage": 91.83, "elapsed_time": "20:56:45", "remaining_time": "1:51:52"}
2333
+ {"current_steps": 11665, "total_steps": 12698, "loss": 0.2013, "lr": 8.025539057067954e-07, "epoch": 6.430540242557883, "percentage": 91.86, "elapsed_time": "20:57:26", "remaining_time": "1:51:21"}
2334
+ {"current_steps": 11670, "total_steps": 12698, "loss": 0.1942, "lr": 7.948627306602174e-07, "epoch": 6.43329658213892, "percentage": 91.9, "elapsed_time": "20:58:10", "remaining_time": "1:50:49"}
2335
+ {"current_steps": 11675, "total_steps": 12698, "loss": 0.1949, "lr": 7.872078397372607e-07, "epoch": 6.436052921719956, "percentage": 91.94, "elapsed_time": "20:58:38", "remaining_time": "1:50:17"}
2336
+ {"current_steps": 11680, "total_steps": 12698, "loss": 0.1902, "lr": 7.795892474002497e-07, "epoch": 6.438809261300992, "percentage": 91.98, "elapsed_time": "20:59:04", "remaining_time": "1:49:44"}
2337
+ {"current_steps": 11685, "total_steps": 12698, "loss": 0.1937, "lr": 7.720069680429399e-07, "epoch": 6.441565600882028, "percentage": 92.02, "elapsed_time": "20:59:32", "remaining_time": "1:49:11"}
2338
+ {"current_steps": 11690, "total_steps": 12698, "loss": 0.1961, "lr": 7.644610159904719e-07, "epoch": 6.444321940463065, "percentage": 92.06, "elapsed_time": "20:59:58", "remaining_time": "1:48:38"}
2339
+ {"current_steps": 11695, "total_steps": 12698, "loss": 0.1911, "lr": 7.569514054993576e-07, "epoch": 6.447078280044101, "percentage": 92.1, "elapsed_time": "21:00:21", "remaining_time": "1:48:05"}
2340
+ {"current_steps": 11700, "total_steps": 12698, "loss": 0.1964, "lr": 7.494781507574478e-07, "epoch": 6.449834619625138, "percentage": 92.14, "elapsed_time": "21:00:50", "remaining_time": "1:47:32"}
2341
+ {"current_steps": 11705, "total_steps": 12698, "loss": 0.1922, "lr": 7.42041265883906e-07, "epoch": 6.452590959206174, "percentage": 92.18, "elapsed_time": "21:01:16", "remaining_time": "1:47:00"}
2342
+ {"current_steps": 11710, "total_steps": 12698, "loss": 0.1859, "lr": 7.346407649291887e-07, "epoch": 6.455347298787211, "percentage": 92.22, "elapsed_time": "21:01:45", "remaining_time": "1:46:27"}
2343
+ {"current_steps": 11715, "total_steps": 12698, "loss": 0.171, "lr": 7.272766618750049e-07, "epoch": 6.458103638368247, "percentage": 92.26, "elapsed_time": "21:02:14", "remaining_time": "1:45:54"}
2344
+ {"current_steps": 11720, "total_steps": 12698, "loss": 0.185, "lr": 7.19948970634301e-07, "epoch": 6.4608599779492835, "percentage": 92.3, "elapsed_time": "21:02:38", "remaining_time": "1:45:21"}
2345
+ {"current_steps": 11725, "total_steps": 12698, "loss": 0.1936, "lr": 7.126577050512274e-07, "epoch": 6.463616317530319, "percentage": 92.34, "elapsed_time": "21:03:04", "remaining_time": "1:44:48"}
2346
+ {"current_steps": 11730, "total_steps": 12698, "loss": 0.1923, "lr": 7.05402878901118e-07, "epoch": 6.466372657111356, "percentage": 92.38, "elapsed_time": "21:03:29", "remaining_time": "1:44:16"}
2347
+ {"current_steps": 11735, "total_steps": 12698, "loss": 0.1768, "lr": 6.981845058904646e-07, "epoch": 6.469128996692392, "percentage": 92.42, "elapsed_time": "21:03:56", "remaining_time": "1:43:43"}
2348
+ {"current_steps": 11740, "total_steps": 12698, "loss": 0.1812, "lr": 6.91002599656887e-07, "epoch": 6.471885336273429, "percentage": 92.46, "elapsed_time": "21:04:22", "remaining_time": "1:43:10"}
2349
+ {"current_steps": 11745, "total_steps": 12698, "loss": 0.1902, "lr": 6.838571737691024e-07, "epoch": 6.474641675854465, "percentage": 92.49, "elapsed_time": "21:04:48", "remaining_time": "1:42:37"}
2350
+ {"current_steps": 11750, "total_steps": 12698, "loss": 0.182, "lr": 6.767482417269145e-07, "epoch": 6.477398015435502, "percentage": 92.53, "elapsed_time": "21:05:16", "remaining_time": "1:42:05"}
2351
+ {"current_steps": 11755, "total_steps": 12698, "loss": 0.1721, "lr": 6.69675816961175e-07, "epoch": 6.480154355016538, "percentage": 92.57, "elapsed_time": "21:05:42", "remaining_time": "1:41:32"}
2352
+ {"current_steps": 11760, "total_steps": 12698, "loss": 0.1877, "lr": 6.626399128337647e-07, "epoch": 6.4829106945975745, "percentage": 92.61, "elapsed_time": "21:06:09", "remaining_time": "1:40:59"}
2353
+ {"current_steps": 11765, "total_steps": 12698, "loss": 0.1811, "lr": 6.556405426375634e-07, "epoch": 6.4856670341786105, "percentage": 92.65, "elapsed_time": "21:06:34", "remaining_time": "1:40:26"}
2354
+ {"current_steps": 11770, "total_steps": 12698, "loss": 0.1756, "lr": 6.486777195964334e-07, "epoch": 6.488423373759647, "percentage": 92.69, "elapsed_time": "21:07:02", "remaining_time": "1:39:53"}
2355
+ {"current_steps": 11775, "total_steps": 12698, "loss": 0.1807, "lr": 6.417514568651783e-07, "epoch": 6.491179713340683, "percentage": 92.73, "elapsed_time": "21:07:25", "remaining_time": "1:39:20"}
2356
+ {"current_steps": 11780, "total_steps": 12698, "loss": 0.1817, "lr": 6.348617675295399e-07, "epoch": 6.49393605292172, "percentage": 92.77, "elapsed_time": "21:07:50", "remaining_time": "1:38:48"}
2357
+ {"current_steps": 11785, "total_steps": 12698, "loss": 0.1849, "lr": 6.280086646061567e-07, "epoch": 6.496692392502756, "percentage": 92.81, "elapsed_time": "21:08:18", "remaining_time": "1:38:15"}
2358
+ {"current_steps": 11790, "total_steps": 12698, "loss": 0.1747, "lr": 6.211921610425431e-07, "epoch": 6.499448732083793, "percentage": 92.85, "elapsed_time": "21:08:45", "remaining_time": "1:37:42"}
2359
+ {"current_steps": 11795, "total_steps": 12698, "loss": 0.1861, "lr": 6.144122697170707e-07, "epoch": 6.502205071664829, "percentage": 92.89, "elapsed_time": "21:09:12", "remaining_time": "1:37:10"}
2360
+ {"current_steps": 11800, "total_steps": 12698, "loss": 0.1883, "lr": 6.076690034389355e-07, "epoch": 6.504961411245866, "percentage": 92.93, "elapsed_time": "21:09:43", "remaining_time": "1:36:37"}
2361
+ {"current_steps": 11805, "total_steps": 12698, "loss": 0.1733, "lr": 6.009623749481442e-07, "epoch": 6.5077177508269015, "percentage": 92.97, "elapsed_time": "21:10:07", "remaining_time": "1:36:04"}
2362
+ {"current_steps": 11810, "total_steps": 12698, "loss": 0.1846, "lr": 5.94292396915479e-07, "epoch": 6.510474090407938, "percentage": 93.01, "elapsed_time": "21:10:33", "remaining_time": "1:35:32"}
2363
+ {"current_steps": 11815, "total_steps": 12698, "loss": 0.1867, "lr": 5.876590819424777e-07, "epoch": 6.513230429988974, "percentage": 93.05, "elapsed_time": "21:11:02", "remaining_time": "1:34:59"}
2364
+ {"current_steps": 11820, "total_steps": 12698, "loss": 0.173, "lr": 5.810624425614175e-07, "epoch": 6.515986769570011, "percentage": 93.09, "elapsed_time": "21:11:31", "remaining_time": "1:34:27"}
2365
+ {"current_steps": 11825, "total_steps": 12698, "loss": 0.1716, "lr": 5.745024912352759e-07, "epoch": 6.518743109151047, "percentage": 93.12, "elapsed_time": "21:11:56", "remaining_time": "1:33:54"}
2366
+ {"current_steps": 11830, "total_steps": 12698, "loss": 0.1918, "lr": 5.679792403577234e-07, "epoch": 6.521499448732084, "percentage": 93.16, "elapsed_time": "21:12:23", "remaining_time": "1:33:21"}
2367
+ {"current_steps": 11835, "total_steps": 12698, "loss": 0.1829, "lr": 5.614927022530881e-07, "epoch": 6.52425578831312, "percentage": 93.2, "elapsed_time": "21:12:52", "remaining_time": "1:32:49"}
2368
+ {"current_steps": 11840, "total_steps": 12698, "loss": 0.1779, "lr": 5.550428891763382e-07, "epoch": 6.527012127894157, "percentage": 93.24, "elapsed_time": "21:13:16", "remaining_time": "1:32:16"}
2369
+ {"current_steps": 11845, "total_steps": 12698, "loss": 0.1876, "lr": 5.486298133130574e-07, "epoch": 6.529768467475193, "percentage": 93.28, "elapsed_time": "21:13:44", "remaining_time": "1:31:43"}
2370
+ {"current_steps": 11850, "total_steps": 12698, "loss": 0.1828, "lr": 5.422534867794227e-07, "epoch": 6.532524807056229, "percentage": 93.32, "elapsed_time": "21:14:11", "remaining_time": "1:31:10"}
2371
+ {"current_steps": 11855, "total_steps": 12698, "loss": 0.1795, "lr": 5.359139216221843e-07, "epoch": 6.535281146637265, "percentage": 93.36, "elapsed_time": "21:14:40", "remaining_time": "1:30:38"}
2372
+ {"current_steps": 11860, "total_steps": 12698, "loss": 0.1893, "lr": 5.296111298186324e-07, "epoch": 6.538037486218302, "percentage": 93.4, "elapsed_time": "21:15:05", "remaining_time": "1:30:05"}
2373
+ {"current_steps": 11865, "total_steps": 12698, "loss": 0.1715, "lr": 5.23345123276584e-07, "epoch": 6.540793825799338, "percentage": 93.44, "elapsed_time": "21:15:33", "remaining_time": "1:29:33"}
2374
+ {"current_steps": 11870, "total_steps": 12698, "loss": 0.1739, "lr": 5.171159138343607e-07, "epoch": 6.543550165380375, "percentage": 93.48, "elapsed_time": "21:15:59", "remaining_time": "1:29:00"}
2375
+ {"current_steps": 11875, "total_steps": 12698, "loss": 0.1725, "lr": 5.109235132607593e-07, "epoch": 6.546306504961411, "percentage": 93.52, "elapsed_time": "21:16:24", "remaining_time": "1:28:27"}
2376
+ {"current_steps": 11880, "total_steps": 12698, "loss": 0.183, "lr": 5.047679332550392e-07, "epoch": 6.549062844542448, "percentage": 93.56, "elapsed_time": "21:16:53", "remaining_time": "1:27:55"}
2377
+ {"current_steps": 11885, "total_steps": 12698, "loss": 0.1838, "lr": 4.986491854468933e-07, "epoch": 6.551819184123484, "percentage": 93.6, "elapsed_time": "21:17:20", "remaining_time": "1:27:22"}
2378
+ {"current_steps": 11890, "total_steps": 12698, "loss": 0.1864, "lr": 4.925672813964211e-07, "epoch": 6.5545755237045205, "percentage": 93.64, "elapsed_time": "21:17:53", "remaining_time": "1:26:50"}
2379
+ {"current_steps": 11895, "total_steps": 12698, "loss": 0.1814, "lr": 4.865222325941244e-07, "epoch": 6.557331863285556, "percentage": 93.68, "elapsed_time": "21:18:24", "remaining_time": "1:26:18"}
2380
+ {"current_steps": 11900, "total_steps": 12698, "loss": 0.1836, "lr": 4.805140504608629e-07, "epoch": 6.560088202866593, "percentage": 93.72, "elapsed_time": "21:18:53", "remaining_time": "1:25:45"}
2381
+ {"current_steps": 11905, "total_steps": 12698, "loss": 0.1863, "lr": 4.7454274634785914e-07, "epoch": 6.56284454244763, "percentage": 93.75, "elapsed_time": "21:19:21", "remaining_time": "1:25:13"}
2382
+ {"current_steps": 11910, "total_steps": 12698, "loss": 0.18, "lr": 4.686083315366463e-07, "epoch": 6.565600882028666, "percentage": 93.79, "elapsed_time": "21:19:46", "remaining_time": "1:24:40"}
2383
+ {"current_steps": 11915, "total_steps": 12698, "loss": 0.1756, "lr": 4.627108172390737e-07, "epoch": 6.568357221609702, "percentage": 93.83, "elapsed_time": "21:20:15", "remaining_time": "1:24:07"}
2384
+ {"current_steps": 11920, "total_steps": 12698, "loss": 0.1659, "lr": 4.5685021459727305e-07, "epoch": 6.571113561190739, "percentage": 93.87, "elapsed_time": "21:20:40", "remaining_time": "1:23:35"}
2385
+ {"current_steps": 11925, "total_steps": 12698, "loss": 0.1675, "lr": 4.510265346836318e-07, "epoch": 6.573869900771776, "percentage": 93.91, "elapsed_time": "21:21:05", "remaining_time": "1:23:02"}
2386
+ {"current_steps": 11930, "total_steps": 12698, "loss": 0.1659, "lr": 4.4523978850079087e-07, "epoch": 6.5766262403528115, "percentage": 93.95, "elapsed_time": "21:21:33", "remaining_time": "1:22:30"}
2387
+ {"current_steps": 11935, "total_steps": 12698, "loss": 0.1689, "lr": 4.3948998698160496e-07, "epoch": 6.5793825799338475, "percentage": 93.99, "elapsed_time": "21:21:59", "remaining_time": "1:21:57"}
2388
+ {"current_steps": 11940, "total_steps": 12698, "loss": 0.1646, "lr": 4.3377714098913115e-07, "epoch": 6.582138919514884, "percentage": 94.03, "elapsed_time": "21:22:26", "remaining_time": "1:21:24"}
2389
+ {"current_steps": 11945, "total_steps": 12698, "loss": 0.1803, "lr": 4.281012613166069e-07, "epoch": 6.584895259095921, "percentage": 94.07, "elapsed_time": "21:22:51", "remaining_time": "1:20:52"}
2390
+ {"current_steps": 11950, "total_steps": 12698, "loss": 0.1881, "lr": 4.2246235868742993e-07, "epoch": 6.587651598676957, "percentage": 94.11, "elapsed_time": "21:23:18", "remaining_time": "1:20:19"}
2391
+ {"current_steps": 11955, "total_steps": 12698, "loss": 0.1701, "lr": 4.1686044375513824e-07, "epoch": 6.590407938257993, "percentage": 94.15, "elapsed_time": "21:23:42", "remaining_time": "1:19:46"}
2392
+ {"current_steps": 11960, "total_steps": 12698, "loss": 0.1786, "lr": 4.1129552710338806e-07, "epoch": 6.59316427783903, "percentage": 94.19, "elapsed_time": "21:24:10", "remaining_time": "1:19:14"}
2393
+ {"current_steps": 11965, "total_steps": 12698, "loss": 0.1711, "lr": 4.0576761924593364e-07, "epoch": 6.595920617420067, "percentage": 94.23, "elapsed_time": "21:24:38", "remaining_time": "1:18:41"}
2394
+ {"current_steps": 11970, "total_steps": 12698, "loss": 0.1712, "lr": 4.00276730626612e-07, "epoch": 6.598676957001103, "percentage": 94.27, "elapsed_time": "21:25:07", "remaining_time": "1:18:09"}
2395
+ {"current_steps": 11975, "total_steps": 12698, "loss": 0.1763, "lr": 3.948228716193181e-07, "epoch": 6.6014332965821385, "percentage": 94.31, "elapsed_time": "21:25:35", "remaining_time": "1:17:37"}
2396
+ {"current_steps": 11980, "total_steps": 12698, "loss": 0.1693, "lr": 3.8940605252798525e-07, "epoch": 6.604189636163175, "percentage": 94.35, "elapsed_time": "21:26:04", "remaining_time": "1:17:04"}
2397
+ {"current_steps": 11985, "total_steps": 12698, "loss": 0.1791, "lr": 3.840262835865716e-07, "epoch": 6.606945975744212, "percentage": 94.38, "elapsed_time": "21:26:27", "remaining_time": "1:16:31"}
2398
+ {"current_steps": 11990, "total_steps": 12698, "loss": 0.169, "lr": 3.7868357495903563e-07, "epoch": 6.609702315325248, "percentage": 94.42, "elapsed_time": "21:26:56", "remaining_time": "1:15:59"}
2399
+ {"current_steps": 11995, "total_steps": 12698, "loss": 0.1766, "lr": 3.7337793673931423e-07, "epoch": 6.612458654906284, "percentage": 94.46, "elapsed_time": "21:27:23", "remaining_time": "1:15:27"}
2400
+ {"current_steps": 12000, "total_steps": 12698, "loss": 0.1835, "lr": 3.681093789513135e-07, "epoch": 6.615214994487321, "percentage": 94.5, "elapsed_time": "21:27:50", "remaining_time": "1:14:54"}
2401
+ {"current_steps": 12005, "total_steps": 12698, "loss": 0.1768, "lr": 3.6287791154887785e-07, "epoch": 6.617971334068358, "percentage": 94.54, "elapsed_time": "21:29:09", "remaining_time": "1:14:25"}
2402
+ {"current_steps": 12010, "total_steps": 12698, "loss": 0.1897, "lr": 3.5768354441578333e-07, "epoch": 6.620727673649394, "percentage": 94.58, "elapsed_time": "21:29:35", "remaining_time": "1:13:52"}
2403
+ {"current_steps": 12015, "total_steps": 12698, "loss": 0.1716, "lr": 3.525262873657065e-07, "epoch": 6.62348401323043, "percentage": 94.62, "elapsed_time": "21:29:59", "remaining_time": "1:13:19"}
2404
+ {"current_steps": 12020, "total_steps": 12698, "loss": 0.1909, "lr": 3.474061501422155e-07, "epoch": 6.626240352811466, "percentage": 94.66, "elapsed_time": "21:30:29", "remaining_time": "1:12:47"}
2405
+ {"current_steps": 12025, "total_steps": 12698, "loss": 0.1851, "lr": 3.423231424187501e-07, "epoch": 6.628996692392503, "percentage": 94.7, "elapsed_time": "21:30:56", "remaining_time": "1:12:15"}
2406
+ {"current_steps": 12030, "total_steps": 12698, "loss": 0.1738, "lr": 3.3727727379859523e-07, "epoch": 6.631753031973539, "percentage": 94.74, "elapsed_time": "21:31:22", "remaining_time": "1:11:42"}
2407
+ {"current_steps": 12035, "total_steps": 12698, "loss": 0.1762, "lr": 3.32268553814874e-07, "epoch": 6.634509371554575, "percentage": 94.78, "elapsed_time": "21:31:53", "remaining_time": "1:11:10"}
2408
+ {"current_steps": 12040, "total_steps": 12698, "loss": 0.1768, "lr": 3.2729699193052357e-07, "epoch": 6.637265711135612, "percentage": 94.82, "elapsed_time": "21:32:19", "remaining_time": "1:10:37"}
2409
+ {"current_steps": 12045, "total_steps": 12698, "loss": 0.1788, "lr": 3.223625975382838e-07, "epoch": 6.640022050716649, "percentage": 94.86, "elapsed_time": "21:32:43", "remaining_time": "1:10:04"}
2410
+ {"current_steps": 12050, "total_steps": 12698, "loss": 0.1824, "lr": 3.174653799606642e-07, "epoch": 6.642778390297685, "percentage": 94.9, "elapsed_time": "21:33:09", "remaining_time": "1:09:32"}
2411
+ {"current_steps": 12055, "total_steps": 12698, "loss": 0.1634, "lr": 3.126053484499436e-07, "epoch": 6.645534729878721, "percentage": 94.94, "elapsed_time": "21:33:36", "remaining_time": "1:08:59"}
2412
+ {"current_steps": 12060, "total_steps": 12698, "loss": 0.1725, "lr": 3.0778251218814394e-07, "epoch": 6.6482910694597575, "percentage": 94.98, "elapsed_time": "21:34:07", "remaining_time": "1:08:27"}
2413
+ {"current_steps": 12065, "total_steps": 12698, "loss": 0.1709, "lr": 3.0299688028701204e-07, "epoch": 6.651047409040794, "percentage": 95.01, "elapsed_time": "21:34:36", "remaining_time": "1:07:55"}
2414
+ {"current_steps": 12070, "total_steps": 12698, "loss": 0.1696, "lr": 2.9824846178801105e-07, "epoch": 6.65380374862183, "percentage": 95.05, "elapsed_time": "21:35:03", "remaining_time": "1:07:22"}
2415
+ {"current_steps": 12075, "total_steps": 12698, "loss": 0.1738, "lr": 2.93537265662287e-07, "epoch": 6.656560088202866, "percentage": 95.09, "elapsed_time": "21:35:30", "remaining_time": "1:06:50"}
2416
+ {"current_steps": 12080, "total_steps": 12698, "loss": 0.1778, "lr": 2.888633008106734e-07, "epoch": 6.659316427783903, "percentage": 95.13, "elapsed_time": "21:35:54", "remaining_time": "1:06:17"}
2417
+ {"current_steps": 12085, "total_steps": 12698, "loss": 0.1729, "lr": 2.842265760636531e-07, "epoch": 6.66207276736494, "percentage": 95.17, "elapsed_time": "21:36:21", "remaining_time": "1:05:45"}
2418
+ {"current_steps": 12090, "total_steps": 12698, "loss": 0.1728, "lr": 2.796271001813566e-07, "epoch": 6.664829106945976, "percentage": 95.21, "elapsed_time": "21:36:44", "remaining_time": "1:05:12"}
2419
+ {"current_steps": 12095, "total_steps": 12698, "loss": 0.1818, "lr": 2.75064881853544e-07, "epoch": 6.667585446527012, "percentage": 95.25, "elapsed_time": "21:37:16", "remaining_time": "1:04:40"}
2420
+ {"current_steps": 12100, "total_steps": 12698, "loss": 0.1721, "lr": 2.705399296995759e-07, "epoch": 6.6703417861080485, "percentage": 95.29, "elapsed_time": "21:37:50", "remaining_time": "1:04:08"}
2421
+ {"current_steps": 12105, "total_steps": 12698, "loss": 0.1625, "lr": 2.660522522684117e-07, "epoch": 6.673098125689085, "percentage": 95.33, "elapsed_time": "21:38:19", "remaining_time": "1:03:36"}
2422
+ {"current_steps": 12110, "total_steps": 12698, "loss": 0.1705, "lr": 2.6160185803858926e-07, "epoch": 6.675854465270121, "percentage": 95.37, "elapsed_time": "21:38:46", "remaining_time": "1:03:03"}
2423
+ {"current_steps": 12115, "total_steps": 12698, "loss": 0.1676, "lr": 2.5718875541820285e-07, "epoch": 6.678610804851157, "percentage": 95.41, "elapsed_time": "21:39:14", "remaining_time": "1:02:31"}
2424
+ {"current_steps": 12120, "total_steps": 12698, "loss": 0.1678, "lr": 2.5281295274489413e-07, "epoch": 6.681367144432194, "percentage": 95.45, "elapsed_time": "21:39:42", "remaining_time": "1:01:58"}
2425
+ {"current_steps": 12125, "total_steps": 12698, "loss": 0.1593, "lr": 2.484744582858389e-07, "epoch": 6.684123484013231, "percentage": 95.49, "elapsed_time": "21:40:09", "remaining_time": "1:01:26"}
2426
+ {"current_steps": 12130, "total_steps": 12698, "loss": 0.1625, "lr": 2.4417328023771835e-07, "epoch": 6.686879823594267, "percentage": 95.53, "elapsed_time": "21:40:34", "remaining_time": "1:00:54"}
2427
+ {"current_steps": 12135, "total_steps": 12698, "loss": 0.1685, "lr": 2.399094267267188e-07, "epoch": 6.689636163175303, "percentage": 95.57, "elapsed_time": "21:41:02", "remaining_time": "1:00:21"}
2428
+ {"current_steps": 12140, "total_steps": 12698, "loss": 0.1817, "lr": 2.3568290580850307e-07, "epoch": 6.69239250275634, "percentage": 95.61, "elapsed_time": "21:41:28", "remaining_time": "0:59:49"}
2429
+ {"current_steps": 12145, "total_steps": 12698, "loss": 0.1629, "lr": 2.3149372546821258e-07, "epoch": 6.695148842337376, "percentage": 95.64, "elapsed_time": "21:41:50", "remaining_time": "0:59:16"}
2430
+ {"current_steps": 12150, "total_steps": 12698, "loss": 0.166, "lr": 2.273418936204297e-07, "epoch": 6.697905181918412, "percentage": 95.68, "elapsed_time": "21:42:20", "remaining_time": "0:58:44"}
2431
+ {"current_steps": 12155, "total_steps": 12698, "loss": 0.1622, "lr": 2.2322741810918202e-07, "epoch": 6.700661521499448, "percentage": 95.72, "elapsed_time": "21:42:45", "remaining_time": "0:58:11"}