penfever commited on
Commit
7410f3e
·
verified ·
1 Parent(s): dcdbb9c

Training in progress, step 6000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcbeae55e12d31142d58bbf3cad7e6aa3064922c8b634d0ed6e76ecac3d52d76
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c59a011d19c4d12049d837b1831a977cca777dc78cd46a1f1d1a771b2154699
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45e29dbfca521f0fb191fb64ed560cc5872176b662af6406a7d35bfb228c768f
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bad298c7af6203eddd22bbbb43e1406ccb38c8a42f5f3a984c69920a0f4826db
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:377a73758c3fb91f05bced440552c6f1306305cba4a7fb20b2090ae7ca3b2de1
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb54db642c42bbbc526c47daad15294c50ea098c4bd120f6cf1bccafdca925a6
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3c3868e255453f358e9bad3a0807092ac91effd0fba4bc57e6b7372329207c7
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a084e08c2fd15e8cedcf64b8df07af7f169dfc6c6782fae3b5e02dfbc39f2882
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -943,3 +943,296 @@
943
  {"current_steps": 4715, "total_steps": 12698, "loss": 0.2448, "lr": 3.168620795847994e-05, "epoch": 2.5992282249173098, "percentage": 37.13, "elapsed_time": "8:32:56", "remaining_time": "14:28:27"}
944
  {"current_steps": 4720, "total_steps": 12698, "loss": 0.2485, "lr": 3.1663887707627666e-05, "epoch": 2.601984564498346, "percentage": 37.17, "elapsed_time": "8:33:24", "remaining_time": "14:27:47"}
945
  {"current_steps": 4725, "total_steps": 12698, "loss": 0.2497, "lr": 3.164154542027872e-05, "epoch": 2.6047409040793825, "percentage": 37.21, "elapsed_time": "8:33:52", "remaining_time": "14:27:06"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
943
  {"current_steps": 4715, "total_steps": 12698, "loss": 0.2448, "lr": 3.168620795847994e-05, "epoch": 2.5992282249173098, "percentage": 37.13, "elapsed_time": "8:32:56", "remaining_time": "14:28:27"}
944
  {"current_steps": 4720, "total_steps": 12698, "loss": 0.2485, "lr": 3.1663887707627666e-05, "epoch": 2.601984564498346, "percentage": 37.17, "elapsed_time": "8:33:24", "remaining_time": "14:27:47"}
945
  {"current_steps": 4725, "total_steps": 12698, "loss": 0.2497, "lr": 3.164154542027872e-05, "epoch": 2.6047409040793825, "percentage": 37.21, "elapsed_time": "8:33:52", "remaining_time": "14:27:06"}
946
+ {"current_steps": 4730, "total_steps": 12698, "loss": 0.2516, "lr": 3.161918113864423e-05, "epoch": 2.607497243660419, "percentage": 37.25, "elapsed_time": "8:34:19", "remaining_time": "14:26:24"}
947
+ {"current_steps": 4735, "total_steps": 12698, "loss": 0.245, "lr": 3.159679490497686e-05, "epoch": 2.6102535832414553, "percentage": 37.29, "elapsed_time": "8:34:44", "remaining_time": "14:25:39"}
948
+ {"current_steps": 4740, "total_steps": 12698, "loss": 0.2668, "lr": 3.157438676157075e-05, "epoch": 2.6130099228224917, "percentage": 37.33, "elapsed_time": "8:35:13", "remaining_time": "14:25:01"}
949
+ {"current_steps": 4745, "total_steps": 12698, "loss": 0.2624, "lr": 3.1551956750761444e-05, "epoch": 2.615766262403528, "percentage": 37.37, "elapsed_time": "8:35:40", "remaining_time": "14:24:18"}
950
+ {"current_steps": 4750, "total_steps": 12698, "loss": 0.259, "lr": 3.15295049149258e-05, "epoch": 2.6185226019845644, "percentage": 37.41, "elapsed_time": "8:36:07", "remaining_time": "14:23:36"}
951
+ {"current_steps": 4755, "total_steps": 12698, "loss": 0.267, "lr": 3.15070312964819e-05, "epoch": 2.621278941565601, "percentage": 37.45, "elapsed_time": "8:36:31", "remaining_time": "14:22:50"}
952
+ {"current_steps": 4760, "total_steps": 12698, "loss": 0.2577, "lr": 3.148453593788899e-05, "epoch": 2.624035281146637, "percentage": 37.49, "elapsed_time": "8:36:56", "remaining_time": "14:22:04"}
953
+ {"current_steps": 4765, "total_steps": 12698, "loss": 0.2641, "lr": 3.146201888164738e-05, "epoch": 2.6267916207276736, "percentage": 37.53, "elapsed_time": "8:37:26", "remaining_time": "14:21:27"}
954
+ {"current_steps": 4770, "total_steps": 12698, "loss": 0.2648, "lr": 3.143948017029838e-05, "epoch": 2.62954796030871, "percentage": 37.56, "elapsed_time": "8:37:52", "remaining_time": "14:20:43"}
955
+ {"current_steps": 4775, "total_steps": 12698, "loss": 0.2525, "lr": 3.141691984642421e-05, "epoch": 2.6323042998897463, "percentage": 37.6, "elapsed_time": "8:38:23", "remaining_time": "14:20:08"}
956
+ {"current_steps": 4780, "total_steps": 12698, "loss": 0.2571, "lr": 3.139433795264791e-05, "epoch": 2.6350606394707827, "percentage": 37.64, "elapsed_time": "8:38:50", "remaining_time": "14:19:26"}
957
+ {"current_steps": 4785, "total_steps": 12698, "loss": 0.2564, "lr": 3.137173453163332e-05, "epoch": 2.637816979051819, "percentage": 37.68, "elapsed_time": "8:39:15", "remaining_time": "14:18:42"}
958
+ {"current_steps": 4790, "total_steps": 12698, "loss": 0.262, "lr": 3.134910962608487e-05, "epoch": 2.6405733186328555, "percentage": 37.72, "elapsed_time": "8:39:39", "remaining_time": "14:17:55"}
959
+ {"current_steps": 4795, "total_steps": 12698, "loss": 0.2575, "lr": 3.132646327874766e-05, "epoch": 2.643329658213892, "percentage": 37.76, "elapsed_time": "8:40:05", "remaining_time": "14:17:11"}
960
+ {"current_steps": 4800, "total_steps": 12698, "loss": 0.2376, "lr": 3.130379553240726e-05, "epoch": 2.6460859977949283, "percentage": 37.8, "elapsed_time": "8:40:36", "remaining_time": "14:16:36"}
961
+ {"current_steps": 4805, "total_steps": 12698, "loss": 0.2531, "lr": 3.1281106429889655e-05, "epoch": 2.6488423373759646, "percentage": 37.84, "elapsed_time": "8:41:04", "remaining_time": "14:15:57"}
962
+ {"current_steps": 4810, "total_steps": 12698, "loss": 0.2393, "lr": 3.125839601406123e-05, "epoch": 2.651598676957001, "percentage": 37.88, "elapsed_time": "8:41:32", "remaining_time": "14:15:17"}
963
+ {"current_steps": 4815, "total_steps": 12698, "loss": 0.2491, "lr": 3.123566432782858e-05, "epoch": 2.6543550165380374, "percentage": 37.92, "elapsed_time": "8:41:59", "remaining_time": "14:14:34"}
964
+ {"current_steps": 4820, "total_steps": 12698, "loss": 0.2523, "lr": 3.121291141413853e-05, "epoch": 2.657111356119074, "percentage": 37.96, "elapsed_time": "8:42:26", "remaining_time": "14:13:53"}
965
+ {"current_steps": 4825, "total_steps": 12698, "loss": 0.2582, "lr": 3.1190137315977976e-05, "epoch": 2.65986769570011, "percentage": 38.0, "elapsed_time": "8:42:52", "remaining_time": "14:13:10"}
966
+ {"current_steps": 4830, "total_steps": 12698, "loss": 0.2443, "lr": 3.116734207637386e-05, "epoch": 2.6626240352811466, "percentage": 38.04, "elapsed_time": "8:43:16", "remaining_time": "14:12:25"}
967
+ {"current_steps": 4835, "total_steps": 12698, "loss": 0.2548, "lr": 3.114452573839306e-05, "epoch": 2.665380374862183, "percentage": 38.08, "elapsed_time": "8:43:40", "remaining_time": "14:11:37"}
968
+ {"current_steps": 4840, "total_steps": 12698, "loss": 0.2536, "lr": 3.112168834514231e-05, "epoch": 2.6681367144432193, "percentage": 38.12, "elapsed_time": "8:44:12", "remaining_time": "14:11:05"}
969
+ {"current_steps": 4845, "total_steps": 12698, "loss": 0.2413, "lr": 3.1098829939768134e-05, "epoch": 2.6708930540242557, "percentage": 38.16, "elapsed_time": "8:44:47", "remaining_time": "14:10:35"}
970
+ {"current_steps": 4850, "total_steps": 12698, "loss": 0.2359, "lr": 3.107595056545675e-05, "epoch": 2.673649393605292, "percentage": 38.19, "elapsed_time": "8:45:15", "remaining_time": "14:09:56"}
971
+ {"current_steps": 4855, "total_steps": 12698, "loss": 0.2442, "lr": 3.1053050265433975e-05, "epoch": 2.6764057331863285, "percentage": 38.23, "elapsed_time": "8:45:43", "remaining_time": "14:09:17"}
972
+ {"current_steps": 4860, "total_steps": 12698, "loss": 0.2421, "lr": 3.103012908296519e-05, "epoch": 2.679162072767365, "percentage": 38.27, "elapsed_time": "8:46:10", "remaining_time": "14:08:35"}
973
+ {"current_steps": 4865, "total_steps": 12698, "loss": 0.2312, "lr": 3.100718706135521e-05, "epoch": 2.6819184123484012, "percentage": 38.31, "elapsed_time": "8:46:40", "remaining_time": "14:07:59"}
974
+ {"current_steps": 4870, "total_steps": 12698, "loss": 0.2365, "lr": 3.098422424394824e-05, "epoch": 2.6846747519294376, "percentage": 38.35, "elapsed_time": "8:47:05", "remaining_time": "14:07:14"}
975
+ {"current_steps": 4875, "total_steps": 12698, "loss": 0.2432, "lr": 3.096124067412774e-05, "epoch": 2.687431091510474, "percentage": 38.39, "elapsed_time": "8:47:31", "remaining_time": "14:06:31"}
976
+ {"current_steps": 4880, "total_steps": 12698, "loss": 0.2414, "lr": 3.093823639531641e-05, "epoch": 2.6901874310915104, "percentage": 38.43, "elapsed_time": "8:47:59", "remaining_time": "14:05:52"}
977
+ {"current_steps": 4885, "total_steps": 12698, "loss": 0.2714, "lr": 3.091521145097606e-05, "epoch": 2.6929437706725468, "percentage": 38.47, "elapsed_time": "8:48:25", "remaining_time": "14:05:08"}
978
+ {"current_steps": 4890, "total_steps": 12698, "loss": 0.2392, "lr": 3.0892165884607545e-05, "epoch": 2.695700110253583, "percentage": 38.51, "elapsed_time": "8:48:49", "remaining_time": "14:04:23"}
979
+ {"current_steps": 4895, "total_steps": 12698, "loss": 0.2437, "lr": 3.086909973975069e-05, "epoch": 2.6984564498346195, "percentage": 38.55, "elapsed_time": "8:49:17", "remaining_time": "14:03:43"}
980
+ {"current_steps": 4900, "total_steps": 12698, "loss": 0.2402, "lr": 3.084601305998419e-05, "epoch": 2.701212789415656, "percentage": 38.59, "elapsed_time": "8:49:42", "remaining_time": "14:02:59"}
981
+ {"current_steps": 4905, "total_steps": 12698, "loss": 0.2505, "lr": 3.082290588892553e-05, "epoch": 2.7039691289966923, "percentage": 38.63, "elapsed_time": "8:50:07", "remaining_time": "14:02:15"}
982
+ {"current_steps": 4910, "total_steps": 12698, "loss": 0.2529, "lr": 3.079977827023092e-05, "epoch": 2.7067254685777287, "percentage": 38.67, "elapsed_time": "8:50:33", "remaining_time": "14:01:32"}
983
+ {"current_steps": 4915, "total_steps": 12698, "loss": 0.2502, "lr": 3.077663024759521e-05, "epoch": 2.709481808158765, "percentage": 38.71, "elapsed_time": "8:51:01", "remaining_time": "14:00:53"}
984
+ {"current_steps": 4920, "total_steps": 12698, "loss": 0.2448, "lr": 3.075346186475178e-05, "epoch": 2.7122381477398014, "percentage": 38.75, "elapsed_time": "8:51:28", "remaining_time": "14:00:11"}
985
+ {"current_steps": 4925, "total_steps": 12698, "loss": 0.2463, "lr": 3.0730273165472486e-05, "epoch": 2.714994487320838, "percentage": 38.79, "elapsed_time": "8:51:53", "remaining_time": "13:59:28"}
986
+ {"current_steps": 4930, "total_steps": 12698, "loss": 0.2479, "lr": 3.070706419356756e-05, "epoch": 2.717750826901874, "percentage": 38.83, "elapsed_time": "8:52:20", "remaining_time": "13:58:47"}
987
+ {"current_steps": 4935, "total_steps": 12698, "loss": 0.1728, "lr": 3.0683834992885535e-05, "epoch": 2.7205071664829106, "percentage": 38.86, "elapsed_time": "8:52:53", "remaining_time": "13:58:15"}
988
+ {"current_steps": 4940, "total_steps": 12698, "loss": 0.1046, "lr": 3.066058560731319e-05, "epoch": 2.723263506063947, "percentage": 38.9, "elapsed_time": "8:53:19", "remaining_time": "13:57:32"}
989
+ {"current_steps": 4945, "total_steps": 12698, "loss": 0.099, "lr": 3.0637316080775396e-05, "epoch": 2.7260198456449833, "percentage": 38.94, "elapsed_time": "8:53:46", "remaining_time": "13:56:52"}
990
+ {"current_steps": 4950, "total_steps": 12698, "loss": 0.108, "lr": 3.0614026457235114e-05, "epoch": 2.7287761852260197, "percentage": 38.98, "elapsed_time": "8:54:08", "remaining_time": "13:56:04"}
991
+ {"current_steps": 4955, "total_steps": 12698, "loss": 0.0958, "lr": 3.059071678069324e-05, "epoch": 2.731532524807056, "percentage": 39.02, "elapsed_time": "8:54:38", "remaining_time": "13:55:27"}
992
+ {"current_steps": 4960, "total_steps": 12698, "loss": 0.1028, "lr": 3.0567387095188586e-05, "epoch": 2.7342888643880925, "percentage": 39.06, "elapsed_time": "8:55:01", "remaining_time": "13:54:41"}
993
+ {"current_steps": 4965, "total_steps": 12698, "loss": 0.163, "lr": 3.054403744479774e-05, "epoch": 2.737045203969129, "percentage": 39.1, "elapsed_time": "8:55:29", "remaining_time": "13:54:01"}
994
+ {"current_steps": 4970, "total_steps": 12698, "loss": 0.1009, "lr": 3.0520667873635044e-05, "epoch": 2.7398015435501653, "percentage": 39.14, "elapsed_time": "8:55:54", "remaining_time": "13:53:17"}
995
+ {"current_steps": 4975, "total_steps": 12698, "loss": 0.124, "lr": 3.0497278425852445e-05, "epoch": 2.7425578831312016, "percentage": 39.18, "elapsed_time": "8:56:24", "remaining_time": "13:52:41"}
996
+ {"current_steps": 4980, "total_steps": 12698, "loss": 0.1196, "lr": 3.0473869145639453e-05, "epoch": 2.745314222712238, "percentage": 39.22, "elapsed_time": "8:57:18", "remaining_time": "13:52:42"}
997
+ {"current_steps": 4985, "total_steps": 12698, "loss": 0.0924, "lr": 3.0450440077223037e-05, "epoch": 2.7480705622932744, "percentage": 39.26, "elapsed_time": "8:57:49", "remaining_time": "13:52:08"}
998
+ {"current_steps": 4990, "total_steps": 12698, "loss": 0.0985, "lr": 3.0426991264867586e-05, "epoch": 2.750826901874311, "percentage": 39.3, "elapsed_time": "8:58:26", "remaining_time": "13:51:43"}
999
+ {"current_steps": 4995, "total_steps": 12698, "loss": 0.0978, "lr": 3.0403522752874754e-05, "epoch": 2.753583241455347, "percentage": 39.34, "elapsed_time": "8:59:00", "remaining_time": "13:51:13"}
1000
+ {"current_steps": 5000, "total_steps": 12698, "loss": 0.1415, "lr": 3.0380034585583425e-05, "epoch": 2.7563395810363835, "percentage": 39.38, "elapsed_time": "8:59:33", "remaining_time": "13:50:42"}
1001
+ {"current_steps": 5005, "total_steps": 12698, "loss": 0.092, "lr": 3.0356526807369624e-05, "epoch": 2.75909592061742, "percentage": 39.42, "elapsed_time": "8:59:55", "remaining_time": "13:49:54"}
1002
+ {"current_steps": 5010, "total_steps": 12698, "loss": 0.1064, "lr": 3.0332999462646414e-05, "epoch": 2.7618522601984563, "percentage": 39.46, "elapsed_time": "9:00:25", "remaining_time": "13:49:17"}
1003
+ {"current_steps": 5015, "total_steps": 12698, "loss": 0.0834, "lr": 3.030945259586385e-05, "epoch": 2.7646085997794927, "percentage": 39.49, "elapsed_time": "9:00:48", "remaining_time": "13:48:31"}
1004
+ {"current_steps": 5020, "total_steps": 12698, "loss": 0.1064, "lr": 3.0285886251508842e-05, "epoch": 2.767364939360529, "percentage": 39.53, "elapsed_time": "9:01:10", "remaining_time": "13:47:43"}
1005
+ {"current_steps": 5025, "total_steps": 12698, "loss": 0.1101, "lr": 3.026230047410511e-05, "epoch": 2.7701212789415655, "percentage": 39.57, "elapsed_time": "9:01:38", "remaining_time": "13:47:03"}
1006
+ {"current_steps": 5030, "total_steps": 12698, "loss": 0.1131, "lr": 3.0238695308213086e-05, "epoch": 2.772877618522602, "percentage": 39.61, "elapsed_time": "9:02:10", "remaining_time": "13:46:30"}
1007
+ {"current_steps": 5035, "total_steps": 12698, "loss": 0.1158, "lr": 3.0215070798429837e-05, "epoch": 2.775633958103638, "percentage": 39.65, "elapsed_time": "9:02:35", "remaining_time": "13:45:48"}
1008
+ {"current_steps": 5040, "total_steps": 12698, "loss": 0.139, "lr": 3.0191426989388985e-05, "epoch": 2.7783902976846746, "percentage": 39.69, "elapsed_time": "9:03:10", "remaining_time": "13:45:20"}
1009
+ {"current_steps": 5045, "total_steps": 12698, "loss": 0.0943, "lr": 3.0167763925760592e-05, "epoch": 2.781146637265711, "percentage": 39.73, "elapsed_time": "9:03:32", "remaining_time": "13:44:32"}
1010
+ {"current_steps": 5050, "total_steps": 12698, "loss": 0.116, "lr": 3.0144081652251107e-05, "epoch": 2.7839029768467474, "percentage": 39.77, "elapsed_time": "9:03:53", "remaining_time": "13:43:42"}
1011
+ {"current_steps": 5055, "total_steps": 12698, "loss": 0.1363, "lr": 3.012038021360328e-05, "epoch": 2.7866593164277838, "percentage": 39.81, "elapsed_time": "9:04:25", "remaining_time": "13:43:08"}
1012
+ {"current_steps": 5060, "total_steps": 12698, "loss": 0.115, "lr": 3.0096659654596064e-05, "epoch": 2.78941565600882, "percentage": 39.85, "elapsed_time": "9:04:56", "remaining_time": "13:42:35"}
1013
+ {"current_steps": 5065, "total_steps": 12698, "loss": 0.1533, "lr": 3.0072920020044533e-05, "epoch": 2.7921719955898565, "percentage": 39.89, "elapsed_time": "9:05:33", "remaining_time": "13:42:09"}
1014
+ {"current_steps": 5070, "total_steps": 12698, "loss": 0.2536, "lr": 3.00491613547998e-05, "epoch": 2.794928335170893, "percentage": 39.93, "elapsed_time": "9:06:16", "remaining_time": "13:41:53"}
1015
+ {"current_steps": 5075, "total_steps": 12698, "loss": 0.1196, "lr": 3.002538370374894e-05, "epoch": 2.7976846747519293, "percentage": 39.97, "elapsed_time": "9:06:47", "remaining_time": "13:41:19"}
1016
+ {"current_steps": 5080, "total_steps": 12698, "loss": 0.1123, "lr": 3.000158711181489e-05, "epoch": 2.8004410143329657, "percentage": 40.01, "elapsed_time": "9:07:19", "remaining_time": "13:40:45"}
1017
+ {"current_steps": 5085, "total_steps": 12698, "loss": 0.1984, "lr": 2.997777162395638e-05, "epoch": 2.803197353914002, "percentage": 40.05, "elapsed_time": "9:08:09", "remaining_time": "13:40:40"}
1018
+ {"current_steps": 5090, "total_steps": 12698, "loss": 0.0956, "lr": 2.9953937285167827e-05, "epoch": 2.8059536934950384, "percentage": 40.09, "elapsed_time": "9:08:43", "remaining_time": "13:40:10"}
1019
+ {"current_steps": 5095, "total_steps": 12698, "loss": 0.1043, "lr": 2.993008414047928e-05, "epoch": 2.808710033076075, "percentage": 40.12, "elapsed_time": "9:09:09", "remaining_time": "13:39:29"}
1020
+ {"current_steps": 5100, "total_steps": 12698, "loss": 0.1062, "lr": 2.9906212234956302e-05, "epoch": 2.811466372657111, "percentage": 40.16, "elapsed_time": "9:09:37", "remaining_time": "13:38:50"}
1021
+ {"current_steps": 5105, "total_steps": 12698, "loss": 0.0951, "lr": 2.9882321613699905e-05, "epoch": 2.8142227122381476, "percentage": 40.2, "elapsed_time": "9:10:08", "remaining_time": "13:38:16"}
1022
+ {"current_steps": 5110, "total_steps": 12698, "loss": 0.0949, "lr": 2.9858412321846467e-05, "epoch": 2.8169790518191844, "percentage": 40.24, "elapsed_time": "9:10:30", "remaining_time": "13:37:27"}
1023
+ {"current_steps": 5115, "total_steps": 12698, "loss": 0.0996, "lr": 2.983448440456764e-05, "epoch": 2.8197353914002203, "percentage": 40.28, "elapsed_time": "9:10:51", "remaining_time": "13:36:38"}
1024
+ {"current_steps": 5120, "total_steps": 12698, "loss": 0.0851, "lr": 2.9810537907070256e-05, "epoch": 2.822491730981257, "percentage": 40.32, "elapsed_time": "9:11:13", "remaining_time": "13:35:51"}
1025
+ {"current_steps": 5125, "total_steps": 12698, "loss": 0.1525, "lr": 2.9786572874596254e-05, "epoch": 2.825248070562293, "percentage": 40.36, "elapsed_time": "9:11:51", "remaining_time": "13:35:28"}
1026
+ {"current_steps": 5130, "total_steps": 12698, "loss": 0.0767, "lr": 2.976258935242259e-05, "epoch": 2.82800441014333, "percentage": 40.4, "elapsed_time": "9:12:17", "remaining_time": "13:34:46"}
1027
+ {"current_steps": 5135, "total_steps": 12698, "loss": 0.0927, "lr": 2.9738587385861164e-05, "epoch": 2.830760749724366, "percentage": 40.44, "elapsed_time": "9:12:41", "remaining_time": "13:34:00"}
1028
+ {"current_steps": 5140, "total_steps": 12698, "loss": 0.0843, "lr": 2.9714567020258712e-05, "epoch": 2.8335170893054027, "percentage": 40.48, "elapsed_time": "9:13:02", "remaining_time": "13:33:13"}
1029
+ {"current_steps": 5145, "total_steps": 12698, "loss": 0.1042, "lr": 2.9690528300996725e-05, "epoch": 2.8362734288864386, "percentage": 40.52, "elapsed_time": "9:13:38", "remaining_time": "13:32:46"}
1030
+ {"current_steps": 5150, "total_steps": 12698, "loss": 0.126, "lr": 2.9666471273491382e-05, "epoch": 2.8390297684674755, "percentage": 40.56, "elapsed_time": "9:14:18", "remaining_time": "13:32:24"}
1031
+ {"current_steps": 5155, "total_steps": 12698, "loss": 0.1294, "lr": 2.9642395983193452e-05, "epoch": 2.8417861080485114, "percentage": 40.6, "elapsed_time": "9:14:51", "remaining_time": "13:31:53"}
1032
+ {"current_steps": 5160, "total_steps": 12698, "loss": 0.1127, "lr": 2.961830247558819e-05, "epoch": 2.844542447629548, "percentage": 40.64, "elapsed_time": "9:15:15", "remaining_time": "13:31:08"}
1033
+ {"current_steps": 5165, "total_steps": 12698, "loss": 0.1259, "lr": 2.9594190796195295e-05, "epoch": 2.847298787210584, "percentage": 40.68, "elapsed_time": "9:15:43", "remaining_time": "13:30:31"}
1034
+ {"current_steps": 5170, "total_steps": 12698, "loss": 0.1401, "lr": 2.957006099056878e-05, "epoch": 2.850055126791621, "percentage": 40.72, "elapsed_time": "9:16:17", "remaining_time": "13:30:00"}
1035
+ {"current_steps": 5175, "total_steps": 12698, "loss": 0.1053, "lr": 2.9545913104296898e-05, "epoch": 2.852811466372657, "percentage": 40.75, "elapsed_time": "9:16:40", "remaining_time": "13:29:15"}
1036
+ {"current_steps": 5180, "total_steps": 12698, "loss": 0.123, "lr": 2.9521747183002086e-05, "epoch": 2.8555678059536937, "percentage": 40.79, "elapsed_time": "9:17:05", "remaining_time": "13:28:31"}
1037
+ {"current_steps": 5185, "total_steps": 12698, "loss": 0.1081, "lr": 2.9497563272340834e-05, "epoch": 2.8583241455347297, "percentage": 40.83, "elapsed_time": "9:17:34", "remaining_time": "13:27:54"}
1038
+ {"current_steps": 5190, "total_steps": 12698, "loss": 0.0958, "lr": 2.947336141800363e-05, "epoch": 2.8610804851157665, "percentage": 40.87, "elapsed_time": "9:18:09", "remaining_time": "13:27:26"}
1039
+ {"current_steps": 5195, "total_steps": 12698, "loss": 0.0956, "lr": 2.9449141665714846e-05, "epoch": 2.8638368246968025, "percentage": 40.91, "elapsed_time": "9:18:42", "remaining_time": "13:26:55"}
1040
+ {"current_steps": 5200, "total_steps": 12698, "loss": 0.0959, "lr": 2.9424904061232687e-05, "epoch": 2.8665931642778393, "percentage": 40.95, "elapsed_time": "9:19:20", "remaining_time": "13:26:31"}
1041
+ {"current_steps": 5205, "total_steps": 12698, "loss": 0.0907, "lr": 2.9400648650349094e-05, "epoch": 2.869349503858875, "percentage": 40.99, "elapsed_time": "9:19:45", "remaining_time": "13:25:49"}
1042
+ {"current_steps": 5210, "total_steps": 12698, "loss": 0.1075, "lr": 2.9376375478889613e-05, "epoch": 2.872105843439912, "percentage": 41.03, "elapsed_time": "9:20:32", "remaining_time": "13:25:38"}
1043
+ {"current_steps": 5215, "total_steps": 12698, "loss": 0.1019, "lr": 2.9352084592713378e-05, "epoch": 2.874862183020948, "percentage": 41.07, "elapsed_time": "9:21:04", "remaining_time": "13:25:04"}
1044
+ {"current_steps": 5220, "total_steps": 12698, "loss": 0.1101, "lr": 2.9327776037712978e-05, "epoch": 2.877618522601985, "percentage": 41.11, "elapsed_time": "9:21:27", "remaining_time": "13:24:20"}
1045
+ {"current_steps": 5225, "total_steps": 12698, "loss": 0.0912, "lr": 2.9303449859814385e-05, "epoch": 2.8803748621830207, "percentage": 41.15, "elapsed_time": "9:21:52", "remaining_time": "13:23:37"}
1046
+ {"current_steps": 5230, "total_steps": 12698, "loss": 0.1003, "lr": 2.927910610497687e-05, "epoch": 2.8831312017640576, "percentage": 41.19, "elapsed_time": "9:22:20", "remaining_time": "13:22:58"}
1047
+ {"current_steps": 5235, "total_steps": 12698, "loss": 0.1049, "lr": 2.925474481919291e-05, "epoch": 2.8858875413450935, "percentage": 41.23, "elapsed_time": "9:22:48", "remaining_time": "13:22:20"}
1048
+ {"current_steps": 5240, "total_steps": 12698, "loss": 0.0824, "lr": 2.9230366048488097e-05, "epoch": 2.8886438809261303, "percentage": 41.27, "elapsed_time": "9:23:11", "remaining_time": "13:21:35"}
1049
+ {"current_steps": 5245, "total_steps": 12698, "loss": 0.1083, "lr": 2.9205969838921065e-05, "epoch": 2.8914002205071663, "percentage": 41.31, "elapsed_time": "9:23:40", "remaining_time": "13:20:57"}
1050
+ {"current_steps": 5250, "total_steps": 12698, "loss": 0.1, "lr": 2.9181556236583385e-05, "epoch": 2.894156560088203, "percentage": 41.35, "elapsed_time": "9:24:03", "remaining_time": "13:20:11"}
1051
+ {"current_steps": 5255, "total_steps": 12698, "loss": 0.1184, "lr": 2.9157125287599508e-05, "epoch": 2.896912899669239, "percentage": 41.38, "elapsed_time": "9:24:33", "remaining_time": "13:19:37"}
1052
+ {"current_steps": 5260, "total_steps": 12698, "loss": 0.1011, "lr": 2.9132677038126637e-05, "epoch": 2.899669239250276, "percentage": 41.42, "elapsed_time": "9:25:06", "remaining_time": "13:19:06"}
1053
+ {"current_steps": 5265, "total_steps": 12698, "loss": 0.1189, "lr": 2.9108211534354672e-05, "epoch": 2.902425578831312, "percentage": 41.46, "elapsed_time": "9:25:27", "remaining_time": "13:18:17"}
1054
+ {"current_steps": 5270, "total_steps": 12698, "loss": 0.1098, "lr": 2.9083728822506103e-05, "epoch": 2.9051819184123486, "percentage": 41.5, "elapsed_time": "9:26:04", "remaining_time": "13:17:52"}
1055
+ {"current_steps": 5275, "total_steps": 12698, "loss": 0.1043, "lr": 2.9059228948835934e-05, "epoch": 2.9079382579933846, "percentage": 41.54, "elapsed_time": "9:26:29", "remaining_time": "13:17:10"}
1056
+ {"current_steps": 5280, "total_steps": 12698, "loss": 0.0956, "lr": 2.9034711959631607e-05, "epoch": 2.9106945975744214, "percentage": 41.58, "elapsed_time": "9:26:54", "remaining_time": "13:16:27"}
1057
+ {"current_steps": 5285, "total_steps": 12698, "loss": 0.0947, "lr": 2.901017790121288e-05, "epoch": 2.9134509371554573, "percentage": 41.62, "elapsed_time": "9:27:13", "remaining_time": "13:15:37"}
1058
+ {"current_steps": 5290, "total_steps": 12698, "loss": 0.1243, "lr": 2.898562681993177e-05, "epoch": 2.916207276736494, "percentage": 41.66, "elapsed_time": "9:27:57", "remaining_time": "13:15:20"}
1059
+ {"current_steps": 5295, "total_steps": 12698, "loss": 0.0868, "lr": 2.8961058762172448e-05, "epoch": 2.91896361631753, "percentage": 41.7, "elapsed_time": "9:28:20", "remaining_time": "13:14:36"}
1060
+ {"current_steps": 5300, "total_steps": 12698, "loss": 0.0962, "lr": 2.8936473774351167e-05, "epoch": 2.921719955898567, "percentage": 41.74, "elapsed_time": "9:28:58", "remaining_time": "13:14:12"}
1061
+ {"current_steps": 5305, "total_steps": 12698, "loss": 0.0959, "lr": 2.891187190291617e-05, "epoch": 2.924476295479603, "percentage": 41.78, "elapsed_time": "9:29:28", "remaining_time": "13:13:36"}
1062
+ {"current_steps": 5310, "total_steps": 12698, "loss": 0.0832, "lr": 2.888725319434758e-05, "epoch": 2.9272326350606397, "percentage": 41.82, "elapsed_time": "9:29:54", "remaining_time": "13:12:55"}
1063
+ {"current_steps": 5315, "total_steps": 12698, "loss": 0.0916, "lr": 2.886261769515734e-05, "epoch": 2.9299889746416756, "percentage": 41.86, "elapsed_time": "9:30:19", "remaining_time": "13:12:13"}
1064
+ {"current_steps": 5320, "total_steps": 12698, "loss": 0.0989, "lr": 2.883796545188912e-05, "epoch": 2.9327453142227125, "percentage": 41.9, "elapsed_time": "9:30:44", "remaining_time": "13:11:32"}
1065
+ {"current_steps": 5325, "total_steps": 12698, "loss": 0.1205, "lr": 2.8813296511118234e-05, "epoch": 2.9355016538037484, "percentage": 41.94, "elapsed_time": "9:31:19", "remaining_time": "13:11:03"}
1066
+ {"current_steps": 5330, "total_steps": 12698, "loss": 0.1134, "lr": 2.8788610919451504e-05, "epoch": 2.938257993384785, "percentage": 41.98, "elapsed_time": "9:31:47", "remaining_time": "13:10:25"}
1067
+ {"current_steps": 5335, "total_steps": 12698, "loss": 0.0831, "lr": 2.8763908723527256e-05, "epoch": 2.941014332965821, "percentage": 42.01, "elapsed_time": "9:32:10", "remaining_time": "13:09:41"}
1068
+ {"current_steps": 5340, "total_steps": 12698, "loss": 0.1208, "lr": 2.8739189970015152e-05, "epoch": 2.943770672546858, "percentage": 42.05, "elapsed_time": "9:32:33", "remaining_time": "13:08:55"}
1069
+ {"current_steps": 5345, "total_steps": 12698, "loss": 0.0952, "lr": 2.8714454705616157e-05, "epoch": 2.946527012127894, "percentage": 42.09, "elapsed_time": "9:32:56", "remaining_time": "13:08:10"}
1070
+ {"current_steps": 5350, "total_steps": 12698, "loss": 0.1018, "lr": 2.868970297706242e-05, "epoch": 2.9492833517089307, "percentage": 42.13, "elapsed_time": "9:33:16", "remaining_time": "13:07:22"}
1071
+ {"current_steps": 5355, "total_steps": 12698, "loss": 0.1134, "lr": 2.8664934831117205e-05, "epoch": 2.9520396912899667, "percentage": 42.17, "elapsed_time": "9:33:44", "remaining_time": "13:06:44"}
1072
+ {"current_steps": 5360, "total_steps": 12698, "loss": 0.1349, "lr": 2.864015031457478e-05, "epoch": 2.9547960308710035, "percentage": 42.21, "elapsed_time": "9:34:24", "remaining_time": "13:06:23"}
1073
+ {"current_steps": 5365, "total_steps": 12698, "loss": 0.1046, "lr": 2.8615349474260345e-05, "epoch": 2.9575523704520394, "percentage": 42.25, "elapsed_time": "9:34:57", "remaining_time": "13:05:52"}
1074
+ {"current_steps": 5370, "total_steps": 12698, "loss": 0.099, "lr": 2.8590532357029955e-05, "epoch": 2.9603087100330763, "percentage": 42.29, "elapsed_time": "9:35:24", "remaining_time": "13:05:12"}
1075
+ {"current_steps": 5375, "total_steps": 12698, "loss": 0.0952, "lr": 2.8565699009770393e-05, "epoch": 2.963065049614112, "percentage": 42.33, "elapsed_time": "9:35:46", "remaining_time": "13:04:26"}
1076
+ {"current_steps": 5380, "total_steps": 12698, "loss": 0.0949, "lr": 2.8540849479399134e-05, "epoch": 2.965821389195149, "percentage": 42.37, "elapsed_time": "9:36:07", "remaining_time": "13:03:39"}
1077
+ {"current_steps": 5385, "total_steps": 12698, "loss": 0.0852, "lr": 2.8515983812864197e-05, "epoch": 2.968577728776185, "percentage": 42.41, "elapsed_time": "9:36:27", "remaining_time": "13:02:50"}
1078
+ {"current_steps": 5390, "total_steps": 12698, "loss": 0.1195, "lr": 2.849110205714411e-05, "epoch": 2.971334068357222, "percentage": 42.45, "elapsed_time": "9:36:47", "remaining_time": "13:02:02"}
1079
+ {"current_steps": 5395, "total_steps": 12698, "loss": 0.086, "lr": 2.8466204259247786e-05, "epoch": 2.9740904079382577, "percentage": 42.49, "elapsed_time": "9:37:12", "remaining_time": "13:01:20"}
1080
+ {"current_steps": 5400, "total_steps": 12698, "loss": 0.0964, "lr": 2.8441290466214453e-05, "epoch": 2.9768467475192946, "percentage": 42.53, "elapsed_time": "9:37:34", "remaining_time": "13:00:34"}
1081
+ {"current_steps": 5405, "total_steps": 12698, "loss": 0.1024, "lr": 2.841636072511355e-05, "epoch": 2.9796030871003305, "percentage": 42.57, "elapsed_time": "9:37:59", "remaining_time": "12:59:52"}
1082
+ {"current_steps": 5410, "total_steps": 12698, "loss": 0.0933, "lr": 2.839141508304466e-05, "epoch": 2.9823594266813673, "percentage": 42.61, "elapsed_time": "9:38:37", "remaining_time": "12:59:28"}
1083
+ {"current_steps": 5415, "total_steps": 12698, "loss": 0.0846, "lr": 2.8366453587137393e-05, "epoch": 2.9851157662624033, "percentage": 42.64, "elapsed_time": "9:39:05", "remaining_time": "12:58:51"}
1084
+ {"current_steps": 5420, "total_steps": 12698, "loss": 0.09, "lr": 2.8341476284551324e-05, "epoch": 2.98787210584344, "percentage": 42.68, "elapsed_time": "9:39:38", "remaining_time": "12:58:20"}
1085
+ {"current_steps": 5425, "total_steps": 12698, "loss": 0.1659, "lr": 2.8316483222475883e-05, "epoch": 2.990628445424476, "percentage": 42.72, "elapsed_time": "9:40:43", "remaining_time": "12:58:32"}
1086
+ {"current_steps": 5430, "total_steps": 12698, "loss": 0.1154, "lr": 2.829147444813028e-05, "epoch": 2.993384785005513, "percentage": 42.76, "elapsed_time": "9:41:16", "remaining_time": "12:58:02"}
1087
+ {"current_steps": 5435, "total_steps": 12698, "loss": 0.1016, "lr": 2.82664500087634e-05, "epoch": 2.996141124586549, "percentage": 42.8, "elapsed_time": "9:41:51", "remaining_time": "12:57:33"}
1088
+ {"current_steps": 5440, "total_steps": 12698, "loss": 0.0879, "lr": 2.8241409951653732e-05, "epoch": 2.9988974641675856, "percentage": 42.84, "elapsed_time": "9:42:14", "remaining_time": "12:56:49"}
1089
+ {"current_steps": 5445, "total_steps": 12698, "loss": 0.1983, "lr": 2.8216354324109284e-05, "epoch": 3.001653803748622, "percentage": 42.88, "elapsed_time": "9:43:27", "remaining_time": "12:57:11"}
1090
+ {"current_steps": 5450, "total_steps": 12698, "loss": 0.2096, "lr": 2.819128317346745e-05, "epoch": 3.0044101433296584, "percentage": 42.92, "elapsed_time": "9:44:41", "remaining_time": "12:57:35"}
1091
+ {"current_steps": 5455, "total_steps": 12698, "loss": 0.2004, "lr": 2.8166196547094986e-05, "epoch": 3.0071664829106948, "percentage": 42.96, "elapsed_time": "9:45:47", "remaining_time": "12:57:48"}
1092
+ {"current_steps": 5460, "total_steps": 12698, "loss": 0.1943, "lr": 2.8141094492387853e-05, "epoch": 3.009922822491731, "percentage": 43.0, "elapsed_time": "9:47:06", "remaining_time": "12:58:17"}
1093
+ {"current_steps": 5465, "total_steps": 12698, "loss": 0.1954, "lr": 2.811597705677118e-05, "epoch": 3.0126791620727675, "percentage": 43.04, "elapsed_time": "9:48:24", "remaining_time": "12:58:46"}
1094
+ {"current_steps": 5470, "total_steps": 12698, "loss": 0.1953, "lr": 2.8090844287699165e-05, "epoch": 3.015435501653804, "percentage": 43.08, "elapsed_time": "9:49:44", "remaining_time": "12:59:17"}
1095
+ {"current_steps": 5475, "total_steps": 12698, "loss": 0.2106, "lr": 2.806569623265495e-05, "epoch": 3.0181918412348403, "percentage": 43.12, "elapsed_time": "9:51:01", "remaining_time": "12:59:43"}
1096
+ {"current_steps": 5480, "total_steps": 12698, "loss": 0.1978, "lr": 2.8040532939150577e-05, "epoch": 3.0209481808158767, "percentage": 43.16, "elapsed_time": "9:52:14", "remaining_time": "13:00:04"}
1097
+ {"current_steps": 5485, "total_steps": 12698, "loss": 0.1925, "lr": 2.8015354454726863e-05, "epoch": 3.023704520396913, "percentage": 43.2, "elapsed_time": "9:53:24", "remaining_time": "13:00:21"}
1098
+ {"current_steps": 5490, "total_steps": 12698, "loss": 0.1828, "lr": 2.7990160826953336e-05, "epoch": 3.0264608599779494, "percentage": 43.24, "elapsed_time": "9:54:24", "remaining_time": "13:00:25"}
1099
+ {"current_steps": 5495, "total_steps": 12698, "loss": 0.1929, "lr": 2.796495210342813e-05, "epoch": 3.029217199558986, "percentage": 43.27, "elapsed_time": "9:55:39", "remaining_time": "13:00:47"}
1100
+ {"current_steps": 5500, "total_steps": 12698, "loss": 0.186, "lr": 2.7939728331777892e-05, "epoch": 3.031973539140022, "percentage": 43.31, "elapsed_time": "9:56:47", "remaining_time": "13:01:02"}
1101
+ {"current_steps": 5505, "total_steps": 12698, "loss": 0.1955, "lr": 2.7914489559657726e-05, "epoch": 3.0347298787210586, "percentage": 43.35, "elapsed_time": "9:57:57", "remaining_time": "13:01:18"}
1102
+ {"current_steps": 5510, "total_steps": 12698, "loss": 0.1808, "lr": 2.788923583475104e-05, "epoch": 3.037486218302095, "percentage": 43.39, "elapsed_time": "9:59:06", "remaining_time": "13:01:33"}
1103
+ {"current_steps": 5515, "total_steps": 12698, "loss": 0.1865, "lr": 2.786396720476951e-05, "epoch": 3.0402425578831314, "percentage": 43.43, "elapsed_time": "10:00:13", "remaining_time": "13:01:45"}
1104
+ {"current_steps": 5520, "total_steps": 12698, "loss": 0.1927, "lr": 2.7838683717452988e-05, "epoch": 3.0429988974641677, "percentage": 43.47, "elapsed_time": "10:01:22", "remaining_time": "13:02:00"}
1105
+ {"current_steps": 5525, "total_steps": 12698, "loss": 0.1838, "lr": 2.7813385420569364e-05, "epoch": 3.045755237045204, "percentage": 43.51, "elapsed_time": "10:02:33", "remaining_time": "13:02:17"}
1106
+ {"current_steps": 5530, "total_steps": 12698, "loss": 0.1898, "lr": 2.778807236191452e-05, "epoch": 3.0485115766262405, "percentage": 43.55, "elapsed_time": "10:03:47", "remaining_time": "13:02:38"}
1107
+ {"current_steps": 5535, "total_steps": 12698, "loss": 0.2051, "lr": 2.7762744589312238e-05, "epoch": 3.051267916207277, "percentage": 43.59, "elapsed_time": "10:04:57", "remaining_time": "13:02:53"}
1108
+ {"current_steps": 5540, "total_steps": 12698, "loss": 0.2005, "lr": 2.7737402150614098e-05, "epoch": 3.0540242557883133, "percentage": 43.63, "elapsed_time": "10:05:57", "remaining_time": "13:02:55"}
1109
+ {"current_steps": 5545, "total_steps": 12698, "loss": 0.1694, "lr": 2.7712045093699372e-05, "epoch": 3.0567805953693497, "percentage": 43.67, "elapsed_time": "10:07:03", "remaining_time": "13:03:05"}
1110
+ {"current_steps": 5550, "total_steps": 12698, "loss": 0.1829, "lr": 2.768667346647496e-05, "epoch": 3.059536934950386, "percentage": 43.71, "elapsed_time": "10:08:16", "remaining_time": "13:03:25"}
1111
+ {"current_steps": 5555, "total_steps": 12698, "loss": 0.1875, "lr": 2.766128731687529e-05, "epoch": 3.0622932745314224, "percentage": 43.75, "elapsed_time": "10:09:28", "remaining_time": "13:03:42"}
1112
+ {"current_steps": 5560, "total_steps": 12698, "loss": 0.1918, "lr": 2.763588669286223e-05, "epoch": 3.065049614112459, "percentage": 43.79, "elapsed_time": "10:10:37", "remaining_time": "13:03:56"}
1113
+ {"current_steps": 5565, "total_steps": 12698, "loss": 0.1867, "lr": 2.761047164242499e-05, "epoch": 3.067805953693495, "percentage": 43.83, "elapsed_time": "10:11:55", "remaining_time": "13:04:20"}
1114
+ {"current_steps": 5570, "total_steps": 12698, "loss": 0.1776, "lr": 2.758504221358003e-05, "epoch": 3.0705622932745316, "percentage": 43.87, "elapsed_time": "10:13:11", "remaining_time": "13:04:42"}
1115
+ {"current_steps": 5575, "total_steps": 12698, "loss": 0.1636, "lr": 2.7559598454370995e-05, "epoch": 3.073318632855568, "percentage": 43.9, "elapsed_time": "10:14:28", "remaining_time": "13:05:06"}
1116
+ {"current_steps": 5580, "total_steps": 12698, "loss": 0.1687, "lr": 2.753414041286858e-05, "epoch": 3.0760749724366043, "percentage": 43.94, "elapsed_time": "10:15:41", "remaining_time": "13:05:23"}
1117
+ {"current_steps": 5585, "total_steps": 12698, "loss": 0.1865, "lr": 2.7508668137170473e-05, "epoch": 3.0788313120176407, "percentage": 43.98, "elapsed_time": "10:16:54", "remaining_time": "13:05:41"}
1118
+ {"current_steps": 5590, "total_steps": 12698, "loss": 0.1768, "lr": 2.748318167540126e-05, "epoch": 3.081587651598677, "percentage": 44.02, "elapsed_time": "10:17:40", "remaining_time": "13:05:25"}
1119
+ {"current_steps": 5595, "total_steps": 12698, "loss": 0.1969, "lr": 2.7457681075712326e-05, "epoch": 3.0843439911797135, "percentage": 44.06, "elapsed_time": "10:18:50", "remaining_time": "13:05:37"}
1120
+ {"current_steps": 5600, "total_steps": 12698, "loss": 0.1997, "lr": 2.7432166386281768e-05, "epoch": 3.08710033076075, "percentage": 44.1, "elapsed_time": "10:20:06", "remaining_time": "13:05:59"}
1121
+ {"current_steps": 5605, "total_steps": 12698, "loss": 0.1995, "lr": 2.7406637655314288e-05, "epoch": 3.0898566703417862, "percentage": 44.14, "elapsed_time": "10:21:16", "remaining_time": "13:06:12"}
1122
+ {"current_steps": 5610, "total_steps": 12698, "loss": 0.1841, "lr": 2.7381094931041134e-05, "epoch": 3.0926130099228226, "percentage": 44.18, "elapsed_time": "10:22:28", "remaining_time": "13:06:27"}
1123
+ {"current_steps": 5615, "total_steps": 12698, "loss": 0.1919, "lr": 2.7355538261719994e-05, "epoch": 3.095369349503859, "percentage": 44.22, "elapsed_time": "10:23:45", "remaining_time": "13:06:50"}
1124
+ {"current_steps": 5620, "total_steps": 12698, "loss": 0.1912, "lr": 2.7329967695634885e-05, "epoch": 3.0981256890848954, "percentage": 44.26, "elapsed_time": "10:25:02", "remaining_time": "13:07:11"}
1125
+ {"current_steps": 5625, "total_steps": 12698, "loss": 0.1898, "lr": 2.7304383281096096e-05, "epoch": 3.1008820286659318, "percentage": 44.3, "elapsed_time": "10:26:17", "remaining_time": "13:07:30"}
1126
+ {"current_steps": 5630, "total_steps": 12698, "loss": 0.1924, "lr": 2.7278785066440058e-05, "epoch": 3.103638368246968, "percentage": 44.34, "elapsed_time": "10:27:35", "remaining_time": "13:07:53"}
1127
+ {"current_steps": 5635, "total_steps": 12698, "loss": 0.193, "lr": 2.7253173100029297e-05, "epoch": 3.1063947078280045, "percentage": 44.38, "elapsed_time": "10:28:51", "remaining_time": "13:08:12"}
1128
+ {"current_steps": 5640, "total_steps": 12698, "loss": 0.1932, "lr": 2.7227547430252315e-05, "epoch": 3.109151047409041, "percentage": 44.42, "elapsed_time": "10:29:58", "remaining_time": "13:08:21"}
1129
+ {"current_steps": 5645, "total_steps": 12698, "loss": 0.1899, "lr": 2.7201908105523496e-05, "epoch": 3.1119073869900773, "percentage": 44.46, "elapsed_time": "10:31:11", "remaining_time": "13:08:36"}
1130
+ {"current_steps": 5650, "total_steps": 12698, "loss": 0.1622, "lr": 2.717625517428303e-05, "epoch": 3.1146637265711137, "percentage": 44.5, "elapsed_time": "10:31:54", "remaining_time": "13:08:15"}
1131
+ {"current_steps": 5655, "total_steps": 12698, "loss": 0.1922, "lr": 2.7150588684996803e-05, "epoch": 3.11742006615215, "percentage": 44.53, "elapsed_time": "10:33:03", "remaining_time": "13:08:26"}
1132
+ {"current_steps": 5660, "total_steps": 12698, "loss": 0.1844, "lr": 2.712490868615633e-05, "epoch": 3.1201764057331864, "percentage": 44.57, "elapsed_time": "10:34:12", "remaining_time": "13:08:37"}
1133
+ {"current_steps": 5665, "total_steps": 12698, "loss": 0.191, "lr": 2.7099215226278635e-05, "epoch": 3.122932745314223, "percentage": 44.61, "elapsed_time": "10:35:26", "remaining_time": "13:08:53"}
1134
+ {"current_steps": 5670, "total_steps": 12698, "loss": 0.1838, "lr": 2.707350835390619e-05, "epoch": 3.125689084895259, "percentage": 44.65, "elapsed_time": "10:36:42", "remaining_time": "13:09:12"}
1135
+ {"current_steps": 5675, "total_steps": 12698, "loss": 0.1834, "lr": 2.7047788117606794e-05, "epoch": 3.1284454244762956, "percentage": 44.69, "elapsed_time": "10:37:56", "remaining_time": "13:09:28"}
1136
+ {"current_steps": 5680, "total_steps": 12698, "loss": 0.1924, "lr": 2.7022054565973498e-05, "epoch": 3.131201764057332, "percentage": 44.73, "elapsed_time": "10:39:15", "remaining_time": "13:09:50"}
1137
+ {"current_steps": 5685, "total_steps": 12698, "loss": 0.1927, "lr": 2.6996307747624514e-05, "epoch": 3.1339581036383684, "percentage": 44.77, "elapsed_time": "10:40:21", "remaining_time": "13:09:56"}
1138
+ {"current_steps": 5690, "total_steps": 12698, "loss": 0.1578, "lr": 2.6970547711203114e-05, "epoch": 3.1367144432194047, "percentage": 44.81, "elapsed_time": "10:41:06", "remaining_time": "13:09:36"}
1139
+ {"current_steps": 5695, "total_steps": 12698, "loss": 0.1841, "lr": 2.6944774505377545e-05, "epoch": 3.139470782800441, "percentage": 44.85, "elapsed_time": "10:42:13", "remaining_time": "13:09:43"}
1140
+ {"current_steps": 5700, "total_steps": 12698, "loss": 0.1866, "lr": 2.6918988178840932e-05, "epoch": 3.1422271223814775, "percentage": 44.89, "elapsed_time": "10:43:27", "remaining_time": "13:09:58"}
1141
+ {"current_steps": 5705, "total_steps": 12698, "loss": 0.1875, "lr": 2.6893188780311182e-05, "epoch": 3.144983461962514, "percentage": 44.93, "elapsed_time": "10:44:34", "remaining_time": "13:10:05"}
1142
+ {"current_steps": 5710, "total_steps": 12698, "loss": 0.179, "lr": 2.686737635853093e-05, "epoch": 3.1477398015435503, "percentage": 44.97, "elapsed_time": "10:45:41", "remaining_time": "13:10:12"}
1143
+ {"current_steps": 5715, "total_steps": 12698, "loss": 0.1854, "lr": 2.6841550962267376e-05, "epoch": 3.1504961411245866, "percentage": 45.01, "elapsed_time": "10:46:54", "remaining_time": "13:10:26"}
1144
+ {"current_steps": 5720, "total_steps": 12698, "loss": 0.1827, "lr": 2.681571264031225e-05, "epoch": 3.153252480705623, "percentage": 45.05, "elapsed_time": "10:48:09", "remaining_time": "13:10:42"}
1145
+ {"current_steps": 5725, "total_steps": 12698, "loss": 0.1895, "lr": 2.678986144148171e-05, "epoch": 3.1560088202866594, "percentage": 45.09, "elapsed_time": "10:48:22", "remaining_time": "13:09:42"}
1146
+ {"current_steps": 5730, "total_steps": 12698, "loss": 0.1704, "lr": 2.6763997414616226e-05, "epoch": 3.158765159867696, "percentage": 45.13, "elapsed_time": "10:48:34", "remaining_time": "13:08:41"}
1147
+ {"current_steps": 5735, "total_steps": 12698, "loss": 0.1668, "lr": 2.673812060858052e-05, "epoch": 3.161521499448732, "percentage": 45.16, "elapsed_time": "10:48:47", "remaining_time": "13:07:42"}
1148
+ {"current_steps": 5740, "total_steps": 12698, "loss": 0.1601, "lr": 2.6712231072263453e-05, "epoch": 3.1642778390297686, "percentage": 45.2, "elapsed_time": "10:48:59", "remaining_time": "13:06:41"}
1149
+ {"current_steps": 5745, "total_steps": 12698, "loss": 0.1694, "lr": 2.6686328854577923e-05, "epoch": 3.167034178610805, "percentage": 45.24, "elapsed_time": "10:49:13", "remaining_time": "13:05:43"}
1150
+ {"current_steps": 5750, "total_steps": 12698, "loss": 0.1666, "lr": 2.6660414004460806e-05, "epoch": 3.1697905181918413, "percentage": 45.28, "elapsed_time": "10:49:25", "remaining_time": "13:04:43"}
1151
+ {"current_steps": 5755, "total_steps": 12698, "loss": 0.1605, "lr": 2.663448657087283e-05, "epoch": 3.1725468577728777, "percentage": 45.32, "elapsed_time": "10:49:36", "remaining_time": "13:03:42"}
1152
+ {"current_steps": 5760, "total_steps": 12698, "loss": 0.1808, "lr": 2.6608546602798512e-05, "epoch": 3.175303197353914, "percentage": 45.36, "elapsed_time": "10:49:48", "remaining_time": "13:02:42"}
1153
+ {"current_steps": 5765, "total_steps": 12698, "loss": 0.1621, "lr": 2.6582594149246035e-05, "epoch": 3.1780595369349505, "percentage": 45.4, "elapsed_time": "10:50:00", "remaining_time": "13:01:41"}
1154
+ {"current_steps": 5770, "total_steps": 12698, "loss": 0.1672, "lr": 2.6556629259247175e-05, "epoch": 3.180815876515987, "percentage": 45.44, "elapsed_time": "10:50:13", "remaining_time": "13:00:43"}
1155
+ {"current_steps": 5775, "total_steps": 12698, "loss": 0.1632, "lr": 2.6530651981857217e-05, "epoch": 3.1835722160970232, "percentage": 45.48, "elapsed_time": "10:50:26", "remaining_time": "12:59:45"}
1156
+ {"current_steps": 5780, "total_steps": 12698, "loss": 0.1632, "lr": 2.6504662366154826e-05, "epoch": 3.1863285556780596, "percentage": 45.52, "elapsed_time": "10:50:39", "remaining_time": "12:58:46"}
1157
+ {"current_steps": 5785, "total_steps": 12698, "loss": 0.1563, "lr": 2.6478660461242e-05, "epoch": 3.189084895259096, "percentage": 45.56, "elapsed_time": "10:50:51", "remaining_time": "12:57:45"}
1158
+ {"current_steps": 5790, "total_steps": 12698, "loss": 0.1452, "lr": 2.6452646316243943e-05, "epoch": 3.1918412348401324, "percentage": 45.6, "elapsed_time": "10:51:03", "remaining_time": "12:56:46"}
1159
+ {"current_steps": 5795, "total_steps": 12698, "loss": 0.1537, "lr": 2.6426619980308988e-05, "epoch": 3.1945975744211688, "percentage": 45.64, "elapsed_time": "10:51:16", "remaining_time": "12:55:47"}
1160
+ {"current_steps": 5800, "total_steps": 12698, "loss": 0.16, "lr": 2.640058150260849e-05, "epoch": 3.197353914002205, "percentage": 45.68, "elapsed_time": "10:51:29", "remaining_time": "12:54:49"}
1161
+ {"current_steps": 5805, "total_steps": 12698, "loss": 0.1668, "lr": 2.6374530932336763e-05, "epoch": 3.2001102535832415, "percentage": 45.72, "elapsed_time": "10:51:43", "remaining_time": "12:53:53"}
1162
+ {"current_steps": 5810, "total_steps": 12698, "loss": 0.164, "lr": 2.6348468318710952e-05, "epoch": 3.202866593164278, "percentage": 45.76, "elapsed_time": "10:51:56", "remaining_time": "12:52:53"}
1163
+ {"current_steps": 5815, "total_steps": 12698, "loss": 0.1516, "lr": 2.6322393710970963e-05, "epoch": 3.2056229327453143, "percentage": 45.79, "elapsed_time": "10:52:09", "remaining_time": "12:51:55"}
1164
+ {"current_steps": 5820, "total_steps": 12698, "loss": 0.163, "lr": 2.6296307158379356e-05, "epoch": 3.2083792723263507, "percentage": 45.83, "elapsed_time": "10:52:23", "remaining_time": "12:50:59"}
1165
+ {"current_steps": 5825, "total_steps": 12698, "loss": 0.1707, "lr": 2.6270208710221253e-05, "epoch": 3.211135611907387, "percentage": 45.87, "elapsed_time": "10:52:38", "remaining_time": "12:50:04"}
1166
+ {"current_steps": 5830, "total_steps": 12698, "loss": 0.1618, "lr": 2.6244098415804272e-05, "epoch": 3.2138919514884234, "percentage": 45.91, "elapsed_time": "10:52:52", "remaining_time": "12:49:06"}
1167
+ {"current_steps": 5835, "total_steps": 12698, "loss": 0.1539, "lr": 2.62179763244584e-05, "epoch": 3.21664829106946, "percentage": 45.95, "elapsed_time": "10:53:04", "remaining_time": "12:48:07"}
1168
+ {"current_steps": 5840, "total_steps": 12698, "loss": 0.1549, "lr": 2.61918424855359e-05, "epoch": 3.219404630650496, "percentage": 45.99, "elapsed_time": "10:53:15", "remaining_time": "12:47:08"}
1169
+ {"current_steps": 5845, "total_steps": 12698, "loss": 0.1593, "lr": 2.616569694841125e-05, "epoch": 3.2221609702315326, "percentage": 46.03, "elapsed_time": "10:53:28", "remaining_time": "12:46:10"}
1170
+ {"current_steps": 5850, "total_steps": 12698, "loss": 0.1624, "lr": 2.6139539762481007e-05, "epoch": 3.224917309812569, "percentage": 46.07, "elapsed_time": "10:53:40", "remaining_time": "12:45:11"}
1171
+ {"current_steps": 5855, "total_steps": 12698, "loss": 0.1592, "lr": 2.6113370977163762e-05, "epoch": 3.2276736493936053, "percentage": 46.11, "elapsed_time": "10:53:55", "remaining_time": "12:44:16"}
1172
+ {"current_steps": 5860, "total_steps": 12698, "loss": 0.1601, "lr": 2.6087190641900005e-05, "epoch": 3.2304299889746417, "percentage": 46.15, "elapsed_time": "10:54:09", "remaining_time": "12:43:20"}
1173
+ {"current_steps": 5865, "total_steps": 12698, "loss": 0.1542, "lr": 2.6060998806152045e-05, "epoch": 3.233186328555678, "percentage": 46.19, "elapsed_time": "10:54:21", "remaining_time": "12:42:21"}
1174
+ {"current_steps": 5870, "total_steps": 12698, "loss": 0.1532, "lr": 2.6034795519403927e-05, "epoch": 3.2359426681367145, "percentage": 46.23, "elapsed_time": "10:54:34", "remaining_time": "12:41:23"}
1175
+ {"current_steps": 5875, "total_steps": 12698, "loss": 0.1636, "lr": 2.600858083116132e-05, "epoch": 3.238699007717751, "percentage": 46.27, "elapsed_time": "10:54:47", "remaining_time": "12:40:26"}
1176
+ {"current_steps": 5880, "total_steps": 12698, "loss": 0.1522, "lr": 2.598235479095145e-05, "epoch": 3.2414553472987873, "percentage": 46.31, "elapsed_time": "10:54:58", "remaining_time": "12:39:27"}
1177
+ {"current_steps": 5885, "total_steps": 12698, "loss": 0.1537, "lr": 2.5956117448322972e-05, "epoch": 3.2442116868798236, "percentage": 46.35, "elapsed_time": "10:55:10", "remaining_time": "12:38:29"}
1178
+ {"current_steps": 5890, "total_steps": 12698, "loss": 0.144, "lr": 2.592986885284591e-05, "epoch": 3.24696802646086, "percentage": 46.39, "elapsed_time": "10:55:22", "remaining_time": "12:37:31"}
1179
+ {"current_steps": 5895, "total_steps": 12698, "loss": 0.1593, "lr": 2.590360905411154e-05, "epoch": 3.2497243660418964, "percentage": 46.42, "elapsed_time": "10:55:34", "remaining_time": "12:36:33"}
1180
+ {"current_steps": 5900, "total_steps": 12698, "loss": 0.1501, "lr": 2.5877338101732293e-05, "epoch": 3.252480705622933, "percentage": 46.46, "elapsed_time": "10:55:46", "remaining_time": "12:35:35"}
1181
+ {"current_steps": 5905, "total_steps": 12698, "loss": 0.1536, "lr": 2.5851056045341704e-05, "epoch": 3.255237045203969, "percentage": 46.5, "elapsed_time": "10:55:58", "remaining_time": "12:34:37"}
1182
+ {"current_steps": 5910, "total_steps": 12698, "loss": 0.1503, "lr": 2.5824762934594256e-05, "epoch": 3.2579933847850056, "percentage": 46.54, "elapsed_time": "10:56:11", "remaining_time": "12:33:41"}
1183
+ {"current_steps": 5915, "total_steps": 12698, "loss": 0.1624, "lr": 2.5798458819165335e-05, "epoch": 3.260749724366042, "percentage": 46.58, "elapsed_time": "10:56:24", "remaining_time": "12:32:43"}
1184
+ {"current_steps": 5920, "total_steps": 12698, "loss": 0.1531, "lr": 2.57721437487511e-05, "epoch": 3.2635060639470783, "percentage": 46.62, "elapsed_time": "10:56:36", "remaining_time": "12:31:46"}
1185
+ {"current_steps": 5925, "total_steps": 12698, "loss": 0.1562, "lr": 2.5745817773068428e-05, "epoch": 3.2662624035281147, "percentage": 46.66, "elapsed_time": "10:56:49", "remaining_time": "12:30:50"}
1186
+ {"current_steps": 5930, "total_steps": 12698, "loss": 0.1602, "lr": 2.571948094185479e-05, "epoch": 3.269018743109151, "percentage": 46.7, "elapsed_time": "10:57:02", "remaining_time": "12:29:53"}
1187
+ {"current_steps": 5935, "total_steps": 12698, "loss": 0.1696, "lr": 2.5693133304868164e-05, "epoch": 3.2717750826901875, "percentage": 46.74, "elapsed_time": "10:57:17", "remaining_time": "12:29:00"}
1188
+ {"current_steps": 5940, "total_steps": 12698, "loss": 0.1531, "lr": 2.5666774911886948e-05, "epoch": 3.274531422271224, "percentage": 46.78, "elapsed_time": "10:57:29", "remaining_time": "12:28:02"}
1189
+ {"current_steps": 5945, "total_steps": 12698, "loss": 0.1542, "lr": 2.5640405812709847e-05, "epoch": 3.2772877618522602, "percentage": 46.82, "elapsed_time": "10:57:43", "remaining_time": "12:27:06"}
1190
+ {"current_steps": 5950, "total_steps": 12698, "loss": 0.1584, "lr": 2.5614026057155822e-05, "epoch": 3.2800441014332966, "percentage": 46.86, "elapsed_time": "10:57:55", "remaining_time": "12:26:09"}
1191
+ {"current_steps": 5955, "total_steps": 12698, "loss": 0.1501, "lr": 2.558763569506394e-05, "epoch": 3.282800441014333, "percentage": 46.9, "elapsed_time": "10:58:07", "remaining_time": "12:25:12"}
1192
+ {"current_steps": 5960, "total_steps": 12698, "loss": 0.1496, "lr": 2.556123477629332e-05, "epoch": 3.2855567805953694, "percentage": 46.94, "elapsed_time": "10:58:19", "remaining_time": "12:24:15"}
1193
+ {"current_steps": 5965, "total_steps": 12698, "loss": 0.146, "lr": 2.5534823350723022e-05, "epoch": 3.2883131201764058, "percentage": 46.98, "elapsed_time": "10:58:31", "remaining_time": "12:23:18"}
1194
+ {"current_steps": 5970, "total_steps": 12698, "loss": 0.1621, "lr": 2.550840146825195e-05, "epoch": 3.291069459757442, "percentage": 47.02, "elapsed_time": "10:58:44", "remaining_time": "12:22:22"}
1195
+ {"current_steps": 5975, "total_steps": 12698, "loss": 0.1564, "lr": 2.548196917879878e-05, "epoch": 3.2938257993384785, "percentage": 47.05, "elapsed_time": "10:58:56", "remaining_time": "12:21:26"}
1196
+ {"current_steps": 5980, "total_steps": 12698, "loss": 0.1525, "lr": 2.5455526532301838e-05, "epoch": 3.296582138919515, "percentage": 47.09, "elapsed_time": "10:59:09", "remaining_time": "12:20:29"}
1197
+ {"current_steps": 5985, "total_steps": 12698, "loss": 0.1514, "lr": 2.5429073578719018e-05, "epoch": 3.2993384785005513, "percentage": 47.13, "elapsed_time": "10:59:21", "remaining_time": "12:19:34"}
1198
+ {"current_steps": 5990, "total_steps": 12698, "loss": 0.1553, "lr": 2.540261036802769e-05, "epoch": 3.3020948180815877, "percentage": 47.17, "elapsed_time": "10:59:35", "remaining_time": "12:18:39"}
1199
+ {"current_steps": 5995, "total_steps": 12698, "loss": 0.158, "lr": 2.53761369502246e-05, "epoch": 3.304851157662624, "percentage": 47.21, "elapsed_time": "10:59:47", "remaining_time": "12:17:42"}
1200
+ {"current_steps": 6000, "total_steps": 12698, "loss": 0.1526, "lr": 2.5349653375325788e-05, "epoch": 3.3076074972436604, "percentage": 47.25, "elapsed_time": "10:59:59", "remaining_time": "12:16:46"}
1201
+ {"current_steps": 6005, "total_steps": 12698, "loss": 0.1533, "lr": 2.5323159693366472e-05, "epoch": 3.310363836824697, "percentage": 47.29, "elapsed_time": "11:00:50", "remaining_time": "12:16:33"}
1202
+ {"current_steps": 6010, "total_steps": 12698, "loss": 0.1511, "lr": 2.529665595440096e-05, "epoch": 3.313120176405733, "percentage": 47.33, "elapsed_time": "11:01:02", "remaining_time": "12:15:37"}
1203
+ {"current_steps": 6015, "total_steps": 12698, "loss": 0.1576, "lr": 2.5270142208502586e-05, "epoch": 3.3158765159867696, "percentage": 47.37, "elapsed_time": "11:01:16", "remaining_time": "12:14:42"}
1204
+ {"current_steps": 6020, "total_steps": 12698, "loss": 0.1619, "lr": 2.5243618505763562e-05, "epoch": 3.318632855567806, "percentage": 47.41, "elapsed_time": "11:01:30", "remaining_time": "12:13:48"}
1205
+ {"current_steps": 6025, "total_steps": 12698, "loss": 0.1474, "lr": 2.5217084896294926e-05, "epoch": 3.3213891951488423, "percentage": 47.45, "elapsed_time": "11:01:41", "remaining_time": "12:12:51"}
1206
+ {"current_steps": 6030, "total_steps": 12698, "loss": 0.1553, "lr": 2.5190541430226432e-05, "epoch": 3.3241455347298787, "percentage": 47.49, "elapsed_time": "11:01:53", "remaining_time": "12:11:54"}
1207
+ {"current_steps": 6035, "total_steps": 12698, "loss": 0.1571, "lr": 2.516398815770645e-05, "epoch": 3.326901874310915, "percentage": 47.53, "elapsed_time": "11:02:05", "remaining_time": "12:10:59"}
1208
+ {"current_steps": 6040, "total_steps": 12698, "loss": 0.1585, "lr": 2.513742512890189e-05, "epoch": 3.3296582138919515, "percentage": 47.57, "elapsed_time": "11:02:18", "remaining_time": "12:10:04"}
1209
+ {"current_steps": 6045, "total_steps": 12698, "loss": 0.1609, "lr": 2.511085239399807e-05, "epoch": 3.332414553472988, "percentage": 47.61, "elapsed_time": "11:02:29", "remaining_time": "12:09:08"}
1210
+ {"current_steps": 6050, "total_steps": 12698, "loss": 0.156, "lr": 2.5084270003198672e-05, "epoch": 3.3351708930540243, "percentage": 47.65, "elapsed_time": "11:02:42", "remaining_time": "12:08:12"}
1211
+ {"current_steps": 6055, "total_steps": 12698, "loss": 0.1586, "lr": 2.5057678006725613e-05, "epoch": 3.3379272326350606, "percentage": 47.68, "elapsed_time": "11:02:53", "remaining_time": "12:07:16"}
1212
+ {"current_steps": 6060, "total_steps": 12698, "loss": 0.1589, "lr": 2.503107645481895e-05, "epoch": 3.340683572216097, "percentage": 47.72, "elapsed_time": "11:03:06", "remaining_time": "12:06:21"}
1213
+ {"current_steps": 6065, "total_steps": 12698, "loss": 0.1639, "lr": 2.5004465397736794e-05, "epoch": 3.3434399117971334, "percentage": 47.76, "elapsed_time": "11:03:19", "remaining_time": "12:05:26"}
1214
+ {"current_steps": 6070, "total_steps": 12698, "loss": 0.1607, "lr": 2.4977844885755228e-05, "epoch": 3.34619625137817, "percentage": 47.8, "elapsed_time": "11:03:34", "remaining_time": "12:04:34"}
1215
+ {"current_steps": 6075, "total_steps": 12698, "loss": 0.1593, "lr": 2.4951214969168177e-05, "epoch": 3.348952590959206, "percentage": 47.84, "elapsed_time": "11:03:47", "remaining_time": "12:03:40"}
1216
+ {"current_steps": 6080, "total_steps": 12698, "loss": 0.1564, "lr": 2.492457569828736e-05, "epoch": 3.3517089305402425, "percentage": 47.88, "elapsed_time": "11:03:58", "remaining_time": "12:02:44"}
1217
+ {"current_steps": 6085, "total_steps": 12698, "loss": 0.1518, "lr": 2.4897927123442135e-05, "epoch": 3.354465270121279, "percentage": 47.92, "elapsed_time": "11:04:11", "remaining_time": "12:01:49"}
1218
+ {"current_steps": 6090, "total_steps": 12698, "loss": 0.1628, "lr": 2.4871269294979473e-05, "epoch": 3.3572216097023153, "percentage": 47.96, "elapsed_time": "11:04:23", "remaining_time": "12:00:54"}
1219
+ {"current_steps": 6095, "total_steps": 12698, "loss": 0.1515, "lr": 2.4844602263263805e-05, "epoch": 3.3599779492833517, "percentage": 48.0, "elapsed_time": "11:04:36", "remaining_time": "11:59:59"}
1220
+ {"current_steps": 6100, "total_steps": 12698, "loss": 0.1495, "lr": 2.481792607867696e-05, "epoch": 3.362734288864388, "percentage": 48.04, "elapsed_time": "11:04:48", "remaining_time": "11:59:04"}
1221
+ {"current_steps": 6105, "total_steps": 12698, "loss": 0.1529, "lr": 2.479124079161805e-05, "epoch": 3.3654906284454245, "percentage": 48.08, "elapsed_time": "11:05:00", "remaining_time": "11:58:09"}
1222
+ {"current_steps": 6110, "total_steps": 12698, "loss": 0.1677, "lr": 2.4764546452503394e-05, "epoch": 3.368246968026461, "percentage": 48.12, "elapsed_time": "11:05:12", "remaining_time": "11:57:15"}
1223
+ {"current_steps": 6115, "total_steps": 12698, "loss": 0.1554, "lr": 2.4737843111766407e-05, "epoch": 3.3710033076074972, "percentage": 48.16, "elapsed_time": "11:05:24", "remaining_time": "11:56:20"}
1224
+ {"current_steps": 6120, "total_steps": 12698, "loss": 0.156, "lr": 2.471113081985752e-05, "epoch": 3.3737596471885336, "percentage": 48.2, "elapsed_time": "11:05:41", "remaining_time": "11:55:30"}
1225
+ {"current_steps": 6125, "total_steps": 12698, "loss": 0.1403, "lr": 2.4684409627244064e-05, "epoch": 3.37651598676957, "percentage": 48.24, "elapsed_time": "11:05:56", "remaining_time": "11:54:38"}
1226
+ {"current_steps": 6130, "total_steps": 12698, "loss": 0.1454, "lr": 2.4657679584410187e-05, "epoch": 3.3792723263506064, "percentage": 48.28, "elapsed_time": "11:06:08", "remaining_time": "11:53:44"}
1227
+ {"current_steps": 6135, "total_steps": 12698, "loss": 0.1549, "lr": 2.4630940741856762e-05, "epoch": 3.3820286659316428, "percentage": 48.31, "elapsed_time": "11:06:20", "remaining_time": "11:52:49"}
1228
+ {"current_steps": 6140, "total_steps": 12698, "loss": 0.1525, "lr": 2.4604193150101287e-05, "epoch": 3.384785005512679, "percentage": 48.35, "elapsed_time": "11:06:34", "remaining_time": "11:51:56"}
1229
+ {"current_steps": 6145, "total_steps": 12698, "loss": 0.1534, "lr": 2.4577436859677795e-05, "epoch": 3.3875413450937155, "percentage": 48.39, "elapsed_time": "11:06:46", "remaining_time": "11:51:02"}
1230
+ {"current_steps": 6150, "total_steps": 12698, "loss": 0.1589, "lr": 2.455067192113674e-05, "epoch": 3.390297684674752, "percentage": 48.43, "elapsed_time": "11:06:59", "remaining_time": "11:50:09"}
1231
+ {"current_steps": 6155, "total_steps": 12698, "loss": 0.1552, "lr": 2.4523898385044924e-05, "epoch": 3.3930540242557883, "percentage": 48.47, "elapsed_time": "11:07:11", "remaining_time": "11:49:15"}
1232
+ {"current_steps": 6160, "total_steps": 12698, "loss": 0.1691, "lr": 2.449711630198539e-05, "epoch": 3.3958103638368247, "percentage": 48.51, "elapsed_time": "11:07:25", "remaining_time": "11:48:22"}
1233
+ {"current_steps": 6165, "total_steps": 12698, "loss": 0.267, "lr": 2.447032572255733e-05, "epoch": 3.398566703417861, "percentage": 48.55, "elapsed_time": "11:08:18", "remaining_time": "11:48:11"}
1234
+ {"current_steps": 6170, "total_steps": 12698, "loss": 0.2486, "lr": 2.4443526697375987e-05, "epoch": 3.4013230429988974, "percentage": 48.59, "elapsed_time": "11:09:03", "remaining_time": "11:47:52"}
1235
+ {"current_steps": 6175, "total_steps": 12698, "loss": 0.2399, "lr": 2.441671927707256e-05, "epoch": 3.404079382579934, "percentage": 48.63, "elapsed_time": "11:10:03", "remaining_time": "11:47:48"}
1236
+ {"current_steps": 6180, "total_steps": 12698, "loss": 0.2407, "lr": 2.4389903512294115e-05, "epoch": 3.40683572216097, "percentage": 48.67, "elapsed_time": "11:10:54", "remaining_time": "11:47:36"}
1237
+ {"current_steps": 6185, "total_steps": 12698, "loss": 0.2503, "lr": 2.4363079453703467e-05, "epoch": 3.4095920617420066, "percentage": 48.71, "elapsed_time": "11:11:43", "remaining_time": "11:47:21"}
1238
+ {"current_steps": 6190, "total_steps": 12698, "loss": 0.2466, "lr": 2.4336247151979128e-05, "epoch": 3.412348401323043, "percentage": 48.75, "elapsed_time": "11:12:33", "remaining_time": "11:47:06"}