Training in progress, epoch 20, checkpoint

Files changed (6) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b2ced86c9801e4026be1866776c08ce5492085a1175dafe22ada264e86f7429d
 size 437961700

 version https://git-lfs.github.com/spec/v1
+oid sha256:69b8a1fbb0b2ebabc7c5f8e8d5ec25388cfef2747f737797e282dcd01b2a50bc
 size 437961700

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e3dcddf7bb6f2e8c0e8f3643f658d18e7a5b96ecb3471c2d3a9d09d724bad43b
 size 4748067

 version https://git-lfs.github.com/spec/v1
+oid sha256:548e94dc2685e005b0d7e57dbcabd457777d3eaaa84ead92f32763cc36dfa36d
 size 4748067

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fb9e414eff58722d667823de371e35357986a30e64b45bc494d4828098d21f8a
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:74236b95568a925beb79e7faf7870231eb1e38b3bfebea880411163d4b5261b1
 size 14645

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b37f55e0b7fd54d79a33d1831f931fecb2307d10ee17c884fd456e2c04818e63
 size 1383

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0f37305dcafcb7d1b99695ee592b933dde91868bc75eb3897eb1e1cbce31146
 size 1383

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5326aad5a305cb353756fdbafb0841ec9b31231063515dd7ba118b57c91e3aac
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:93868e507dd0a2ffbdee1d3242238179b3c04f412293c025930b9b63d57cd536
 size 1465

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -2,9 +2,9 @@
   "best_global_step": 2548,
   "best_metric": 2.07909893989563,
   "best_model_checkpoint": "./bert-resume/checkpoint-2548",
-  "epoch": 19.0,
   "eval_steps": 500,
-  "global_step": 3724,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -209,6 +209,14 @@
       "eval_samples_per_second": 58.519,
       "eval_steps_per_second": 1.83,
       "step": 3724
     }
   ],
   "logging_steps": 500,
@@ -223,12 +231,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 3.119972596076851e+16,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": null

   "best_global_step": 2548,
   "best_metric": 2.07909893989563,
   "best_model_checkpoint": "./bert-resume/checkpoint-2548",
+  "epoch": 20.0,
   "eval_steps": 500,
+  "global_step": 3920,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 58.519,
       "eval_steps_per_second": 1.83,
       "step": 3724
+    },
+    {
+      "epoch": 20.0,
+      "eval_loss": 2.0794472694396973,
+      "eval_runtime": 30.0698,
+      "eval_samples_per_second": 58.497,
+      "eval_steps_per_second": 1.829,
+      "step": 3920
     }
   ],
   "logging_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 3.284181680080896e+16,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": null