Training in progress, epoch 5, checkpoint

Files changed (6) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eb7b9ee5d5a289ecee12276ea139b3446e5d2b0749738e76ee12ab4e6815011a
 size 437958624

 version https://git-lfs.github.com/spec/v1
+oid sha256:210856a64940b579b6ac438055db28bb7947047d7b751c78767ac9a639d94c3e
 size 437958624

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f52c9c737c0616d379ccd0e217fd4da602c37c20f09befad90a3b45ec2414448
 size 4741923

 version https://git-lfs.github.com/spec/v1
+oid sha256:11bbc5b49b7537c8c7e5902cd575557135d769301c92827b5f9ddf71ab88e3d7
 size 4741923

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6fb370ab700093b2f074f90e23d7f00c5453a68d643bf15d029b1e8596742be3
 size 14645

 version https://git-lfs.github.com/spec/v1
+oid sha256:d44b4f35543873087c1cf6328742bd57e22ab2a916a6a3f007a76de03ee9cbab
 size 14645

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9343bdb5d2121fead6995ccf81e3591c0ddf27b60c835e5527a4bd7a66af257
 size 1383

 version https://git-lfs.github.com/spec/v1
+oid sha256:8e1ac30298048a080369699ec7fa0a715c4c2d28ff44da425171525f8394b890
 size 1383

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b6e8e008c9fcdd6b519f5ca1b89689630a9e27532a04ab80fd57e825818c9a4a
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:2909836fc184f92a445a91a7ebd6fe5b3c1c5b6a8f29fd49d1721b035d5f5860
 size 1465

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,10 +1,10 @@
 {
-  "best_global_step": 1868,
-  "best_metric": 0.5720958113670349,
-  "best_model_checkpoint": "./bert-email/checkpoint-1868",
-  "epoch": 4.0,
   "eval_steps": 500,
-  "global_step": 1868,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -61,6 +61,21 @@
       "eval_samples_per_second": 55.764,
       "eval_steps_per_second": 1.749,
       "step": 1868
     }
   ],
   "logging_steps": 500,
@@ -75,12 +90,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 1.57024677838848e+16,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": null

 {
+  "best_global_step": 2335,
+  "best_metric": 0.5627617239952087,
+  "best_model_checkpoint": "./bert-email/checkpoint-2335",
+  "epoch": 5.0,
   "eval_steps": 500,
+  "global_step": 2335,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 55.764,
       "eval_steps_per_second": 1.749,
       "step": 1868
+    },
+    {
+      "epoch": 4.282655246252677,
+      "grad_norm": 1.6766972541809082,
+      "learning_rate": 1.4389721627408994e-06,
+      "loss": 0.6073400268554687,
+      "step": 2000
+    },
+    {
+      "epoch": 5.0,
+      "eval_loss": 0.5627617239952087,
+      "eval_runtime": 66.8913,
+      "eval_samples_per_second": 55.762,
+      "eval_steps_per_second": 1.749,
+      "step": 2335
     }
   ],
   "logging_steps": 500,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 1.9628084729856e+16,
   "train_batch_size": 32,
   "trial_name": null,
   "trial_params": null