Commit Β·
8d3be93
1
Parent(s): 5f6916a
Training in progress, step 56800
Browse files- {checkpoint-42600 β checkpoint-56800}/config.json +0 -0
- {checkpoint-42600 β checkpoint-56800}/optimizer.pt +1 -1
- {checkpoint-42600 β checkpoint-56800}/preprocessor_config.json +0 -0
- {checkpoint-42600 β checkpoint-56800}/pytorch_model.bin +1 -1
- {checkpoint-42600 β checkpoint-56800}/rng_state.pth +1 -1
- {checkpoint-42600 β checkpoint-56800}/scaler.pt +1 -1
- {checkpoint-42600 β checkpoint-56800}/scheduler.pt +1 -1
- {checkpoint-42600 β checkpoint-56800}/trainer_state.json +33 -3
- {checkpoint-42600 β checkpoint-56800}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Apr02_11-39-56_364af271dda7/events.out.tfevents.1775136463.364af271dda7.26706.0 +2 -2
{checkpoint-42600 β checkpoint-56800}/config.json
RENAMED
|
File without changes
|
{checkpoint-42600 β checkpoint-56800}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 721687098
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6d239faa9fff93ab890500865996a20c6609e11c84a8722536e9cf5caa02a5e4
|
| 3 |
size 721687098
|
{checkpoint-42600 β checkpoint-56800}/preprocessor_config.json
RENAMED
|
File without changes
|
{checkpoint-42600 β checkpoint-56800}/pytorch_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377673950
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1667da094d4e850422b2a4351a457c341ba3faa9fe24afab30d76557b9cc7783
|
| 3 |
size 377673950
|
{checkpoint-42600 β checkpoint-56800}/rng_state.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14308
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69520be733ce3c62aac8e519ecfec10db86b8d268a18251b920f5538a794fe5a
|
| 3 |
size 14308
|
{checkpoint-42600 β checkpoint-56800}/scaler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c314e454d6b8968b90afae3bbc3ca5e73780f0af94b546a8ad2128097d22104a
|
| 3 |
size 988
|
{checkpoint-42600 β checkpoint-56800}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7338ad7686598f45591f3dbb5e645c8a345976f35f07fe14f5f9eeea5f0afcbe
|
| 3 |
size 1064
|
{checkpoint-42600 β checkpoint-56800}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.711880624294281,
|
| 3 |
"best_model_checkpoint": "JuanPajero/FT-S5-LM/checkpoint-28400",
|
| 4 |
-
"epoch":
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -96,11 +96,41 @@
|
|
| 96 |
"eval_steps_per_second": 2.033,
|
| 97 |
"eval_wer": 0.2705310068428191,
|
| 98 |
"step": 42600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 99 |
}
|
| 100 |
],
|
| 101 |
"max_steps": 71900,
|
| 102 |
"num_train_epochs": 10,
|
| 103 |
-
"total_flos":
|
| 104 |
"trial_name": null,
|
| 105 |
"trial_params": null
|
| 106 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.711880624294281,
|
| 3 |
"best_model_checkpoint": "JuanPajero/FT-S5-LM/checkpoint-28400",
|
| 4 |
+
"epoch": 7.899860917941585,
|
| 5 |
+
"global_step": 56800,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 96 |
"eval_steps_per_second": 2.033,
|
| 97 |
"eval_wer": 0.2705310068428191,
|
| 98 |
"step": 42600
|
| 99 |
+
},
|
| 100 |
+
{
|
| 101 |
+
"epoch": 6.91,
|
| 102 |
+
"learning_rate": 1.0300880853036624e-05,
|
| 103 |
+
"loss": 0.2431,
|
| 104 |
+
"step": 49700
|
| 105 |
+
},
|
| 106 |
+
{
|
| 107 |
+
"epoch": 6.91,
|
| 108 |
+
"eval_loss": 0.7319042682647705,
|
| 109 |
+
"eval_runtime": 1221.2572,
|
| 110 |
+
"eval_samples_per_second": 16.318,
|
| 111 |
+
"eval_steps_per_second": 2.04,
|
| 112 |
+
"eval_wer": 0.2662402227230545,
|
| 113 |
+
"step": 49700
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"epoch": 7.9,
|
| 117 |
+
"learning_rate": 7.010662957811776e-06,
|
| 118 |
+
"loss": 0.2315,
|
| 119 |
+
"step": 56800
|
| 120 |
+
},
|
| 121 |
+
{
|
| 122 |
+
"epoch": 7.9,
|
| 123 |
+
"eval_loss": 0.7422261238098145,
|
| 124 |
+
"eval_runtime": 1219.7016,
|
| 125 |
+
"eval_samples_per_second": 16.338,
|
| 126 |
+
"eval_steps_per_second": 2.042,
|
| 127 |
+
"eval_wer": 0.26504196453155754,
|
| 128 |
+
"step": 56800
|
| 129 |
}
|
| 130 |
],
|
| 131 |
"max_steps": 71900,
|
| 132 |
"num_train_epochs": 10,
|
| 133 |
+
"total_flos": 6.787551470604595e+19,
|
| 134 |
"trial_name": null,
|
| 135 |
"trial_params": null
|
| 136 |
}
|
{checkpoint-42600 β checkpoint-56800}/training_args.bin
RENAMED
|
File without changes
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 377673950
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1667da094d4e850422b2a4351a457c341ba3faa9fe24afab30d76557b9cc7783
|
| 3 |
size 377673950
|
runs/Apr02_11-39-56_364af271dda7/events.out.tfevents.1775136463.364af271dda7.26706.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:006688382b8c231881b0a48e551a98d4e1a1f07d7e8f09774bf5c0c73b4c6cf9
|
| 3 |
+
size 6522
|