| { |
| "best_metric": 0.18050541516245489, |
| "best_model_checkpoint": "/content/drive/MyDrive/Fine tune/wav2vec2_R/TestModel6/checkpoint-198", |
| "epoch": 27.0, |
| "eval_steps": 500, |
| "global_step": 243, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "grad_norm": 2.6207005977630615, |
| "learning_rate": 2.0454545454545457e-05, |
| "loss": 1.4468, |
| "step": 9 |
| }, |
| { |
| "epoch": 1.0, |
| "eval_loss": 0.9447698593139648, |
| "eval_runtime": 7.468, |
| "eval_samples_per_second": 1.339, |
| "eval_steps_per_second": 0.268, |
| "eval_wer": 0.3458483754512635, |
| "step": 9 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 0.9180173873901367, |
| "learning_rate": 4.0909090909090915e-05, |
| "loss": 1.0187, |
| "step": 18 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_loss": 0.7252597808837891, |
| "eval_runtime": 7.0648, |
| "eval_samples_per_second": 1.415, |
| "eval_steps_per_second": 0.283, |
| "eval_wer": 0.2772563176895307, |
| "step": 18 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 1.0308139324188232, |
| "learning_rate": 4.9978417404589105e-05, |
| "loss": 0.7962, |
| "step": 27 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_loss": 0.5624670386314392, |
| "eval_runtime": 7.0549, |
| "eval_samples_per_second": 1.417, |
| "eval_steps_per_second": 0.283, |
| "eval_wer": 0.30541516245487366, |
| "step": 27 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 1.6524184942245483, |
| "learning_rate": 4.983095894354858e-05, |
| "loss": 0.6591, |
| "step": 36 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_loss": 0.49896639585494995, |
| "eval_runtime": 6.9528, |
| "eval_samples_per_second": 1.438, |
| "eval_steps_per_second": 0.288, |
| "eval_wer": 0.24332129963898916, |
| "step": 36 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 1.9104937314987183, |
| "learning_rate": 4.954463568772415e-05, |
| "loss": 0.5742, |
| "step": 45 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_loss": 0.4727010130882263, |
| "eval_runtime": 7.6581, |
| "eval_samples_per_second": 1.306, |
| "eval_steps_per_second": 0.261, |
| "eval_wer": 0.23249097472924188, |
| "step": 45 |
| }, |
| { |
| "epoch": 6.0, |
| "grad_norm": 0.7306864261627197, |
| "learning_rate": 4.912104887290587e-05, |
| "loss": 0.5231, |
| "step": 54 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_loss": 0.4486842155456543, |
| "eval_runtime": 7.182, |
| "eval_samples_per_second": 1.392, |
| "eval_steps_per_second": 0.278, |
| "eval_wer": 0.21444043321299638, |
| "step": 54 |
| }, |
| { |
| "epoch": 7.0, |
| "grad_norm": 0.8729464411735535, |
| "learning_rate": 4.856256736838498e-05, |
| "loss": 0.4567, |
| "step": 63 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_loss": 0.45621854066848755, |
| "eval_runtime": 7.0189, |
| "eval_samples_per_second": 1.425, |
| "eval_steps_per_second": 0.285, |
| "eval_wer": 0.21516245487364621, |
| "step": 63 |
| }, |
| { |
| "epoch": 8.0, |
| "grad_norm": 0.9639649987220764, |
| "learning_rate": 4.787231442927587e-05, |
| "loss": 0.4934, |
| "step": 72 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_loss": 0.4438972473144531, |
| "eval_runtime": 7.0861, |
| "eval_samples_per_second": 1.411, |
| "eval_steps_per_second": 0.282, |
| "eval_wer": 0.2108303249097473, |
| "step": 72 |
| }, |
| { |
| "epoch": 9.0, |
| "grad_norm": 1.3746402263641357, |
| "learning_rate": 4.7054150230006604e-05, |
| "loss": 0.4516, |
| "step": 81 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_loss": 0.43273186683654785, |
| "eval_runtime": 7.1786, |
| "eval_samples_per_second": 1.393, |
| "eval_steps_per_second": 0.279, |
| "eval_wer": 0.2043321299638989, |
| "step": 81 |
| }, |
| { |
| "epoch": 10.0, |
| "grad_norm": 0.5043421387672424, |
| "learning_rate": 4.61126502766577e-05, |
| "loss": 0.4069, |
| "step": 90 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_loss": 0.43151745200157166, |
| "eval_runtime": 6.9477, |
| "eval_samples_per_second": 1.439, |
| "eval_steps_per_second": 0.288, |
| "eval_wer": 0.1956678700361011, |
| "step": 90 |
| }, |
| { |
| "epoch": 11.0, |
| "grad_norm": 1.8196316957473755, |
| "learning_rate": 4.50530798188761e-05, |
| "loss": 0.4235, |
| "step": 99 |
| }, |
| { |
| "epoch": 11.0, |
| "eval_loss": 0.4364844858646393, |
| "eval_runtime": 7.1022, |
| "eval_samples_per_second": 1.408, |
| "eval_steps_per_second": 0.282, |
| "eval_wer": 0.20144404332129964, |
| "step": 99 |
| }, |
| { |
| "epoch": 12.0, |
| "grad_norm": 0.22248859703540802, |
| "learning_rate": 4.388136440446337e-05, |
| "loss": 0.4004, |
| "step": 108 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_loss": 0.43696457147598267, |
| "eval_runtime": 7.1886, |
| "eval_samples_per_second": 1.391, |
| "eval_steps_per_second": 0.278, |
| "eval_wer": 0.19855595667870035, |
| "step": 108 |
| }, |
| { |
| "epoch": 13.0, |
| "grad_norm": 1.0341521501541138, |
| "learning_rate": 4.2604056741308796e-05, |
| "loss": 0.3652, |
| "step": 117 |
| }, |
| { |
| "epoch": 13.0, |
| "eval_loss": 0.4320377707481384, |
| "eval_runtime": 7.073, |
| "eval_samples_per_second": 1.414, |
| "eval_steps_per_second": 0.283, |
| "eval_wer": 0.19494584837545126, |
| "step": 117 |
| }, |
| { |
| "epoch": 14.0, |
| "grad_norm": 0.6511925458908081, |
| "learning_rate": 4.12283000519888e-05, |
| "loss": 0.3597, |
| "step": 126 |
| }, |
| { |
| "epoch": 14.0, |
| "eval_loss": 0.4305523931980133, |
| "eval_runtime": 7.0901, |
| "eval_samples_per_second": 1.41, |
| "eval_steps_per_second": 0.282, |
| "eval_wer": 0.19133574007220217, |
| "step": 126 |
| }, |
| { |
| "epoch": 15.0, |
| "grad_norm": 0.897441565990448, |
| "learning_rate": 3.9761788125968744e-05, |
| "loss": 0.3701, |
| "step": 135 |
| }, |
| { |
| "epoch": 15.0, |
| "eval_loss": 0.4407591223716736, |
| "eval_runtime": 6.9823, |
| "eval_samples_per_second": 1.432, |
| "eval_steps_per_second": 0.286, |
| "eval_wer": 0.1891696750902527, |
| "step": 135 |
| }, |
| { |
| "epoch": 16.0, |
| "grad_norm": 1.0737636089324951, |
| "learning_rate": 3.821272229281139e-05, |
| "loss": 0.3348, |
| "step": 144 |
| }, |
| { |
| "epoch": 16.0, |
| "eval_loss": 0.4343787729740143, |
| "eval_runtime": 7.07, |
| "eval_samples_per_second": 1.414, |
| "eval_steps_per_second": 0.283, |
| "eval_wer": 0.18483754512635378, |
| "step": 144 |
| }, |
| { |
| "epoch": 17.0, |
| "grad_norm": 0.5325424671173096, |
| "learning_rate": 3.6589765557015145e-05, |
| "loss": 0.3248, |
| "step": 153 |
| }, |
| { |
| "epoch": 17.0, |
| "eval_loss": 0.42944344878196716, |
| "eval_runtime": 7.0553, |
| "eval_samples_per_second": 1.417, |
| "eval_steps_per_second": 0.283, |
| "eval_wer": 0.1884476534296029, |
| "step": 153 |
| }, |
| { |
| "epoch": 18.0, |
| "grad_norm": 0.6885235905647278, |
| "learning_rate": 3.490199415097892e-05, |
| "loss": 0.3212, |
| "step": 162 |
| }, |
| { |
| "epoch": 18.0, |
| "eval_loss": 0.4301183819770813, |
| "eval_runtime": 6.9613, |
| "eval_samples_per_second": 1.437, |
| "eval_steps_per_second": 0.287, |
| "eval_wer": 0.18483754512635378, |
| "step": 162 |
| }, |
| { |
| "epoch": 19.0, |
| "grad_norm": 0.5315946340560913, |
| "learning_rate": 3.31588467770289e-05, |
| "loss": 0.3484, |
| "step": 171 |
| }, |
| { |
| "epoch": 19.0, |
| "eval_loss": 0.4417332112789154, |
| "eval_runtime": 7.0935, |
| "eval_samples_per_second": 1.41, |
| "eval_steps_per_second": 0.282, |
| "eval_wer": 0.1855595667870036, |
| "step": 171 |
| }, |
| { |
| "epoch": 20.0, |
| "grad_norm": 0.6952418684959412, |
| "learning_rate": 3.137007182236637e-05, |
| "loss": 0.3193, |
| "step": 180 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_loss": 0.4366823732852936, |
| "eval_runtime": 6.9514, |
| "eval_samples_per_second": 1.439, |
| "eval_steps_per_second": 0.288, |
| "eval_wer": 0.19061371841155234, |
| "step": 180 |
| }, |
| { |
| "epoch": 21.0, |
| "grad_norm": 0.3309876024723053, |
| "learning_rate": 2.9545672842132273e-05, |
| "loss": 0.3157, |
| "step": 189 |
| }, |
| { |
| "epoch": 21.0, |
| "eval_loss": 0.45008668303489685, |
| "eval_runtime": 6.9279, |
| "eval_samples_per_second": 1.443, |
| "eval_steps_per_second": 0.289, |
| "eval_wer": 0.18411552346570398, |
| "step": 189 |
| }, |
| { |
| "epoch": 22.0, |
| "grad_norm": 0.49725911021232605, |
| "learning_rate": 2.769585261546897e-05, |
| "loss": 0.2985, |
| "step": 198 |
| }, |
| { |
| "epoch": 22.0, |
| "eval_loss": 0.4500831961631775, |
| "eval_runtime": 6.8409, |
| "eval_samples_per_second": 1.462, |
| "eval_steps_per_second": 0.292, |
| "eval_wer": 0.18050541516245489, |
| "step": 198 |
| }, |
| { |
| "epoch": 23.0, |
| "grad_norm": 0.7141502499580383, |
| "learning_rate": 2.5830956087440665e-05, |
| "loss": 0.3284, |
| "step": 207 |
| }, |
| { |
| "epoch": 23.0, |
| "eval_loss": 0.4402785897254944, |
| "eval_runtime": 6.9521, |
| "eval_samples_per_second": 1.438, |
| "eval_steps_per_second": 0.288, |
| "eval_wer": 0.18483754512635378, |
| "step": 207 |
| }, |
| { |
| "epoch": 24.0, |
| "grad_norm": 0.8570722341537476, |
| "learning_rate": 2.3961412515904336e-05, |
| "loss": 0.3057, |
| "step": 216 |
| }, |
| { |
| "epoch": 24.0, |
| "eval_loss": 0.4428979754447937, |
| "eval_runtime": 6.9014, |
| "eval_samples_per_second": 1.449, |
| "eval_steps_per_second": 0.29, |
| "eval_wer": 0.1884476534296029, |
| "step": 216 |
| }, |
| { |
| "epoch": 25.0, |
| "grad_norm": 0.9306482076644897, |
| "learning_rate": 2.2097677146869242e-05, |
| "loss": 0.3062, |
| "step": 225 |
| }, |
| { |
| "epoch": 25.0, |
| "eval_loss": 0.4460487961769104, |
| "eval_runtime": 6.8059, |
| "eval_samples_per_second": 1.469, |
| "eval_steps_per_second": 0.294, |
| "eval_wer": 0.1855595667870036, |
| "step": 225 |
| }, |
| { |
| "epoch": 26.0, |
| "grad_norm": 0.28782331943511963, |
| "learning_rate": 2.0250172744520258e-05, |
| "loss": 0.2985, |
| "step": 234 |
| }, |
| { |
| "epoch": 26.0, |
| "eval_loss": 0.4484630227088928, |
| "eval_runtime": 6.8287, |
| "eval_samples_per_second": 1.464, |
| "eval_steps_per_second": 0.293, |
| "eval_wer": 0.18411552346570398, |
| "step": 234 |
| }, |
| { |
| "epoch": 27.0, |
| "grad_norm": 0.636001706123352, |
| "learning_rate": 1.842923130289262e-05, |
| "loss": 0.2732, |
| "step": 243 |
| }, |
| { |
| "epoch": 27.0, |
| "eval_loss": 0.449407160282135, |
| "eval_runtime": 6.9231, |
| "eval_samples_per_second": 1.444, |
| "eval_steps_per_second": 0.289, |
| "eval_wer": 0.18050541516245489, |
| "step": 243 |
| } |
| ], |
| "logging_steps": 500, |
| "max_steps": 400, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 50, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "EarlyStoppingCallback": { |
| "args": { |
| "early_stopping_patience": 6, |
| "early_stopping_threshold": 0.0 |
| }, |
| "attributes": { |
| "early_stopping_patience_counter": 5 |
| } |
| }, |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": false |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 3.7013666477539267e+18, |
| "train_batch_size": 4, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|