{ "avg_step_time": 7.642647361755371, "epoch": 0.02, "total_flos": 9621820885958656.0, "total_training_time": 93.81911158561707, "total_training_time_mins": 1.5636518597602844, "train_loss": 3.0537273406982424, "train_runtime": 83.3739, "train_samples_per_second": 9.595, "train_steps_per_second": 0.12 }