{ "epoch": 1.0, "eval_loss": 4.021326541900635, "eval_runtime": 8.2548, "eval_samples_per_second": 1.211, "eval_steps_per_second": 0.363, "perplexity": 55.77504470825612, "total_flos": 1.78310533349376e+18, "train_loss": 3.701560302754243, "train_runtime": 68412.5844, "train_samples_per_second": 28.065, "train_steps_per_second": 7.016 }