{ "epoch": 1.0, "eval_loss": 6.96756649017334, "eval_runtime": 8.0075, "eval_samples_per_second": 0.375, "eval_steps_per_second": 0.125, "perplexity": 1061.6361026099812, "total_flos": 1.6465434123436032e+19, "train_loss": 1.934643552494049, "train_runtime": 49285.6778, "train_samples_per_second": 155.826, "train_steps_per_second": 9.739 }