{ "epoch": 1.0, "eval_loss": 3.1214051246643066, "eval_runtime": 7.9735, "eval_samples_per_second": 0.376, "eval_steps_per_second": 0.125, "perplexity": 22.678222996470602, "total_flos": 1.6465434123436032e+19, "train_loss": 3.1435366572697956, "train_runtime": 166616.0143, "train_samples_per_second": 46.094, "train_steps_per_second": 2.881 }