{ "epoch": 1.0, "eval_loss": 3.381364107131958, "eval_runtime": 8.4739, "eval_samples_per_second": 0.354, "eval_steps_per_second": 0.118, "perplexity": 29.41086333045894, "total_flos": 2.295939729457152e+19, "train_loss": 3.214656148060163, "train_runtime": 141094.738, "train_samples_per_second": 54.432, "train_steps_per_second": 3.402 }