{ "epoch": 1.0, "eval_loss": 3.519840955734253, "eval_runtime": 6.8599, "eval_samples_per_second": 1.458, "eval_steps_per_second": 0.437, "perplexity": 33.77905567149807, "total_flos": 5.9174692061184e+17, "train_loss": 3.8328423178553583, "train_runtime": 75170.0745, "train_samples_per_second": 25.542, "train_steps_per_second": 6.386 }