{ "initial_eval_loss": 0.6070852279663086, "initial_eval_model_preparation_time": 0.0369, "initial_eval_runtime": 351.3242, "initial_eval_samples_per_second": 0.313, "initial_eval_steps_per_second": 0.313, "epoch": 0, "initial_eval_perplexity": 1.8350747712770092 }