{ "epoch": 4.888888888888889, "total_flos": 6.236491392252641e+17, "train_loss": 0.4509546727668948, "train_runtime": 4992.3279, "train_samples_per_second": 5.33, "train_steps": 205, "train_steps_per_second": 0.041 }