{ "epoch": 2.62, "eval_loss": 2.006091594696045, "eval_runtime": 861.4578, "eval_samples": 771820, "eval_samples_per_second": 895.946, "eval_steps_per_second": 55.997, "perplexity": 7.4342046074668735, "train_loss": 2.133689431966146, "train_runtime": 416842.919, "train_samples": 14664588, "train_samples_per_second": 92.121, "train_steps_per_second": 5.758 }