{ "epoch": 5.0, "eval_loss": 1.3518991470336914, "eval_runtime": 4.6868, "eval_samples": 800, "eval_samples_per_second": 170.691, "eval_steps_per_second": 21.336, "perplexity": 3.864758309760122, "train_loss": 1.626130136269521, "train_runtime": 5849.5407, "train_samples": 15300, "train_samples_per_second": 13.078, "train_steps_per_second": 1.635 }