{ "epoch": 3.0, "eval_loss": 1.5619168281555176, "eval_runtime": 63.0861, "eval_samples": 42251, "eval_samples_per_second": 669.735, "eval_steps_per_second": 83.727, "perplexity": 4.76795183577856, "train_loss": 1.8846093698359827, "train_runtime": 20632.0794, "train_samples": 802763, "train_samples_per_second": 116.725, "train_steps_per_second": 14.591 }