{ "epoch": 4.71, "eval_loss": 1.5495115518569946, "eval_runtime": 200.1691, "eval_samples": 181300, "eval_samples_per_second": 905.734, "eval_steps_per_second": 3.542, "perplexity": 4.709169435672752, "train_loss": 0.5639808364868164, "train_runtime": 35161.1614, "train_samples": 4349088, "train_samples_per_second": 582.461, "train_steps_per_second": 0.284 }