{ "epoch": 3.0, "eval_loss": 1.6137232780456543, "eval_runtime": 529.2083, "eval_samples": 9423, "eval_samples_per_second": 17.806, "eval_steps_per_second": 1.113, "perplexity": 5.021472804605811, "train_loss": 1.6269652545171758, "train_runtime": 39015.8853, "train_samples": 102048, "train_samples_per_second": 7.847, "train_steps_per_second": 0.327 }