{ "epoch": 3.0, "eval_loss": 1.920763373374939, "eval_runtime": 81.4759, "eval_samples": 5193, "eval_samples_per_second": 63.737, "eval_steps_per_second": 7.978, "perplexity": 6.826167395302532, "train_loss": 2.110191111022448, "train_runtime": 17635.5568, "train_samples": 98673, "train_samples_per_second": 16.785, "train_steps_per_second": 0.262 }