{ "epoch": 0.85, "eval_accuracy": 0.15112417542322987, "eval_loss": 6.060698509216309, "eval_runtime": 1562.4042, "eval_samples": 308356, "eval_samples_per_second": 197.36, "eval_steps_per_second": 4.112, "perplexity": 428.6747655797377, "train_loss": 6.324463086895448, "train_runtime": 89974.5083, "train_samples": 5858758, "train_samples_per_second": 325.579, "train_steps_per_second": 6.783 }