{ "epoch": 3.02, "eval_accuracy": 0.5056511877490866, "eval_loss": 2.8022732734680176, "eval_runtime": 1319.1397, "eval_samples": 308356, "eval_samples_per_second": 233.755, "eval_steps_per_second": 4.175, "perplexity": 16.48207247360368, "train_loss": 4.694392849819643, "train_runtime": 197999.2569, "train_samples": 5858758, "train_samples_per_second": 2958.98, "train_steps_per_second": 52.839 }