{ "epoch": 2.58, "eval_accuracy": 0.15118347474846977, "eval_loss": 6.042614459991455, "eval_runtime": 1256.9952, "eval_samples": 308356, "eval_samples_per_second": 245.312, "eval_steps_per_second": 4.381, "perplexity": 420.9922647471828, "train_loss": 6.298876106775028, "train_runtime": 198451.5423, "train_samples": 5858758, "train_samples_per_second": 147.612, "train_steps_per_second": 2.636 }