{ "epoch": 1.35, "eval_accuracy": 0.7117631908735097, "eval_loss": 1.3268314599990845, "eval_runtime": 3605.525, "eval_samples": 4955347, "eval_samples_per_second": 1374.376, "eval_steps_per_second": 5.369, "perplexity": 3.769081960487532, "train_loss": 1.5473345408935546, "train_runtime": 243315.0329, "train_samples": 94568241, "train_samples_per_second": 526.067, "train_steps_per_second": 2.055 }