{ "epoch": 3.06, "eval_accuracy": 0.17367944889882433, "eval_loss": 5.767988204956055, "eval_runtime": 1121.2169, "eval_samples": 308356, "eval_samples_per_second": 275.019, "eval_steps_per_second": 4.912, "perplexity": 319.89352464992356, "train_loss": 6.214869752465887, "train_runtime": 199028.524, "train_samples": 5858758, "train_samples_per_second": 147.184, "train_steps_per_second": 2.628 }