{ "epoch": 8.0, "eval_accuracy": 0.16528946828166702, "eval_loss": 6.006351470947266, "eval_runtime": 28.9332, "eval_samples": 4053, "eval_samples_per_second": 140.081, "eval_steps_per_second": 35.046, "perplexity": 405.99931440686527, "total_flos": 4.223778440028365e+16, "train_loss": 2.356345704317949, "train_runtime": 3822.1574, "train_samples": 80219, "train_samples_per_second": 167.903, "train_steps_per_second": 10.495 }