{ "epoch": 0.83, "eval_accuracy": 0.5855461819146771, "eval_loss": 2.197262763977051, "eval_runtime": 1891.0124, "eval_samples": 308356, "eval_samples_per_second": 163.064, "eval_steps_per_second": 3.398, "perplexity": 9.000343686329554, "train_loss": 2.3200887040276985, "train_runtime": 107983.587, "train_samples": 5858758, "train_samples_per_second": 271.28, "train_steps_per_second": 5.652 }