{ "epoch": 3.0, "eval_accuracy": 0.4740019077647743, "eval_loss": 3.1173603534698486, "eval_runtime": 6169.3155, "eval_samples": 2812170, "eval_samples_per_second": 455.832, "eval_steps_per_second": 1.781, "perplexity": 22.586680033328033, "train_loss": 3.5860012905026264, "train_runtime": 1342569.7438, "train_samples": 25309522, "train_samples_per_second": 56.555, "train_steps_per_second": 0.221 }