{ "epoch": 6.67, "eval_accuracy": 0.47417707399571035, "eval_loss": 2.9272146224975586, "eval_runtime": 749.8561, "eval_samples": 308356, "eval_samples_per_second": 411.22, "eval_steps_per_second": 3.739, "perplexity": 18.675539556158554, "train_loss": 3.9441763886343586, "train_runtime": 197998.8709, "train_samples": 5858758, "train_samples_per_second": 2958.986, "train_steps_per_second": 26.9 }