{ "epoch": 15.82, "eval_accuracy": 0.14704149331934327, "eval_loss": 6.142465114593506, "eval_runtime": 406.9014, "eval_samples": 308356, "eval_samples_per_second": 757.815, "eval_steps_per_second": 4.212, "perplexity": 465.1989272263101, "train_loss": 6.343742852633573, "train_runtime": 197999.4151, "train_samples": 5858758, "train_samples_per_second": 2958.977, "train_steps_per_second": 16.439 }