{ "epoch": 167.88, "eval_accuracy": 0.6427141769796747, "eval_loss": NaN, "eval_runtime": 2.1292, "eval_samples": 479, "eval_samples_per_second": 224.97, "eval_steps_per_second": 1.879, "perplexity": NaN, "train_loss": 0.00019481298685073851, "train_runtime": 193101.3534, "train_samples": 228639, "train_samples_per_second": 198.859, "train_steps_per_second": 1.554 }