{ "epoch": 1.72, "eval_accuracy": 0.44304308255003333, "eval_loss": 3.2766900062561035, "eval_runtime": 1728.7154, "eval_samples": 308356, "eval_samples_per_second": 178.373, "eval_steps_per_second": 3.717, "perplexity": 26.487952480866188, "train_loss": 5.009029721765974, "train_runtime": 198560.4752, "train_samples": 5858758, "train_samples_per_second": 147.531, "train_steps_per_second": 3.074 }