{ "epoch": 10.0, "eval_loss": 2.990234375, "eval_runtime": 125.3791, "eval_samples": 240, "eval_samples_per_second": 1.914, "eval_steps_per_second": 0.096, "perplexity": 19.89034374461794, "train_loss": 3.1787637246621623, "train_runtime": 4372.4031, "train_samples": 114248, "train_samples_per_second": 261.293, "train_steps_per_second": 0.254 }