{ "epoch": 5.9, "eval_loss": 1.4719988107681274, "eval_runtime": 5.2039, "eval_samples": 202, "eval_samples_per_second": 38.817, "eval_steps_per_second": 1.345, "perplexity": 4.35793713301621, "train_loss": 0.9728257921006944, "train_runtime": 2307.7787, "train_samples": 3888, "train_samples_per_second": 10.108, "train_steps_per_second": 0.039 }