{ "epoch": 500.0, "eval_loss": 6.0234375, "eval_runtime": 2.3608, "eval_samples": 9, "eval_samples_per_second": 3.812, "eval_steps_per_second": 0.847, "perplexity": 412.9958316281291, "train_loss": 0.36582159678141274, "train_runtime": 9345.1631, "train_samples": 23, "train_samples_per_second": 1.231, "train_steps_per_second": 0.161 }