{ "epoch": 500.0, "eval_loss": 0.038116455078125, "eval_runtime": 2.8548, "eval_samples": 324, "eval_samples_per_second": 113.495, "eval_steps_per_second": 14.362, "perplexity": 1.0388522054491718, "train_loss": 0.09131514180790294, "train_runtime": 19622.0994, "train_samples": 704, "train_samples_per_second": 17.939, "train_steps_per_second": 1.121 }