{ "epoch": 10.11, "eval_loss": 2.560811996459961, "eval_runtime": 225.5262, "eval_samples": 200000, "eval_samples_per_second": 886.815, "eval_steps_per_second": 55.426, "perplexity": 12.94632541910408, "train_loss": 2.9681437548828127, "train_runtime": 221059.9809, "train_samples": 3799999, "train_samples_per_second": 173.709, "train_steps_per_second": 10.857 }