{ "epoch": 1.0, "eval_loss": 2.060576915740967, "eval_runtime": 187.7576, "eval_samples": 100000, "eval_samples_per_second": 532.602, "eval_steps_per_second": 66.575, "perplexity": 7.850497579750318, "train_loss": 0.24544810387602325, "train_runtime": 44838.2229, "train_samples": 64750662, "train_samples_per_second": 1444.095, "train_steps_per_second": 5.641 }