{ "epoch": 1.0, "eval_loss": 2.18013596534729, "eval_runtime": 9.846, "eval_samples_per_second": 22.141, "eval_steps_per_second": 2.844, "perplexity": 8.847509131596244, "total_flos": 2.42426139967488e+16, "train_loss": 2.3308336977473276, "train_runtime": 355.7712, "train_samples_per_second": 7.508, "train_steps_per_second": 3.755 }