{ "epoch": 4.0, "eval_loss": 2.4018473625183105, "eval_runtime": 343.4017, "eval_samples_per_second": 205.89, "eval_steps_per_second": 1.61, "perplexity": 11.043559004771115, "total_flos": 4159012790599680.0, "train_loss": 0.7021765150223461, "train_runtime": 17437.0559, "train_samples_per_second": 145.971, "train_steps_per_second": 2.281 }