{ "epoch": 1.0, "eval_loss": 1.9169865846633911, "eval_runtime": 6.1838, "eval_samples_per_second": 13.746, "eval_steps_per_second": 1.779, "perplexity": 6.800435026787768, "total_flos": 8396029742284800.0, "train_loss": 2.2311009658879533, "train_runtime": 144.4923, "train_samples_per_second": 6.395, "train_steps_per_second": 3.197 }