{ "epoch": 1.0, "eval_loss": 1.750352382659912, "eval_runtime": 1628.7902, "eval_samples_per_second": 76.532, "eval_steps_per_second": 9.567, "perplexity": 5.7566308555301, "total_flos": 7.631778497299481e+18, "train_loss": 2.1485319636500972, "train_runtime": 14119.5859, "train_samples_per_second": 35.382, "train_steps_per_second": 4.423 }