{ "epoch": 1.0, "eval_loss": 2.0019874572753906, "eval_runtime": 54.4001, "eval_samples_per_second": 22.022, "eval_steps_per_second": 2.757, "perplexity": 7.403756135241051, "total_flos": 9.84840481406976e+16, "train_loss": 2.112572115185123, "train_runtime": 1452.1865, "train_samples_per_second": 7.455, "train_steps_per_second": 3.727 }