{ "epoch": 1.0, "eval_loss": 1.9000619649887085, "eval_runtime": 18.3283, "eval_samples_per_second": 21.988, "eval_steps_per_second": 2.783, "perplexity": 6.686308746488937, "total_flos": 5.10776634114048e+16, "train_loss": 2.1906768205718286, "train_runtime": 755.3629, "train_samples_per_second": 7.416, "train_steps_per_second": 3.708 }