{ "epoch": 5.05, "eval_loss": 1.942165732383728, "eval_runtime": 459.5033, "eval_samples": 400000, "eval_samples_per_second": 870.505, "eval_steps_per_second": 54.407, "perplexity": 6.97383809440389, "train_loss": 2.0860133251953124, "train_runtime": 289964.3288, "train_samples": 7600000, "train_samples_per_second": 132.43, "train_steps_per_second": 8.277 }