{ "epoch": 9.83, "eval_loss": 2.4514307975769043, "eval_runtime": 229.7941, "eval_samples": 205510, "eval_samples_per_second": 894.323, "eval_steps_per_second": 55.898, "perplexity": 11.604939165014551, "train_loss": 2.5438934391276042, "train_runtime": 220778.1092, "train_samples": 3904699, "train_samples_per_second": 173.93, "train_steps_per_second": 10.871 }