{ "epoch": 3.0, "eval_loss": 0.7738651633262634, "eval_runtime": 61.8989, "eval_samples": 524, "eval_samples_per_second": 8.465, "eval_steps_per_second": 0.533, "perplexity": 2.1681302568083956, "train_loss": 1.5514631569575188, "train_runtime": 557290.3071, "train_samples": 737503, "train_samples_per_second": 3.97, "train_steps_per_second": 0.031 }