{ "epoch": 4.65, "eval_loss": 1.5519299507141113, "eval_runtime": 106.731, "eval_samples": 181300, "eval_samples_per_second": 1698.662, "eval_steps_per_second": 6.643, "perplexity": 4.720571867911094, "train_loss": 0.5719003509521484, "train_runtime": 13336.4941, "train_samples": 4349088, "train_samples_per_second": 1535.636, "train_steps_per_second": 0.75 }