{ "epoch": 5.0, "eval_loss": 4.238580703735352, "eval_runtime": 104.2188, "eval_samples": 18156, "eval_samples_per_second": 174.21, "eval_steps_per_second": 21.781, "perplexity": 69.30941140849554, "train_loss": 5.372212270862655, "train_runtime": 34970.0124, "train_samples": 369106, "train_samples_per_second": 52.775, "train_steps_per_second": 6.597 }