{ "epoch": 8.0, "eval_loss": 1.9716644287109375, "eval_runtime": 80.7808, "eval_samples": 5193, "eval_samples_per_second": 64.285, "eval_steps_per_second": 8.046, "perplexity": 7.18262150622839, "train_loss": 2.136193385538579, "train_runtime": 46556.9069, "train_samples": 98673, "train_samples_per_second": 16.955, "train_steps_per_second": 0.265 }