{ "epoch": 3.0, "eval_loss": 1.422879934310913, "eval_runtime": 543.4644, "eval_samples": 179869, "eval_samples_per_second": 330.967, "eval_steps_per_second": 5.172, "perplexity": 4.1490522485207775, "train_loss": 1.7074700184427065, "train_runtime": 2192.338, "train_samples": 179869, "train_samples_per_second": 246.133, "train_steps_per_second": 3.847 }