{ "epoch": 4.03, "eval_loss": 1.2611794471740723, "eval_runtime": 25.4151, "eval_samples": 3332, "eval_samples_per_second": 131.103, "eval_steps_per_second": 0.275, "perplexity": 3.5295819888396176, "train_loss": 1.25592919921875, "train_runtime": 8163.1704, "train_samples": 63101, "train_samples_per_second": 154.599, "train_steps_per_second": 0.304 }