{ "epoch": 4.24, "eval_loss": 1.0333222150802612, "eval_runtime": 465.8524, "eval_samples": 181300, "eval_samples_per_second": 389.179, "eval_steps_per_second": 6.081, "perplexity": 2.810387052828362, "train_loss": 0.023931974029541017, "train_runtime": 6473.1334, "train_samples": 4349088, "train_samples_per_second": 3163.846, "train_steps_per_second": 1.545 }