{ "epoch": 3.0, "eval_loss": 3.9845974445343018, "eval_runtime": 1425.6748, "eval_samples": 32253, "eval_samples_per_second": 22.623, "eval_steps_per_second": 3.771, "perplexity": 53.7636422730289, "train_loss": 0.7859680134460877, "train_runtime": 210975.8843, "train_samples": 3196485, "train_samples_per_second": 45.453, "train_steps_per_second": 7.575 }