{ "epoch": 3.0, "eval_loss": 0.6613607406616211, "eval_runtime": 13.2548, "eval_samples": 3200, "eval_samples_per_second": 103.962, "eval_steps_per_second": 0.83, "perplexity": 1.9374268770613925, "train_loss": 0.6159939037574517, "train_runtime": 13745.4884, "train_samples": 344926, "train_samples_per_second": 25.399, "train_steps_per_second": 0.199 }