{ "epoch": 12.0, "eval_loss": 1.9043388366699219, "eval_runtime": 45.4507, "eval_samples": 2933, "eval_samples_per_second": 64.531, "eval_steps_per_second": 8.075, "perplexity": 6.714966470038764, "train_loss": 1.9039230375877523, "train_runtime": 39633.1701, "train_samples": 55736, "train_samples_per_second": 16.876, "train_steps_per_second": 0.264 }