{ "epoch": 53.58, "eval_loss": 0.7302267551422119, "eval_runtime": 3.6523, "eval_samples_per_second": 2738.025, "eval_steps_per_second": 21.63, "perplexity": 2.0755511962245876, "train_loss": 1.193239736328125, "train_runtime": 102111.9968, "train_samples_per_second": 1253.526, "train_steps_per_second": 4.897 }