{ "epoch": 1.0, "eval_loss": 3.6833789348602295, "eval_runtime": 180.5086, "eval_samples": 40311, "eval_samples_per_second": 223.319, "eval_steps_per_second": 18.614, "perplexity": 39.780583236136096, "train_loss": 3.773873895684371, "train_runtime": 142283.9744, "train_samples": 8570756, "train_samples_per_second": 60.237, "train_steps_per_second": 5.02 }