{ "epoch": 3.0, "eval_loss": 1.5925407409667969, "eval_runtime": 2.0229, "eval_samples": 100, "eval_samples_per_second": 49.434, "eval_steps_per_second": 1.977, "perplexity": 4.916223925276727, "train_loss": 1.3950741625133278, "train_runtime": 240198.6559, "train_samples": 500000, "train_samples_per_second": 6.245, "train_steps_per_second": 0.049 }