{ "epoch": 20.0, "eval_accuracy": 0.4055823320854937, "eval_loss": 3.4263744354248047, "eval_runtime": 154.08, "eval_samples": 57918, "eval_samples_per_second": 375.896, "eval_steps_per_second": 5.874, "perplexity": 30.764900174885234, "train_loss": 3.1576745831950372, "train_runtime": 81271.0608, "train_samples": 595038, "train_samples_per_second": 146.433, "train_steps_per_second": 4.576 }