{ "epoch": 3.38, "eval_accuracy": 0.5043557996025465, "eval_loss": 2.814643621444702, "eval_runtime": 1183.0633, "eval_samples": 308356, "eval_samples_per_second": 260.642, "eval_steps_per_second": 4.073, "perplexity": 16.687227750401497, "train_loss": 4.827055456554494, "train_runtime": 197999.4407, "train_samples": 5858758, "train_samples_per_second": 2958.977, "train_steps_per_second": 46.234 }