{ "epoch": 4.0, "eval_loss": 1.6668897867202759, "eval_runtime": 102.7014, "eval_samples": 13319, "eval_samples_per_second": 129.687, "eval_steps_per_second": 16.212, "perplexity": 5.295671489170355, "train_loss": 1.9931427570304485, "train_runtime": 30194.781, "train_samples": 253694, "train_samples_per_second": 33.608, "train_steps_per_second": 0.131 }