{ "epoch": 20.0, "eval_loss": 1.0495083332061768, "eval_runtime": 798.4883, "eval_samples": 77096, "eval_samples_per_second": 96.552, "eval_steps_per_second": 6.035, "perplexity": 2.856246451242393, "train_loss": 0.5992164485148723, "train_runtime": 340057.0464, "train_samples": 1464817, "train_samples_per_second": 86.151, "train_steps_per_second": 0.673 }