{ "epoch": 4.71, "eval_loss": 1.3815752267837524, "eval_runtime": 184.9651, "eval_samples": 181300, "eval_samples_per_second": 980.185, "eval_steps_per_second": 3.833, "perplexity": 3.9811679331316605, "train_loss": 0.00010499673156234791, "train_runtime": 1054.6912, "train_samples": 4349088, "train_samples_per_second": 19418.005, "train_steps_per_second": 9.481 }