{ "epoch": 2.986666666666667, "total_flos": 1.79183583387648e+16, "train_loss": 1.8150039003008889, "train_runtime": 321.7396, "train_samples_per_second": 4.196, "train_steps_per_second": 0.261 }