{ "epoch": 3.0, "total_flos": 1.095858495811584e+16, "train_loss": 5.286988735290586, "train_runtime": 4988.9767, "train_samples_per_second": 4.173, "train_steps_per_second": 2.087 }