{ "epoch": 0.354862233609357, "total_flos": 3.589813132276531e+16, "train_loss": 2.132816611328125, "train_runtime": 15981.9131, "train_samples": 4508785, "train_samples_per_second": 100.113, "train_steps_per_second": 6.257 }