{ "epoch": 100.0, "total_flos": 9.341428686415195e+19, "train_loss": 2.455530970781699, "train_runtime": 21216.8436, "train_samples_per_second": 16.369, "train_steps_per_second": 2.05 }