{ "epoch": 100.0, "total_flos": 1.8667587341684736e+18, "train_loss": 0.16236644983291626, "train_runtime": 1253.5555, "train_samples_per_second": 19.225, "train_steps_per_second": 0.16 }