{ "epoch": 4.0, "total_flos": 1.870424802038661e+18, "train_loss": 0.5094418521630693, "train_runtime": 3760.9881, "train_samples_per_second": 19.953, "train_steps_per_second": 1.248 }