{ "epoch": 4.0, "total_flos": 1.436727240856535e+18, "train_loss": 0.027367618223170524, "train_runtime": 673.711, "train_samples_per_second": 27.519, "train_steps_per_second": 1.722 }