{ "epoch": 71.0, "learning_rate": 1.0000000000000002e-07, "total_flos": 4.157361617896582e+20, "train_loss": 0.13389379075850644, "train_runtime": 24026.1554, "train_samples_per_second": 24.654, "train_steps_per_second": 0.774 }