{ "epoch": 2.99, "total_flos": 1.336513820941394e+18, "train_loss": 0.2994473668617931, "train_runtime": 953.1608, "train_samples_per_second": 66.313, "train_steps_per_second": 0.516 }