{ "epoch": 10.0, "total_flos": 4.4162288418816e+17, "train_loss": 0.14765226224263509, "train_runtime": 28756.843, "train_samples_per_second": 3.13, "train_steps_per_second": 0.391 }