{ "epoch": 2.8, "total_flos": 3.447204447633408e+16, "train_loss": 0.9240701993306478, "train_runtime": 522.1165, "train_samples_per_second": 0.896, "train_steps_per_second": 0.006 }