{ "epoch": 4.0, "total_flos": 3.205097416476426e+17, "train_loss": 0.11964335679434814, "train_runtime": 100.8137, "train_samples_per_second": 41.026, "train_steps_per_second": 2.579 }