{ "epoch": 4.0, "total_flos": 3.205097416476426e+17, "train_loss": 0.12538275879163008, "train_runtime": 253.3958, "train_samples_per_second": 16.322, "train_steps_per_second": 2.052 }