{ "epoch": 8.0, "total_flos": 1.809515998170317e+16, "train_loss": 0.27006837725639343, "train_runtime": 613.5218, "train_samples_per_second": 1.78, "train_steps_per_second": 0.02 }