{ "epoch": 3.0, "total_flos": 1.3233014236495872e+16, "train_loss": 0.3693488495690482, "train_runtime": 207.611, "train_samples_per_second": 12.774, "train_steps_per_second": 0.101 }