{ "epoch": 3.0, "total_flos": 4.15443275785175e+16, "train_loss": 0.3380747139453888, "train_runtime": 1182.7003, "train_samples_per_second": 2.242, "train_steps_per_second": 0.018 }