{ "epoch": 85.0, "learning_rate": 1.0000000000000002e-07, "total_flos": 1.1045912459199104e+21, "train_loss": 0.0019856175725272715, "train_runtime": 5622.9029, "train_samples_per_second": 132.483, "train_steps_per_second": 4.142 }