{ "epoch": 2.0, "train_loss": 3.16140578525316, "train_runtime": 93885.6881, "train_samples": 946752, "train_samples_per_second": 20.168, "train_steps_per_second": 0.63 }