{ "epoch": 3.0, "train_loss": 1.3950741625133278, "train_runtime": 240198.6559, "train_samples": 500000, "train_samples_per_second": 6.245, "train_steps_per_second": 0.049 }