{ "epoch": 5.0, "train_loss": 4.472965654296875, "train_runtime": 2699.6495, "train_samples": 10000, "train_samples_per_second": 18.521, "train_steps_per_second": 4.63 }