epoch = 3.0 train_loss = 0.5495197716846489 train_runtime = 1839.8406 train_samples_per_second = 449.388 train_steps_per_second = 1.754