epoch = 3.0 train_loss = 0.3217803806246462 train_runtime = 6847.4259 train_samples_per_second = 120.747 train_steps_per_second = 0.943