epoch = 3.0 train_loss = 0.526550701855136 train_runtime = 2225.4543 train_samples_per_second = 371.521 train_steps_per_second = 1.45