epoch = 3.0 train_loss = 0.4807460529653556 train_runtime = 2232.8308 train_samples_per_second = 370.294 train_steps_per_second = 1.446