epoch = 3.0 train_loss = 0.3537116788234259 train_runtime = 3231.8718 train_samples_per_second = 255.828 train_steps_per_second = 1.999