epoch = 4.0 train_loss = 2.6336010373971255 train_runtime = 9376.0618 train_samples = 42367 train_samples_per_second = 18.075 train_steps_per_second = 9.037