epoch = 3.0 train_loss = 1.8377529225624027 train_runtime = 9670.2298 train_samples_per_second = 75.23 train_steps_per_second = 9.404