epoch = 5.0 train_loss = 2.009976102938465 train_runtime = 3338.0012 train_samples = 42367 train_samples_per_second = 63.462 train_steps_per_second = 1.983