epoch = 3.0 train_loss = 0.48864371005487267 train_runtime = 2988.0593 train_samples_per_second = 276.702 train_steps_per_second = 1.08