{ "epoch": 2.0, "train_loss": 2.223597173579037, "train_runtime": 8040.0291, "train_samples": 16416, "train_samples_per_second": 4.084, "train_steps_per_second": 0.064, "train_tokens_per_second": 8363.146 }