{ "epoch": 1.6, "total_flos": 364154381869824.0, "train_loss": 0.6259692611694336, "train_runtime": 219.9954, "train_samples": 10000, "train_samples_per_second": 72.729, "train_steps_per_second": 4.546 }