{ "epoch": 1.6, "eval_loss": 0.5873731970787048, "eval_runtime": 1.7661, "eval_samples": 1000, "eval_samples_per_second": 566.226, "eval_steps_per_second": 35.672, "total_flos": 364154381869824.0, "train_loss": 0.6259692611694336, "train_runtime": 219.9954, "train_samples": 10000, "train_samples_per_second": 72.729, "train_steps_per_second": 4.546 }