{ "epoch": 3.0, "eval_loss": 0.059506773948669434, "eval_runtime": 88.8314, "eval_samples_per_second": 203.791, "eval_steps_per_second": 0.405, "total_flos": 3375200049561600.0, "train_loss": 0.5100103264290189, "train_runtime": 14999.08, "train_samples_per_second": 68.795, "train_steps_per_second": 0.017 }