{"train/loss": 0.073, "train/learning_rate": 2.2037037037037038e-05, "train/epoch": 3.0, "train/global_step": 354, "_timestamp": 1713959114.6460462, "_runtime": 12046.784997224808, "_step": 5, "eval/loss": 0.08488664031028748, "eval/runtime": 37.5454, "eval/samples_per_second": 0.692, "eval/steps_per_second": 0.346} |