gemma-2b-it-math / trainer_log.jsonl
tjluyao's picture
Upload 13 files
1ecc8d5 verified
raw
history blame contribute delete
No virus
3.61 kB
{"current_steps": 10, "total_steps": 170, "loss": 1.6736, "learning_rate": 9.91645696388268e-05, "epoch": 0.08849557522123894, "percentage": 5.88, "elapsed_time": "0:00:09", "remaining_time": "0:02:30"}
{"current_steps": 20, "total_steps": 170, "loss": 1.1231, "learning_rate": 9.665301848904975e-05, "epoch": 0.17699115044247787, "percentage": 11.76, "elapsed_time": "0:00:17", "remaining_time": "0:02:08"}
{"current_steps": 30, "total_steps": 170, "loss": 1.0192, "learning_rate": 9.255088935784784e-05, "epoch": 0.26548672566371684, "percentage": 17.65, "elapsed_time": "0:00:24", "remaining_time": "0:01:56"}
{"current_steps": 40, "total_steps": 170, "loss": 0.8938, "learning_rate": 8.699803935381485e-05, "epoch": 0.35398230088495575, "percentage": 23.53, "elapsed_time": "0:00:33", "remaining_time": "0:01:50"}
{"current_steps": 50, "total_steps": 170, "loss": 0.9706, "learning_rate": 8.018378615106108e-05, "epoch": 0.4424778761061947, "percentage": 29.41, "elapsed_time": "0:00:42", "remaining_time": "0:01:40"}
{"current_steps": 60, "total_steps": 170, "loss": 0.8909, "learning_rate": 7.23404534331376e-05, "epoch": 0.5309734513274337, "percentage": 35.29, "elapsed_time": "0:00:49", "remaining_time": "0:01:30"}
{"current_steps": 70, "total_steps": 170, "loss": 0.8943, "learning_rate": 6.373545009932168e-05, "epoch": 0.6194690265486725, "percentage": 41.18, "elapsed_time": "0:00:56", "remaining_time": "0:01:21"}
{"current_steps": 80, "total_steps": 170, "loss": 0.873, "learning_rate": 5.466215328310079e-05, "epoch": 0.7079646017699115, "percentage": 47.06, "elapsed_time": "0:01:04", "remaining_time": "0:01:12"}
{"current_steps": 90, "total_steps": 170, "loss": 0.8852, "learning_rate": 4.542990601526297e-05, "epoch": 0.7964601769911505, "percentage": 52.94, "elapsed_time": "0:01:11", "remaining_time": "0:01:03"}
{"current_steps": 100, "total_steps": 170, "loss": 0.8028, "learning_rate": 3.635347054911746e-05, "epoch": 0.8849557522123894, "percentage": 58.82, "elapsed_time": "0:01:21", "remaining_time": "0:00:57"}
{"current_steps": 110, "total_steps": 170, "loss": 0.7924, "learning_rate": 2.774229692390805e-05, "epoch": 0.9734513274336283, "percentage": 64.71, "elapsed_time": "0:01:31", "remaining_time": "0:00:49"}
{"current_steps": 120, "total_steps": 170, "loss": 0.7311, "learning_rate": 1.9889972641710248e-05, "epoch": 1.0619469026548674, "percentage": 70.59, "elapsed_time": "0:01:38", "remaining_time": "0:00:41"}
{"current_steps": 130, "total_steps": 170, "loss": 0.7295, "learning_rate": 1.3064213158260386e-05, "epoch": 1.1504424778761062, "percentage": 76.47, "elapsed_time": "0:01:46", "remaining_time": "0:00:32"}
{"current_steps": 140, "total_steps": 170, "loss": 0.7283, "learning_rate": 7.497734449769639e-06, "epoch": 1.238938053097345, "percentage": 82.35, "elapsed_time": "0:01:57", "remaining_time": "0:00:25"}
{"current_steps": 150, "total_steps": 170, "loss": 0.7425, "learning_rate": 3.380318844467728e-06, "epoch": 1.3274336283185841, "percentage": 88.24, "elapsed_time": "0:02:06", "remaining_time": "0:00:16"}
{"current_steps": 160, "total_steps": 170, "loss": 0.7629, "learning_rate": 8.523446247096445e-07, "epoch": 1.415929203539823, "percentage": 94.12, "elapsed_time": "0:02:15", "remaining_time": "0:00:08"}
{"current_steps": 170, "total_steps": 170, "loss": 0.6129, "learning_rate": 0.0, "epoch": 1.504424778761062, "percentage": 100.0, "elapsed_time": "0:02:24", "remaining_time": "0:00:00"}
{"current_steps": 170, "total_steps": 170, "epoch": 1.504424778761062, "percentage": 100.0, "elapsed_time": "0:02:24", "remaining_time": "0:00:00"}