seed_math_automathtext / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 3
0423a8f verified
raw
history blame
2.58 kB
{"current_steps": 10, "total_steps": 117, "loss": 0.6037, "lr": 5e-06, "epoch": 0.2564102564102564, "percentage": 8.55, "elapsed_time": "0:09:40", "remaining_time": "1:43:27"}
{"current_steps": 20, "total_steps": 117, "loss": 0.5362, "lr": 5e-06, "epoch": 0.5128205128205128, "percentage": 17.09, "elapsed_time": "0:19:15", "remaining_time": "1:33:22"}
{"current_steps": 30, "total_steps": 117, "loss": 0.5112, "lr": 5e-06, "epoch": 0.7692307692307693, "percentage": 25.64, "elapsed_time": "0:28:50", "remaining_time": "1:23:37"}
{"current_steps": 39, "total_steps": 117, "eval_loss": 0.4971420168876648, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:38:10", "remaining_time": "1:16:20"}
{"current_steps": 40, "total_steps": 117, "loss": 0.4974, "lr": 5e-06, "epoch": 1.0256410256410255, "percentage": 34.19, "elapsed_time": "0:40:13", "remaining_time": "1:17:25"}
{"current_steps": 50, "total_steps": 117, "loss": 0.4671, "lr": 5e-06, "epoch": 1.282051282051282, "percentage": 42.74, "elapsed_time": "0:49:48", "remaining_time": "1:06:45"}
{"current_steps": 60, "total_steps": 117, "loss": 0.47, "lr": 5e-06, "epoch": 1.5384615384615383, "percentage": 51.28, "elapsed_time": "0:59:24", "remaining_time": "0:56:25"}
{"current_steps": 70, "total_steps": 117, "loss": 0.4657, "lr": 5e-06, "epoch": 1.7948717948717947, "percentage": 59.83, "elapsed_time": "1:08:59", "remaining_time": "0:46:19"}
{"current_steps": 78, "total_steps": 117, "eval_loss": 0.48121070861816406, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:17:21", "remaining_time": "0:38:40"}
{"current_steps": 80, "total_steps": 117, "loss": 0.4509, "lr": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "1:20:27", "remaining_time": "0:37:12"}
{"current_steps": 90, "total_steps": 117, "loss": 0.4352, "lr": 5e-06, "epoch": 2.3076923076923075, "percentage": 76.92, "elapsed_time": "1:30:03", "remaining_time": "0:27:01"}
{"current_steps": 100, "total_steps": 117, "loss": 0.4268, "lr": 5e-06, "epoch": 2.564102564102564, "percentage": 85.47, "elapsed_time": "1:39:40", "remaining_time": "0:16:56"}
{"current_steps": 110, "total_steps": 117, "loss": 0.4298, "lr": 5e-06, "epoch": 2.8205128205128203, "percentage": 94.02, "elapsed_time": "1:49:16", "remaining_time": "0:06:57"}
{"current_steps": 117, "total_steps": 117, "eval_loss": 0.4801027178764343, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:57:53", "remaining_time": "0:00:00"}
{"current_steps": 117, "total_steps": 117, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:59:07", "remaining_time": "0:00:00"}