LLaMA3-70B-qlora-bnb-G06F17-30 / trainer_log.jsonl
bzhang0426's picture
Upload 14 files
08970ad verified
{"current_steps": 10, "total_steps": 222, "loss": 12.2081, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.9977474155117045e-05, "epoch": 0.13377926421404682, "percentage": 4.5, "elapsed_time": "0:11:22", "remaining_time": "4:01:12"}
{"current_steps": 20, "total_steps": 222, "loss": 9.9449, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.9640397758692715e-05, "epoch": 0.26755852842809363, "percentage": 9.01, "elapsed_time": "0:22:55", "remaining_time": "3:51:27"}
{"current_steps": 30, "total_steps": 222, "loss": 6.0546, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.8798182638228166e-05, "epoch": 0.4013377926421405, "percentage": 13.51, "elapsed_time": "0:33:35", "remaining_time": "3:34:58"}
{"current_steps": 40, "total_steps": 222, "loss": 1.4872, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.748018037239592e-05, "epoch": 0.5351170568561873, "percentage": 18.02, "elapsed_time": "0:44:37", "remaining_time": "3:23:04"}
{"current_steps": 50, "total_steps": 222, "loss": 0.378, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.571274123109606e-05, "epoch": 0.6688963210702341, "percentage": 22.52, "elapsed_time": "0:55:36", "remaining_time": "3:11:16"}
{"current_steps": 60, "total_steps": 222, "loss": 0.3846, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.353120088833501e-05, "epoch": 0.802675585284281, "percentage": 27.03, "elapsed_time": "1:06:08", "remaining_time": "2:58:36"}
{"current_steps": 70, "total_steps": 222, "loss": 0.3639, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.0979173970824626e-05, "epoch": 0.9364548494983278, "percentage": 31.53, "elapsed_time": "1:17:22", "remaining_time": "2:48:01"}
{"current_steps": 80, "total_steps": 222, "loss": 0.3366, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.8107682088930794e-05, "epoch": 1.0702341137123745, "percentage": 36.04, "elapsed_time": "1:27:56", "remaining_time": "2:36:05"}
{"current_steps": 90, "total_steps": 222, "loss": 0.3343, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.497413378288541e-05, "epoch": 1.2040133779264215, "percentage": 40.54, "elapsed_time": "1:38:45", "remaining_time": "2:24:50"}
{"current_steps": 100, "total_steps": 222, "loss": 0.3548, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.164117677777191e-05, "epoch": 1.3377926421404682, "percentage": 45.05, "elapsed_time": "1:49:41", "remaining_time": "2:13:49"}
{"current_steps": 100, "total_steps": 222, "loss": null, "eval_loss": 0.3387661278247833, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 1.3377926421404682, "percentage": 45.05, "elapsed_time": "1:49:41", "remaining_time": "2:13:49"}
{"current_steps": 110, "total_steps": 222, "loss": 0.4054, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.8175445493671972e-05, "epoch": 1.471571906354515, "percentage": 49.55, "elapsed_time": "2:04:43", "remaining_time": "2:06:59"}
{"current_steps": 120, "total_steps": 222, "loss": 0.3489, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.4646228851480956e-05, "epoch": 1.605351170568562, "percentage": 54.05, "elapsed_time": "2:15:44", "remaining_time": "1:55:23"}
{"current_steps": 130, "total_steps": 222, "loss": 0.3078, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.1124085008395054e-05, "epoch": 1.7391304347826086, "percentage": 58.56, "elapsed_time": "2:26:56", "remaining_time": "1:43:59"}
{"current_steps": 140, "total_steps": 222, "loss": 0.3377, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.7679430718086243e-05, "epoch": 1.8729096989966556, "percentage": 63.06, "elapsed_time": "2:37:38", "remaining_time": "1:32:20"}
{"current_steps": 150, "total_steps": 222, "loss": 0.2855, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.4381133517898804e-05, "epoch": 2.0066889632107023, "percentage": 67.57, "elapsed_time": "2:48:56", "remaining_time": "1:21:05"}
{"current_steps": 160, "total_steps": 222, "loss": 0.2867, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.1295134888882258e-05, "epoch": 2.140468227424749, "percentage": 72.07, "elapsed_time": "3:00:01", "remaining_time": "1:09:45"}
{"current_steps": 170, "total_steps": 222, "loss": 0.3044, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 8.483131915247968e-06, "epoch": 2.274247491638796, "percentage": 76.58, "elapsed_time": "3:11:16", "remaining_time": "0:58:30"}
{"current_steps": 180, "total_steps": 222, "loss": 0.28, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 6.001343800282569e-06, "epoch": 2.408026755852843, "percentage": 81.08, "elapsed_time": "3:22:06", "remaining_time": "0:47:09"}
{"current_steps": 190, "total_steps": 222, "loss": 0.2838, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.8993878992512415e-06, "epoch": 2.5418060200668897, "percentage": 85.59, "elapsed_time": "3:32:59", "remaining_time": "0:35:52"}
{"current_steps": 200, "total_steps": 222, "loss": 0.271, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.219287740296605e-06, "epoch": 2.6755852842809364, "percentage": 90.09, "elapsed_time": "3:43:42", "remaining_time": "0:24:36"}
{"current_steps": 200, "total_steps": 222, "loss": null, "eval_loss": 0.3382669687271118, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 2.6755852842809364, "percentage": 90.09, "elapsed_time": "3:43:42", "remaining_time": "0:24:36"}
{"current_steps": 210, "total_steps": 222, "loss": 0.2943, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 9.946328655577624e-07, "epoch": 2.809364548494983, "percentage": 94.59, "elapsed_time": "3:58:43", "remaining_time": "0:13:38"}
{"current_steps": 220, "total_steps": 222, "loss": 0.2605, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.499072894559057e-07, "epoch": 2.94314381270903, "percentage": 99.1, "elapsed_time": "4:09:38", "remaining_time": "0:02:16"}
{"current_steps": 222, "total_steps": 222, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 2.9698996655518393, "percentage": 100.0, "elapsed_time": "4:12:02", "remaining_time": "0:00:00"}
{"current_steps": 67, "total_steps": 67, "loss": null, "eval_loss": 0.3382669687271118, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 2.9698996655518393, "percentage": 100.0, "elapsed_time": "4:15:58", "remaining_time": "0:00:00"}