LLaMA3-70B-qlora-bnb-A61K-15950 / trainer_log.jsonl
bzhang0426's picture
Upload 15 files
162c34b verified
raw
history blame contribute delete
No virus
6.68 kB
{"current_steps": 10, "total_steps": 202, "loss": 12.5496, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 9.523809523809523e-06, "epoch": 0.04938271604938271, "percentage": 4.95, "elapsed_time": "0:21:11", "remaining_time": "6:46:54"}
{"current_steps": 20, "total_steps": 202, "loss": 11.9318, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 5.714285714285714e-05, "epoch": 0.09876543209876543, "percentage": 9.9, "elapsed_time": "0:40:51", "remaining_time": "6:11:48"}
{"current_steps": 30, "total_steps": 202, "loss": 7.8505, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 9.999246866958692e-05, "epoch": 0.14814814814814814, "percentage": 14.85, "elapsed_time": "1:00:42", "remaining_time": "5:48:03"}
{"current_steps": 40, "total_steps": 202, "loss": 1.2163, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 9.909145108993794e-05, "epoch": 0.19753086419753085, "percentage": 19.8, "elapsed_time": "1:21:55", "remaining_time": "5:31:48"}
{"current_steps": 50, "total_steps": 202, "loss": 0.4577, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 9.67152097716334e-05, "epoch": 0.24691358024691357, "percentage": 24.75, "elapsed_time": "1:42:44", "remaining_time": "5:12:21"}
{"current_steps": 60, "total_steps": 202, "loss": 0.3768, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 9.29351520070574e-05, "epoch": 0.2962962962962963, "percentage": 29.7, "elapsed_time": "2:03:42", "remaining_time": "4:52:45"}
{"current_steps": 70, "total_steps": 202, "loss": 0.4593, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 8.786487050581583e-05, "epoch": 0.345679012345679, "percentage": 34.65, "elapsed_time": "2:23:56", "remaining_time": "4:31:25"}
{"current_steps": 80, "total_steps": 202, "loss": 0.4234, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 8.165672987449962e-05, "epoch": 0.3950617283950617, "percentage": 39.6, "elapsed_time": "2:44:08", "remaining_time": "4:10:19"}
{"current_steps": 90, "total_steps": 202, "loss": 0.3857, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 7.449728798069864e-05, "epoch": 0.4444444444444444, "percentage": 44.55, "elapsed_time": "3:03:31", "remaining_time": "3:48:23"}
{"current_steps": 100, "total_steps": 202, "loss": 0.3663, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 6.66016897916682e-05, "epoch": 0.49382716049382713, "percentage": 49.5, "elapsed_time": "3:23:41", "remaining_time": "3:27:46"}
{"current_steps": 100, "total_steps": 202, "loss": null, "eval_loss": 0.35489073395729065, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.49382716049382713, "percentage": 49.5, "elapsed_time": "3:23:41", "remaining_time": "3:27:46"}
{"current_steps": 110, "total_steps": 202, "loss": 0.37, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 5.820720215572375e-05, "epoch": 0.5432098765432098, "percentage": 54.46, "elapsed_time": "4:04:58", "remaining_time": "3:24:52"}
{"current_steps": 120, "total_steps": 202, "loss": 0.3788, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.956608380955877e-05, "epoch": 0.5925925925925926, "percentage": 59.41, "elapsed_time": "4:26:23", "remaining_time": "3:02:01"}
{"current_steps": 130, "total_steps": 202, "loss": 0.401, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.093800487148857e-05, "epoch": 0.6419753086419753, "percentage": 64.36, "elapsed_time": "4:46:53", "remaining_time": "2:38:53"}
{"current_steps": 140, "total_steps": 202, "loss": 0.3944, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.258224361880657e-05, "epoch": 0.691358024691358, "percentage": 69.31, "elapsed_time": "5:07:33", "remaining_time": "2:16:12"}
{"current_steps": 150, "total_steps": 202, "loss": 0.3521, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.474989504016798e-05, "epoch": 0.7407407407407407, "percentage": 74.26, "elapsed_time": "5:26:36", "remaining_time": "1:53:13"}
{"current_steps": 160, "total_steps": 202, "loss": 0.3425, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.7676325300069825e-05, "epoch": 0.7901234567901234, "percentage": 79.21, "elapsed_time": "5:45:49", "remaining_time": "1:30:46"}
{"current_steps": 170, "total_steps": 202, "loss": 0.3548, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.1574098862709992e-05, "epoch": 0.8395061728395061, "percentage": 84.16, "elapsed_time": "6:07:10", "remaining_time": "1:09:06"}
{"current_steps": 180, "total_steps": 202, "loss": 0.3404, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 6.626590818846162e-06, "epoch": 0.8888888888888888, "percentage": 89.11, "elapsed_time": "6:27:49", "remaining_time": "0:47:24"}
{"current_steps": 190, "total_steps": 202, "loss": 0.3374, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.9824763685681766e-06, "epoch": 0.9382716049382716, "percentage": 94.06, "elapsed_time": "6:47:00", "remaining_time": "0:25:42"}
{"current_steps": 200, "total_steps": 202, "loss": 0.3383, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 7.512630539036502e-07, "epoch": 0.9876543209876543, "percentage": 99.01, "elapsed_time": "7:07:29", "remaining_time": "0:04:16"}
{"current_steps": 200, "total_steps": 202, "loss": null, "eval_loss": 0.35073795914649963, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.9876543209876543, "percentage": 99.01, "elapsed_time": "7:07:29", "remaining_time": "0:04:16"}
{"current_steps": 202, "total_steps": 202, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.9975308641975309, "percentage": 100.0, "elapsed_time": "7:33:40", "remaining_time": "0:00:00"}
{"current_steps": 180, "total_steps": 180, "loss": null, "eval_loss": 0.35073795914649963, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.9975308641975309, "percentage": 100.0, "elapsed_time": "7:55:37", "remaining_time": "0:00:00"}