Llama-3-lora / trainer_log.jsonl
xi0v's picture
Upload folder using huggingface_hub
ec9bb8b verified
{"current_steps": 10, "total_steps": 408, "loss": 1.493, "learning_rate": 1.2195121951219513e-05, "epoch": 0.07326007326007326, "percentage": 2.45, "elapsed_time": "0:01:34", "remaining_time": "1:02:31"}
{"current_steps": 20, "total_steps": 408, "loss": 1.1235, "learning_rate": 2.4390243902439026e-05, "epoch": 0.14652014652014653, "percentage": 4.9, "elapsed_time": "0:03:13", "remaining_time": "1:02:28"}
{"current_steps": 30, "total_steps": 408, "loss": 1.1219, "learning_rate": 3.6585365853658535e-05, "epoch": 0.21978021978021978, "percentage": 7.35, "elapsed_time": "0:04:53", "remaining_time": "1:01:32"}
{"current_steps": 40, "total_steps": 408, "loss": 1.1664, "learning_rate": 4.878048780487805e-05, "epoch": 0.29304029304029305, "percentage": 9.8, "elapsed_time": "0:06:29", "remaining_time": "0:59:42"}
{"current_steps": 50, "total_steps": 408, "loss": 1.0602, "learning_rate": 4.992584373844853e-05, "epoch": 0.3663003663003663, "percentage": 12.25, "elapsed_time": "0:08:11", "remaining_time": "0:58:40"}
{"current_steps": 60, "total_steps": 408, "loss": 1.0122, "learning_rate": 4.9670065861258264e-05, "epoch": 0.43956043956043955, "percentage": 14.71, "elapsed_time": "0:09:45", "remaining_time": "0:56:34"}
{"current_steps": 70, "total_steps": 408, "loss": 1.1042, "learning_rate": 4.9233623530708587e-05, "epoch": 0.5128205128205128, "percentage": 17.16, "elapsed_time": "0:11:20", "remaining_time": "0:54:48"}
{"current_steps": 80, "total_steps": 408, "loss": 0.9888, "learning_rate": 4.861971291236772e-05, "epoch": 0.5860805860805861, "percentage": 19.61, "elapsed_time": "0:12:57", "remaining_time": "0:53:08"}
{"current_steps": 90, "total_steps": 408, "loss": 1.0949, "learning_rate": 4.7832829812079794e-05, "epoch": 0.6593406593406593, "percentage": 22.06, "elapsed_time": "0:14:32", "remaining_time": "0:51:23"}
{"current_steps": 100, "total_steps": 408, "loss": 1.0847, "learning_rate": 4.687873675216522e-05, "epoch": 0.7326007326007326, "percentage": 24.51, "elapsed_time": "0:16:15", "remaining_time": "0:50:05"}
{"current_steps": 110, "total_steps": 408, "loss": 1.0386, "learning_rate": 4.576442077117073e-05, "epoch": 0.8058608058608059, "percentage": 26.96, "elapsed_time": "0:17:54", "remaining_time": "0:48:31"}
{"current_steps": 120, "total_steps": 408, "loss": 1.0071, "learning_rate": 4.4498042256211164e-05, "epoch": 0.8791208791208791, "percentage": 29.41, "elapsed_time": "0:19:23", "remaining_time": "0:46:32"}
{"current_steps": 130, "total_steps": 408, "loss": 0.9977, "learning_rate": 4.308887518261507e-05, "epoch": 0.9523809523809523, "percentage": 31.86, "elapsed_time": "0:21:00", "remaining_time": "0:44:55"}
{"current_steps": 140, "total_steps": 408, "loss": 1.0333, "learning_rate": 4.154723919851291e-05, "epoch": 1.0256410256410255, "percentage": 34.31, "elapsed_time": "0:22:37", "remaining_time": "0:43:19"}
{"current_steps": 150, "total_steps": 408, "loss": 0.8241, "learning_rate": 3.9884424051727556e-05, "epoch": 1.098901098901099, "percentage": 36.76, "elapsed_time": "0:24:11", "remaining_time": "0:41:36"}
{"current_steps": 160, "total_steps": 408, "loss": 0.7771, "learning_rate": 3.8112606912406044e-05, "epoch": 1.1721611721611722, "percentage": 39.22, "elapsed_time": "0:25:59", "remaining_time": "0:40:17"}
{"current_steps": 170, "total_steps": 408, "loss": 0.7341, "learning_rate": 3.624476319685771e-05, "epoch": 1.2454212454212454, "percentage": 41.67, "elapsed_time": "0:27:35", "remaining_time": "0:38:38"}
{"current_steps": 180, "total_steps": 408, "loss": 0.7059, "learning_rate": 3.429457154565565e-05, "epoch": 1.3186813186813187, "percentage": 44.12, "elapsed_time": "0:29:18", "remaining_time": "0:37:07"}
{"current_steps": 190, "total_steps": 408, "loss": 0.7403, "learning_rate": 3.227631365186836e-05, "epoch": 1.3919413919413919, "percentage": 46.57, "elapsed_time": "0:30:54", "remaining_time": "0:35:27"}
{"current_steps": 200, "total_steps": 408, "loss": 0.7738, "learning_rate": 3.020476967300212e-05, "epoch": 1.4652014652014653, "percentage": 49.02, "elapsed_time": "0:32:27", "remaining_time": "0:33:45"}
{"current_steps": 210, "total_steps": 408, "loss": 0.6995, "learning_rate": 2.8095109992575823e-05, "epoch": 1.5384615384615383, "percentage": 51.47, "elapsed_time": "0:34:03", "remaining_time": "0:32:06"}
{"current_steps": 220, "total_steps": 408, "loss": 0.7363, "learning_rate": 2.5962784123982843e-05, "epoch": 1.6117216117216118, "percentage": 53.92, "elapsed_time": "0:35:35", "remaining_time": "0:30:24"}
{"current_steps": 230, "total_steps": 408, "loss": 0.7735, "learning_rate": 2.3823407570221813e-05, "epoch": 1.684981684981685, "percentage": 56.37, "elapsed_time": "0:37:22", "remaining_time": "0:28:55"}
{"current_steps": 240, "total_steps": 408, "loss": 0.6975, "learning_rate": 2.1692647468048236e-05, "epoch": 1.7582417582417582, "percentage": 58.82, "elapsed_time": "0:38:59", "remaining_time": "0:27:17"}
{"current_steps": 250, "total_steps": 408, "loss": 0.7239, "learning_rate": 1.9586107854000326e-05, "epoch": 1.8315018315018317, "percentage": 61.27, "elapsed_time": "0:40:42", "remaining_time": "0:25:43"}
{"current_steps": 260, "total_steps": 408, "loss": 0.7285, "learning_rate": 1.7519215392522025e-05, "epoch": 1.9047619047619047, "percentage": 63.73, "elapsed_time": "0:42:16", "remaining_time": "0:24:03"}
{"current_steps": 270, "total_steps": 408, "loss": 0.7415, "learning_rate": 1.5507106403021894e-05, "epoch": 1.978021978021978, "percentage": 66.18, "elapsed_time": "0:43:53", "remaining_time": "0:22:26"}
{"current_steps": 280, "total_steps": 408, "loss": 0.5019, "learning_rate": 1.3564516013194023e-05, "epoch": 2.051282051282051, "percentage": 68.63, "elapsed_time": "0:45:24", "remaining_time": "0:20:45"}
{"current_steps": 290, "total_steps": 408, "loss": 0.5581, "learning_rate": 1.1705670250356415e-05, "epoch": 2.1245421245421245, "percentage": 71.08, "elapsed_time": "0:47:06", "remaining_time": "0:19:10"}
{"current_steps": 300, "total_steps": 408, "loss": 0.495, "learning_rate": 9.944181861046186e-06, "epoch": 2.197802197802198, "percentage": 73.53, "elapsed_time": "0:48:43", "remaining_time": "0:17:32"}
{"current_steps": 310, "total_steps": 408, "loss": 0.5017, "learning_rate": 8.292950621808022e-06, "epoch": 2.271062271062271, "percentage": 75.98, "elapsed_time": "0:50:21", "remaining_time": "0:15:55"}
{"current_steps": 320, "total_steps": 408, "loss": 0.5482, "learning_rate": 6.764068871222826e-06, "epoch": 2.3443223443223444, "percentage": 78.43, "elapsed_time": "0:52:05", "remaining_time": "0:14:19"}
{"current_steps": 330, "total_steps": 408, "loss": 0.4744, "learning_rate": 5.368732954986388e-06, "epoch": 2.4175824175824174, "percentage": 80.88, "elapsed_time": "0:53:39", "remaining_time": "0:12:40"}
{"current_steps": 340, "total_steps": 408, "loss": 0.5586, "learning_rate": 4.117161232546024e-06, "epoch": 2.490842490842491, "percentage": 83.33, "elapsed_time": "0:55:19", "remaining_time": "0:11:03"}
{"current_steps": 350, "total_steps": 408, "loss": 0.4924, "learning_rate": 3.0185192457509894e-06, "epoch": 2.564102564102564, "percentage": 85.78, "elapsed_time": "0:56:57", "remaining_time": "0:09:26"}
{"current_steps": 360, "total_steps": 408, "loss": 0.4985, "learning_rate": 2.0808525975233805e-06, "epoch": 2.6373626373626373, "percentage": 88.24, "elapsed_time": "0:58:34", "remaining_time": "0:07:48"}
{"current_steps": 370, "total_steps": 408, "loss": 0.4771, "learning_rate": 1.311028032094369e-06, "epoch": 2.7106227106227108, "percentage": 90.69, "elapsed_time": "1:00:07", "remaining_time": "0:06:10"}
{"current_steps": 380, "total_steps": 408, "loss": 0.4619, "learning_rate": 7.146831482883115e-07, "epoch": 2.7838827838827838, "percentage": 93.14, "elapsed_time": "1:01:49", "remaining_time": "0:04:33"}
{"current_steps": 390, "total_steps": 408, "loss": 0.5103, "learning_rate": 2.961851141157046e-07, "epoch": 2.857142857142857, "percentage": 95.59, "elapsed_time": "1:03:27", "remaining_time": "0:02:55"}
{"current_steps": 400, "total_steps": 408, "loss": 0.5113, "learning_rate": 5.85986850174608e-08, "epoch": 2.9304029304029307, "percentage": 98.04, "elapsed_time": "1:05:02", "remaining_time": "0:01:18"}
{"current_steps": 408, "total_steps": 408, "epoch": 2.989010989010989, "percentage": 100.0, "elapsed_time": "1:06:16", "remaining_time": "0:00:00"}