Boffl's picture
Upload trainer_log.jsonl with huggingface_hub
c92743b verified
raw
history blame
8.57 kB
{"current_steps": 10, "total_steps": 410, "loss": 3.3584, "learning_rate": 1.0975609756097562e-05, "epoch": 0.02437538086532602, "percentage": 2.44, "elapsed_time": "0:14:01", "remaining_time": "9:21:08"}
{"current_steps": 20, "total_steps": 410, "loss": 3.1749, "learning_rate": 2.1951219512195124e-05, "epoch": 0.04875076173065204, "percentage": 4.88, "elapsed_time": "0:28:04", "remaining_time": "9:07:30"}
{"current_steps": 30, "total_steps": 410, "loss": 2.9963, "learning_rate": 3.292682926829269e-05, "epoch": 0.07312614259597806, "percentage": 7.32, "elapsed_time": "0:42:05", "remaining_time": "8:53:10"}
{"current_steps": 40, "total_steps": 410, "loss": 2.8865, "learning_rate": 4.51219512195122e-05, "epoch": 0.09750152346130408, "percentage": 9.76, "elapsed_time": "0:56:07", "remaining_time": "8:39:06"}
{"current_steps": 50, "total_steps": 410, "loss": 2.8482, "learning_rate": 4.996738892723075e-05, "epoch": 0.1218769043266301, "percentage": 12.2, "elapsed_time": "1:10:08", "remaining_time": "8:25:01"}
{"current_steps": 60, "total_steps": 410, "loss": 2.8334, "learning_rate": 4.976840705816688e-05, "epoch": 0.14625228519195613, "percentage": 14.63, "elapsed_time": "1:24:09", "remaining_time": "8:10:55"}
{"current_steps": 70, "total_steps": 410, "loss": 2.7419, "learning_rate": 4.939000027687756e-05, "epoch": 0.17062766605728213, "percentage": 17.07, "elapsed_time": "1:38:13", "remaining_time": "7:57:05"}
{"current_steps": 80, "total_steps": 410, "loss": 2.6897, "learning_rate": 4.8834909801373264e-05, "epoch": 0.19500304692260817, "percentage": 19.51, "elapsed_time": "1:52:16", "remaining_time": "7:43:08"}
{"current_steps": 90, "total_steps": 410, "loss": 2.6547, "learning_rate": 4.810715676468894e-05, "epoch": 0.21937842778793418, "percentage": 21.95, "elapsed_time": "2:06:19", "remaining_time": "7:29:11"}
{"current_steps": 100, "total_steps": 410, "loss": 2.6865, "learning_rate": 4.7212013085378824e-05, "epoch": 0.2437538086532602, "percentage": 24.39, "elapsed_time": "2:20:23", "remaining_time": "7:15:13"}
{"current_steps": 110, "total_steps": 410, "loss": 2.6123, "learning_rate": 4.615596327719111e-05, "epoch": 0.2681291895185862, "percentage": 26.83, "elapsed_time": "2:34:29", "remaining_time": "7:01:20"}
{"current_steps": 120, "total_steps": 410, "loss": 2.5791, "learning_rate": 4.507424333013069e-05, "epoch": 0.29250457038391225, "percentage": 29.27, "elapsed_time": "2:48:33", "remaining_time": "6:47:19"}
{"current_steps": 130, "total_steps": 410, "loss": 2.5722, "learning_rate": 4.373446685572683e-05, "epoch": 0.3168799512492383, "percentage": 31.71, "elapsed_time": "3:02:36", "remaining_time": "6:33:19"}
{"current_steps": 140, "total_steps": 410, "loss": 2.5763, "learning_rate": 4.225897595837744e-05, "epoch": 0.34125533211456427, "percentage": 34.15, "elapsed_time": "3:16:38", "remaining_time": "6:19:14"}
{"current_steps": 150, "total_steps": 410, "loss": 2.5901, "learning_rate": 4.0658459247330766e-05, "epoch": 0.3656307129798903, "percentage": 36.59, "elapsed_time": "3:30:41", "remaining_time": "6:05:11"}
{"current_steps": 160, "total_steps": 410, "loss": 2.5185, "learning_rate": 3.8944511031809865e-05, "epoch": 0.39000609384521634, "percentage": 39.02, "elapsed_time": "3:44:44", "remaining_time": "5:51:08"}
{"current_steps": 170, "total_steps": 410, "loss": 2.4729, "learning_rate": 3.712954733063284e-05, "epoch": 0.4143814747105424, "percentage": 41.46, "elapsed_time": "3:58:47", "remaining_time": "5:37:07"}
{"current_steps": 180, "total_steps": 410, "loss": 2.5748, "learning_rate": 3.5226715929283506e-05, "epoch": 0.43875685557586835, "percentage": 43.9, "elapsed_time": "4:12:50", "remaining_time": "5:23:04"}
{"current_steps": 190, "total_steps": 410, "loss": 2.5046, "learning_rate": 3.324980113598824e-05, "epoch": 0.4631322364411944, "percentage": 46.34, "elapsed_time": "4:26:52", "remaining_time": "5:09:01"}
{"current_steps": 200, "total_steps": 410, "loss": 2.5345, "learning_rate": 3.121312392675618e-05, "epoch": 0.4875076173065204, "percentage": 48.78, "elapsed_time": "4:40:55", "remaining_time": "4:54:58"}
{"current_steps": 210, "total_steps": 410, "loss": 2.4931, "learning_rate": 2.9131438202742124e-05, "epoch": 0.5118829981718465, "percentage": 51.22, "elapsed_time": "4:55:00", "remaining_time": "4:40:57"}
{"current_steps": 220, "total_steps": 410, "loss": 2.4892, "learning_rate": 2.7019823911454812e-05, "epoch": 0.5362583790371724, "percentage": 53.66, "elapsed_time": "5:09:02", "remaining_time": "4:26:54"}
{"current_steps": 230, "total_steps": 410, "loss": 2.5281, "learning_rate": 2.4893577806051537e-05, "epoch": 0.5606337599024985, "percentage": 56.1, "elapsed_time": "5:23:05", "remaining_time": "4:12:51"}
{"current_steps": 240, "total_steps": 410, "loss": 2.4737, "learning_rate": 2.2768102634070147e-05, "epoch": 0.5850091407678245, "percentage": 58.54, "elapsed_time": "5:37:07", "remaining_time": "3:58:47"}
{"current_steps": 250, "total_steps": 410, "loss": 2.4923, "learning_rate": 2.0658795558326743e-05, "epoch": 0.6093845216331505, "percentage": 60.98, "elapsed_time": "5:51:09", "remaining_time": "3:44:44"}
{"current_steps": 260, "total_steps": 410, "loss": 2.4491, "learning_rate": 1.8580936618269696e-05, "epoch": 0.6337599024984766, "percentage": 63.41, "elapsed_time": "6:05:12", "remaining_time": "3:30:42"}
{"current_steps": 270, "total_steps": 410, "loss": 2.5303, "learning_rate": 1.6549578039787436e-05, "epoch": 0.6581352833638026, "percentage": 65.85, "elapsed_time": "6:19:15", "remaining_time": "3:16:39"}
{"current_steps": 280, "total_steps": 410, "loss": 2.4304, "learning_rate": 1.4579435195321434e-05, "epoch": 0.6825106642291285, "percentage": 68.29, "elapsed_time": "6:33:19", "remaining_time": "3:02:36"}
{"current_steps": 290, "total_steps": 410, "loss": 2.4408, "learning_rate": 1.2684780004180414e-05, "epoch": 0.7068860450944546, "percentage": 70.73, "elapsed_time": "6:47:22", "remaining_time": "2:48:34"}
{"current_steps": 300, "total_steps": 410, "loss": 2.4091, "learning_rate": 1.0879337545275165e-05, "epoch": 0.7312614259597806, "percentage": 73.17, "elapsed_time": "7:01:25", "remaining_time": "2:34:31"}
{"current_steps": 310, "total_steps": 410, "loss": 2.3872, "learning_rate": 9.176186631221958e-06, "epoch": 0.7556368068251066, "percentage": 75.61, "elapsed_time": "7:15:30", "remaining_time": "2:20:29"}
{"current_steps": 320, "total_steps": 410, "loss": 2.4045, "learning_rate": 7.587665064066085e-06, "epoch": 0.7800121876904327, "percentage": 78.05, "elapsed_time": "7:29:33", "remaining_time": "2:06:26"}
{"current_steps": 330, "total_steps": 410, "loss": 2.4953, "learning_rate": 6.125280258962873e-06, "epoch": 0.8043875685557587, "percentage": 80.49, "elapsed_time": "7:43:35", "remaining_time": "1:52:23"}
{"current_steps": 340, "total_steps": 410, "loss": 2.3752, "learning_rate": 4.799625883267672e-06, "epoch": 0.8287629494210847, "percentage": 82.93, "elapsed_time": "7:57:38", "remaining_time": "1:38:20"}
{"current_steps": 350, "total_steps": 410, "loss": 2.3658, "learning_rate": 3.6203051149095973e-06, "epoch": 0.8531383302864107, "percentage": 85.37, "elapsed_time": "8:11:40", "remaining_time": "1:24:17"}
{"current_steps": 360, "total_steps": 410, "loss": 2.4198, "learning_rate": 2.595861075973613e-06, "epoch": 0.8775137111517367, "percentage": 87.8, "elapsed_time": "8:25:42", "remaining_time": "1:10:14"}
{"current_steps": 370, "total_steps": 410, "loss": 2.4113, "learning_rate": 1.733714945437212e-06, "epoch": 0.9018890920170628, "percentage": 90.24, "elapsed_time": "8:39:43", "remaining_time": "0:56:11"}
{"current_steps": 380, "total_steps": 410, "loss": 2.4011, "learning_rate": 1.0401121993794033e-06, "epoch": 0.9262644728823888, "percentage": 92.68, "elapsed_time": "8:53:46", "remaining_time": "0:42:08"}
{"current_steps": 390, "total_steps": 410, "loss": 2.4523, "learning_rate": 5.20077368103597e-07, "epoch": 0.9506398537477148, "percentage": 95.12, "elapsed_time": "9:07:49", "remaining_time": "0:28:05"}
{"current_steps": 400, "total_steps": 410, "loss": 2.4289, "learning_rate": 1.77377637918405e-07, "epoch": 0.9750152346130408, "percentage": 97.56, "elapsed_time": "9:21:52", "remaining_time": "0:14:02"}
{"current_steps": 410, "total_steps": 410, "loss": 2.4421, "learning_rate": 1.4495561248931145e-08, "epoch": 0.9993906154783668, "percentage": 100.0, "elapsed_time": "9:35:56", "remaining_time": "0:00:00"}
{"current_steps": 410, "total_steps": 410, "epoch": 0.9993906154783668, "percentage": 100.0, "elapsed_time": "9:35:59", "remaining_time": "0:00:00"}