Danny-Test / trainer_log.jsonl
Delta-Vector's picture
Upload folder using huggingface_hub
f8e98cd verified
raw
history blame
18.6 kB
{"current_steps": 10, "total_steps": 908, "loss": 1.4512, "learning_rate": 3.296703296703297e-07, "epoch": 0.04405286343612335, "percentage": 1.1, "elapsed_time": "0:00:44", "remaining_time": "1:06:25"}
{"current_steps": 20, "total_steps": 908, "loss": 1.4723, "learning_rate": 6.593406593406594e-07, "epoch": 0.0881057268722467, "percentage": 2.2, "elapsed_time": "0:01:27", "remaining_time": "1:04:32"}
{"current_steps": 30, "total_steps": 908, "loss": 1.3932, "learning_rate": 9.890109890109891e-07, "epoch": 0.13215859030837004, "percentage": 3.3, "elapsed_time": "0:02:10", "remaining_time": "1:03:24"}
{"current_steps": 40, "total_steps": 908, "loss": 1.3093, "learning_rate": 1.3186813186813187e-06, "epoch": 0.1762114537444934, "percentage": 4.41, "elapsed_time": "0:02:52", "remaining_time": "1:02:26"}
{"current_steps": 50, "total_steps": 908, "loss": 1.2687, "learning_rate": 1.6483516483516486e-06, "epoch": 0.22026431718061673, "percentage": 5.51, "elapsed_time": "0:03:35", "remaining_time": "1:01:34"}
{"current_steps": 60, "total_steps": 908, "loss": 1.2427, "learning_rate": 1.9780219780219782e-06, "epoch": 0.2643171806167401, "percentage": 6.61, "elapsed_time": "0:04:17", "remaining_time": "1:00:46"}
{"current_steps": 70, "total_steps": 908, "loss": 1.2286, "learning_rate": 2.307692307692308e-06, "epoch": 0.30837004405286345, "percentage": 7.71, "elapsed_time": "0:05:00", "remaining_time": "0:59:59"}
{"current_steps": 80, "total_steps": 908, "loss": 1.1827, "learning_rate": 2.6373626373626375e-06, "epoch": 0.3524229074889868, "percentage": 8.81, "elapsed_time": "0:05:43", "remaining_time": "0:59:13"}
{"current_steps": 90, "total_steps": 908, "loss": 1.1941, "learning_rate": 2.9670329670329673e-06, "epoch": 0.3964757709251101, "percentage": 9.91, "elapsed_time": "0:06:26", "remaining_time": "0:58:29"}
{"current_steps": 100, "total_steps": 908, "loss": 1.1731, "learning_rate": 2.999101829950985e-06, "epoch": 0.44052863436123346, "percentage": 11.01, "elapsed_time": "0:07:08", "remaining_time": "0:57:45"}
{"current_steps": 110, "total_steps": 908, "loss": 1.1148, "learning_rate": 2.9959984254953274e-06, "epoch": 0.4845814977973568, "percentage": 12.11, "elapsed_time": "0:07:51", "remaining_time": "0:57:01"}
{"current_steps": 120, "total_steps": 908, "loss": 1.191, "learning_rate": 2.9906832852013294e-06, "epoch": 0.5286343612334802, "percentage": 13.22, "elapsed_time": "0:08:34", "remaining_time": "0:56:17"}
{"current_steps": 130, "total_steps": 908, "loss": 1.1818, "learning_rate": 2.9831642671563205e-06, "epoch": 0.5726872246696035, "percentage": 14.32, "elapsed_time": "0:09:17", "remaining_time": "0:55:33"}
{"current_steps": 140, "total_steps": 908, "loss": 1.1969, "learning_rate": 2.9734524877367604e-06, "epoch": 0.6167400881057269, "percentage": 15.42, "elapsed_time": "0:09:59", "remaining_time": "0:54:50"}
{"current_steps": 150, "total_steps": 908, "loss": 1.1203, "learning_rate": 2.961562305173399e-06, "epoch": 0.6607929515418502, "percentage": 16.52, "elapsed_time": "0:10:42", "remaining_time": "0:54:06"}
{"current_steps": 160, "total_steps": 908, "loss": 1.2301, "learning_rate": 2.9475112983235753e-06, "epoch": 0.7048458149779736, "percentage": 17.62, "elapsed_time": "0:11:25", "remaining_time": "0:53:23"}
{"current_steps": 170, "total_steps": 908, "loss": 1.183, "learning_rate": 2.9313202406820232e-06, "epoch": 0.748898678414097, "percentage": 18.72, "elapsed_time": "0:12:07", "remaining_time": "0:52:39"}
{"current_steps": 180, "total_steps": 908, "loss": 1.1304, "learning_rate": 2.9130130696686196e-06, "epoch": 0.7929515418502202, "percentage": 19.82, "elapsed_time": "0:12:50", "remaining_time": "0:51:56"}
{"current_steps": 190, "total_steps": 908, "loss": 1.1618, "learning_rate": 2.8926168512384744e-06, "epoch": 0.8370044052863436, "percentage": 20.93, "elapsed_time": "0:13:33", "remaining_time": "0:51:13"}
{"current_steps": 200, "total_steps": 908, "loss": 1.1491, "learning_rate": 2.870161739866686e-06, "epoch": 0.8810572687224669, "percentage": 22.03, "elapsed_time": "0:14:15", "remaining_time": "0:50:30"}
{"current_steps": 210, "total_steps": 908, "loss": 1.145, "learning_rate": 2.845680933966922e-06, "epoch": 0.9251101321585903, "percentage": 23.13, "elapsed_time": "0:14:58", "remaining_time": "0:49:46"}
{"current_steps": 220, "total_steps": 908, "loss": 1.2206, "learning_rate": 2.8192106268097337e-06, "epoch": 0.9691629955947136, "percentage": 24.23, "elapsed_time": "0:15:41", "remaining_time": "0:49:03"}
{"current_steps": 230, "total_steps": 908, "loss": 1.133, "learning_rate": 2.7907899530131763e-06, "epoch": 1.013215859030837, "percentage": 25.33, "elapsed_time": "0:16:23", "remaining_time": "0:48:20"}
{"current_steps": 240, "total_steps": 908, "loss": 1.0399, "learning_rate": 2.7604609306848312e-06, "epoch": 1.0572687224669604, "percentage": 26.43, "elapsed_time": "0:17:06", "remaining_time": "0:47:37"}
{"current_steps": 250, "total_steps": 908, "loss": 1.007, "learning_rate": 2.7282683993007865e-06, "epoch": 1.1013215859030836, "percentage": 27.53, "elapsed_time": "0:17:49", "remaining_time": "0:46:54"}
{"current_steps": 260, "total_steps": 908, "loss": 1.0139, "learning_rate": 2.6942599534133987e-06, "epoch": 1.145374449339207, "percentage": 28.63, "elapsed_time": "0:18:31", "remaining_time": "0:46:11"}
{"current_steps": 270, "total_steps": 908, "loss": 1.0493, "learning_rate": 2.658485872285863e-06, "epoch": 1.1894273127753303, "percentage": 29.74, "elapsed_time": "0:19:14", "remaining_time": "0:45:28"}
{"current_steps": 280, "total_steps": 908, "loss": 0.9478, "learning_rate": 2.6209990455576105e-06, "epoch": 1.2334801762114538, "percentage": 30.84, "elapsed_time": "0:19:57", "remaining_time": "0:44:44"}
{"current_steps": 290, "total_steps": 908, "loss": 1.0108, "learning_rate": 2.5818548950504342e-06, "epoch": 1.277533039647577, "percentage": 31.94, "elapsed_time": "0:20:39", "remaining_time": "0:44:01"}
{"current_steps": 300, "total_steps": 908, "loss": 1.0294, "learning_rate": 2.541111292830951e-06, "epoch": 1.3215859030837005, "percentage": 33.04, "elapsed_time": "0:21:22", "remaining_time": "0:43:18"}
{"current_steps": 310, "total_steps": 908, "loss": 0.9748, "learning_rate": 2.4988284756505333e-06, "epoch": 1.3656387665198237, "percentage": 34.14, "elapsed_time": "0:22:04", "remaining_time": "0:42:35"}
{"current_steps": 320, "total_steps": 908, "loss": 1.0054, "learning_rate": 2.455068955889216e-06, "epoch": 1.4096916299559472, "percentage": 35.24, "elapsed_time": "0:22:47", "remaining_time": "0:41:52"}
{"current_steps": 330, "total_steps": 908, "loss": 1.0155, "learning_rate": 2.4098974291352257e-06, "epoch": 1.4537444933920705, "percentage": 36.34, "elapsed_time": "0:23:30", "remaining_time": "0:41:09"}
{"current_steps": 340, "total_steps": 908, "loss": 1.0677, "learning_rate": 2.3633806785367873e-06, "epoch": 1.497797356828194, "percentage": 37.44, "elapsed_time": "0:24:12", "remaining_time": "0:40:26"}
{"current_steps": 350, "total_steps": 908, "loss": 0.987, "learning_rate": 2.315587476067607e-06, "epoch": 1.5418502202643172, "percentage": 38.55, "elapsed_time": "0:24:55", "remaining_time": "0:39:43"}
{"current_steps": 360, "total_steps": 908, "loss": 1.0526, "learning_rate": 2.2665884808520048e-06, "epoch": 1.5859030837004404, "percentage": 39.65, "elapsed_time": "0:25:37", "remaining_time": "0:39:00"}
{"current_steps": 370, "total_steps": 908, "loss": 1.0304, "learning_rate": 2.2164561347000213e-06, "epoch": 1.6299559471365639, "percentage": 40.75, "elapsed_time": "0:26:20", "remaining_time": "0:38:17"}
{"current_steps": 380, "total_steps": 908, "loss": 0.9921, "learning_rate": 2.1652645550069394e-06, "epoch": 1.6740088105726874, "percentage": 41.85, "elapsed_time": "0:27:02", "remaining_time": "0:37:34"}
{"current_steps": 390, "total_steps": 908, "loss": 1.0062, "learning_rate": 2.113089425175561e-06, "epoch": 1.7180616740088106, "percentage": 42.95, "elapsed_time": "0:27:45", "remaining_time": "0:36:51"}
{"current_steps": 400, "total_steps": 908, "loss": 0.993, "learning_rate": 2.0600078827232473e-06, "epoch": 1.7621145374449338, "percentage": 44.05, "elapsed_time": "0:28:27", "remaining_time": "0:36:09"}
{"current_steps": 410, "total_steps": 908, "loss": 0.989, "learning_rate": 2.006098405239142e-06, "epoch": 1.8061674008810573, "percentage": 45.15, "elapsed_time": "0:29:10", "remaining_time": "0:35:26"}
{"current_steps": 420, "total_steps": 908, "loss": 1.0184, "learning_rate": 1.95144069436019e-06, "epoch": 1.8502202643171806, "percentage": 46.26, "elapsed_time": "0:29:53", "remaining_time": "0:34:43"}
{"current_steps": 430, "total_steps": 908, "loss": 1.0655, "learning_rate": 1.896115557937476e-06, "epoch": 1.894273127753304, "percentage": 47.36, "elapsed_time": "0:30:35", "remaining_time": "0:34:00"}
{"current_steps": 440, "total_steps": 908, "loss": 1.0139, "learning_rate": 1.8402047905671065e-06, "epoch": 1.9383259911894273, "percentage": 48.46, "elapsed_time": "0:31:18", "remaining_time": "0:33:17"}
{"current_steps": 450, "total_steps": 908, "loss": 1.0103, "learning_rate": 1.7837910526622437e-06, "epoch": 1.9823788546255505, "percentage": 49.56, "elapsed_time": "0:32:00", "remaining_time": "0:32:34"}
{"current_steps": 460, "total_steps": 908, "loss": 0.8977, "learning_rate": 1.726957748245093e-06, "epoch": 2.026431718061674, "percentage": 50.66, "elapsed_time": "0:32:43", "remaining_time": "0:31:52"}
{"current_steps": 470, "total_steps": 908, "loss": 0.8438, "learning_rate": 1.6697889016395088e-06, "epoch": 2.0704845814977975, "percentage": 51.76, "elapsed_time": "0:33:25", "remaining_time": "0:31:09"}
{"current_steps": 480, "total_steps": 908, "loss": 0.9008, "learning_rate": 1.6123690332465296e-06, "epoch": 2.1145374449339207, "percentage": 52.86, "elapsed_time": "0:34:08", "remaining_time": "0:30:26"}
{"current_steps": 490, "total_steps": 908, "loss": 0.8176, "learning_rate": 1.5547830345864886e-06, "epoch": 2.158590308370044, "percentage": 53.96, "elapsed_time": "0:34:50", "remaining_time": "0:29:43"}
{"current_steps": 500, "total_steps": 908, "loss": 0.8901, "learning_rate": 1.4971160427924554e-06, "epoch": 2.202643171806167, "percentage": 55.07, "elapsed_time": "0:35:33", "remaining_time": "0:29:00"}
{"current_steps": 510, "total_steps": 908, "loss": 0.8247, "learning_rate": 1.439453314740552e-06, "epoch": 2.246696035242291, "percentage": 56.17, "elapsed_time": "0:36:22", "remaining_time": "0:28:23"}
{"current_steps": 520, "total_steps": 908, "loss": 0.8294, "learning_rate": 1.381880101003235e-06, "epoch": 2.290748898678414, "percentage": 57.27, "elapsed_time": "0:37:04", "remaining_time": "0:27:40"}
{"current_steps": 530, "total_steps": 908, "loss": 0.9032, "learning_rate": 1.3244815198119024e-06, "epoch": 2.3348017621145374, "percentage": 58.37, "elapsed_time": "0:37:47", "remaining_time": "0:26:57"}
{"current_steps": 540, "total_steps": 908, "loss": 0.8862, "learning_rate": 1.2673424312151519e-06, "epoch": 2.3788546255506606, "percentage": 59.47, "elapsed_time": "0:38:29", "remaining_time": "0:26:14"}
{"current_steps": 550, "total_steps": 908, "loss": 0.894, "learning_rate": 1.2105473116187517e-06, "epoch": 2.4229074889867843, "percentage": 60.57, "elapsed_time": "0:39:12", "remaining_time": "0:25:31"}
{"current_steps": 560, "total_steps": 908, "loss": 0.8126, "learning_rate": 1.154180128892796e-06, "epoch": 2.4669603524229076, "percentage": 61.67, "elapsed_time": "0:39:54", "remaining_time": "0:24:48"}
{"current_steps": 570, "total_steps": 908, "loss": 0.8059, "learning_rate": 1.0983242182307033e-06, "epoch": 2.511013215859031, "percentage": 62.78, "elapsed_time": "0:40:37", "remaining_time": "0:24:05"}
{"current_steps": 580, "total_steps": 908, "loss": 0.8959, "learning_rate": 1.0430621589435803e-06, "epoch": 2.555066079295154, "percentage": 63.88, "elapsed_time": "0:41:20", "remaining_time": "0:23:22"}
{"current_steps": 590, "total_steps": 908, "loss": 0.8393, "learning_rate": 9.884756523721117e-07, "epoch": 2.5991189427312777, "percentage": 64.98, "elapsed_time": "0:42:02", "remaining_time": "0:22:39"}
{"current_steps": 600, "total_steps": 908, "loss": 0.862, "learning_rate": 9.346454010964724e-07, "epoch": 2.643171806167401, "percentage": 66.08, "elapsed_time": "0:42:45", "remaining_time": "0:21:56"}
{"current_steps": 610, "total_steps": 908, "loss": 0.859, "learning_rate": 8.816509896228376e-07, "epoch": 2.6872246696035242, "percentage": 67.18, "elapsed_time": "0:43:27", "remaining_time": "0:21:13"}
{"current_steps": 620, "total_steps": 908, "loss": 0.8348, "learning_rate": 8.295707667228987e-07, "epoch": 2.7312775330396475, "percentage": 68.28, "elapsed_time": "0:44:10", "remaining_time": "0:20:31"}
{"current_steps": 630, "total_steps": 908, "loss": 0.8668, "learning_rate": 7.784817296003237e-07, "epoch": 2.7753303964757707, "percentage": 69.38, "elapsed_time": "0:44:52", "remaining_time": "0:19:48"}
{"current_steps": 640, "total_steps": 908, "loss": 0.8627, "learning_rate": 7.284594100554311e-07, "epoch": 2.8193832599118944, "percentage": 70.48, "elapsed_time": "0:45:35", "remaining_time": "0:19:05"}
{"current_steps": 650, "total_steps": 908, "loss": 0.855, "learning_rate": 6.7957776281636e-07, "epoch": 2.8634361233480177, "percentage": 71.59, "elapsed_time": "0:46:17", "remaining_time": "0:18:22"}
{"current_steps": 660, "total_steps": 908, "loss": 0.8849, "learning_rate": 6.31909056201842e-07, "epoch": 2.907488986784141, "percentage": 72.69, "elapsed_time": "0:47:00", "remaining_time": "0:17:39"}
{"current_steps": 670, "total_steps": 908, "loss": 0.8629, "learning_rate": 5.855237652772183e-07, "epoch": 2.951541850220264, "percentage": 73.79, "elapsed_time": "0:47:43", "remaining_time": "0:16:57"}
{"current_steps": 680, "total_steps": 908, "loss": 0.8796, "learning_rate": 5.404904676616635e-07, "epoch": 2.995594713656388, "percentage": 74.89, "elapsed_time": "0:48:25", "remaining_time": "0:16:14"}
{"current_steps": 690, "total_steps": 908, "loss": 0.779, "learning_rate": 4.968757421406609e-07, "epoch": 3.039647577092511, "percentage": 75.99, "elapsed_time": "0:49:08", "remaining_time": "0:15:31"}
{"current_steps": 700, "total_steps": 908, "loss": 0.7582, "learning_rate": 4.547440702336238e-07, "epoch": 3.0837004405286343, "percentage": 77.09, "elapsed_time": "0:49:50", "remaining_time": "0:14:48"}
{"current_steps": 710, "total_steps": 908, "loss": 0.7063, "learning_rate": 4.1415774086218277e-07, "epoch": 3.1277533039647576, "percentage": 78.19, "elapsed_time": "0:50:33", "remaining_time": "0:14:05"}
{"current_steps": 720, "total_steps": 908, "loss": 0.752, "learning_rate": 3.7517675826009083e-07, "epoch": 3.171806167400881, "percentage": 79.3, "elapsed_time": "0:51:15", "remaining_time": "0:13:23"}
{"current_steps": 730, "total_steps": 908, "loss": 0.7829, "learning_rate": 3.378587532608872e-07, "epoch": 3.2158590308370045, "percentage": 80.4, "elapsed_time": "0:51:58", "remaining_time": "0:12:40"}
{"current_steps": 740, "total_steps": 908, "loss": 0.72, "learning_rate": 3.0225889809447925e-07, "epoch": 3.2599118942731278, "percentage": 81.5, "elapsed_time": "0:52:41", "remaining_time": "0:11:57"}
{"current_steps": 750, "total_steps": 908, "loss": 0.7852, "learning_rate": 2.684298248186077e-07, "epoch": 3.303964757709251, "percentage": 82.6, "elapsed_time": "0:53:23", "remaining_time": "0:11:14"}
{"current_steps": 760, "total_steps": 908, "loss": 0.7912, "learning_rate": 2.3642154750579275e-07, "epoch": 3.3480176211453743, "percentage": 83.7, "elapsed_time": "0:54:06", "remaining_time": "0:10:32"}
{"current_steps": 770, "total_steps": 908, "loss": 0.7456, "learning_rate": 2.0628138830079696e-07, "epoch": 3.392070484581498, "percentage": 84.8, "elapsed_time": "0:54:48", "remaining_time": "0:09:49"}
{"current_steps": 780, "total_steps": 908, "loss": 0.7654, "learning_rate": 1.7805390745792993e-07, "epoch": 3.436123348017621, "percentage": 85.9, "elapsed_time": "0:55:31", "remaining_time": "0:09:06"}
{"current_steps": 790, "total_steps": 908, "loss": 0.7437, "learning_rate": 1.5178083746162667e-07, "epoch": 3.4801762114537445, "percentage": 87.0, "elapsed_time": "0:56:13", "remaining_time": "0:08:23"}
{"current_steps": 800, "total_steps": 908, "loss": 0.7834, "learning_rate": 1.2750102132769738e-07, "epoch": 3.5242290748898677, "percentage": 88.11, "elapsed_time": "0:56:56", "remaining_time": "0:07:41"}
{"current_steps": 810, "total_steps": 908, "loss": 0.7943, "learning_rate": 1.0525035517647014e-07, "epoch": 3.568281938325991, "percentage": 89.21, "elapsed_time": "0:57:39", "remaining_time": "0:06:58"}
{"current_steps": 820, "total_steps": 908, "loss": 0.7826, "learning_rate": 8.50617351627232e-08, "epoch": 3.6123348017621146, "percentage": 90.31, "elapsed_time": "0:58:21", "remaining_time": "0:06:15"}
{"current_steps": 830, "total_steps": 908, "loss": 0.8379, "learning_rate": 6.696500884087259e-08, "epoch": 3.656387665198238, "percentage": 91.41, "elapsed_time": "0:59:04", "remaining_time": "0:05:33"}
{"current_steps": 840, "total_steps": 908, "loss": 0.7614, "learning_rate": 5.0986931037314666e-08, "epoch": 3.700440528634361, "percentage": 92.51, "elapsed_time": "0:59:46", "remaining_time": "0:04:50"}
{"current_steps": 850, "total_steps": 908, "loss": 0.8152, "learning_rate": 3.7151124295163374e-08, "epoch": 3.744493392070485, "percentage": 93.61, "elapsed_time": "1:00:29", "remaining_time": "0:04:07"}
{"current_steps": 860, "total_steps": 908, "loss": 0.7517, "learning_rate": 2.5478043949868192e-08, "epoch": 3.788546255506608, "percentage": 94.71, "elapsed_time": "1:01:12", "remaining_time": "0:03:24"}
{"current_steps": 870, "total_steps": 908, "loss": 0.7697, "learning_rate": 1.5984947887334623e-08, "epoch": 3.8325991189427313, "percentage": 95.81, "elapsed_time": "1:01:54", "remaining_time": "0:02:42"}
{"current_steps": 880, "total_steps": 908, "loss": 0.7506, "learning_rate": 8.685871029272318e-09, "epoch": 3.8766519823788546, "percentage": 96.92, "elapsed_time": "1:02:37", "remaining_time": "0:01:59"}
{"current_steps": 890, "total_steps": 908, "loss": 0.7273, "learning_rate": 3.5916045834781253e-09, "epoch": 3.920704845814978, "percentage": 98.02, "elapsed_time": "1:03:19", "remaining_time": "0:01:16"}
{"current_steps": 900, "total_steps": 908, "loss": 0.8123, "learning_rate": 7.096800897425371e-10, "epoch": 3.964757709251101, "percentage": 99.12, "elapsed_time": "1:04:02", "remaining_time": "0:00:34"}
{"current_steps": 908, "total_steps": 908, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "1:04:42", "remaining_time": "0:00:00"}