diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,14368 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 29.885057471264368, + "global_step": 20800, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.01, + "learning_rate": 4.8e-06, + "loss": 24.5479, + "step": 10 + }, + { + "epoch": 0.03, + "learning_rate": 1.0799999999999998e-05, + "loss": 24.3336, + "step": 20 + }, + { + "epoch": 0.04, + "learning_rate": 1.68e-05, + "loss": 23.7501, + "step": 30 + }, + { + "epoch": 0.06, + "learning_rate": 2.28e-05, + "loss": 22.2394, + "step": 40 + }, + { + "epoch": 0.07, + "learning_rate": 2.88e-05, + "loss": 22.1365, + "step": 50 + }, + { + "epoch": 0.09, + "learning_rate": 3.42e-05, + "loss": 20.337, + "step": 60 + }, + { + "epoch": 0.1, + "learning_rate": 4.02e-05, + "loss": 19.8122, + "step": 70 + }, + { + "epoch": 0.11, + "learning_rate": 4.62e-05, + "loss": 19.0623, + "step": 80 + }, + { + "epoch": 0.13, + "learning_rate": 5.2199999999999995e-05, + "loss": 16.9603, + "step": 90 + }, + { + "epoch": 0.14, + "learning_rate": 5.82e-05, + "loss": 15.8856, + "step": 100 + }, + { + "epoch": 0.14, + "eval_loss": 15.38314151763916, + "eval_runtime": 39.1757, + "eval_samples_per_second": 11.665, + "eval_steps_per_second": 1.481, + "eval_wer": 1.0, + "step": 100 + }, + { + "epoch": 0.16, + "learning_rate": 6.419999999999999e-05, + "loss": 14.1248, + "step": 110 + }, + { + "epoch": 0.17, + "learning_rate": 7.02e-05, + "loss": 12.634, + "step": 120 + }, + { + "epoch": 0.19, + "learning_rate": 7.62e-05, + "loss": 10.9827, + "step": 130 + }, + { + "epoch": 0.2, + "learning_rate": 8.22e-05, + "loss": 9.6156, + "step": 140 + }, + { + "epoch": 0.22, + "learning_rate": 8.819999999999999e-05, + "loss": 8.3307, + "step": 150 + }, + { + "epoch": 0.23, + "learning_rate": 9.419999999999999e-05, + "loss": 7.1401, + "step": 160 + }, + { + "epoch": 0.24, + "learning_rate": 0.0001002, + "loss": 6.2121, + "step": 170 + }, + { + "epoch": 0.26, + "learning_rate": 0.00010619999999999998, + "loss": 5.5431, + "step": 180 + }, + { + "epoch": 0.27, + "learning_rate": 0.00011219999999999999, + "loss": 5.1547, + "step": 190 + }, + { + "epoch": 0.29, + "learning_rate": 0.0001182, + "loss": 4.9694, + "step": 200 + }, + { + "epoch": 0.29, + "eval_loss": 4.939667701721191, + "eval_runtime": 39.3067, + "eval_samples_per_second": 11.627, + "eval_steps_per_second": 1.476, + "eval_wer": 1.0, + "step": 200 + }, + { + "epoch": 0.3, + "learning_rate": 0.00012419999999999998, + "loss": 4.8874, + "step": 210 + }, + { + "epoch": 0.32, + "learning_rate": 0.0001302, + "loss": 4.8633, + "step": 220 + }, + { + "epoch": 0.33, + "learning_rate": 0.0001362, + "loss": 4.8666, + "step": 230 + }, + { + "epoch": 0.34, + "learning_rate": 0.0001422, + "loss": 4.8345, + "step": 240 + }, + { + "epoch": 0.36, + "learning_rate": 0.0001482, + "loss": 4.8414, + "step": 250 + }, + { + "epoch": 0.37, + "learning_rate": 0.00015419999999999998, + "loss": 4.8116, + "step": 260 + }, + { + "epoch": 0.39, + "learning_rate": 0.0001602, + "loss": 4.7888, + "step": 270 + }, + { + "epoch": 0.4, + "learning_rate": 0.0001662, + "loss": 4.7886, + "step": 280 + }, + { + "epoch": 0.42, + "learning_rate": 0.00017219999999999998, + "loss": 4.7816, + "step": 290 + }, + { + "epoch": 0.43, + "learning_rate": 0.00017819999999999997, + "loss": 4.8183, + "step": 300 + }, + { + "epoch": 0.43, + "eval_loss": 4.77665901184082, + "eval_runtime": 39.6162, + "eval_samples_per_second": 11.536, + "eval_steps_per_second": 1.464, + "eval_wer": 1.0, + "step": 300 + }, + { + "epoch": 0.45, + "learning_rate": 0.00018419999999999998, + "loss": 4.7999, + "step": 310 + }, + { + "epoch": 0.46, + "learning_rate": 0.0001902, + "loss": 4.7751, + "step": 320 + }, + { + "epoch": 0.47, + "learning_rate": 0.0001962, + "loss": 4.7608, + "step": 330 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002022, + "loss": 4.743, + "step": 340 + }, + { + "epoch": 0.5, + "learning_rate": 0.00020819999999999996, + "loss": 4.7291, + "step": 350 + }, + { + "epoch": 0.52, + "learning_rate": 0.00021419999999999998, + "loss": 4.7118, + "step": 360 + }, + { + "epoch": 0.53, + "learning_rate": 0.00022019999999999999, + "loss": 4.7286, + "step": 370 + }, + { + "epoch": 0.55, + "learning_rate": 0.00022619999999999997, + "loss": 4.715, + "step": 380 + }, + { + "epoch": 0.56, + "learning_rate": 0.00023219999999999998, + "loss": 4.709, + "step": 390 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002382, + "loss": 4.683, + "step": 400 + }, + { + "epoch": 0.57, + "eval_loss": 4.713740348815918, + "eval_runtime": 39.3947, + "eval_samples_per_second": 11.601, + "eval_steps_per_second": 1.472, + "eval_wer": 1.0, + "step": 400 + }, + { + "epoch": 0.59, + "learning_rate": 0.00024419999999999997, + "loss": 4.7096, + "step": 410 + }, + { + "epoch": 0.6, + "learning_rate": 0.00025019999999999996, + "loss": 4.7024, + "step": 420 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002562, + "loss": 4.7074, + "step": 430 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002622, + "loss": 4.7047, + "step": 440 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026819999999999996, + "loss": 4.6906, + "step": 450 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002742, + "loss": 4.6973, + "step": 460 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002802, + "loss": 4.6773, + "step": 470 + }, + { + "epoch": 0.69, + "learning_rate": 0.00028619999999999996, + "loss": 4.6905, + "step": 480 + }, + { + "epoch": 0.7, + "learning_rate": 0.00029219999999999995, + "loss": 4.6664, + "step": 490 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002982, + "loss": 4.6742, + "step": 500 + }, + { + "epoch": 0.72, + "eval_loss": 4.695952415466309, + "eval_runtime": 39.4463, + "eval_samples_per_second": 11.585, + "eval_steps_per_second": 1.47, + "eval_wer": 1.0, + "step": 500 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002998969578017664, + "loss": 4.7007, + "step": 510 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002997497546614327, + "loss": 4.6779, + "step": 520 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002996025515210991, + "loss": 4.6749, + "step": 530 + }, + { + "epoch": 0.78, + "learning_rate": 0.00029945534838076544, + "loss": 4.6655, + "step": 540 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002993081452404318, + "loss": 4.6543, + "step": 550 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002991609421000981, + "loss": 4.6716, + "step": 560 + }, + { + "epoch": 0.82, + "learning_rate": 0.00029901373895976446, + "loss": 4.6725, + "step": 570 + }, + { + "epoch": 0.83, + "learning_rate": 0.00029886653581943077, + "loss": 4.6846, + "step": 580 + }, + { + "epoch": 0.85, + "learning_rate": 0.00029871933267909713, + "loss": 4.6431, + "step": 590 + }, + { + "epoch": 0.86, + "learning_rate": 0.00029857212953876344, + "loss": 4.6485, + "step": 600 + }, + { + "epoch": 0.86, + "eval_loss": 4.668909072875977, + "eval_runtime": 39.3362, + "eval_samples_per_second": 11.618, + "eval_steps_per_second": 1.474, + "eval_wer": 1.0, + "step": 600 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002984249263984298, + "loss": 4.6752, + "step": 610 + }, + { + "epoch": 0.89, + "learning_rate": 0.00029827772325809616, + "loss": 4.6491, + "step": 620 + }, + { + "epoch": 0.91, + "learning_rate": 0.00029813052011776246, + "loss": 4.6515, + "step": 630 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002979833169774288, + "loss": 4.6491, + "step": 640 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002978361138370952, + "loss": 4.6027, + "step": 650 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002976889106967615, + "loss": 4.6736, + "step": 660 + }, + { + "epoch": 0.96, + "learning_rate": 0.00029754170755642785, + "loss": 4.6461, + "step": 670 + }, + { + "epoch": 0.98, + "learning_rate": 0.00029739450441609416, + "loss": 4.6184, + "step": 680 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002972473012757605, + "loss": 4.6395, + "step": 690 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002971000981354269, + "loss": 4.6174, + "step": 700 + }, + { + "epoch": 1.01, + "eval_loss": 4.663065433502197, + "eval_runtime": 39.4396, + "eval_samples_per_second": 11.587, + "eval_steps_per_second": 1.471, + "eval_wer": 0.9998494202680319, + "step": 700 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002969528949950932, + "loss": 4.6355, + "step": 710 + }, + { + "epoch": 1.03, + "learning_rate": 0.00029680569185475955, + "loss": 4.611, + "step": 720 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002966584887144259, + "loss": 4.6402, + "step": 730 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002965112855740922, + "loss": 4.6334, + "step": 740 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002963640824337586, + "loss": 4.6247, + "step": 750 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002962168792934249, + "loss": 4.6173, + "step": 760 + }, + { + "epoch": 1.11, + "learning_rate": 0.00029606967615309124, + "loss": 4.5934, + "step": 770 + }, + { + "epoch": 1.12, + "learning_rate": 0.00029592247301275755, + "loss": 4.6392, + "step": 780 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002957752698724239, + "loss": 4.5958, + "step": 790 + }, + { + "epoch": 1.15, + "learning_rate": 0.00029562806673209027, + "loss": 4.5931, + "step": 800 + }, + { + "epoch": 1.15, + "eval_loss": 4.590127944946289, + "eval_runtime": 39.464, + "eval_samples_per_second": 11.58, + "eval_steps_per_second": 1.47, + "eval_wer": 0.9968378256286704, + "step": 800 + }, + { + "epoch": 1.16, + "learning_rate": 0.00029548086359175663, + "loss": 4.5797, + "step": 810 + }, + { + "epoch": 1.18, + "learning_rate": 0.00029533366045142293, + "loss": 4.5442, + "step": 820 + }, + { + "epoch": 1.19, + "learning_rate": 0.0002951864573110893, + "loss": 4.5553, + "step": 830 + }, + { + "epoch": 1.21, + "learning_rate": 0.0002950392541707556, + "loss": 4.5279, + "step": 840 + }, + { + "epoch": 1.22, + "learning_rate": 0.00029489205103042196, + "loss": 4.5188, + "step": 850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00029474484789008827, + "loss": 4.5404, + "step": 860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00029459764474975463, + "loss": 4.5379, + "step": 870 + }, + { + "epoch": 1.26, + "learning_rate": 0.000294450441609421, + "loss": 4.4347, + "step": 880 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002943032384690873, + "loss": 4.4093, + "step": 890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00029415603532875366, + "loss": 4.3427, + "step": 900 + }, + { + "epoch": 1.29, + "eval_loss": 4.386187553405762, + "eval_runtime": 39.5926, + "eval_samples_per_second": 11.543, + "eval_steps_per_second": 1.465, + "eval_wer": 1.0, + "step": 900 + }, + { + "epoch": 1.31, + "learning_rate": 0.00029400883218842, + "loss": 4.28, + "step": 910 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002938616290480863, + "loss": 4.1754, + "step": 920 + }, + { + "epoch": 1.34, + "learning_rate": 0.0002937144259077527, + "loss": 4.0524, + "step": 930 + }, + { + "epoch": 1.35, + "learning_rate": 0.000293567222767419, + "loss": 3.8665, + "step": 940 + }, + { + "epoch": 1.36, + "learning_rate": 0.00029342001962708535, + "loss": 3.786, + "step": 950 + }, + { + "epoch": 1.38, + "learning_rate": 0.0002932728164867517, + "loss": 3.4787, + "step": 960 + }, + { + "epoch": 1.39, + "learning_rate": 0.000293125613346418, + "loss": 3.2242, + "step": 970 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002929784102060844, + "loss": 2.9959, + "step": 980 + }, + { + "epoch": 1.42, + "learning_rate": 0.00029283120706575074, + "loss": 2.8204, + "step": 990 + }, + { + "epoch": 1.44, + "learning_rate": 0.00029268400392541704, + "loss": 2.6594, + "step": 1000 + }, + { + "epoch": 1.44, + "eval_loss": 2.4058356285095215, + "eval_runtime": 39.9286, + "eval_samples_per_second": 11.445, + "eval_steps_per_second": 1.453, + "eval_wer": 0.9799728956482457, + "step": 1000 + }, + { + "epoch": 1.45, + "learning_rate": 0.0002925368007850834, + "loss": 2.527, + "step": 1010 + }, + { + "epoch": 1.47, + "learning_rate": 0.0002923895976447497, + "loss": 2.371, + "step": 1020 + }, + { + "epoch": 1.48, + "learning_rate": 0.00029224239450441607, + "loss": 2.271, + "step": 1030 + }, + { + "epoch": 1.49, + "learning_rate": 0.0002920951913640824, + "loss": 2.185, + "step": 1040 + }, + { + "epoch": 1.51, + "learning_rate": 0.00029194798822374874, + "loss": 2.167, + "step": 1050 + }, + { + "epoch": 1.52, + "learning_rate": 0.0002918007850834151, + "loss": 2.0004, + "step": 1060 + }, + { + "epoch": 1.54, + "learning_rate": 0.00029165358194308146, + "loss": 1.9067, + "step": 1070 + }, + { + "epoch": 1.55, + "learning_rate": 0.00029150637880274777, + "loss": 1.8721, + "step": 1080 + }, + { + "epoch": 1.57, + "learning_rate": 0.0002913591756624141, + "loss": 1.7606, + "step": 1090 + }, + { + "epoch": 1.58, + "learning_rate": 0.00029121197252208043, + "loss": 1.729, + "step": 1100 + }, + { + "epoch": 1.58, + "eval_loss": 1.5358420610427856, + "eval_runtime": 39.5025, + "eval_samples_per_second": 11.569, + "eval_steps_per_second": 1.468, + "eval_wer": 0.8920343321788887, + "step": 1100 + }, + { + "epoch": 1.59, + "learning_rate": 0.0002910647693817468, + "loss": 1.621, + "step": 1110 + }, + { + "epoch": 1.61, + "learning_rate": 0.0002909175662414131, + "loss": 1.6394, + "step": 1120 + }, + { + "epoch": 1.62, + "learning_rate": 0.00029077036310107946, + "loss": 1.626, + "step": 1130 + }, + { + "epoch": 1.64, + "learning_rate": 0.0002906231599607458, + "loss": 1.5561, + "step": 1140 + }, + { + "epoch": 1.65, + "learning_rate": 0.0002904759568204122, + "loss": 1.5221, + "step": 1150 + }, + { + "epoch": 1.67, + "learning_rate": 0.0002903287536800785, + "loss": 1.4047, + "step": 1160 + }, + { + "epoch": 1.68, + "learning_rate": 0.00029018155053974485, + "loss": 1.4521, + "step": 1170 + }, + { + "epoch": 1.7, + "learning_rate": 0.00029003434739941115, + "loss": 1.3526, + "step": 1180 + }, + { + "epoch": 1.71, + "learning_rate": 0.00028988714425907746, + "loss": 1.2765, + "step": 1190 + }, + { + "epoch": 1.72, + "learning_rate": 0.0002897399411187438, + "loss": 1.3998, + "step": 1200 + }, + { + "epoch": 1.72, + "eval_loss": 1.1598572731018066, + "eval_runtime": 39.5369, + "eval_samples_per_second": 11.559, + "eval_steps_per_second": 1.467, + "eval_wer": 0.8021382321939466, + "step": 1200 + }, + { + "epoch": 1.74, + "learning_rate": 0.0002895927379784102, + "loss": 1.2611, + "step": 1210 + }, + { + "epoch": 1.75, + "learning_rate": 0.00028944553483807654, + "loss": 1.2765, + "step": 1220 + }, + { + "epoch": 1.77, + "learning_rate": 0.00028929833169774285, + "loss": 1.1803, + "step": 1230 + }, + { + "epoch": 1.78, + "learning_rate": 0.0002891511285574092, + "loss": 1.2348, + "step": 1240 + }, + { + "epoch": 1.8, + "learning_rate": 0.00028900392541707557, + "loss": 1.1927, + "step": 1250 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002888567222767419, + "loss": 1.141, + "step": 1260 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002887095191364082, + "loss": 1.2261, + "step": 1270 + }, + { + "epoch": 1.84, + "learning_rate": 0.00028856231599607454, + "loss": 1.1062, + "step": 1280 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002884151128557409, + "loss": 1.095, + "step": 1290 + }, + { + "epoch": 1.87, + "learning_rate": 0.00028826790971540726, + "loss": 1.1236, + "step": 1300 + }, + { + "epoch": 1.87, + "eval_loss": 0.9830673336982727, + "eval_runtime": 39.4178, + "eval_samples_per_second": 11.594, + "eval_steps_per_second": 1.471, + "eval_wer": 0.7566631531395874, + "step": 1300 + }, + { + "epoch": 1.88, + "learning_rate": 0.00028812070657507357, + "loss": 1.0961, + "step": 1310 + }, + { + "epoch": 1.9, + "learning_rate": 0.00028797350343473993, + "loss": 1.09, + "step": 1320 + }, + { + "epoch": 1.91, + "learning_rate": 0.0002878263002944063, + "loss": 1.0263, + "step": 1330 + }, + { + "epoch": 1.93, + "learning_rate": 0.0002876790971540726, + "loss": 1.0797, + "step": 1340 + }, + { + "epoch": 1.94, + "learning_rate": 0.0002875318940137389, + "loss": 1.0631, + "step": 1350 + }, + { + "epoch": 1.95, + "learning_rate": 0.00028738469087340526, + "loss": 0.9842, + "step": 1360 + }, + { + "epoch": 1.97, + "learning_rate": 0.0002872374877330716, + "loss": 1.129, + "step": 1370 + }, + { + "epoch": 1.98, + "learning_rate": 0.00028709028459273793, + "loss": 0.9745, + "step": 1380 + }, + { + "epoch": 2.0, + "learning_rate": 0.0002869430814524043, + "loss": 0.9876, + "step": 1390 + }, + { + "epoch": 2.01, + "learning_rate": 0.00028679587831207065, + "loss": 1.0142, + "step": 1400 + }, + { + "epoch": 2.01, + "eval_loss": 0.8522623181343079, + "eval_runtime": 39.9987, + "eval_samples_per_second": 11.425, + "eval_steps_per_second": 1.45, + "eval_wer": 0.6712844451136877, + "step": 1400 + }, + { + "epoch": 2.03, + "learning_rate": 0.000286648675171737, + "loss": 0.9384, + "step": 1410 + }, + { + "epoch": 2.04, + "learning_rate": 0.0002865014720314033, + "loss": 0.9115, + "step": 1420 + }, + { + "epoch": 2.05, + "learning_rate": 0.0002863542688910696, + "loss": 0.9601, + "step": 1430 + }, + { + "epoch": 2.07, + "learning_rate": 0.000286207065750736, + "loss": 0.9199, + "step": 1440 + }, + { + "epoch": 2.08, + "learning_rate": 0.00028605986261040234, + "loss": 0.9359, + "step": 1450 + }, + { + "epoch": 2.1, + "learning_rate": 0.00028591265947006865, + "loss": 0.9353, + "step": 1460 + }, + { + "epoch": 2.11, + "learning_rate": 0.000285765456329735, + "loss": 0.8925, + "step": 1470 + }, + { + "epoch": 2.13, + "learning_rate": 0.00028561825318940137, + "loss": 0.9429, + "step": 1480 + }, + { + "epoch": 2.14, + "learning_rate": 0.0002854710500490677, + "loss": 0.8772, + "step": 1490 + }, + { + "epoch": 2.16, + "learning_rate": 0.00028532384690873404, + "loss": 0.9132, + "step": 1500 + }, + { + "epoch": 2.16, + "eval_loss": 0.802708089351654, + "eval_runtime": 39.7319, + "eval_samples_per_second": 11.502, + "eval_steps_per_second": 1.46, + "eval_wer": 0.6539677759373589, + "step": 1500 + }, + { + "epoch": 2.17, + "learning_rate": 0.00028517664376840035, + "loss": 0.8947, + "step": 1510 + }, + { + "epoch": 2.18, + "learning_rate": 0.0002850294406280667, + "loss": 0.8716, + "step": 1520 + }, + { + "epoch": 2.2, + "learning_rate": 0.000284882237487733, + "loss": 0.8453, + "step": 1530 + }, + { + "epoch": 2.21, + "learning_rate": 0.00028473503434739937, + "loss": 0.8724, + "step": 1540 + }, + { + "epoch": 2.23, + "learning_rate": 0.00028458783120706573, + "loss": 0.835, + "step": 1550 + }, + { + "epoch": 2.24, + "learning_rate": 0.0002844406280667321, + "loss": 0.8617, + "step": 1560 + }, + { + "epoch": 2.26, + "learning_rate": 0.0002842934249263984, + "loss": 0.8362, + "step": 1570 + }, + { + "epoch": 2.27, + "learning_rate": 0.00028414622178606476, + "loss": 0.7738, + "step": 1580 + }, + { + "epoch": 2.28, + "learning_rate": 0.00028399901864573107, + "loss": 0.8412, + "step": 1590 + }, + { + "epoch": 2.3, + "learning_rate": 0.0002838518155053974, + "loss": 0.8157, + "step": 1600 + }, + { + "epoch": 2.3, + "eval_loss": 0.7228513956069946, + "eval_runtime": 39.6806, + "eval_samples_per_second": 11.517, + "eval_steps_per_second": 1.462, + "eval_wer": 0.6179792199969885, + "step": 1600 + }, + { + "epoch": 2.31, + "learning_rate": 0.00028370461236506373, + "loss": 0.7675, + "step": 1610 + }, + { + "epoch": 2.33, + "learning_rate": 0.0002835574092247301, + "loss": 0.8323, + "step": 1620 + }, + { + "epoch": 2.34, + "learning_rate": 0.00028341020608439645, + "loss": 0.784, + "step": 1630 + }, + { + "epoch": 2.36, + "learning_rate": 0.00028326300294406276, + "loss": 0.782, + "step": 1640 + }, + { + "epoch": 2.37, + "learning_rate": 0.0002831157998037291, + "loss": 0.7919, + "step": 1650 + }, + { + "epoch": 2.39, + "learning_rate": 0.0002829685966633955, + "loss": 0.7782, + "step": 1660 + }, + { + "epoch": 2.4, + "learning_rate": 0.0002828213935230618, + "loss": 0.8246, + "step": 1670 + }, + { + "epoch": 2.41, + "learning_rate": 0.00028267419038272815, + "loss": 0.7631, + "step": 1680 + }, + { + "epoch": 2.43, + "learning_rate": 0.00028252698724239445, + "loss": 0.7991, + "step": 1690 + }, + { + "epoch": 2.44, + "learning_rate": 0.0002823797841020608, + "loss": 0.8154, + "step": 1700 + }, + { + "epoch": 2.44, + "eval_loss": 0.6884952783584595, + "eval_runtime": 39.9781, + "eval_samples_per_second": 11.431, + "eval_steps_per_second": 1.451, + "eval_wer": 0.6060834211715103, + "step": 1700 + }, + { + "epoch": 2.46, + "learning_rate": 0.0002822325809617272, + "loss": 0.7625, + "step": 1710 + }, + { + "epoch": 2.47, + "learning_rate": 0.0002820853778213935, + "loss": 0.7888, + "step": 1720 + }, + { + "epoch": 2.49, + "learning_rate": 0.00028193817468105984, + "loss": 0.7091, + "step": 1730 + }, + { + "epoch": 2.5, + "learning_rate": 0.0002817909715407262, + "loss": 0.7846, + "step": 1740 + }, + { + "epoch": 2.51, + "learning_rate": 0.0002816437684003925, + "loss": 0.7651, + "step": 1750 + }, + { + "epoch": 2.53, + "learning_rate": 0.00028149656526005887, + "loss": 0.6977, + "step": 1760 + }, + { + "epoch": 2.54, + "learning_rate": 0.0002813493621197252, + "loss": 0.7321, + "step": 1770 + }, + { + "epoch": 2.56, + "learning_rate": 0.00028120215897939154, + "loss": 0.6753, + "step": 1780 + }, + { + "epoch": 2.57, + "learning_rate": 0.00028105495583905784, + "loss": 0.7269, + "step": 1790 + }, + { + "epoch": 2.59, + "learning_rate": 0.0002809077526987242, + "loss": 0.7424, + "step": 1800 + }, + { + "epoch": 2.59, + "eval_loss": 0.6070171594619751, + "eval_runtime": 39.745, + "eval_samples_per_second": 11.498, + "eval_steps_per_second": 1.459, + "eval_wer": 0.5691913868393315, + "step": 1800 + }, + { + "epoch": 2.6, + "learning_rate": 0.00028076054955839056, + "loss": 0.6781, + "step": 1810 + }, + { + "epoch": 2.61, + "learning_rate": 0.0002806133464180569, + "loss": 0.7446, + "step": 1820 + }, + { + "epoch": 2.63, + "learning_rate": 0.00028046614327772323, + "loss": 0.7286, + "step": 1830 + }, + { + "epoch": 2.64, + "learning_rate": 0.0002803189401373896, + "loss": 0.707, + "step": 1840 + }, + { + "epoch": 2.66, + "learning_rate": 0.0002801717369970559, + "loss": 0.7032, + "step": 1850 + }, + { + "epoch": 2.67, + "learning_rate": 0.00028002453385672226, + "loss": 0.7005, + "step": 1860 + }, + { + "epoch": 2.69, + "learning_rate": 0.00027987733071638856, + "loss": 0.6833, + "step": 1870 + }, + { + "epoch": 2.7, + "learning_rate": 0.0002797301275760549, + "loss": 0.6812, + "step": 1880 + }, + { + "epoch": 2.72, + "learning_rate": 0.0002795829244357213, + "loss": 0.6614, + "step": 1890 + }, + { + "epoch": 2.73, + "learning_rate": 0.00027943572129538765, + "loss": 0.6949, + "step": 1900 + }, + { + "epoch": 2.73, + "eval_loss": 0.5801286697387695, + "eval_runtime": 39.6689, + "eval_samples_per_second": 11.52, + "eval_steps_per_second": 1.462, + "eval_wer": 0.5460021081162475, + "step": 1900 + }, + { + "epoch": 2.74, + "learning_rate": 0.00027928851815505395, + "loss": 0.676, + "step": 1910 + }, + { + "epoch": 2.76, + "learning_rate": 0.0002791413150147203, + "loss": 0.7185, + "step": 1920 + }, + { + "epoch": 2.77, + "learning_rate": 0.0002789941118743866, + "loss": 0.6175, + "step": 1930 + }, + { + "epoch": 2.79, + "learning_rate": 0.000278846908734053, + "loss": 0.6519, + "step": 1940 + }, + { + "epoch": 2.8, + "learning_rate": 0.0002786997055937193, + "loss": 0.662, + "step": 1950 + }, + { + "epoch": 2.82, + "learning_rate": 0.00027855250245338565, + "loss": 0.6317, + "step": 1960 + }, + { + "epoch": 2.83, + "learning_rate": 0.000278405299313052, + "loss": 0.6532, + "step": 1970 + }, + { + "epoch": 2.84, + "learning_rate": 0.0002782580961727183, + "loss": 0.6097, + "step": 1980 + }, + { + "epoch": 2.86, + "learning_rate": 0.0002781108930323847, + "loss": 0.6441, + "step": 1990 + }, + { + "epoch": 2.87, + "learning_rate": 0.00027796368989205103, + "loss": 0.6748, + "step": 2000 + }, + { + "epoch": 2.87, + "eval_loss": 0.5619427561759949, + "eval_runtime": 39.9278, + "eval_samples_per_second": 11.446, + "eval_steps_per_second": 1.453, + "eval_wer": 0.5387742809817798, + "step": 2000 + }, + { + "epoch": 2.89, + "learning_rate": 0.00027781648675171734, + "loss": 0.6749, + "step": 2010 + }, + { + "epoch": 2.9, + "learning_rate": 0.0002776692836113837, + "loss": 0.6225, + "step": 2020 + }, + { + "epoch": 2.92, + "learning_rate": 0.00027752208047105, + "loss": 0.592, + "step": 2030 + }, + { + "epoch": 2.93, + "learning_rate": 0.00027737487733071637, + "loss": 0.6007, + "step": 2040 + }, + { + "epoch": 2.95, + "learning_rate": 0.00027722767419038273, + "loss": 0.6488, + "step": 2050 + }, + { + "epoch": 2.96, + "learning_rate": 0.00027708047105004903, + "loss": 0.6334, + "step": 2060 + }, + { + "epoch": 2.97, + "learning_rate": 0.0002769332679097154, + "loss": 0.6266, + "step": 2070 + }, + { + "epoch": 2.99, + "learning_rate": 0.00027678606476938175, + "loss": 0.5994, + "step": 2080 + }, + { + "epoch": 3.0, + "learning_rate": 0.00027663886162904806, + "loss": 0.6151, + "step": 2090 + }, + { + "epoch": 3.02, + "learning_rate": 0.0002764916584887144, + "loss": 0.5569, + "step": 2100 + }, + { + "epoch": 3.02, + "eval_loss": 0.5206429958343506, + "eval_runtime": 39.8569, + "eval_samples_per_second": 11.466, + "eval_steps_per_second": 1.455, + "eval_wer": 0.5130251468152387, + "step": 2100 + }, + { + "epoch": 3.03, + "learning_rate": 0.00027634445534838073, + "loss": 0.5417, + "step": 2110 + }, + { + "epoch": 3.05, + "learning_rate": 0.0002761972522080471, + "loss": 0.6448, + "step": 2120 + }, + { + "epoch": 3.06, + "learning_rate": 0.0002760500490677134, + "loss": 0.5474, + "step": 2130 + }, + { + "epoch": 3.07, + "learning_rate": 0.00027590284592737976, + "loss": 0.5912, + "step": 2140 + }, + { + "epoch": 3.09, + "learning_rate": 0.0002757556427870461, + "loss": 0.5482, + "step": 2150 + }, + { + "epoch": 3.1, + "learning_rate": 0.0002756084396467125, + "loss": 0.5619, + "step": 2160 + }, + { + "epoch": 3.12, + "learning_rate": 0.0002754612365063788, + "loss": 0.581, + "step": 2170 + }, + { + "epoch": 3.13, + "learning_rate": 0.00027531403336604514, + "loss": 0.5275, + "step": 2180 + }, + { + "epoch": 3.15, + "learning_rate": 0.00027516683022571145, + "loss": 0.5497, + "step": 2190 + }, + { + "epoch": 3.16, + "learning_rate": 0.0002750196270853778, + "loss": 0.5584, + "step": 2200 + }, + { + "epoch": 3.16, + "eval_loss": 0.4875911772251129, + "eval_runtime": 39.9849, + "eval_samples_per_second": 11.429, + "eval_steps_per_second": 1.451, + "eval_wer": 0.49028760728805904, + "step": 2200 + }, + { + "epoch": 3.18, + "learning_rate": 0.0002748724239450441, + "loss": 0.5276, + "step": 2210 + }, + { + "epoch": 3.19, + "learning_rate": 0.0002747252208047105, + "loss": 0.5582, + "step": 2220 + }, + { + "epoch": 3.2, + "learning_rate": 0.00027457801766437684, + "loss": 0.5294, + "step": 2230 + }, + { + "epoch": 3.22, + "learning_rate": 0.00027443081452404314, + "loss": 0.5978, + "step": 2240 + }, + { + "epoch": 3.23, + "learning_rate": 0.0002742836113837095, + "loss": 0.5331, + "step": 2250 + }, + { + "epoch": 3.25, + "learning_rate": 0.00027413640824337586, + "loss": 0.5714, + "step": 2260 + }, + { + "epoch": 3.26, + "learning_rate": 0.00027398920510304217, + "loss": 0.549, + "step": 2270 + }, + { + "epoch": 3.28, + "learning_rate": 0.0002738420019627085, + "loss": 0.5706, + "step": 2280 + }, + { + "epoch": 3.29, + "learning_rate": 0.00027369479882237484, + "loss": 0.5235, + "step": 2290 + }, + { + "epoch": 3.3, + "learning_rate": 0.0002735475956820412, + "loss": 0.5333, + "step": 2300 + }, + { + "epoch": 3.3, + "eval_loss": 0.46249067783355713, + "eval_runtime": 40.1021, + "eval_samples_per_second": 11.396, + "eval_steps_per_second": 1.446, + "eval_wer": 0.4661948501731667, + "step": 2300 + }, + { + "epoch": 3.32, + "learning_rate": 0.00027340039254170756, + "loss": 0.5333, + "step": 2310 + }, + { + "epoch": 3.33, + "learning_rate": 0.00027325318940137386, + "loss": 0.578, + "step": 2320 + }, + { + "epoch": 3.35, + "learning_rate": 0.0002731059862610402, + "loss": 0.5243, + "step": 2330 + }, + { + "epoch": 3.36, + "learning_rate": 0.0002729587831207066, + "loss": 0.5668, + "step": 2340 + }, + { + "epoch": 3.38, + "learning_rate": 0.0002728115799803729, + "loss": 0.5112, + "step": 2350 + }, + { + "epoch": 3.39, + "learning_rate": 0.0002726643768400392, + "loss": 0.5039, + "step": 2360 + }, + { + "epoch": 3.41, + "learning_rate": 0.00027251717369970556, + "loss": 0.5342, + "step": 2370 + }, + { + "epoch": 3.42, + "learning_rate": 0.0002723699705593719, + "loss": 0.4879, + "step": 2380 + }, + { + "epoch": 3.43, + "learning_rate": 0.0002722227674190382, + "loss": 0.5277, + "step": 2390 + }, + { + "epoch": 3.45, + "learning_rate": 0.0002720755642787046, + "loss": 0.5277, + "step": 2400 + }, + { + "epoch": 3.45, + "eval_loss": 0.4557473361492157, + "eval_runtime": 39.6153, + "eval_samples_per_second": 11.536, + "eval_steps_per_second": 1.464, + "eval_wer": 0.4631832555338051, + "step": 2400 + }, + { + "epoch": 3.46, + "learning_rate": 0.00027192836113837095, + "loss": 0.5052, + "step": 2410 + }, + { + "epoch": 3.48, + "learning_rate": 0.0002717811579980373, + "loss": 0.5292, + "step": 2420 + }, + { + "epoch": 3.49, + "learning_rate": 0.0002716339548577036, + "loss": 0.5448, + "step": 2430 + }, + { + "epoch": 3.51, + "learning_rate": 0.0002714867517173699, + "loss": 0.5089, + "step": 2440 + }, + { + "epoch": 3.52, + "learning_rate": 0.0002713395485770363, + "loss": 0.5381, + "step": 2450 + }, + { + "epoch": 3.53, + "learning_rate": 0.00027119234543670264, + "loss": 0.5119, + "step": 2460 + }, + { + "epoch": 3.55, + "learning_rate": 0.00027104514229636895, + "loss": 0.5093, + "step": 2470 + }, + { + "epoch": 3.56, + "learning_rate": 0.0002708979391560353, + "loss": 0.4931, + "step": 2480 + }, + { + "epoch": 3.58, + "learning_rate": 0.00027075073601570167, + "loss": 0.4823, + "step": 2490 + }, + { + "epoch": 3.59, + "learning_rate": 0.000270603532875368, + "loss": 0.479, + "step": 2500 + }, + { + "epoch": 3.59, + "eval_loss": 0.42780354619026184, + "eval_runtime": 39.8004, + "eval_samples_per_second": 11.482, + "eval_steps_per_second": 1.457, + "eval_wer": 0.44421020930582744, + "step": 2500 + }, + { + "epoch": 3.61, + "learning_rate": 0.00027045632973503433, + "loss": 0.4703, + "step": 2510 + }, + { + "epoch": 3.62, + "learning_rate": 0.00027030912659470064, + "loss": 0.4812, + "step": 2520 + }, + { + "epoch": 3.64, + "learning_rate": 0.000270161923454367, + "loss": 0.5042, + "step": 2530 + }, + { + "epoch": 3.65, + "learning_rate": 0.0002700147203140333, + "loss": 0.486, + "step": 2540 + }, + { + "epoch": 3.66, + "learning_rate": 0.00026986751717369967, + "loss": 0.4923, + "step": 2550 + }, + { + "epoch": 3.68, + "learning_rate": 0.00026972031403336603, + "loss": 0.4595, + "step": 2560 + }, + { + "epoch": 3.69, + "learning_rate": 0.0002695731108930324, + "loss": 0.6039, + "step": 2570 + }, + { + "epoch": 3.71, + "learning_rate": 0.0002694259077526987, + "loss": 0.4577, + "step": 2580 + }, + { + "epoch": 3.72, + "learning_rate": 0.00026927870461236506, + "loss": 0.4911, + "step": 2590 + }, + { + "epoch": 3.74, + "learning_rate": 0.00026913150147203136, + "loss": 0.5368, + "step": 2600 + }, + { + "epoch": 3.74, + "eval_loss": 0.43260544538497925, + "eval_runtime": 39.7779, + "eval_samples_per_second": 11.489, + "eval_steps_per_second": 1.458, + "eval_wer": 0.44677006474928477, + "step": 2600 + }, + { + "epoch": 3.75, + "learning_rate": 0.0002689842983316977, + "loss": 0.4625, + "step": 2610 + }, + { + "epoch": 3.76, + "learning_rate": 0.00026883709519136403, + "loss": 0.5655, + "step": 2620 + }, + { + "epoch": 3.78, + "learning_rate": 0.0002686898920510304, + "loss": 0.4575, + "step": 2630 + }, + { + "epoch": 3.79, + "learning_rate": 0.00026854268891069675, + "loss": 0.5072, + "step": 2640 + }, + { + "epoch": 3.81, + "learning_rate": 0.00026839548577036306, + "loss": 0.4799, + "step": 2650 + }, + { + "epoch": 3.82, + "learning_rate": 0.0002682482826300294, + "loss": 0.4849, + "step": 2660 + }, + { + "epoch": 3.84, + "learning_rate": 0.0002681010794896958, + "loss": 0.5101, + "step": 2670 + }, + { + "epoch": 3.85, + "learning_rate": 0.0002679538763493621, + "loss": 0.4985, + "step": 2680 + }, + { + "epoch": 3.86, + "learning_rate": 0.00026780667320902844, + "loss": 0.4664, + "step": 2690 + }, + { + "epoch": 3.88, + "learning_rate": 0.00026765947006869475, + "loss": 0.5113, + "step": 2700 + }, + { + "epoch": 3.88, + "eval_loss": 0.40216904878616333, + "eval_runtime": 40.3356, + "eval_samples_per_second": 11.33, + "eval_steps_per_second": 1.438, + "eval_wer": 0.4338202078000301, + "step": 2700 + }, + { + "epoch": 3.89, + "learning_rate": 0.0002675122669283611, + "loss": 0.4684, + "step": 2710 + }, + { + "epoch": 3.91, + "learning_rate": 0.00026736506378802747, + "loss": 0.4687, + "step": 2720 + }, + { + "epoch": 3.92, + "learning_rate": 0.0002672178606476938, + "loss": 0.4609, + "step": 2730 + }, + { + "epoch": 3.94, + "learning_rate": 0.00026707065750736014, + "loss": 0.4715, + "step": 2740 + }, + { + "epoch": 3.95, + "learning_rate": 0.0002669234543670265, + "loss": 0.5112, + "step": 2750 + }, + { + "epoch": 3.97, + "learning_rate": 0.0002667762512266928, + "loss": 0.4614, + "step": 2760 + }, + { + "epoch": 3.98, + "learning_rate": 0.00026662904808635917, + "loss": 0.4613, + "step": 2770 + }, + { + "epoch": 3.99, + "learning_rate": 0.00026648184494602547, + "loss": 0.4496, + "step": 2780 + }, + { + "epoch": 4.01, + "learning_rate": 0.00026633464180569183, + "loss": 0.4614, + "step": 2790 + }, + { + "epoch": 4.02, + "learning_rate": 0.00026618743866535814, + "loss": 0.4377, + "step": 2800 + }, + { + "epoch": 4.02, + "eval_loss": 0.3904813528060913, + "eval_runtime": 40.1396, + "eval_samples_per_second": 11.385, + "eval_steps_per_second": 1.445, + "eval_wer": 0.42824875771721127, + "step": 2800 + }, + { + "epoch": 4.04, + "learning_rate": 0.0002660402355250245, + "loss": 0.4191, + "step": 2810 + }, + { + "epoch": 4.05, + "learning_rate": 0.00026589303238469086, + "loss": 0.3959, + "step": 2820 + }, + { + "epoch": 4.07, + "learning_rate": 0.0002657458292443572, + "loss": 0.4222, + "step": 2830 + }, + { + "epoch": 4.08, + "learning_rate": 0.0002655986261040235, + "loss": 0.3959, + "step": 2840 + }, + { + "epoch": 4.09, + "learning_rate": 0.0002654514229636899, + "loss": 0.3709, + "step": 2850 + }, + { + "epoch": 4.11, + "learning_rate": 0.0002653042198233562, + "loss": 0.4196, + "step": 2860 + }, + { + "epoch": 4.12, + "learning_rate": 0.00026515701668302255, + "loss": 0.4266, + "step": 2870 + }, + { + "epoch": 4.14, + "learning_rate": 0.00026500981354268886, + "loss": 0.4069, + "step": 2880 + }, + { + "epoch": 4.15, + "learning_rate": 0.0002648626104023552, + "loss": 0.4123, + "step": 2890 + }, + { + "epoch": 4.17, + "learning_rate": 0.0002647154072620216, + "loss": 0.3715, + "step": 2900 + }, + { + "epoch": 4.17, + "eval_loss": 0.3695952892303467, + "eval_runtime": 39.8629, + "eval_samples_per_second": 11.464, + "eval_steps_per_second": 1.455, + "eval_wer": 0.40581237765396777, + "step": 2900 + }, + { + "epoch": 4.18, + "learning_rate": 0.00026456820412168794, + "loss": 0.4446, + "step": 2910 + }, + { + "epoch": 4.2, + "learning_rate": 0.00026442100098135425, + "loss": 0.4482, + "step": 2920 + }, + { + "epoch": 4.21, + "learning_rate": 0.0002642737978410206, + "loss": 0.4032, + "step": 2930 + }, + { + "epoch": 4.22, + "learning_rate": 0.0002641265947006869, + "loss": 0.425, + "step": 2940 + }, + { + "epoch": 4.24, + "learning_rate": 0.0002639793915603533, + "loss": 0.3987, + "step": 2950 + }, + { + "epoch": 4.25, + "learning_rate": 0.0002638321884200196, + "loss": 0.3933, + "step": 2960 + }, + { + "epoch": 4.27, + "learning_rate": 0.00026368498527968594, + "loss": 0.4381, + "step": 2970 + }, + { + "epoch": 4.28, + "learning_rate": 0.0002635377821393523, + "loss": 0.3662, + "step": 2980 + }, + { + "epoch": 4.3, + "learning_rate": 0.0002633905789990186, + "loss": 0.4008, + "step": 2990 + }, + { + "epoch": 4.31, + "learning_rate": 0.00026324337585868497, + "loss": 0.3764, + "step": 3000 + }, + { + "epoch": 4.31, + "eval_loss": 0.36124685406684875, + "eval_runtime": 39.8744, + "eval_samples_per_second": 11.461, + "eval_steps_per_second": 1.455, + "eval_wer": 0.3918084625809366, + "step": 3000 + }, + { + "epoch": 4.32, + "learning_rate": 0.00026309617271835133, + "loss": 0.4272, + "step": 3010 + }, + { + "epoch": 4.34, + "learning_rate": 0.00026294896957801764, + "loss": 0.4066, + "step": 3020 + }, + { + "epoch": 4.35, + "learning_rate": 0.000262801766437684, + "loss": 0.3517, + "step": 3030 + }, + { + "epoch": 4.37, + "learning_rate": 0.0002626545632973503, + "loss": 0.4108, + "step": 3040 + }, + { + "epoch": 4.38, + "learning_rate": 0.00026250736015701666, + "loss": 0.3775, + "step": 3050 + }, + { + "epoch": 4.4, + "learning_rate": 0.000262360157016683, + "loss": 0.3643, + "step": 3060 + }, + { + "epoch": 4.41, + "learning_rate": 0.00026221295387634933, + "loss": 0.395, + "step": 3070 + }, + { + "epoch": 4.43, + "learning_rate": 0.0002620657507360157, + "loss": 0.3699, + "step": 3080 + }, + { + "epoch": 4.44, + "learning_rate": 0.00026191854759568205, + "loss": 0.3657, + "step": 3090 + }, + { + "epoch": 4.45, + "learning_rate": 0.00026177134445534836, + "loss": 0.3915, + "step": 3100 + }, + { + "epoch": 4.45, + "eval_loss": 0.3556678593158722, + "eval_runtime": 39.9374, + "eval_samples_per_second": 11.443, + "eval_steps_per_second": 1.452, + "eval_wer": 0.384731215178437, + "step": 3100 + }, + { + "epoch": 4.47, + "learning_rate": 0.00026162414131501466, + "loss": 0.3968, + "step": 3110 + }, + { + "epoch": 4.48, + "learning_rate": 0.000261476938174681, + "loss": 0.4099, + "step": 3120 + }, + { + "epoch": 4.5, + "learning_rate": 0.0002613297350343474, + "loss": 0.422, + "step": 3130 + }, + { + "epoch": 4.51, + "learning_rate": 0.0002611825318940137, + "loss": 0.4122, + "step": 3140 + }, + { + "epoch": 4.53, + "learning_rate": 0.00026103532875368005, + "loss": 0.3962, + "step": 3150 + }, + { + "epoch": 4.54, + "learning_rate": 0.0002608881256133464, + "loss": 0.3721, + "step": 3160 + }, + { + "epoch": 4.55, + "learning_rate": 0.00026074092247301277, + "loss": 0.468, + "step": 3170 + }, + { + "epoch": 4.57, + "learning_rate": 0.0002605937193326791, + "loss": 0.3766, + "step": 3180 + }, + { + "epoch": 4.58, + "learning_rate": 0.0002604465161923454, + "loss": 0.3768, + "step": 3190 + }, + { + "epoch": 4.6, + "learning_rate": 0.00026029931305201175, + "loss": 0.369, + "step": 3200 + }, + { + "epoch": 4.6, + "eval_loss": 0.36044731736183167, + "eval_runtime": 39.912, + "eval_samples_per_second": 11.45, + "eval_steps_per_second": 1.453, + "eval_wer": 0.39286252070471317, + "step": 3200 + }, + { + "epoch": 4.61, + "learning_rate": 0.0002601521099116781, + "loss": 0.4042, + "step": 3210 + }, + { + "epoch": 4.63, + "learning_rate": 0.0002600049067713444, + "loss": 0.3628, + "step": 3220 + }, + { + "epoch": 4.64, + "learning_rate": 0.00025985770363101077, + "loss": 0.3977, + "step": 3230 + }, + { + "epoch": 4.66, + "learning_rate": 0.00025971050049067713, + "loss": 0.4106, + "step": 3240 + }, + { + "epoch": 4.67, + "learning_rate": 0.00025956329735034344, + "loss": 0.3944, + "step": 3250 + }, + { + "epoch": 4.68, + "learning_rate": 0.0002594160942100098, + "loss": 0.3964, + "step": 3260 + }, + { + "epoch": 4.7, + "learning_rate": 0.0002592688910696761, + "loss": 0.3937, + "step": 3270 + }, + { + "epoch": 4.71, + "learning_rate": 0.00025912168792934247, + "loss": 0.33, + "step": 3280 + }, + { + "epoch": 4.73, + "learning_rate": 0.00025897448478900877, + "loss": 0.4144, + "step": 3290 + }, + { + "epoch": 4.74, + "learning_rate": 0.00025882728164867513, + "loss": 0.3644, + "step": 3300 + }, + { + "epoch": 4.74, + "eval_loss": 0.3271957039833069, + "eval_runtime": 39.9356, + "eval_samples_per_second": 11.443, + "eval_steps_per_second": 1.452, + "eval_wer": 0.3604878783315766, + "step": 3300 + }, + { + "epoch": 4.76, + "learning_rate": 0.0002586800785083415, + "loss": 0.3605, + "step": 3310 + }, + { + "epoch": 4.77, + "learning_rate": 0.00025853287536800785, + "loss": 0.3926, + "step": 3320 + }, + { + "epoch": 4.78, + "learning_rate": 0.00025838567222767416, + "loss": 0.3565, + "step": 3330 + }, + { + "epoch": 4.8, + "learning_rate": 0.0002582384690873405, + "loss": 0.3856, + "step": 3340 + }, + { + "epoch": 4.81, + "learning_rate": 0.00025809126594700683, + "loss": 0.3295, + "step": 3350 + }, + { + "epoch": 4.83, + "learning_rate": 0.0002579440628066732, + "loss": 0.3327, + "step": 3360 + }, + { + "epoch": 4.84, + "learning_rate": 0.0002577968596663395, + "loss": 0.374, + "step": 3370 + }, + { + "epoch": 4.86, + "learning_rate": 0.00025764965652600585, + "loss": 0.3291, + "step": 3380 + }, + { + "epoch": 4.87, + "learning_rate": 0.0002575024533856722, + "loss": 0.3902, + "step": 3390 + }, + { + "epoch": 4.89, + "learning_rate": 0.0002573552502453385, + "loss": 0.3959, + "step": 3400 + }, + { + "epoch": 4.89, + "eval_loss": 0.3158166706562042, + "eval_runtime": 40.0972, + "eval_samples_per_second": 11.397, + "eval_steps_per_second": 1.446, + "eval_wer": 0.36681222707423583, + "step": 3400 + }, + { + "epoch": 4.9, + "learning_rate": 0.0002572080471050049, + "loss": 0.3636, + "step": 3410 + }, + { + "epoch": 4.91, + "learning_rate": 0.00025706084396467124, + "loss": 0.3581, + "step": 3420 + }, + { + "epoch": 4.93, + "learning_rate": 0.00025691364082433755, + "loss": 0.3505, + "step": 3430 + }, + { + "epoch": 4.94, + "learning_rate": 0.0002567664376840039, + "loss": 0.3967, + "step": 3440 + }, + { + "epoch": 4.96, + "learning_rate": 0.0002566192345436702, + "loss": 0.3328, + "step": 3450 + }, + { + "epoch": 4.97, + "learning_rate": 0.0002564720314033366, + "loss": 0.3625, + "step": 3460 + }, + { + "epoch": 4.99, + "learning_rate": 0.00025632482826300294, + "loss": 0.386, + "step": 3470 + }, + { + "epoch": 5.0, + "learning_rate": 0.00025617762512266924, + "loss": 0.3102, + "step": 3480 + }, + { + "epoch": 5.01, + "learning_rate": 0.0002560304219823356, + "loss": 0.3945, + "step": 3490 + }, + { + "epoch": 5.03, + "learning_rate": 0.00025588321884200196, + "loss": 0.3307, + "step": 3500 + }, + { + "epoch": 5.03, + "eval_loss": 0.32223132252693176, + "eval_runtime": 40.0169, + "eval_samples_per_second": 11.42, + "eval_steps_per_second": 1.449, + "eval_wer": 0.35702454449631077, + "step": 3500 + }, + { + "epoch": 5.04, + "learning_rate": 0.00025573601570166827, + "loss": 0.3412, + "step": 3510 + }, + { + "epoch": 5.06, + "learning_rate": 0.00025558881256133463, + "loss": 0.3243, + "step": 3520 + }, + { + "epoch": 5.07, + "learning_rate": 0.00025544160942100094, + "loss": 0.3513, + "step": 3530 + }, + { + "epoch": 5.09, + "learning_rate": 0.0002552944062806673, + "loss": 0.3336, + "step": 3540 + }, + { + "epoch": 5.1, + "learning_rate": 0.0002551472031403336, + "loss": 0.318, + "step": 3550 + }, + { + "epoch": 5.11, + "learning_rate": 0.00025499999999999996, + "loss": 0.3662, + "step": 3560 + }, + { + "epoch": 5.13, + "learning_rate": 0.0002548527968596663, + "loss": 0.3265, + "step": 3570 + }, + { + "epoch": 5.14, + "learning_rate": 0.0002547055937193327, + "loss": 0.2784, + "step": 3580 + }, + { + "epoch": 5.16, + "learning_rate": 0.000254558390578999, + "loss": 0.3218, + "step": 3590 + }, + { + "epoch": 5.17, + "learning_rate": 0.00025441118743866535, + "loss": 0.3283, + "step": 3600 + }, + { + "epoch": 5.17, + "eval_loss": 0.3063613176345825, + "eval_runtime": 40.0819, + "eval_samples_per_second": 11.402, + "eval_steps_per_second": 1.447, + "eval_wer": 0.3576268634241831, + "step": 3600 + }, + { + "epoch": 5.19, + "learning_rate": 0.00025426398429833166, + "loss": 0.3153, + "step": 3610 + }, + { + "epoch": 5.2, + "learning_rate": 0.000254116781157998, + "loss": 0.2926, + "step": 3620 + }, + { + "epoch": 5.22, + "learning_rate": 0.0002539695780176643, + "loss": 0.3065, + "step": 3630 + }, + { + "epoch": 5.23, + "learning_rate": 0.0002538223748773307, + "loss": 0.3656, + "step": 3640 + }, + { + "epoch": 5.24, + "learning_rate": 0.00025367517173699705, + "loss": 0.2764, + "step": 3650 + }, + { + "epoch": 5.26, + "learning_rate": 0.0002535279685966634, + "loss": 0.3197, + "step": 3660 + }, + { + "epoch": 5.27, + "learning_rate": 0.0002533807654563297, + "loss": 0.3113, + "step": 3670 + }, + { + "epoch": 5.29, + "learning_rate": 0.0002532335623159961, + "loss": 0.3154, + "step": 3680 + }, + { + "epoch": 5.3, + "learning_rate": 0.0002530863591756624, + "loss": 0.3771, + "step": 3690 + }, + { + "epoch": 5.32, + "learning_rate": 0.00025293915603532874, + "loss": 0.2934, + "step": 3700 + }, + { + "epoch": 5.32, + "eval_loss": 0.30499157309532166, + "eval_runtime": 39.856, + "eval_samples_per_second": 11.466, + "eval_steps_per_second": 1.455, + "eval_wer": 0.34829092004216233, + "step": 3700 + }, + { + "epoch": 5.33, + "learning_rate": 0.00025279195289499505, + "loss": 0.3419, + "step": 3710 + }, + { + "epoch": 5.34, + "learning_rate": 0.0002526447497546614, + "loss": 0.3312, + "step": 3720 + }, + { + "epoch": 5.36, + "learning_rate": 0.00025249754661432777, + "loss": 0.2881, + "step": 3730 + }, + { + "epoch": 5.37, + "learning_rate": 0.0002523503434739941, + "loss": 0.3223, + "step": 3740 + }, + { + "epoch": 5.39, + "learning_rate": 0.00025220314033366043, + "loss": 0.3118, + "step": 3750 + }, + { + "epoch": 5.4, + "learning_rate": 0.0002520559371933268, + "loss": 0.3139, + "step": 3760 + }, + { + "epoch": 5.42, + "learning_rate": 0.0002519087340529931, + "loss": 0.3198, + "step": 3770 + }, + { + "epoch": 5.43, + "learning_rate": 0.00025176153091265946, + "loss": 0.2908, + "step": 3780 + }, + { + "epoch": 5.45, + "learning_rate": 0.00025161432777232577, + "loss": 0.3446, + "step": 3790 + }, + { + "epoch": 5.46, + "learning_rate": 0.00025146712463199213, + "loss": 0.3015, + "step": 3800 + }, + { + "epoch": 5.46, + "eval_loss": 0.28972870111465454, + "eval_runtime": 40.1556, + "eval_samples_per_second": 11.381, + "eval_steps_per_second": 1.444, + "eval_wer": 0.3416654118355669, + "step": 3800 + }, + { + "epoch": 5.47, + "learning_rate": 0.0002513199214916585, + "loss": 0.3488, + "step": 3810 + }, + { + "epoch": 5.49, + "learning_rate": 0.0002511727183513248, + "loss": 0.2873, + "step": 3820 + }, + { + "epoch": 5.5, + "learning_rate": 0.00025102551521099116, + "loss": 0.2951, + "step": 3830 + }, + { + "epoch": 5.52, + "learning_rate": 0.0002508783120706575, + "loss": 0.3305, + "step": 3840 + }, + { + "epoch": 5.53, + "learning_rate": 0.0002507311089303238, + "loss": 0.3062, + "step": 3850 + }, + { + "epoch": 5.55, + "learning_rate": 0.0002505839057899902, + "loss": 0.3912, + "step": 3860 + }, + { + "epoch": 5.56, + "learning_rate": 0.0002504367026496565, + "loss": 0.2884, + "step": 3870 + }, + { + "epoch": 5.57, + "learning_rate": 0.00025028949950932285, + "loss": 0.3128, + "step": 3880 + }, + { + "epoch": 5.59, + "learning_rate": 0.00025014229636898916, + "loss": 0.3343, + "step": 3890 + }, + { + "epoch": 5.6, + "learning_rate": 0.0002499950932286555, + "loss": 0.2929, + "step": 3900 + }, + { + "epoch": 5.6, + "eval_loss": 0.28876641392707825, + "eval_runtime": 40.338, + "eval_samples_per_second": 11.329, + "eval_steps_per_second": 1.438, + "eval_wer": 0.31862671284445115, + "step": 3900 + }, + { + "epoch": 5.62, + "learning_rate": 0.0002498478900883219, + "loss": 0.3341, + "step": 3910 + }, + { + "epoch": 5.63, + "learning_rate": 0.00024970068694798824, + "loss": 0.3196, + "step": 3920 + }, + { + "epoch": 5.65, + "learning_rate": 0.00024955348380765454, + "loss": 0.3025, + "step": 3930 + }, + { + "epoch": 5.66, + "learning_rate": 0.0002494062806673209, + "loss": 0.3231, + "step": 3940 + }, + { + "epoch": 5.68, + "learning_rate": 0.0002492590775269872, + "loss": 0.2989, + "step": 3950 + }, + { + "epoch": 5.69, + "learning_rate": 0.00024911187438665357, + "loss": 0.304, + "step": 3960 + }, + { + "epoch": 5.7, + "learning_rate": 0.0002489646712463199, + "loss": 0.2816, + "step": 3970 + }, + { + "epoch": 5.72, + "learning_rate": 0.00024881746810598624, + "loss": 0.3096, + "step": 3980 + }, + { + "epoch": 5.73, + "learning_rate": 0.0002486702649656526, + "loss": 0.3, + "step": 3990 + }, + { + "epoch": 5.75, + "learning_rate": 0.0002485230618253189, + "loss": 0.2815, + "step": 4000 + }, + { + "epoch": 5.75, + "eval_loss": 0.28788086771965027, + "eval_runtime": 40.0114, + "eval_samples_per_second": 11.422, + "eval_steps_per_second": 1.45, + "eval_wer": 0.31666917632886615, + "step": 4000 + }, + { + "epoch": 5.76, + "learning_rate": 0.00024837585868498526, + "loss": 0.3083, + "step": 4010 + }, + { + "epoch": 5.78, + "learning_rate": 0.0002482286555446516, + "loss": 0.2857, + "step": 4020 + }, + { + "epoch": 5.79, + "learning_rate": 0.00024808145240431793, + "loss": 0.3066, + "step": 4030 + }, + { + "epoch": 5.8, + "learning_rate": 0.00024793424926398424, + "loss": 0.2842, + "step": 4040 + }, + { + "epoch": 5.82, + "learning_rate": 0.0002477870461236506, + "loss": 0.2664, + "step": 4050 + }, + { + "epoch": 5.83, + "learning_rate": 0.00024763984298331696, + "loss": 0.3455, + "step": 4060 + }, + { + "epoch": 5.85, + "learning_rate": 0.0002474926398429833, + "loss": 0.2824, + "step": 4070 + }, + { + "epoch": 5.86, + "learning_rate": 0.0002473454367026496, + "loss": 0.2934, + "step": 4080 + }, + { + "epoch": 5.88, + "learning_rate": 0.000247198233562316, + "loss": 0.3343, + "step": 4090 + }, + { + "epoch": 5.89, + "learning_rate": 0.00024705103042198235, + "loss": 0.2778, + "step": 4100 + }, + { + "epoch": 5.89, + "eval_loss": 0.2641572952270508, + "eval_runtime": 39.8509, + "eval_samples_per_second": 11.468, + "eval_steps_per_second": 1.455, + "eval_wer": 0.3136575816895046, + "step": 4100 + }, + { + "epoch": 5.91, + "learning_rate": 0.00024690382728164865, + "loss": 0.2685, + "step": 4110 + }, + { + "epoch": 5.92, + "learning_rate": 0.00024675662414131496, + "loss": 0.3127, + "step": 4120 + }, + { + "epoch": 5.93, + "learning_rate": 0.0002466094210009813, + "loss": 0.2618, + "step": 4130 + }, + { + "epoch": 5.95, + "learning_rate": 0.0002464622178606477, + "loss": 0.3303, + "step": 4140 + }, + { + "epoch": 5.96, + "learning_rate": 0.000246315014720314, + "loss": 0.2635, + "step": 4150 + }, + { + "epoch": 5.98, + "learning_rate": 0.00024616781157998035, + "loss": 0.3033, + "step": 4160 + }, + { + "epoch": 5.99, + "learning_rate": 0.0002460206084396467, + "loss": 0.2614, + "step": 4170 + }, + { + "epoch": 6.01, + "learning_rate": 0.00024587340529931307, + "loss": 0.2824, + "step": 4180 + }, + { + "epoch": 6.02, + "learning_rate": 0.0002457262021589794, + "loss": 0.247, + "step": 4190 + }, + { + "epoch": 6.03, + "learning_rate": 0.0002455789990186457, + "loss": 0.2822, + "step": 4200 + }, + { + "epoch": 6.03, + "eval_loss": 0.2591544985771179, + "eval_runtime": 40.0116, + "eval_samples_per_second": 11.422, + "eval_steps_per_second": 1.45, + "eval_wer": 0.29920192742056917, + "step": 4200 + }, + { + "epoch": 6.05, + "learning_rate": 0.00024543179587831204, + "loss": 0.2866, + "step": 4210 + }, + { + "epoch": 6.06, + "learning_rate": 0.0002452845927379784, + "loss": 0.24, + "step": 4220 + }, + { + "epoch": 6.08, + "learning_rate": 0.0002451373895976447, + "loss": 0.249, + "step": 4230 + }, + { + "epoch": 6.09, + "learning_rate": 0.00024499018645731107, + "loss": 0.2542, + "step": 4240 + }, + { + "epoch": 6.11, + "learning_rate": 0.00024484298331697743, + "loss": 0.2672, + "step": 4250 + }, + { + "epoch": 6.12, + "learning_rate": 0.0002446957801766438, + "loss": 0.3306, + "step": 4260 + }, + { + "epoch": 6.14, + "learning_rate": 0.0002445485770363101, + "loss": 0.2413, + "step": 4270 + }, + { + "epoch": 6.15, + "learning_rate": 0.0002444013738959764, + "loss": 0.2675, + "step": 4280 + }, + { + "epoch": 6.16, + "learning_rate": 0.00024425417075564276, + "loss": 0.2492, + "step": 4290 + }, + { + "epoch": 6.18, + "learning_rate": 0.0002441069676153091, + "loss": 0.2343, + "step": 4300 + }, + { + "epoch": 6.18, + "eval_loss": 0.2688565254211426, + "eval_runtime": 39.6355, + "eval_samples_per_second": 11.53, + "eval_steps_per_second": 1.463, + "eval_wer": 0.294835115193495, + "step": 4300 + }, + { + "epoch": 6.19, + "learning_rate": 0.00024395976447497543, + "loss": 0.3075, + "step": 4310 + }, + { + "epoch": 6.21, + "learning_rate": 0.0002438125613346418, + "loss": 0.2398, + "step": 4320 + }, + { + "epoch": 6.22, + "learning_rate": 0.00024366535819430812, + "loss": 0.2782, + "step": 4330 + }, + { + "epoch": 6.24, + "learning_rate": 0.00024351815505397446, + "loss": 0.2511, + "step": 4340 + }, + { + "epoch": 6.25, + "learning_rate": 0.0002433709519136408, + "loss": 0.234, + "step": 4350 + }, + { + "epoch": 6.26, + "learning_rate": 0.00024322374877330715, + "loss": 0.2972, + "step": 4360 + }, + { + "epoch": 6.28, + "learning_rate": 0.00024307654563297348, + "loss": 0.2553, + "step": 4370 + }, + { + "epoch": 6.29, + "learning_rate": 0.00024292934249263982, + "loss": 0.2697, + "step": 4380 + }, + { + "epoch": 6.31, + "learning_rate": 0.00024278213935230615, + "loss": 0.2303, + "step": 4390 + }, + { + "epoch": 6.32, + "learning_rate": 0.0002426349362119725, + "loss": 0.2556, + "step": 4400 + }, + { + "epoch": 6.32, + "eval_loss": 0.2687687575817108, + "eval_runtime": 40.0355, + "eval_samples_per_second": 11.415, + "eval_steps_per_second": 1.449, + "eval_wer": 0.28896250564674, + "step": 4400 + }, + { + "epoch": 6.34, + "learning_rate": 0.00024248773307163884, + "loss": 0.2581, + "step": 4410 + }, + { + "epoch": 6.35, + "learning_rate": 0.00024234052993130518, + "loss": 0.2807, + "step": 4420 + }, + { + "epoch": 6.36, + "learning_rate": 0.0002421933267909715, + "loss": 0.2925, + "step": 4430 + }, + { + "epoch": 6.38, + "learning_rate": 0.00024204612365063787, + "loss": 0.2417, + "step": 4440 + }, + { + "epoch": 6.39, + "learning_rate": 0.00024189892051030418, + "loss": 0.2539, + "step": 4450 + }, + { + "epoch": 6.41, + "learning_rate": 0.00024175171736997054, + "loss": 0.2756, + "step": 4460 + }, + { + "epoch": 6.42, + "learning_rate": 0.00024160451422963687, + "loss": 0.223, + "step": 4470 + }, + { + "epoch": 6.44, + "learning_rate": 0.00024145731108930323, + "loss": 0.2717, + "step": 4480 + }, + { + "epoch": 6.45, + "learning_rate": 0.00024131010794896954, + "loss": 0.2731, + "step": 4490 + }, + { + "epoch": 6.47, + "learning_rate": 0.0002411629048086359, + "loss": 0.2437, + "step": 4500 + }, + { + "epoch": 6.47, + "eval_loss": 0.2555336654186249, + "eval_runtime": 40.1329, + "eval_samples_per_second": 11.387, + "eval_steps_per_second": 1.445, + "eval_wer": 0.28760728805902724, + "step": 4500 + }, + { + "epoch": 6.48, + "learning_rate": 0.00024101570166830223, + "loss": 0.2746, + "step": 4510 + }, + { + "epoch": 6.49, + "learning_rate": 0.0002408684985279686, + "loss": 0.2506, + "step": 4520 + }, + { + "epoch": 6.51, + "learning_rate": 0.0002407212953876349, + "loss": 0.2604, + "step": 4530 + }, + { + "epoch": 6.52, + "learning_rate": 0.00024057409224730126, + "loss": 0.2634, + "step": 4540 + }, + { + "epoch": 6.54, + "learning_rate": 0.0002404268891069676, + "loss": 0.2561, + "step": 4550 + }, + { + "epoch": 6.55, + "learning_rate": 0.00024027968596663395, + "loss": 0.2648, + "step": 4560 + }, + { + "epoch": 6.57, + "learning_rate": 0.00024013248282630026, + "loss": 0.2446, + "step": 4570 + }, + { + "epoch": 6.58, + "learning_rate": 0.00023998527968596662, + "loss": 0.2685, + "step": 4580 + }, + { + "epoch": 6.59, + "learning_rate": 0.00023983807654563295, + "loss": 0.2434, + "step": 4590 + }, + { + "epoch": 6.61, + "learning_rate": 0.0002396908734052993, + "loss": 0.237, + "step": 4600 + }, + { + "epoch": 6.61, + "eval_loss": 0.2497735321521759, + "eval_runtime": 40.0633, + "eval_samples_per_second": 11.407, + "eval_steps_per_second": 1.448, + "eval_wer": 0.28233699744014457, + "step": 4600 + }, + { + "epoch": 6.62, + "learning_rate": 0.00023954367026496562, + "loss": 0.2712, + "step": 4610 + }, + { + "epoch": 6.64, + "learning_rate": 0.00023939646712463198, + "loss": 0.2464, + "step": 4620 + }, + { + "epoch": 6.65, + "learning_rate": 0.00023924926398429831, + "loss": 0.2903, + "step": 4630 + }, + { + "epoch": 6.67, + "learning_rate": 0.00023910206084396465, + "loss": 0.2472, + "step": 4640 + }, + { + "epoch": 6.68, + "learning_rate": 0.00023895485770363098, + "loss": 0.2602, + "step": 4650 + }, + { + "epoch": 6.7, + "learning_rate": 0.00023880765456329734, + "loss": 0.2728, + "step": 4660 + }, + { + "epoch": 6.71, + "learning_rate": 0.00023866045142296368, + "loss": 0.2636, + "step": 4670 + }, + { + "epoch": 6.72, + "learning_rate": 0.00023851324828263, + "loss": 0.2515, + "step": 4680 + }, + { + "epoch": 6.74, + "learning_rate": 0.00023836604514229634, + "loss": 0.2602, + "step": 4690 + }, + { + "epoch": 6.75, + "learning_rate": 0.0002382188420019627, + "loss": 0.2375, + "step": 4700 + }, + { + "epoch": 6.75, + "eval_loss": 0.2609308660030365, + "eval_runtime": 39.7988, + "eval_samples_per_second": 11.483, + "eval_steps_per_second": 1.457, + "eval_wer": 0.29363047733775033, + "step": 4700 + }, + { + "epoch": 6.77, + "learning_rate": 0.00023807163886162904, + "loss": 0.2602, + "step": 4710 + }, + { + "epoch": 6.78, + "learning_rate": 0.00023792443572129537, + "loss": 0.2384, + "step": 4720 + }, + { + "epoch": 6.8, + "learning_rate": 0.0002377772325809617, + "loss": 0.2466, + "step": 4730 + }, + { + "epoch": 6.81, + "learning_rate": 0.00023763002944062806, + "loss": 0.2674, + "step": 4740 + }, + { + "epoch": 6.82, + "learning_rate": 0.00023748282630029437, + "loss": 0.2497, + "step": 4750 + }, + { + "epoch": 6.84, + "learning_rate": 0.00023733562315996073, + "loss": 0.2771, + "step": 4760 + }, + { + "epoch": 6.85, + "learning_rate": 0.00023718842001962706, + "loss": 0.2276, + "step": 4770 + }, + { + "epoch": 6.87, + "learning_rate": 0.00023704121687929342, + "loss": 0.2459, + "step": 4780 + }, + { + "epoch": 6.88, + "learning_rate": 0.00023689401373895973, + "loss": 0.2425, + "step": 4790 + }, + { + "epoch": 6.9, + "learning_rate": 0.0002367468105986261, + "loss": 0.2361, + "step": 4800 + }, + { + "epoch": 6.9, + "eval_loss": 0.2400684505701065, + "eval_runtime": 39.986, + "eval_samples_per_second": 11.429, + "eval_steps_per_second": 1.451, + "eval_wer": 0.28037946092455956, + "step": 4800 + }, + { + "epoch": 6.91, + "learning_rate": 0.00023659960745829242, + "loss": 0.2473, + "step": 4810 + }, + { + "epoch": 6.93, + "learning_rate": 0.00023645240431795878, + "loss": 0.2144, + "step": 4820 + }, + { + "epoch": 6.94, + "learning_rate": 0.0002363052011776251, + "loss": 0.2641, + "step": 4830 + }, + { + "epoch": 6.95, + "learning_rate": 0.00023615799803729145, + "loss": 0.2559, + "step": 4840 + }, + { + "epoch": 6.97, + "learning_rate": 0.00023601079489695778, + "loss": 0.2404, + "step": 4850 + }, + { + "epoch": 6.98, + "learning_rate": 0.0002358635917566241, + "loss": 0.2533, + "step": 4860 + }, + { + "epoch": 7.0, + "learning_rate": 0.00023571638861629045, + "loss": 0.2301, + "step": 4870 + }, + { + "epoch": 7.01, + "learning_rate": 0.0002355691854759568, + "loss": 0.2553, + "step": 4880 + }, + { + "epoch": 7.03, + "learning_rate": 0.00023542198233562315, + "loss": 0.2102, + "step": 4890 + }, + { + "epoch": 7.04, + "learning_rate": 0.00023527477919528945, + "loss": 0.2266, + "step": 4900 + }, + { + "epoch": 7.04, + "eval_loss": 0.2387649267911911, + "eval_runtime": 40.0231, + "eval_samples_per_second": 11.418, + "eval_steps_per_second": 1.449, + "eval_wer": 0.2708929378105707, + "step": 4900 + }, + { + "epoch": 7.05, + "learning_rate": 0.0002351275760549558, + "loss": 0.2141, + "step": 4910 + }, + { + "epoch": 7.07, + "learning_rate": 0.00023498037291462217, + "loss": 0.2192, + "step": 4920 + }, + { + "epoch": 7.08, + "learning_rate": 0.0002348331697742885, + "loss": 0.2375, + "step": 4930 + }, + { + "epoch": 7.1, + "learning_rate": 0.0002346859666339548, + "loss": 0.2104, + "step": 4940 + }, + { + "epoch": 7.11, + "learning_rate": 0.00023453876349362117, + "loss": 0.2054, + "step": 4950 + }, + { + "epoch": 7.13, + "learning_rate": 0.00023439156035328753, + "loss": 0.2081, + "step": 4960 + }, + { + "epoch": 7.14, + "learning_rate": 0.00023424435721295387, + "loss": 0.2141, + "step": 4970 + }, + { + "epoch": 7.16, + "learning_rate": 0.00023409715407262017, + "loss": 0.2106, + "step": 4980 + }, + { + "epoch": 7.17, + "learning_rate": 0.00023394995093228653, + "loss": 0.1952, + "step": 4990 + }, + { + "epoch": 7.18, + "learning_rate": 0.0002338027477919529, + "loss": 0.2299, + "step": 5000 + }, + { + "epoch": 7.18, + "eval_loss": 0.24284440279006958, + "eval_runtime": 39.8933, + "eval_samples_per_second": 11.456, + "eval_steps_per_second": 1.454, + "eval_wer": 0.2772172865532299, + "step": 5000 + }, + { + "epoch": 7.2, + "learning_rate": 0.0002336555446516192, + "loss": 0.2312, + "step": 5010 + }, + { + "epoch": 7.21, + "learning_rate": 0.00023350834151128553, + "loss": 0.2173, + "step": 5020 + }, + { + "epoch": 7.23, + "learning_rate": 0.0002333611383709519, + "loss": 0.2383, + "step": 5030 + }, + { + "epoch": 7.24, + "learning_rate": 0.00023321393523061825, + "loss": 0.2071, + "step": 5040 + }, + { + "epoch": 7.26, + "learning_rate": 0.00023306673209028456, + "loss": 0.2402, + "step": 5050 + }, + { + "epoch": 7.27, + "learning_rate": 0.0002329195289499509, + "loss": 0.2559, + "step": 5060 + }, + { + "epoch": 7.28, + "learning_rate": 0.00023277232580961725, + "loss": 0.2094, + "step": 5070 + }, + { + "epoch": 7.3, + "learning_rate": 0.00023262512266928362, + "loss": 0.2216, + "step": 5080 + }, + { + "epoch": 7.31, + "learning_rate": 0.00023247791952894992, + "loss": 0.2184, + "step": 5090 + }, + { + "epoch": 7.33, + "learning_rate": 0.00023233071638861625, + "loss": 0.2322, + "step": 5100 + }, + { + "epoch": 7.33, + "eval_loss": 0.24409331381320953, + "eval_runtime": 40.158, + "eval_samples_per_second": 11.38, + "eval_steps_per_second": 1.444, + "eval_wer": 0.27450685137780456, + "step": 5100 + }, + { + "epoch": 7.34, + "learning_rate": 0.00023218351324828262, + "loss": 0.2169, + "step": 5110 + }, + { + "epoch": 7.36, + "learning_rate": 0.00023203631010794898, + "loss": 0.243, + "step": 5120 + }, + { + "epoch": 7.37, + "learning_rate": 0.00023188910696761528, + "loss": 0.2499, + "step": 5130 + }, + { + "epoch": 7.39, + "learning_rate": 0.00023174190382728162, + "loss": 0.2151, + "step": 5140 + }, + { + "epoch": 7.4, + "learning_rate": 0.00023159470068694798, + "loss": 0.2384, + "step": 5150 + }, + { + "epoch": 7.41, + "learning_rate": 0.00023144749754661428, + "loss": 0.2193, + "step": 5160 + }, + { + "epoch": 7.43, + "learning_rate": 0.00023130029440628064, + "loss": 0.214, + "step": 5170 + }, + { + "epoch": 7.44, + "learning_rate": 0.00023115309126594698, + "loss": 0.2394, + "step": 5180 + }, + { + "epoch": 7.46, + "learning_rate": 0.00023100588812561334, + "loss": 0.1871, + "step": 5190 + }, + { + "epoch": 7.47, + "learning_rate": 0.00023085868498527964, + "loss": 0.214, + "step": 5200 + }, + { + "epoch": 7.47, + "eval_loss": 0.24094292521476746, + "eval_runtime": 40.0199, + "eval_samples_per_second": 11.419, + "eval_steps_per_second": 1.449, + "eval_wer": 0.2722481553982834, + "step": 5200 + }, + { + "epoch": 7.49, + "learning_rate": 0.000230711481844946, + "loss": 0.2096, + "step": 5210 + }, + { + "epoch": 7.5, + "learning_rate": 0.00023056427870461234, + "loss": 0.2079, + "step": 5220 + }, + { + "epoch": 7.51, + "learning_rate": 0.0002304170755642787, + "loss": 0.233, + "step": 5230 + }, + { + "epoch": 7.53, + "learning_rate": 0.000230269872423945, + "loss": 0.244, + "step": 5240 + }, + { + "epoch": 7.54, + "learning_rate": 0.00023012266928361136, + "loss": 0.2502, + "step": 5250 + }, + { + "epoch": 7.56, + "learning_rate": 0.0002299754661432777, + "loss": 0.2079, + "step": 5260 + }, + { + "epoch": 7.57, + "learning_rate": 0.00022982826300294406, + "loss": 0.2067, + "step": 5270 + }, + { + "epoch": 7.59, + "learning_rate": 0.00022968105986261036, + "loss": 0.2274, + "step": 5280 + }, + { + "epoch": 7.6, + "learning_rate": 0.00022953385672227672, + "loss": 0.2019, + "step": 5290 + }, + { + "epoch": 7.61, + "learning_rate": 0.00022938665358194306, + "loss": 0.2223, + "step": 5300 + }, + { + "epoch": 7.61, + "eval_loss": 0.24156498908996582, + "eval_runtime": 39.8819, + "eval_samples_per_second": 11.459, + "eval_steps_per_second": 1.454, + "eval_wer": 0.26923656075892183, + "step": 5300 + }, + { + "epoch": 7.63, + "learning_rate": 0.0002292394504416094, + "loss": 0.2297, + "step": 5310 + }, + { + "epoch": 7.64, + "learning_rate": 0.00022909224730127573, + "loss": 0.1978, + "step": 5320 + }, + { + "epoch": 7.66, + "learning_rate": 0.00022894504416094209, + "loss": 0.2437, + "step": 5330 + }, + { + "epoch": 7.67, + "learning_rate": 0.00022879784102060842, + "loss": 0.2047, + "step": 5340 + }, + { + "epoch": 7.69, + "learning_rate": 0.00022865063788027475, + "loss": 0.2329, + "step": 5350 + }, + { + "epoch": 7.7, + "learning_rate": 0.00022850343473994109, + "loss": 0.2225, + "step": 5360 + }, + { + "epoch": 7.72, + "learning_rate": 0.00022835623159960745, + "loss": 0.2198, + "step": 5370 + }, + { + "epoch": 7.73, + "learning_rate": 0.00022820902845927378, + "loss": 0.2289, + "step": 5380 + }, + { + "epoch": 7.74, + "learning_rate": 0.0002280618253189401, + "loss": 0.2167, + "step": 5390 + }, + { + "epoch": 7.76, + "learning_rate": 0.00022791462217860645, + "loss": 0.2201, + "step": 5400 + }, + { + "epoch": 7.76, + "eval_loss": 0.22141778469085693, + "eval_runtime": 39.8574, + "eval_samples_per_second": 11.466, + "eval_steps_per_second": 1.455, + "eval_wer": 0.2546303267580184, + "step": 5400 + }, + { + "epoch": 7.77, + "learning_rate": 0.0002277674190382728, + "loss": 0.2066, + "step": 5410 + }, + { + "epoch": 7.79, + "learning_rate": 0.00022762021589793914, + "loss": 0.2034, + "step": 5420 + }, + { + "epoch": 7.8, + "learning_rate": 0.00022747301275760547, + "loss": 0.2038, + "step": 5430 + }, + { + "epoch": 7.82, + "learning_rate": 0.0002273258096172718, + "loss": 0.2034, + "step": 5440 + }, + { + "epoch": 7.83, + "learning_rate": 0.00022717860647693817, + "loss": 0.2328, + "step": 5450 + }, + { + "epoch": 7.84, + "learning_rate": 0.00022703140333660447, + "loss": 0.1861, + "step": 5460 + }, + { + "epoch": 7.86, + "learning_rate": 0.00022688420019627083, + "loss": 0.2146, + "step": 5470 + }, + { + "epoch": 7.87, + "learning_rate": 0.00022673699705593717, + "loss": 0.2463, + "step": 5480 + }, + { + "epoch": 7.89, + "learning_rate": 0.00022658979391560353, + "loss": 0.1953, + "step": 5490 + }, + { + "epoch": 7.9, + "learning_rate": 0.00022644259077526983, + "loss": 0.2225, + "step": 5500 + }, + { + "epoch": 7.9, + "eval_loss": 0.22256095707416534, + "eval_runtime": 39.882, + "eval_samples_per_second": 11.459, + "eval_steps_per_second": 1.454, + "eval_wer": 0.2653214877277518, + "step": 5500 + }, + { + "epoch": 7.92, + "learning_rate": 0.0002262953876349362, + "loss": 0.2189, + "step": 5510 + }, + { + "epoch": 7.93, + "learning_rate": 0.00022614818449460253, + "loss": 0.1998, + "step": 5520 + }, + { + "epoch": 7.95, + "learning_rate": 0.0002260009813542689, + "loss": 0.2587, + "step": 5530 + }, + { + "epoch": 7.96, + "learning_rate": 0.0002258537782139352, + "loss": 0.2029, + "step": 5540 + }, + { + "epoch": 7.97, + "learning_rate": 0.00022570657507360156, + "loss": 0.1974, + "step": 5550 + }, + { + "epoch": 7.99, + "learning_rate": 0.0002255593719332679, + "loss": 0.2219, + "step": 5560 + }, + { + "epoch": 8.0, + "learning_rate": 0.00022541216879293425, + "loss": 0.2126, + "step": 5570 + }, + { + "epoch": 8.02, + "learning_rate": 0.00022526496565260056, + "loss": 0.2219, + "step": 5580 + }, + { + "epoch": 8.03, + "learning_rate": 0.00022511776251226692, + "loss": 0.1896, + "step": 5590 + }, + { + "epoch": 8.05, + "learning_rate": 0.00022497055937193325, + "loss": 0.2159, + "step": 5600 + }, + { + "epoch": 8.05, + "eval_loss": 0.21107521653175354, + "eval_runtime": 40.0872, + "eval_samples_per_second": 11.4, + "eval_steps_per_second": 1.447, + "eval_wer": 0.24318626712844452, + "step": 5600 + }, + { + "epoch": 8.06, + "learning_rate": 0.00022482335623159958, + "loss": 0.1805, + "step": 5610 + }, + { + "epoch": 8.07, + "learning_rate": 0.00022467615309126592, + "loss": 0.1778, + "step": 5620 + }, + { + "epoch": 8.09, + "learning_rate": 0.00022452894995093228, + "loss": 0.1797, + "step": 5630 + }, + { + "epoch": 8.1, + "learning_rate": 0.0002243817468105986, + "loss": 0.1686, + "step": 5640 + }, + { + "epoch": 8.12, + "learning_rate": 0.00022423454367026494, + "loss": 0.1895, + "step": 5650 + }, + { + "epoch": 8.13, + "learning_rate": 0.00022408734052993128, + "loss": 0.1648, + "step": 5660 + }, + { + "epoch": 8.15, + "learning_rate": 0.00022394013738959764, + "loss": 0.2194, + "step": 5670 + }, + { + "epoch": 8.16, + "learning_rate": 0.00022379293424926397, + "loss": 0.1901, + "step": 5680 + }, + { + "epoch": 8.18, + "learning_rate": 0.0002236457311089303, + "loss": 0.1913, + "step": 5690 + }, + { + "epoch": 8.19, + "learning_rate": 0.00022349852796859664, + "loss": 0.2291, + "step": 5700 + }, + { + "epoch": 8.19, + "eval_loss": 0.20670226216316223, + "eval_runtime": 40.0404, + "eval_samples_per_second": 11.413, + "eval_steps_per_second": 1.449, + "eval_wer": 0.24680018069567836, + "step": 5700 + }, + { + "epoch": 8.2, + "learning_rate": 0.000223351324828263, + "loss": 0.1716, + "step": 5710 + }, + { + "epoch": 8.22, + "learning_rate": 0.00022320412168792933, + "loss": 0.1894, + "step": 5720 + }, + { + "epoch": 8.23, + "learning_rate": 0.00022305691854759567, + "loss": 0.2024, + "step": 5730 + }, + { + "epoch": 8.25, + "learning_rate": 0.000222909715407262, + "loss": 0.1778, + "step": 5740 + }, + { + "epoch": 8.26, + "learning_rate": 0.00022276251226692836, + "loss": 0.2244, + "step": 5750 + }, + { + "epoch": 8.28, + "learning_rate": 0.00022261530912659467, + "loss": 0.2153, + "step": 5760 + }, + { + "epoch": 8.29, + "learning_rate": 0.00022246810598626103, + "loss": 0.2085, + "step": 5770 + }, + { + "epoch": 8.3, + "learning_rate": 0.00022232090284592736, + "loss": 0.1727, + "step": 5780 + }, + { + "epoch": 8.32, + "learning_rate": 0.00022217369970559372, + "loss": 0.1769, + "step": 5790 + }, + { + "epoch": 8.33, + "learning_rate": 0.00022202649656526003, + "loss": 0.2067, + "step": 5800 + }, + { + "epoch": 8.33, + "eval_loss": 0.2133297473192215, + "eval_runtime": 40.2177, + "eval_samples_per_second": 11.363, + "eval_steps_per_second": 1.442, + "eval_wer": 0.23701249811775335, + "step": 5800 + }, + { + "epoch": 8.35, + "learning_rate": 0.00022187929342492639, + "loss": 0.1915, + "step": 5810 + }, + { + "epoch": 8.36, + "learning_rate": 0.00022173209028459272, + "loss": 0.1666, + "step": 5820 + }, + { + "epoch": 8.38, + "learning_rate": 0.00022158488714425908, + "loss": 0.2038, + "step": 5830 + }, + { + "epoch": 8.39, + "learning_rate": 0.0002214376840039254, + "loss": 0.1724, + "step": 5840 + }, + { + "epoch": 8.41, + "learning_rate": 0.00022129048086359175, + "loss": 0.2457, + "step": 5850 + }, + { + "epoch": 8.42, + "learning_rate": 0.00022114327772325808, + "loss": 0.1776, + "step": 5860 + }, + { + "epoch": 8.43, + "learning_rate": 0.00022099607458292444, + "loss": 0.1952, + "step": 5870 + }, + { + "epoch": 8.45, + "learning_rate": 0.00022084887144259075, + "loss": 0.2253, + "step": 5880 + }, + { + "epoch": 8.46, + "learning_rate": 0.0002207016683022571, + "loss": 0.1772, + "step": 5890 + }, + { + "epoch": 8.48, + "learning_rate": 0.00022055446516192344, + "loss": 0.1882, + "step": 5900 + }, + { + "epoch": 8.48, + "eval_loss": 0.21073894202709198, + "eval_runtime": 39.9763, + "eval_samples_per_second": 11.432, + "eval_steps_per_second": 1.451, + "eval_wer": 0.23520554133413643, + "step": 5900 + }, + { + "epoch": 8.49, + "learning_rate": 0.00022040726202158975, + "loss": 0.1848, + "step": 5910 + }, + { + "epoch": 8.51, + "learning_rate": 0.0002202600588812561, + "loss": 0.1788, + "step": 5920 + }, + { + "epoch": 8.52, + "learning_rate": 0.00022011285574092247, + "loss": 0.2083, + "step": 5930 + }, + { + "epoch": 8.53, + "learning_rate": 0.0002199656526005888, + "loss": 0.206, + "step": 5940 + }, + { + "epoch": 8.55, + "learning_rate": 0.0002198184494602551, + "loss": 0.2169, + "step": 5950 + }, + { + "epoch": 8.56, + "learning_rate": 0.00021967124631992147, + "loss": 0.1949, + "step": 5960 + }, + { + "epoch": 8.58, + "learning_rate": 0.00021952404317958783, + "loss": 0.1824, + "step": 5970 + }, + { + "epoch": 8.59, + "learning_rate": 0.00021937684003925416, + "loss": 0.2049, + "step": 5980 + }, + { + "epoch": 8.61, + "learning_rate": 0.00021922963689892047, + "loss": 0.166, + "step": 5990 + }, + { + "epoch": 8.62, + "learning_rate": 0.00021908243375858683, + "loss": 0.2055, + "step": 6000 + }, + { + "epoch": 8.62, + "eval_loss": 0.21278780698776245, + "eval_runtime": 39.9574, + "eval_samples_per_second": 11.437, + "eval_steps_per_second": 1.452, + "eval_wer": 0.2550820659539226, + "step": 6000 + }, + { + "epoch": 8.64, + "learning_rate": 0.0002189352306182532, + "loss": 0.1874, + "step": 6010 + }, + { + "epoch": 8.65, + "learning_rate": 0.00021878802747791952, + "loss": 0.1799, + "step": 6020 + }, + { + "epoch": 8.66, + "learning_rate": 0.00021864082433758583, + "loss": 0.2084, + "step": 6030 + }, + { + "epoch": 8.68, + "learning_rate": 0.0002184936211972522, + "loss": 0.207, + "step": 6040 + }, + { + "epoch": 8.69, + "learning_rate": 0.00021834641805691855, + "loss": 0.215, + "step": 6050 + }, + { + "epoch": 8.71, + "learning_rate": 0.00021819921491658486, + "loss": 0.1749, + "step": 6060 + }, + { + "epoch": 8.72, + "learning_rate": 0.0002180520117762512, + "loss": 0.1796, + "step": 6070 + }, + { + "epoch": 8.74, + "learning_rate": 0.00021790480863591755, + "loss": 0.1734, + "step": 6080 + }, + { + "epoch": 8.75, + "learning_rate": 0.0002177576054955839, + "loss": 0.1894, + "step": 6090 + }, + { + "epoch": 8.76, + "learning_rate": 0.00021761040235525022, + "loss": 0.2144, + "step": 6100 + }, + { + "epoch": 8.76, + "eval_loss": 0.20413599908351898, + "eval_runtime": 40.0035, + "eval_samples_per_second": 11.424, + "eval_steps_per_second": 1.45, + "eval_wer": 0.2302364101791899, + "step": 6100 + }, + { + "epoch": 8.78, + "learning_rate": 0.00021746319921491655, + "loss": 0.2061, + "step": 6110 + }, + { + "epoch": 8.79, + "learning_rate": 0.0002173159960745829, + "loss": 0.1862, + "step": 6120 + }, + { + "epoch": 8.81, + "learning_rate": 0.00021716879293424927, + "loss": 0.2183, + "step": 6130 + }, + { + "epoch": 8.82, + "learning_rate": 0.00021702158979391558, + "loss": 0.1819, + "step": 6140 + }, + { + "epoch": 8.84, + "learning_rate": 0.0002168743866535819, + "loss": 0.2072, + "step": 6150 + }, + { + "epoch": 8.85, + "learning_rate": 0.00021672718351324827, + "loss": 0.1876, + "step": 6160 + }, + { + "epoch": 8.86, + "learning_rate": 0.0002165799803729146, + "loss": 0.2077, + "step": 6170 + }, + { + "epoch": 8.88, + "learning_rate": 0.00021643277723258094, + "loss": 0.2064, + "step": 6180 + }, + { + "epoch": 8.89, + "learning_rate": 0.00021628557409224727, + "loss": 0.1796, + "step": 6190 + }, + { + "epoch": 8.91, + "learning_rate": 0.00021613837095191363, + "loss": 0.1948, + "step": 6200 + }, + { + "epoch": 8.91, + "eval_loss": 0.207631453871727, + "eval_runtime": 39.8141, + "eval_samples_per_second": 11.478, + "eval_steps_per_second": 1.457, + "eval_wer": 0.2347538021382322, + "step": 6200 + }, + { + "epoch": 8.92, + "learning_rate": 0.00021599116781157994, + "loss": 0.1759, + "step": 6210 + }, + { + "epoch": 8.94, + "learning_rate": 0.0002158439646712463, + "loss": 0.2199, + "step": 6220 + }, + { + "epoch": 8.95, + "learning_rate": 0.00021569676153091263, + "loss": 0.1782, + "step": 6230 + }, + { + "epoch": 8.97, + "learning_rate": 0.000215549558390579, + "loss": 0.1646, + "step": 6240 + }, + { + "epoch": 8.98, + "learning_rate": 0.0002154023552502453, + "loss": 0.203, + "step": 6250 + }, + { + "epoch": 8.99, + "learning_rate": 0.00021525515210991166, + "loss": 0.185, + "step": 6260 + }, + { + "epoch": 9.01, + "learning_rate": 0.000215107948969578, + "loss": 0.1783, + "step": 6270 + }, + { + "epoch": 9.02, + "learning_rate": 0.00021496074582924435, + "loss": 0.163, + "step": 6280 + }, + { + "epoch": 9.04, + "learning_rate": 0.00021481354268891066, + "loss": 0.1734, + "step": 6290 + }, + { + "epoch": 9.05, + "learning_rate": 0.00021466633954857702, + "loss": 0.176, + "step": 6300 + }, + { + "epoch": 9.05, + "eval_loss": 0.20396728813648224, + "eval_runtime": 39.8795, + "eval_samples_per_second": 11.46, + "eval_steps_per_second": 1.454, + "eval_wer": 0.22933293178738143, + "step": 6300 + }, + { + "epoch": 9.07, + "learning_rate": 0.00021451913640824335, + "loss": 0.1499, + "step": 6310 + }, + { + "epoch": 9.08, + "learning_rate": 0.00021437193326790971, + "loss": 0.1693, + "step": 6320 + }, + { + "epoch": 9.09, + "learning_rate": 0.00021422473012757602, + "loss": 0.1554, + "step": 6330 + }, + { + "epoch": 9.11, + "learning_rate": 0.00021407752698724238, + "loss": 0.158, + "step": 6340 + }, + { + "epoch": 9.12, + "learning_rate": 0.00021393032384690871, + "loss": 0.1957, + "step": 6350 + }, + { + "epoch": 9.14, + "learning_rate": 0.00021378312070657505, + "loss": 0.1862, + "step": 6360 + }, + { + "epoch": 9.15, + "learning_rate": 0.00021363591756624138, + "loss": 0.1581, + "step": 6370 + }, + { + "epoch": 9.17, + "learning_rate": 0.00021348871442590774, + "loss": 0.133, + "step": 6380 + }, + { + "epoch": 9.18, + "learning_rate": 0.00021334151128557408, + "loss": 0.1534, + "step": 6390 + }, + { + "epoch": 9.2, + "learning_rate": 0.0002131943081452404, + "loss": 0.1892, + "step": 6400 + }, + { + "epoch": 9.2, + "eval_loss": 0.1975768804550171, + "eval_runtime": 39.8911, + "eval_samples_per_second": 11.456, + "eval_steps_per_second": 1.454, + "eval_wer": 0.22466496009637102, + "step": 6400 + }, + { + "epoch": 9.21, + "learning_rate": 0.00021304710500490674, + "loss": 0.146, + "step": 6410 + }, + { + "epoch": 9.22, + "learning_rate": 0.0002128999018645731, + "loss": 0.1676, + "step": 6420 + }, + { + "epoch": 9.24, + "learning_rate": 0.00021275269872423944, + "loss": 0.135, + "step": 6430 + }, + { + "epoch": 9.25, + "learning_rate": 0.00021260549558390577, + "loss": 0.1776, + "step": 6440 + }, + { + "epoch": 9.27, + "learning_rate": 0.0002124582924435721, + "loss": 0.155, + "step": 6450 + }, + { + "epoch": 9.28, + "learning_rate": 0.00021231108930323846, + "loss": 0.1667, + "step": 6460 + }, + { + "epoch": 9.3, + "learning_rate": 0.0002121638861629048, + "loss": 0.1514, + "step": 6470 + }, + { + "epoch": 9.31, + "learning_rate": 0.00021201668302257113, + "loss": 0.1718, + "step": 6480 + }, + { + "epoch": 9.32, + "learning_rate": 0.00021186947988223746, + "loss": 0.1912, + "step": 6490 + }, + { + "epoch": 9.34, + "learning_rate": 0.00021172227674190382, + "loss": 0.1645, + "step": 6500 + }, + { + "epoch": 9.34, + "eval_loss": 0.19538117945194244, + "eval_runtime": 40.169, + "eval_samples_per_second": 11.377, + "eval_steps_per_second": 1.444, + "eval_wer": 0.21547959644631834, + "step": 6500 + }, + { + "epoch": 9.35, + "learning_rate": 0.00021157507360157013, + "loss": 0.1581, + "step": 6510 + }, + { + "epoch": 9.37, + "learning_rate": 0.0002114278704612365, + "loss": 0.1781, + "step": 6520 + }, + { + "epoch": 9.38, + "learning_rate": 0.00021128066732090282, + "loss": 0.1437, + "step": 6530 + }, + { + "epoch": 9.4, + "learning_rate": 0.00021113346418056918, + "loss": 0.1538, + "step": 6540 + }, + { + "epoch": 9.41, + "learning_rate": 0.0002109862610402355, + "loss": 0.1945, + "step": 6550 + }, + { + "epoch": 9.43, + "learning_rate": 0.00021083905789990185, + "loss": 0.1629, + "step": 6560 + }, + { + "epoch": 9.44, + "learning_rate": 0.00021069185475956818, + "loss": 0.1905, + "step": 6570 + }, + { + "epoch": 9.45, + "learning_rate": 0.00021054465161923455, + "loss": 0.1688, + "step": 6580 + }, + { + "epoch": 9.47, + "learning_rate": 0.00021039744847890085, + "loss": 0.1678, + "step": 6590 + }, + { + "epoch": 9.48, + "learning_rate": 0.0002102502453385672, + "loss": 0.1723, + "step": 6600 + }, + { + "epoch": 9.48, + "eval_loss": 0.19737230241298676, + "eval_runtime": 40.207, + "eval_samples_per_second": 11.366, + "eval_steps_per_second": 1.443, + "eval_wer": 0.2215027857250414, + "step": 6600 + }, + { + "epoch": 9.5, + "learning_rate": 0.00021010304219823355, + "loss": 0.1664, + "step": 6610 + }, + { + "epoch": 9.51, + "learning_rate": 0.0002099558390578999, + "loss": 0.1783, + "step": 6620 + }, + { + "epoch": 9.53, + "learning_rate": 0.0002098086359175662, + "loss": 0.1776, + "step": 6630 + }, + { + "epoch": 9.54, + "learning_rate": 0.00020966143277723257, + "loss": 0.1511, + "step": 6640 + }, + { + "epoch": 9.55, + "learning_rate": 0.0002095142296368989, + "loss": 0.1905, + "step": 6650 + }, + { + "epoch": 9.57, + "learning_rate": 0.00020936702649656524, + "loss": 0.1478, + "step": 6660 + }, + { + "epoch": 9.58, + "learning_rate": 0.00020921982335623157, + "loss": 0.1802, + "step": 6670 + }, + { + "epoch": 9.6, + "learning_rate": 0.00020907262021589793, + "loss": 0.1668, + "step": 6680 + }, + { + "epoch": 9.61, + "learning_rate": 0.00020892541707556427, + "loss": 0.1529, + "step": 6690 + }, + { + "epoch": 9.63, + "learning_rate": 0.0002087782139352306, + "loss": 0.1685, + "step": 6700 + }, + { + "epoch": 9.63, + "eval_loss": 0.20146189630031586, + "eval_runtime": 39.9776, + "eval_samples_per_second": 11.431, + "eval_steps_per_second": 1.451, + "eval_wer": 0.21773829242583947, + "step": 6700 + }, + { + "epoch": 9.64, + "learning_rate": 0.00020863101079489693, + "loss": 0.1339, + "step": 6710 + }, + { + "epoch": 9.66, + "learning_rate": 0.0002084838076545633, + "loss": 0.175, + "step": 6720 + }, + { + "epoch": 9.67, + "learning_rate": 0.00020833660451422963, + "loss": 0.1607, + "step": 6730 + }, + { + "epoch": 9.68, + "learning_rate": 0.00020818940137389596, + "loss": 0.1571, + "step": 6740 + }, + { + "epoch": 9.7, + "learning_rate": 0.0002080421982335623, + "loss": 0.1678, + "step": 6750 + }, + { + "epoch": 9.71, + "learning_rate": 0.00020789499509322865, + "loss": 0.1585, + "step": 6760 + }, + { + "epoch": 9.73, + "learning_rate": 0.000207747791952895, + "loss": 0.2009, + "step": 6770 + }, + { + "epoch": 9.74, + "learning_rate": 0.00020760058881256132, + "loss": 0.1597, + "step": 6780 + }, + { + "epoch": 9.76, + "learning_rate": 0.00020745338567222765, + "loss": 0.1763, + "step": 6790 + }, + { + "epoch": 9.77, + "learning_rate": 0.00020730618253189402, + "loss": 0.1617, + "step": 6800 + }, + { + "epoch": 9.77, + "eval_loss": 0.20486493408679962, + "eval_runtime": 39.9706, + "eval_samples_per_second": 11.433, + "eval_steps_per_second": 1.451, + "eval_wer": 0.22195452492094564, + "step": 6800 + }, + { + "epoch": 9.78, + "learning_rate": 0.00020715897939156032, + "loss": 0.1613, + "step": 6810 + }, + { + "epoch": 9.8, + "learning_rate": 0.00020701177625122666, + "loss": 0.1911, + "step": 6820 + }, + { + "epoch": 9.81, + "learning_rate": 0.00020686457311089302, + "loss": 0.1849, + "step": 6830 + }, + { + "epoch": 9.83, + "learning_rate": 0.00020671736997055938, + "loss": 0.1719, + "step": 6840 + }, + { + "epoch": 9.84, + "learning_rate": 0.00020657016683022568, + "loss": 0.1817, + "step": 6850 + }, + { + "epoch": 9.86, + "learning_rate": 0.00020642296368989202, + "loss": 0.1575, + "step": 6860 + }, + { + "epoch": 9.87, + "learning_rate": 0.00020627576054955838, + "loss": 0.1655, + "step": 6870 + }, + { + "epoch": 9.89, + "learning_rate": 0.00020612855740922474, + "loss": 0.1773, + "step": 6880 + }, + { + "epoch": 9.9, + "learning_rate": 0.00020598135426889104, + "loss": 0.1749, + "step": 6890 + }, + { + "epoch": 9.91, + "learning_rate": 0.00020583415112855738, + "loss": 0.1669, + "step": 6900 + }, + { + "epoch": 9.91, + "eval_loss": 0.19124703109264374, + "eval_runtime": 39.8375, + "eval_samples_per_second": 11.472, + "eval_steps_per_second": 1.456, + "eval_wer": 0.21547959644631834, + "step": 6900 + }, + { + "epoch": 9.93, + "learning_rate": 0.00020568694798822374, + "loss": 0.1504, + "step": 6910 + }, + { + "epoch": 9.94, + "learning_rate": 0.0002055397448478901, + "loss": 0.1713, + "step": 6920 + }, + { + "epoch": 9.96, + "learning_rate": 0.0002053925417075564, + "loss": 0.1773, + "step": 6930 + }, + { + "epoch": 9.97, + "learning_rate": 0.00020524533856722274, + "loss": 0.158, + "step": 6940 + }, + { + "epoch": 9.99, + "learning_rate": 0.0002050981354268891, + "loss": 0.1632, + "step": 6950 + }, + { + "epoch": 10.0, + "learning_rate": 0.0002049509322865554, + "loss": 0.1622, + "step": 6960 + }, + { + "epoch": 10.01, + "learning_rate": 0.00020480372914622176, + "loss": 0.1693, + "step": 6970 + }, + { + "epoch": 10.03, + "learning_rate": 0.0002046565260058881, + "loss": 0.1505, + "step": 6980 + }, + { + "epoch": 10.04, + "learning_rate": 0.00020450932286555446, + "loss": 0.1477, + "step": 6990 + }, + { + "epoch": 10.06, + "learning_rate": 0.00020436211972522076, + "loss": 0.1504, + "step": 7000 + }, + { + "epoch": 10.06, + "eval_loss": 0.1917961686849594, + "eval_runtime": 40.0723, + "eval_samples_per_second": 11.404, + "eval_steps_per_second": 1.447, + "eval_wer": 0.21547959644631834, + "step": 7000 + }, + { + "epoch": 10.07, + "learning_rate": 0.00020421491658488713, + "loss": 0.121, + "step": 7010 + }, + { + "epoch": 10.09, + "learning_rate": 0.00020406771344455346, + "loss": 0.1654, + "step": 7020 + }, + { + "epoch": 10.1, + "learning_rate": 0.00020392051030421982, + "loss": 0.1567, + "step": 7030 + }, + { + "epoch": 10.11, + "learning_rate": 0.00020377330716388613, + "loss": 0.1748, + "step": 7040 + }, + { + "epoch": 10.13, + "learning_rate": 0.00020362610402355249, + "loss": 0.1355, + "step": 7050 + }, + { + "epoch": 10.14, + "learning_rate": 0.00020347890088321882, + "loss": 0.1484, + "step": 7060 + }, + { + "epoch": 10.16, + "learning_rate": 0.00020333169774288518, + "loss": 0.1646, + "step": 7070 + }, + { + "epoch": 10.17, + "learning_rate": 0.00020318449460255149, + "loss": 0.1906, + "step": 7080 + }, + { + "epoch": 10.19, + "learning_rate": 0.00020303729146221785, + "loss": 0.1629, + "step": 7090 + }, + { + "epoch": 10.2, + "learning_rate": 0.00020289008832188418, + "loss": 0.1715, + "step": 7100 + }, + { + "epoch": 10.2, + "eval_loss": 0.20631931722164154, + "eval_runtime": 40.224, + "eval_samples_per_second": 11.361, + "eval_steps_per_second": 1.442, + "eval_wer": 0.2124680018069568, + "step": 7100 + }, + { + "epoch": 10.22, + "learning_rate": 0.0002027428851815505, + "loss": 0.1555, + "step": 7110 + }, + { + "epoch": 10.23, + "learning_rate": 0.00020259568204121685, + "loss": 0.1834, + "step": 7120 + }, + { + "epoch": 10.24, + "learning_rate": 0.0002024484789008832, + "loss": 0.1437, + "step": 7130 + }, + { + "epoch": 10.26, + "learning_rate": 0.00020230127576054954, + "loss": 0.1608, + "step": 7140 + }, + { + "epoch": 10.27, + "learning_rate": 0.00020215407262021587, + "loss": 0.159, + "step": 7150 + }, + { + "epoch": 10.29, + "learning_rate": 0.0002020068694798822, + "loss": 0.1512, + "step": 7160 + }, + { + "epoch": 10.3, + "learning_rate": 0.00020185966633954857, + "loss": 0.1701, + "step": 7170 + }, + { + "epoch": 10.32, + "learning_rate": 0.0002017124631992149, + "loss": 0.1324, + "step": 7180 + }, + { + "epoch": 10.33, + "learning_rate": 0.00020156526005888123, + "loss": 0.1629, + "step": 7190 + }, + { + "epoch": 10.34, + "learning_rate": 0.00020141805691854757, + "loss": 0.1604, + "step": 7200 + }, + { + "epoch": 10.34, + "eval_loss": 0.1930931955575943, + "eval_runtime": 40.1705, + "eval_samples_per_second": 11.377, + "eval_steps_per_second": 1.444, + "eval_wer": 0.21261858153892485, + "step": 7200 + }, + { + "epoch": 10.36, + "learning_rate": 0.00020127085377821393, + "loss": 0.1234, + "step": 7210 + }, + { + "epoch": 10.37, + "learning_rate": 0.00020112365063788026, + "loss": 0.1739, + "step": 7220 + }, + { + "epoch": 10.39, + "learning_rate": 0.0002009764474975466, + "loss": 0.1482, + "step": 7230 + }, + { + "epoch": 10.4, + "learning_rate": 0.00020082924435721293, + "loss": 0.1717, + "step": 7240 + }, + { + "epoch": 10.42, + "learning_rate": 0.0002006820412168793, + "loss": 0.1697, + "step": 7250 + }, + { + "epoch": 10.43, + "learning_rate": 0.0002005348380765456, + "loss": 0.1609, + "step": 7260 + }, + { + "epoch": 10.45, + "learning_rate": 0.00020038763493621196, + "loss": 0.1583, + "step": 7270 + }, + { + "epoch": 10.46, + "learning_rate": 0.0002002404317958783, + "loss": 0.1319, + "step": 7280 + }, + { + "epoch": 10.47, + "learning_rate": 0.00020009322865554465, + "loss": 0.1548, + "step": 7290 + }, + { + "epoch": 10.49, + "learning_rate": 0.00019994602551521096, + "loss": 0.1296, + "step": 7300 + }, + { + "epoch": 10.49, + "eval_loss": 0.1908556967973709, + "eval_runtime": 39.9017, + "eval_samples_per_second": 11.453, + "eval_steps_per_second": 1.454, + "eval_wer": 0.21261858153892485, + "step": 7300 + }, + { + "epoch": 10.5, + "learning_rate": 0.00019979882237487732, + "loss": 0.1352, + "step": 7310 + }, + { + "epoch": 10.52, + "learning_rate": 0.00019965161923454365, + "loss": 0.1664, + "step": 7320 + }, + { + "epoch": 10.53, + "learning_rate": 0.00019950441609421, + "loss": 0.1202, + "step": 7330 + }, + { + "epoch": 10.55, + "learning_rate": 0.00019935721295387632, + "loss": 0.1642, + "step": 7340 + }, + { + "epoch": 10.56, + "learning_rate": 0.00019921000981354268, + "loss": 0.1413, + "step": 7350 + }, + { + "epoch": 10.57, + "learning_rate": 0.000199062806673209, + "loss": 0.1233, + "step": 7360 + }, + { + "epoch": 10.59, + "learning_rate": 0.00019891560353287537, + "loss": 0.1356, + "step": 7370 + }, + { + "epoch": 10.6, + "learning_rate": 0.00019876840039254168, + "loss": 0.1423, + "step": 7380 + }, + { + "epoch": 10.62, + "learning_rate": 0.00019862119725220804, + "loss": 0.1568, + "step": 7390 + }, + { + "epoch": 10.63, + "learning_rate": 0.00019847399411187437, + "loss": 0.1405, + "step": 7400 + }, + { + "epoch": 10.63, + "eval_loss": 0.19520747661590576, + "eval_runtime": 39.9029, + "eval_samples_per_second": 11.453, + "eval_steps_per_second": 1.454, + "eval_wer": 0.21066104502333985, + "step": 7400 + }, + { + "epoch": 10.65, + "learning_rate": 0.0001983267909715407, + "loss": 0.1478, + "step": 7410 + }, + { + "epoch": 10.66, + "learning_rate": 0.00019817958783120704, + "loss": 0.1633, + "step": 7420 + }, + { + "epoch": 10.68, + "learning_rate": 0.0001980323846908734, + "loss": 0.1438, + "step": 7430 + }, + { + "epoch": 10.69, + "learning_rate": 0.00019788518155053973, + "loss": 0.1668, + "step": 7440 + }, + { + "epoch": 10.7, + "learning_rate": 0.00019773797841020607, + "loss": 0.1472, + "step": 7450 + }, + { + "epoch": 10.72, + "learning_rate": 0.0001975907752698724, + "loss": 0.1323, + "step": 7460 + }, + { + "epoch": 10.73, + "learning_rate": 0.00019744357212953876, + "loss": 0.1607, + "step": 7470 + }, + { + "epoch": 10.75, + "learning_rate": 0.0001972963689892051, + "loss": 0.1649, + "step": 7480 + }, + { + "epoch": 10.76, + "learning_rate": 0.00019714916584887143, + "loss": 0.1469, + "step": 7490 + }, + { + "epoch": 10.78, + "learning_rate": 0.00019700196270853776, + "loss": 0.1423, + "step": 7500 + }, + { + "epoch": 10.78, + "eval_loss": 0.20175614953041077, + "eval_runtime": 39.9105, + "eval_samples_per_second": 11.451, + "eval_steps_per_second": 1.453, + "eval_wer": 0.2096069868995633, + "step": 7500 + }, + { + "epoch": 10.79, + "learning_rate": 0.00019685475956820412, + "loss": 0.1369, + "step": 7510 + }, + { + "epoch": 10.8, + "learning_rate": 0.00019670755642787043, + "loss": 0.1513, + "step": 7520 + }, + { + "epoch": 10.82, + "learning_rate": 0.0001965603532875368, + "loss": 0.1426, + "step": 7530 + }, + { + "epoch": 10.83, + "learning_rate": 0.00019641315014720312, + "loss": 0.182, + "step": 7540 + }, + { + "epoch": 10.85, + "learning_rate": 0.00019626594700686948, + "loss": 0.1548, + "step": 7550 + }, + { + "epoch": 10.86, + "learning_rate": 0.0001961187438665358, + "loss": 0.1208, + "step": 7560 + }, + { + "epoch": 10.88, + "learning_rate": 0.00019597154072620215, + "loss": 0.1596, + "step": 7570 + }, + { + "epoch": 10.89, + "learning_rate": 0.00019582433758586848, + "loss": 0.1369, + "step": 7580 + }, + { + "epoch": 10.91, + "learning_rate": 0.00019567713444553484, + "loss": 0.1583, + "step": 7590 + }, + { + "epoch": 10.92, + "learning_rate": 0.00019552993130520115, + "loss": 0.1434, + "step": 7600 + }, + { + "epoch": 10.92, + "eval_loss": 0.18903155624866486, + "eval_runtime": 40.197, + "eval_samples_per_second": 11.369, + "eval_steps_per_second": 1.443, + "eval_wer": 0.2064448125282337, + "step": 7600 + }, + { + "epoch": 10.93, + "learning_rate": 0.0001953827281648675, + "loss": 0.1513, + "step": 7610 + }, + { + "epoch": 10.95, + "learning_rate": 0.00019523552502453384, + "loss": 0.1791, + "step": 7620 + }, + { + "epoch": 10.96, + "learning_rate": 0.0001950883218842002, + "loss": 0.1272, + "step": 7630 + }, + { + "epoch": 10.98, + "learning_rate": 0.0001949411187438665, + "loss": 0.1441, + "step": 7640 + }, + { + "epoch": 10.99, + "learning_rate": 0.00019479391560353287, + "loss": 0.1205, + "step": 7650 + }, + { + "epoch": 11.01, + "learning_rate": 0.0001946467124631992, + "loss": 0.151, + "step": 7660 + }, + { + "epoch": 11.02, + "learning_rate": 0.0001944995093228655, + "loss": 0.136, + "step": 7670 + }, + { + "epoch": 11.03, + "learning_rate": 0.00019435230618253187, + "loss": 0.1342, + "step": 7680 + }, + { + "epoch": 11.05, + "learning_rate": 0.00019420510304219823, + "loss": 0.1474, + "step": 7690 + }, + { + "epoch": 11.06, + "learning_rate": 0.00019405789990186456, + "loss": 0.1439, + "step": 7700 + }, + { + "epoch": 11.06, + "eval_loss": 0.1940617859363556, + "eval_runtime": 39.8635, + "eval_samples_per_second": 11.464, + "eval_steps_per_second": 1.455, + "eval_wer": 0.20268031922903176, + "step": 7700 + }, + { + "epoch": 11.08, + "learning_rate": 0.00019391069676153087, + "loss": 0.1328, + "step": 7710 + }, + { + "epoch": 11.09, + "learning_rate": 0.00019376349362119723, + "loss": 0.1136, + "step": 7720 + }, + { + "epoch": 11.11, + "learning_rate": 0.0001936162904808636, + "loss": 0.1119, + "step": 7730 + }, + { + "epoch": 11.12, + "learning_rate": 0.00019346908734052992, + "loss": 0.1645, + "step": 7740 + }, + { + "epoch": 11.14, + "learning_rate": 0.00019332188420019623, + "loss": 0.1351, + "step": 7750 + }, + { + "epoch": 11.15, + "learning_rate": 0.0001931746810598626, + "loss": 0.1427, + "step": 7760 + }, + { + "epoch": 11.16, + "learning_rate": 0.00019302747791952895, + "loss": 0.1949, + "step": 7770 + }, + { + "epoch": 11.18, + "learning_rate": 0.00019288027477919528, + "loss": 0.1581, + "step": 7780 + }, + { + "epoch": 11.19, + "learning_rate": 0.0001927330716388616, + "loss": 0.1372, + "step": 7790 + }, + { + "epoch": 11.21, + "learning_rate": 0.00019258586849852795, + "loss": 0.1415, + "step": 7800 + }, + { + "epoch": 11.21, + "eval_loss": 0.18760690093040466, + "eval_runtime": 40.0158, + "eval_samples_per_second": 11.42, + "eval_steps_per_second": 1.449, + "eval_wer": 0.20268031922903176, + "step": 7800 + }, + { + "epoch": 11.22, + "learning_rate": 0.0001924386653581943, + "loss": 0.1523, + "step": 7810 + }, + { + "epoch": 11.24, + "learning_rate": 0.00019229146221786062, + "loss": 0.1295, + "step": 7820 + }, + { + "epoch": 11.25, + "learning_rate": 0.00019214425907752695, + "loss": 0.1288, + "step": 7830 + }, + { + "epoch": 11.26, + "learning_rate": 0.0001919970559371933, + "loss": 0.1567, + "step": 7840 + }, + { + "epoch": 11.28, + "learning_rate": 0.00019184985279685967, + "loss": 0.1315, + "step": 7850 + }, + { + "epoch": 11.29, + "learning_rate": 0.00019170264965652598, + "loss": 0.153, + "step": 7860 + }, + { + "epoch": 11.31, + "learning_rate": 0.0001915554465161923, + "loss": 0.1413, + "step": 7870 + }, + { + "epoch": 11.32, + "learning_rate": 0.00019140824337585867, + "loss": 0.1203, + "step": 7880 + }, + { + "epoch": 11.34, + "learning_rate": 0.00019126104023552503, + "loss": 0.1459, + "step": 7890 + }, + { + "epoch": 11.35, + "learning_rate": 0.00019111383709519134, + "loss": 0.1289, + "step": 7900 + }, + { + "epoch": 11.35, + "eval_loss": 0.18372580409049988, + "eval_runtime": 40.1863, + "eval_samples_per_second": 11.372, + "eval_steps_per_second": 1.443, + "eval_wer": 0.20629423279626563, + "step": 7900 + }, + { + "epoch": 11.36, + "learning_rate": 0.00019096663395485767, + "loss": 0.138, + "step": 7910 + }, + { + "epoch": 11.38, + "learning_rate": 0.00019081943081452403, + "loss": 0.1593, + "step": 7920 + }, + { + "epoch": 11.39, + "learning_rate": 0.0001906722276741904, + "loss": 0.1145, + "step": 7930 + }, + { + "epoch": 11.41, + "learning_rate": 0.0001905250245338567, + "loss": 0.1582, + "step": 7940 + }, + { + "epoch": 11.42, + "learning_rate": 0.00019037782139352303, + "loss": 0.1597, + "step": 7950 + }, + { + "epoch": 11.44, + "learning_rate": 0.0001902306182531894, + "loss": 0.1344, + "step": 7960 + }, + { + "epoch": 11.45, + "learning_rate": 0.0001900834151128557, + "loss": 0.1387, + "step": 7970 + }, + { + "epoch": 11.47, + "learning_rate": 0.00018993621197252206, + "loss": 0.1321, + "step": 7980 + }, + { + "epoch": 11.48, + "learning_rate": 0.00018980372914622178, + "loss": 0.1783, + "step": 7990 + }, + { + "epoch": 11.49, + "learning_rate": 0.00018965652600588809, + "loss": 0.1268, + "step": 8000 + }, + { + "epoch": 11.49, + "eval_loss": 0.17705726623535156, + "eval_runtime": 39.9982, + "eval_samples_per_second": 11.426, + "eval_steps_per_second": 1.45, + "eval_wer": 0.20358379762084022, + "step": 8000 + }, + { + "epoch": 11.51, + "learning_rate": 0.00018950932286555445, + "loss": 0.1468, + "step": 8010 + }, + { + "epoch": 11.52, + "learning_rate": 0.0001893621197252208, + "loss": 0.1278, + "step": 8020 + }, + { + "epoch": 11.54, + "learning_rate": 0.00018921491658488714, + "loss": 0.1432, + "step": 8030 + }, + { + "epoch": 11.55, + "learning_rate": 0.00018906771344455345, + "loss": 0.1383, + "step": 8040 + }, + { + "epoch": 11.57, + "learning_rate": 0.0001889205103042198, + "loss": 0.1267, + "step": 8050 + }, + { + "epoch": 11.58, + "learning_rate": 0.00018877330716388617, + "loss": 0.1315, + "step": 8060 + }, + { + "epoch": 11.59, + "learning_rate": 0.00018862610402355247, + "loss": 0.1618, + "step": 8070 + }, + { + "epoch": 11.61, + "learning_rate": 0.0001884789008832188, + "loss": 0.144, + "step": 8080 + }, + { + "epoch": 11.62, + "learning_rate": 0.00018833169774288517, + "loss": 0.1267, + "step": 8090 + }, + { + "epoch": 11.64, + "learning_rate": 0.00018818449460255153, + "loss": 0.1335, + "step": 8100 + }, + { + "epoch": 11.64, + "eval_loss": 0.1754847913980484, + "eval_runtime": 39.9481, + "eval_samples_per_second": 11.44, + "eval_steps_per_second": 1.452, + "eval_wer": 0.20087336244541484, + "step": 8100 + }, + { + "epoch": 11.65, + "learning_rate": 0.00018803729146221783, + "loss": 0.1241, + "step": 8110 + }, + { + "epoch": 11.67, + "learning_rate": 0.00018789008832188417, + "loss": 0.1458, + "step": 8120 + }, + { + "epoch": 11.68, + "learning_rate": 0.00018774288518155053, + "loss": 0.1269, + "step": 8130 + }, + { + "epoch": 11.7, + "learning_rate": 0.0001875956820412169, + "loss": 0.1547, + "step": 8140 + }, + { + "epoch": 11.71, + "learning_rate": 0.0001874484789008832, + "loss": 0.138, + "step": 8150 + }, + { + "epoch": 11.72, + "learning_rate": 0.00018730127576054953, + "loss": 0.1513, + "step": 8160 + }, + { + "epoch": 11.74, + "learning_rate": 0.0001871540726202159, + "loss": 0.1523, + "step": 8170 + }, + { + "epoch": 11.75, + "learning_rate": 0.00018700686947988225, + "loss": 0.1463, + "step": 8180 + }, + { + "epoch": 11.77, + "learning_rate": 0.00018685966633954856, + "loss": 0.1541, + "step": 8190 + }, + { + "epoch": 11.78, + "learning_rate": 0.0001867124631992149, + "loss": 0.1136, + "step": 8200 + }, + { + "epoch": 11.78, + "eval_loss": 0.19131112098693848, + "eval_runtime": 40.2824, + "eval_samples_per_second": 11.345, + "eval_steps_per_second": 1.44, + "eval_wer": 0.205089594940521, + "step": 8200 + }, + { + "epoch": 11.8, + "learning_rate": 0.00018656526005888125, + "loss": 0.1186, + "step": 8210 + }, + { + "epoch": 11.81, + "learning_rate": 0.00018641805691854756, + "loss": 0.151, + "step": 8220 + }, + { + "epoch": 11.82, + "learning_rate": 0.00018627085377821392, + "loss": 0.1311, + "step": 8230 + }, + { + "epoch": 11.84, + "learning_rate": 0.00018612365063788025, + "loss": 0.1507, + "step": 8240 + }, + { + "epoch": 11.85, + "learning_rate": 0.0001859764474975466, + "loss": 0.1305, + "step": 8250 + }, + { + "epoch": 11.87, + "learning_rate": 0.00018582924435721292, + "loss": 0.1331, + "step": 8260 + }, + { + "epoch": 11.88, + "learning_rate": 0.00018568204121687928, + "loss": 0.1288, + "step": 8270 + }, + { + "epoch": 11.9, + "learning_rate": 0.0001855348380765456, + "loss": 0.1305, + "step": 8280 + }, + { + "epoch": 11.91, + "learning_rate": 0.00018538763493621197, + "loss": 0.1492, + "step": 8290 + }, + { + "epoch": 11.93, + "learning_rate": 0.00018524043179587828, + "loss": 0.1321, + "step": 8300 + }, + { + "epoch": 11.93, + "eval_loss": 0.1786966621875763, + "eval_runtime": 39.7362, + "eval_samples_per_second": 11.501, + "eval_steps_per_second": 1.46, + "eval_wer": 0.201174521909351, + "step": 8300 + }, + { + "epoch": 11.94, + "learning_rate": 0.00018509322865554464, + "loss": 0.1387, + "step": 8310 + }, + { + "epoch": 11.95, + "learning_rate": 0.00018494602551521097, + "loss": 0.1183, + "step": 8320 + }, + { + "epoch": 11.97, + "learning_rate": 0.00018479882237487733, + "loss": 0.1429, + "step": 8330 + }, + { + "epoch": 11.98, + "learning_rate": 0.00018465161923454364, + "loss": 0.142, + "step": 8340 + }, + { + "epoch": 12.0, + "learning_rate": 0.00018450441609421, + "loss": 0.1511, + "step": 8350 + }, + { + "epoch": 12.01, + "learning_rate": 0.00018435721295387633, + "loss": 0.1594, + "step": 8360 + }, + { + "epoch": 12.03, + "learning_rate": 0.00018421000981354266, + "loss": 0.1273, + "step": 8370 + }, + { + "epoch": 12.04, + "learning_rate": 0.000184062806673209, + "loss": 0.1324, + "step": 8380 + }, + { + "epoch": 12.05, + "learning_rate": 0.00018391560353287536, + "loss": 0.1219, + "step": 8390 + }, + { + "epoch": 12.07, + "learning_rate": 0.0001837684003925417, + "loss": 0.1088, + "step": 8400 + }, + { + "epoch": 12.07, + "eval_loss": 0.19158530235290527, + "eval_runtime": 39.7742, + "eval_samples_per_second": 11.49, + "eval_steps_per_second": 1.458, + "eval_wer": 0.19966872458967022, + "step": 8400 + }, + { + "epoch": 12.08, + "learning_rate": 0.00018362119725220803, + "loss": 0.1208, + "step": 8410 + }, + { + "epoch": 12.1, + "learning_rate": 0.00018347399411187436, + "loss": 0.1286, + "step": 8420 + }, + { + "epoch": 12.11, + "learning_rate": 0.00018332679097154072, + "loss": 0.1394, + "step": 8430 + }, + { + "epoch": 12.13, + "learning_rate": 0.00018317958783120705, + "loss": 0.1601, + "step": 8440 + }, + { + "epoch": 12.14, + "learning_rate": 0.00018303238469087339, + "loss": 0.1211, + "step": 8450 + }, + { + "epoch": 12.16, + "learning_rate": 0.00018288518155053972, + "loss": 0.1519, + "step": 8460 + }, + { + "epoch": 12.17, + "learning_rate": 0.00018273797841020608, + "loss": 0.1015, + "step": 8470 + }, + { + "epoch": 12.18, + "learning_rate": 0.0001825907752698724, + "loss": 0.1214, + "step": 8480 + }, + { + "epoch": 12.2, + "learning_rate": 0.00018244357212953875, + "loss": 0.1315, + "step": 8490 + }, + { + "epoch": 12.21, + "learning_rate": 0.00018229636898920508, + "loss": 0.1319, + "step": 8500 + }, + { + "epoch": 12.21, + "eval_loss": 0.178669735789299, + "eval_runtime": 39.4909, + "eval_samples_per_second": 11.572, + "eval_steps_per_second": 1.469, + "eval_wer": 0.20252973949706368, + "step": 8500 + }, + { + "epoch": 12.23, + "learning_rate": 0.00018214916584887144, + "loss": 0.1498, + "step": 8510 + }, + { + "epoch": 12.24, + "learning_rate": 0.00018200196270853775, + "loss": 0.1089, + "step": 8520 + }, + { + "epoch": 12.26, + "learning_rate": 0.0001818547595682041, + "loss": 0.1212, + "step": 8530 + }, + { + "epoch": 12.27, + "learning_rate": 0.00018170755642787044, + "loss": 0.1483, + "step": 8540 + }, + { + "epoch": 12.28, + "learning_rate": 0.0001815603532875368, + "loss": 0.1295, + "step": 8550 + }, + { + "epoch": 12.3, + "learning_rate": 0.0001814131501472031, + "loss": 0.1221, + "step": 8560 + }, + { + "epoch": 12.31, + "learning_rate": 0.00018126594700686947, + "loss": 0.1058, + "step": 8570 + }, + { + "epoch": 12.33, + "learning_rate": 0.0001811187438665358, + "loss": 0.1259, + "step": 8580 + }, + { + "epoch": 12.34, + "learning_rate": 0.00018097154072620216, + "loss": 0.1267, + "step": 8590 + }, + { + "epoch": 12.36, + "learning_rate": 0.00018082433758586847, + "loss": 0.1274, + "step": 8600 + }, + { + "epoch": 12.36, + "eval_loss": 0.18227306008338928, + "eval_runtime": 40.0342, + "eval_samples_per_second": 11.415, + "eval_steps_per_second": 1.449, + "eval_wer": 0.2044872760126487, + "step": 8600 + }, + { + "epoch": 12.37, + "learning_rate": 0.00018067713444553483, + "loss": 0.1318, + "step": 8610 + }, + { + "epoch": 12.39, + "learning_rate": 0.00018052993130520116, + "loss": 0.1286, + "step": 8620 + }, + { + "epoch": 12.4, + "learning_rate": 0.0001803827281648675, + "loss": 0.1115, + "step": 8630 + }, + { + "epoch": 12.41, + "learning_rate": 0.00018023552502453383, + "loss": 0.1283, + "step": 8640 + }, + { + "epoch": 12.43, + "learning_rate": 0.0001800883218842002, + "loss": 0.1297, + "step": 8650 + }, + { + "epoch": 12.44, + "learning_rate": 0.00017994111874386652, + "loss": 0.1287, + "step": 8660 + }, + { + "epoch": 12.46, + "learning_rate": 0.00017979391560353286, + "loss": 0.1334, + "step": 8670 + }, + { + "epoch": 12.47, + "learning_rate": 0.0001796467124631992, + "loss": 0.1264, + "step": 8680 + }, + { + "epoch": 12.49, + "learning_rate": 0.00017949950932286555, + "loss": 0.1287, + "step": 8690 + }, + { + "epoch": 12.5, + "learning_rate": 0.00017935230618253188, + "loss": 0.1361, + "step": 8700 + }, + { + "epoch": 12.5, + "eval_loss": 0.1859862059354782, + "eval_runtime": 39.6559, + "eval_samples_per_second": 11.524, + "eval_steps_per_second": 1.463, + "eval_wer": 0.20749887065201025, + "step": 8700 + }, + { + "epoch": 12.51, + "learning_rate": 0.00017920510304219822, + "loss": 0.1718, + "step": 8710 + }, + { + "epoch": 12.53, + "learning_rate": 0.00017905789990186455, + "loss": 0.1127, + "step": 8720 + }, + { + "epoch": 12.54, + "learning_rate": 0.0001789106967615309, + "loss": 0.1558, + "step": 8730 + }, + { + "epoch": 12.56, + "learning_rate": 0.00017876349362119724, + "loss": 0.1398, + "step": 8740 + }, + { + "epoch": 12.57, + "learning_rate": 0.00017861629048086358, + "loss": 0.1351, + "step": 8750 + }, + { + "epoch": 12.59, + "learning_rate": 0.0001784690873405299, + "loss": 0.1291, + "step": 8760 + }, + { + "epoch": 12.6, + "learning_rate": 0.00017832188420019627, + "loss": 0.1339, + "step": 8770 + }, + { + "epoch": 12.61, + "learning_rate": 0.00017817468105986258, + "loss": 0.152, + "step": 8780 + }, + { + "epoch": 12.63, + "learning_rate": 0.00017802747791952894, + "loss": 0.1313, + "step": 8790 + }, + { + "epoch": 12.64, + "learning_rate": 0.00017788027477919527, + "loss": 0.1541, + "step": 8800 + }, + { + "epoch": 12.64, + "eval_loss": 0.1849740892648697, + "eval_runtime": 39.6506, + "eval_samples_per_second": 11.526, + "eval_steps_per_second": 1.463, + "eval_wer": 0.20283089896099984, + "step": 8800 + }, + { + "epoch": 12.66, + "learning_rate": 0.00017773307163886163, + "loss": 0.1601, + "step": 8810 + }, + { + "epoch": 12.67, + "learning_rate": 0.00017758586849852794, + "loss": 0.123, + "step": 8820 + }, + { + "epoch": 12.69, + "learning_rate": 0.0001774386653581943, + "loss": 0.134, + "step": 8830 + }, + { + "epoch": 12.7, + "learning_rate": 0.00017729146221786063, + "loss": 0.1273, + "step": 8840 + }, + { + "epoch": 12.72, + "learning_rate": 0.000177144259077527, + "loss": 0.1085, + "step": 8850 + }, + { + "epoch": 12.73, + "learning_rate": 0.0001769970559371933, + "loss": 0.1438, + "step": 8860 + }, + { + "epoch": 12.74, + "learning_rate": 0.00017684985279685966, + "loss": 0.1215, + "step": 8870 + }, + { + "epoch": 12.76, + "learning_rate": 0.000176702649656526, + "loss": 0.1301, + "step": 8880 + }, + { + "epoch": 12.77, + "learning_rate": 0.00017655544651619235, + "loss": 0.118, + "step": 8890 + }, + { + "epoch": 12.79, + "learning_rate": 0.00017640824337585866, + "loss": 0.0957, + "step": 8900 + }, + { + "epoch": 12.79, + "eval_loss": 0.1861564964056015, + "eval_runtime": 39.7711, + "eval_samples_per_second": 11.491, + "eval_steps_per_second": 1.458, + "eval_wer": 0.19469959343472368, + "step": 8900 + }, + { + "epoch": 12.8, + "learning_rate": 0.00017626104023552502, + "loss": 0.1277, + "step": 8910 + }, + { + "epoch": 12.82, + "learning_rate": 0.00017611383709519135, + "loss": 0.1311, + "step": 8920 + }, + { + "epoch": 12.83, + "learning_rate": 0.00017596663395485766, + "loss": 0.1545, + "step": 8930 + }, + { + "epoch": 12.84, + "learning_rate": 0.00017581943081452402, + "loss": 0.1182, + "step": 8940 + }, + { + "epoch": 12.86, + "learning_rate": 0.00017567222767419038, + "loss": 0.12, + "step": 8950 + }, + { + "epoch": 12.87, + "learning_rate": 0.00017552502453385671, + "loss": 0.1413, + "step": 8960 + }, + { + "epoch": 12.89, + "learning_rate": 0.00017537782139352302, + "loss": 0.1131, + "step": 8970 + }, + { + "epoch": 12.9, + "learning_rate": 0.00017523061825318938, + "loss": 0.124, + "step": 8980 + }, + { + "epoch": 12.92, + "learning_rate": 0.00017508341511285574, + "loss": 0.122, + "step": 8990 + }, + { + "epoch": 12.93, + "learning_rate": 0.00017493621197252208, + "loss": 0.1139, + "step": 9000 + }, + { + "epoch": 12.93, + "eval_loss": 0.17861497402191162, + "eval_runtime": 39.712, + "eval_samples_per_second": 11.508, + "eval_steps_per_second": 1.461, + "eval_wer": 0.18310495407318175, + "step": 9000 + }, + { + "epoch": 12.95, + "learning_rate": 0.00017478900883218838, + "loss": 0.1459, + "step": 9010 + }, + { + "epoch": 12.96, + "learning_rate": 0.00017464180569185474, + "loss": 0.1092, + "step": 9020 + }, + { + "epoch": 12.97, + "learning_rate": 0.0001744946025515211, + "loss": 0.1329, + "step": 9030 + }, + { + "epoch": 12.99, + "learning_rate": 0.00017434739941118744, + "loss": 0.1047, + "step": 9040 + }, + { + "epoch": 13.0, + "learning_rate": 0.00017420019627085374, + "loss": 0.1094, + "step": 9050 + }, + { + "epoch": 13.02, + "learning_rate": 0.0001740529931305201, + "loss": 0.1347, + "step": 9060 + }, + { + "epoch": 13.03, + "learning_rate": 0.00017390578999018646, + "loss": 0.1158, + "step": 9070 + }, + { + "epoch": 13.05, + "learning_rate": 0.00017375858684985277, + "loss": 0.1443, + "step": 9080 + }, + { + "epoch": 13.06, + "learning_rate": 0.0001736113837095191, + "loss": 0.1027, + "step": 9090 + }, + { + "epoch": 13.07, + "learning_rate": 0.00017346418056918546, + "loss": 0.107, + "step": 9100 + }, + { + "epoch": 13.07, + "eval_loss": 0.18377935886383057, + "eval_runtime": 39.9042, + "eval_samples_per_second": 11.452, + "eval_steps_per_second": 1.453, + "eval_wer": 0.1959042312904683, + "step": 9100 + }, + { + "epoch": 13.09, + "learning_rate": 0.00017331697742885182, + "loss": 0.1134, + "step": 9110 + }, + { + "epoch": 13.1, + "learning_rate": 0.00017316977428851813, + "loss": 0.1044, + "step": 9120 + }, + { + "epoch": 13.12, + "learning_rate": 0.00017302257114818446, + "loss": 0.1194, + "step": 9130 + }, + { + "epoch": 13.13, + "learning_rate": 0.00017287536800785082, + "loss": 0.1139, + "step": 9140 + }, + { + "epoch": 13.15, + "learning_rate": 0.00017272816486751718, + "loss": 0.1271, + "step": 9150 + }, + { + "epoch": 13.16, + "learning_rate": 0.0001725809617271835, + "loss": 0.1207, + "step": 9160 + }, + { + "epoch": 13.18, + "learning_rate": 0.00017243375858684982, + "loss": 0.117, + "step": 9170 + }, + { + "epoch": 13.19, + "learning_rate": 0.00017228655544651618, + "loss": 0.1332, + "step": 9180 + }, + { + "epoch": 13.2, + "learning_rate": 0.00017213935230618255, + "loss": 0.1186, + "step": 9190 + }, + { + "epoch": 13.22, + "learning_rate": 0.00017199214916584885, + "loss": 0.1103, + "step": 9200 + }, + { + "epoch": 13.22, + "eval_loss": 0.1748352199792862, + "eval_runtime": 39.9358, + "eval_samples_per_second": 11.443, + "eval_steps_per_second": 1.452, + "eval_wer": 0.18732118656828792, + "step": 9200 + }, + { + "epoch": 13.23, + "learning_rate": 0.00017184494602551518, + "loss": 0.1177, + "step": 9210 + }, + { + "epoch": 13.25, + "learning_rate": 0.00017169774288518155, + "loss": 0.1022, + "step": 9220 + }, + { + "epoch": 13.26, + "learning_rate": 0.00017155053974484785, + "loss": 0.1417, + "step": 9230 + }, + { + "epoch": 13.28, + "learning_rate": 0.0001714033366045142, + "loss": 0.1326, + "step": 9240 + }, + { + "epoch": 13.29, + "learning_rate": 0.00017125613346418055, + "loss": 0.1207, + "step": 9250 + }, + { + "epoch": 13.3, + "learning_rate": 0.0001711089303238469, + "loss": 0.1132, + "step": 9260 + }, + { + "epoch": 13.32, + "learning_rate": 0.0001709617271835132, + "loss": 0.097, + "step": 9270 + }, + { + "epoch": 13.33, + "learning_rate": 0.00017081452404317957, + "loss": 0.1492, + "step": 9280 + }, + { + "epoch": 13.35, + "learning_rate": 0.0001706673209028459, + "loss": 0.1272, + "step": 9290 + }, + { + "epoch": 13.36, + "learning_rate": 0.00017052011776251227, + "loss": 0.1274, + "step": 9300 + }, + { + "epoch": 13.36, + "eval_loss": 0.17697954177856445, + "eval_runtime": 39.8577, + "eval_samples_per_second": 11.466, + "eval_steps_per_second": 1.455, + "eval_wer": 0.19771118807408522, + "step": 9300 + }, + { + "epoch": 13.38, + "learning_rate": 0.00017037291462217857, + "loss": 0.1162, + "step": 9310 + }, + { + "epoch": 13.39, + "learning_rate": 0.00017022571148184493, + "loss": 0.1054, + "step": 9320 + }, + { + "epoch": 13.41, + "learning_rate": 0.00017007850834151127, + "loss": 0.1115, + "step": 9330 + }, + { + "epoch": 13.42, + "learning_rate": 0.00016993130520117763, + "loss": 0.103, + "step": 9340 + }, + { + "epoch": 13.43, + "learning_rate": 0.00016978410206084393, + "loss": 0.1359, + "step": 9350 + }, + { + "epoch": 13.45, + "learning_rate": 0.0001696368989205103, + "loss": 0.1019, + "step": 9360 + }, + { + "epoch": 13.46, + "learning_rate": 0.00016948969578017663, + "loss": 0.1107, + "step": 9370 + }, + { + "epoch": 13.48, + "learning_rate": 0.00016934249263984296, + "loss": 0.126, + "step": 9380 + }, + { + "epoch": 13.49, + "learning_rate": 0.0001691952894995093, + "loss": 0.1239, + "step": 9390 + }, + { + "epoch": 13.51, + "learning_rate": 0.00016904808635917565, + "loss": 0.1243, + "step": 9400 + }, + { + "epoch": 13.51, + "eval_loss": 0.17389988899230957, + "eval_runtime": 39.7378, + "eval_samples_per_second": 11.5, + "eval_steps_per_second": 1.46, + "eval_wer": 0.19349495557897908, + "step": 9400 + }, + { + "epoch": 13.52, + "learning_rate": 0.000168900883218842, + "loss": 0.1237, + "step": 9410 + }, + { + "epoch": 13.53, + "learning_rate": 0.00016875368007850832, + "loss": 0.1058, + "step": 9420 + }, + { + "epoch": 13.55, + "learning_rate": 0.00016860647693817465, + "loss": 0.1313, + "step": 9430 + }, + { + "epoch": 13.56, + "learning_rate": 0.00016845927379784102, + "loss": 0.1101, + "step": 9440 + }, + { + "epoch": 13.58, + "learning_rate": 0.00016831207065750735, + "loss": 0.1158, + "step": 9450 + }, + { + "epoch": 13.59, + "learning_rate": 0.00016816486751717368, + "loss": 0.1189, + "step": 9460 + }, + { + "epoch": 13.61, + "learning_rate": 0.00016801766437684002, + "loss": 0.1178, + "step": 9470 + }, + { + "epoch": 13.62, + "learning_rate": 0.00016787046123650638, + "loss": 0.1273, + "step": 9480 + }, + { + "epoch": 13.64, + "learning_rate": 0.0001677232580961727, + "loss": 0.1302, + "step": 9490 + }, + { + "epoch": 13.65, + "learning_rate": 0.00016757605495583904, + "loss": 0.0975, + "step": 9500 + }, + { + "epoch": 13.65, + "eval_loss": 0.17656183242797852, + "eval_runtime": 39.8815, + "eval_samples_per_second": 11.459, + "eval_steps_per_second": 1.454, + "eval_wer": 0.19816292726998946, + "step": 9500 + }, + { + "epoch": 13.66, + "learning_rate": 0.00016742885181550538, + "loss": 0.1057, + "step": 9510 + }, + { + "epoch": 13.68, + "learning_rate": 0.00016728164867517174, + "loss": 0.1182, + "step": 9520 + }, + { + "epoch": 13.69, + "learning_rate": 0.00016713444553483804, + "loss": 0.111, + "step": 9530 + }, + { + "epoch": 13.71, + "learning_rate": 0.0001669872423945044, + "loss": 0.128, + "step": 9540 + }, + { + "epoch": 13.72, + "learning_rate": 0.00016684003925417074, + "loss": 0.095, + "step": 9550 + }, + { + "epoch": 13.74, + "learning_rate": 0.0001666928361138371, + "loss": 0.1286, + "step": 9560 + }, + { + "epoch": 13.75, + "learning_rate": 0.0001665456329735034, + "loss": 0.1028, + "step": 9570 + }, + { + "epoch": 13.76, + "learning_rate": 0.00016639842983316976, + "loss": 0.1336, + "step": 9580 + }, + { + "epoch": 13.78, + "learning_rate": 0.0001662512266928361, + "loss": 0.095, + "step": 9590 + }, + { + "epoch": 13.79, + "learning_rate": 0.00016610402355250246, + "loss": 0.1093, + "step": 9600 + }, + { + "epoch": 13.79, + "eval_loss": 0.1793922334909439, + "eval_runtime": 40.0085, + "eval_samples_per_second": 11.423, + "eval_steps_per_second": 1.45, + "eval_wer": 0.1959042312904683, + "step": 9600 + }, + { + "epoch": 13.81, + "learning_rate": 0.00016595682041216876, + "loss": 0.1257, + "step": 9610 + }, + { + "epoch": 13.82, + "learning_rate": 0.00016580961727183512, + "loss": 0.0955, + "step": 9620 + }, + { + "epoch": 13.84, + "learning_rate": 0.00016566241413150146, + "loss": 0.1234, + "step": 9630 + }, + { + "epoch": 13.85, + "learning_rate": 0.00016551521099116782, + "loss": 0.0953, + "step": 9640 + }, + { + "epoch": 13.86, + "learning_rate": 0.00016536800785083412, + "loss": 0.1147, + "step": 9650 + }, + { + "epoch": 13.88, + "learning_rate": 0.00016522080471050049, + "loss": 0.1232, + "step": 9660 + }, + { + "epoch": 13.89, + "learning_rate": 0.00016507360157016682, + "loss": 0.1264, + "step": 9670 + }, + { + "epoch": 13.91, + "learning_rate": 0.00016492639842983315, + "loss": 0.1401, + "step": 9680 + }, + { + "epoch": 13.92, + "learning_rate": 0.00016477919528949949, + "loss": 0.1071, + "step": 9690 + }, + { + "epoch": 13.94, + "learning_rate": 0.00016463199214916585, + "loss": 0.1123, + "step": 9700 + }, + { + "epoch": 13.94, + "eval_loss": 0.16937404870986938, + "eval_runtime": 40.1681, + "eval_samples_per_second": 11.377, + "eval_steps_per_second": 1.444, + "eval_wer": 0.193344375847011, + "step": 9700 + }, + { + "epoch": 13.95, + "learning_rate": 0.00016448478900883218, + "loss": 0.13, + "step": 9710 + }, + { + "epoch": 13.97, + "learning_rate": 0.0001643375858684985, + "loss": 0.1109, + "step": 9720 + }, + { + "epoch": 13.98, + "learning_rate": 0.00016419038272816485, + "loss": 0.1241, + "step": 9730 + }, + { + "epoch": 13.99, + "learning_rate": 0.0001640431795878312, + "loss": 0.115, + "step": 9740 + }, + { + "epoch": 14.01, + "learning_rate": 0.00016389597644749754, + "loss": 0.11, + "step": 9750 + }, + { + "epoch": 14.02, + "learning_rate": 0.00016374877330716387, + "loss": 0.1115, + "step": 9760 + }, + { + "epoch": 14.04, + "learning_rate": 0.0001636015701668302, + "loss": 0.0945, + "step": 9770 + }, + { + "epoch": 14.05, + "learning_rate": 0.00016345436702649657, + "loss": 0.1122, + "step": 9780 + }, + { + "epoch": 14.07, + "learning_rate": 0.0001633071638861629, + "loss": 0.0999, + "step": 9790 + }, + { + "epoch": 14.08, + "learning_rate": 0.00016315996074582923, + "loss": 0.1401, + "step": 9800 + }, + { + "epoch": 14.08, + "eval_loss": 0.17904061079025269, + "eval_runtime": 39.9612, + "eval_samples_per_second": 11.436, + "eval_steps_per_second": 1.451, + "eval_wer": 0.19093510013552176, + "step": 9800 + }, + { + "epoch": 14.09, + "learning_rate": 0.00016301275760549557, + "loss": 0.1179, + "step": 9810 + }, + { + "epoch": 14.11, + "learning_rate": 0.00016286555446516193, + "loss": 0.1311, + "step": 9820 + }, + { + "epoch": 14.12, + "learning_rate": 0.00016271835132482823, + "loss": 0.1111, + "step": 9830 + }, + { + "epoch": 14.14, + "learning_rate": 0.0001625711481844946, + "loss": 0.1112, + "step": 9840 + }, + { + "epoch": 14.15, + "learning_rate": 0.00016242394504416093, + "loss": 0.1189, + "step": 9850 + }, + { + "epoch": 14.17, + "learning_rate": 0.0001622767419038273, + "loss": 0.1143, + "step": 9860 + }, + { + "epoch": 14.18, + "learning_rate": 0.0001621295387634936, + "loss": 0.1192, + "step": 9870 + }, + { + "epoch": 14.2, + "learning_rate": 0.00016198233562315996, + "loss": 0.1224, + "step": 9880 + }, + { + "epoch": 14.21, + "learning_rate": 0.0001618351324828263, + "loss": 0.1, + "step": 9890 + }, + { + "epoch": 14.22, + "learning_rate": 0.00016168792934249265, + "loss": 0.1255, + "step": 9900 + }, + { + "epoch": 14.22, + "eval_loss": 0.17239724099636078, + "eval_runtime": 40.3402, + "eval_samples_per_second": 11.329, + "eval_steps_per_second": 1.438, + "eval_wer": 0.18822466496009638, + "step": 9900 + }, + { + "epoch": 14.24, + "learning_rate": 0.00016154072620215896, + "loss": 0.0956, + "step": 9910 + }, + { + "epoch": 14.25, + "learning_rate": 0.00016139352306182532, + "loss": 0.1031, + "step": 9920 + }, + { + "epoch": 14.27, + "learning_rate": 0.00016124631992149165, + "loss": 0.1059, + "step": 9930 + }, + { + "epoch": 14.28, + "learning_rate": 0.000161099116781158, + "loss": 0.1004, + "step": 9940 + }, + { + "epoch": 14.3, + "learning_rate": 0.00016095191364082432, + "loss": 0.1064, + "step": 9950 + }, + { + "epoch": 14.31, + "learning_rate": 0.00016080471050049065, + "loss": 0.1167, + "step": 9960 + }, + { + "epoch": 14.32, + "learning_rate": 0.000160657507360157, + "loss": 0.1056, + "step": 9970 + }, + { + "epoch": 14.34, + "learning_rate": 0.00016051030421982332, + "loss": 0.128, + "step": 9980 + }, + { + "epoch": 14.35, + "learning_rate": 0.00016036310107948968, + "loss": 0.1267, + "step": 9990 + }, + { + "epoch": 14.37, + "learning_rate": 0.000160215897939156, + "loss": 0.1126, + "step": 10000 + }, + { + "epoch": 14.37, + "eval_loss": 0.1660313904285431, + "eval_runtime": 40.0416, + "eval_samples_per_second": 11.413, + "eval_steps_per_second": 1.448, + "eval_wer": 0.18882698388796867, + "step": 10000 + }, + { + "epoch": 14.38, + "learning_rate": 0.00016006869479882237, + "loss": 0.0972, + "step": 10010 + }, + { + "epoch": 14.4, + "learning_rate": 0.00015992149165848868, + "loss": 0.0785, + "step": 10020 + }, + { + "epoch": 14.41, + "learning_rate": 0.00015977428851815504, + "loss": 0.1162, + "step": 10030 + }, + { + "epoch": 14.43, + "learning_rate": 0.00015962708537782137, + "loss": 0.1037, + "step": 10040 + }, + { + "epoch": 14.44, + "learning_rate": 0.00015947988223748773, + "loss": 0.1261, + "step": 10050 + }, + { + "epoch": 14.45, + "learning_rate": 0.00015933267909715404, + "loss": 0.1, + "step": 10060 + }, + { + "epoch": 14.47, + "learning_rate": 0.0001591854759568204, + "loss": 0.1175, + "step": 10070 + }, + { + "epoch": 14.48, + "learning_rate": 0.00015903827281648673, + "loss": 0.1218, + "step": 10080 + }, + { + "epoch": 14.5, + "learning_rate": 0.0001588910696761531, + "loss": 0.0957, + "step": 10090 + }, + { + "epoch": 14.51, + "learning_rate": 0.0001587438665358194, + "loss": 0.1241, + "step": 10100 + }, + { + "epoch": 14.51, + "eval_loss": 0.16984562575817108, + "eval_runtime": 40.0158, + "eval_samples_per_second": 11.42, + "eval_steps_per_second": 1.449, + "eval_wer": 0.19048336093961754, + "step": 10100 + }, + { + "epoch": 14.53, + "learning_rate": 0.00015859666339548576, + "loss": 0.0949, + "step": 10110 + }, + { + "epoch": 14.54, + "learning_rate": 0.0001584494602551521, + "loss": 0.1353, + "step": 10120 + }, + { + "epoch": 14.55, + "learning_rate": 0.00015830225711481843, + "loss": 0.1164, + "step": 10130 + }, + { + "epoch": 14.57, + "learning_rate": 0.00015815505397448476, + "loss": 0.0954, + "step": 10140 + }, + { + "epoch": 14.58, + "learning_rate": 0.00015800785083415112, + "loss": 0.1477, + "step": 10150 + }, + { + "epoch": 14.6, + "learning_rate": 0.00015786064769381745, + "loss": 0.1094, + "step": 10160 + }, + { + "epoch": 14.61, + "learning_rate": 0.0001577134445534838, + "loss": 0.0973, + "step": 10170 + }, + { + "epoch": 14.63, + "learning_rate": 0.00015756624141315012, + "loss": 0.1124, + "step": 10180 + }, + { + "epoch": 14.64, + "learning_rate": 0.00015741903827281648, + "loss": 0.1131, + "step": 10190 + }, + { + "epoch": 14.66, + "learning_rate": 0.00015727183513248281, + "loss": 0.1147, + "step": 10200 + }, + { + "epoch": 14.66, + "eval_loss": 0.16483080387115479, + "eval_runtime": 39.9302, + "eval_samples_per_second": 11.445, + "eval_steps_per_second": 1.453, + "eval_wer": 0.1802439391657883, + "step": 10200 + }, + { + "epoch": 14.67, + "learning_rate": 0.00015712463199214915, + "loss": 0.1111, + "step": 10210 + }, + { + "epoch": 14.68, + "learning_rate": 0.00015697742885181548, + "loss": 0.1048, + "step": 10220 + }, + { + "epoch": 14.7, + "learning_rate": 0.00015683022571148184, + "loss": 0.1285, + "step": 10230 + }, + { + "epoch": 14.71, + "learning_rate": 0.00015668302257114817, + "loss": 0.092, + "step": 10240 + }, + { + "epoch": 14.73, + "learning_rate": 0.0001565358194308145, + "loss": 0.1086, + "step": 10250 + }, + { + "epoch": 14.74, + "learning_rate": 0.00015638861629048084, + "loss": 0.1002, + "step": 10260 + }, + { + "epoch": 14.76, + "learning_rate": 0.0001562414131501472, + "loss": 0.1148, + "step": 10270 + }, + { + "epoch": 14.77, + "learning_rate": 0.0001560942100098135, + "loss": 0.1267, + "step": 10280 + }, + { + "epoch": 14.78, + "learning_rate": 0.00015594700686947987, + "loss": 0.1025, + "step": 10290 + }, + { + "epoch": 14.8, + "learning_rate": 0.0001557998037291462, + "loss": 0.115, + "step": 10300 + }, + { + "epoch": 14.8, + "eval_loss": 0.1692885160446167, + "eval_runtime": 40.0262, + "eval_samples_per_second": 11.418, + "eval_steps_per_second": 1.449, + "eval_wer": 0.18581538924860713, + "step": 10300 + }, + { + "epoch": 14.81, + "learning_rate": 0.00015565260058881256, + "loss": 0.0927, + "step": 10310 + }, + { + "epoch": 14.83, + "learning_rate": 0.00015550539744847887, + "loss": 0.1171, + "step": 10320 + }, + { + "epoch": 14.84, + "learning_rate": 0.00015535819430814523, + "loss": 0.1267, + "step": 10330 + }, + { + "epoch": 14.86, + "learning_rate": 0.00015521099116781156, + "loss": 0.1005, + "step": 10340 + }, + { + "epoch": 14.87, + "learning_rate": 0.00015506378802747792, + "loss": 0.117, + "step": 10350 + }, + { + "epoch": 14.89, + "learning_rate": 0.00015491658488714423, + "loss": 0.0975, + "step": 10360 + }, + { + "epoch": 14.9, + "learning_rate": 0.0001547693817468106, + "loss": 0.1131, + "step": 10370 + }, + { + "epoch": 14.91, + "learning_rate": 0.00015462217860647692, + "loss": 0.1209, + "step": 10380 + }, + { + "epoch": 14.93, + "learning_rate": 0.00015447497546614328, + "loss": 0.105, + "step": 10390 + }, + { + "epoch": 14.94, + "learning_rate": 0.0001543277723258096, + "loss": 0.1078, + "step": 10400 + }, + { + "epoch": 14.94, + "eval_loss": 0.16425766050815582, + "eval_runtime": 39.9939, + "eval_samples_per_second": 11.427, + "eval_steps_per_second": 1.45, + "eval_wer": 0.18385785273302213, + "step": 10400 + }, + { + "epoch": 14.96, + "learning_rate": 0.00015418056918547595, + "loss": 0.1102, + "step": 10410 + }, + { + "epoch": 14.97, + "learning_rate": 0.00015403336604514228, + "loss": 0.1, + "step": 10420 + }, + { + "epoch": 14.99, + "learning_rate": 0.00015388616290480862, + "loss": 0.0944, + "step": 10430 + }, + { + "epoch": 15.0, + "learning_rate": 0.00015373895976447495, + "loss": 0.1232, + "step": 10440 + }, + { + "epoch": 15.01, + "learning_rate": 0.0001535917566241413, + "loss": 0.1017, + "step": 10450 + }, + { + "epoch": 15.03, + "learning_rate": 0.00015344455348380764, + "loss": 0.0991, + "step": 10460 + }, + { + "epoch": 15.04, + "learning_rate": 0.00015329735034347398, + "loss": 0.0986, + "step": 10470 + }, + { + "epoch": 15.06, + "learning_rate": 0.0001531501472031403, + "loss": 0.1012, + "step": 10480 + }, + { + "epoch": 15.07, + "learning_rate": 0.00015300294406280667, + "loss": 0.0992, + "step": 10490 + }, + { + "epoch": 15.09, + "learning_rate": 0.000152855740922473, + "loss": 0.107, + "step": 10500 + }, + { + "epoch": 15.09, + "eval_loss": 0.169921875, + "eval_runtime": 39.8342, + "eval_samples_per_second": 11.473, + "eval_steps_per_second": 1.456, + "eval_wer": 0.17964162023791597, + "step": 10500 + }, + { + "epoch": 15.1, + "learning_rate": 0.00015270853778213934, + "loss": 0.0901, + "step": 10510 + }, + { + "epoch": 15.11, + "learning_rate": 0.00015256133464180567, + "loss": 0.1056, + "step": 10520 + }, + { + "epoch": 15.13, + "learning_rate": 0.00015241413150147203, + "loss": 0.1044, + "step": 10530 + }, + { + "epoch": 15.14, + "learning_rate": 0.00015226692836113837, + "loss": 0.0921, + "step": 10540 + }, + { + "epoch": 15.16, + "learning_rate": 0.0001521197252208047, + "loss": 0.1146, + "step": 10550 + }, + { + "epoch": 15.17, + "learning_rate": 0.00015197252208047103, + "loss": 0.0826, + "step": 10560 + }, + { + "epoch": 15.19, + "learning_rate": 0.0001518253189401374, + "loss": 0.1078, + "step": 10570 + }, + { + "epoch": 15.2, + "learning_rate": 0.0001516781157998037, + "loss": 0.1036, + "step": 10580 + }, + { + "epoch": 15.22, + "learning_rate": 0.00015153091265947006, + "loss": 0.0755, + "step": 10590 + }, + { + "epoch": 15.23, + "learning_rate": 0.0001513837095191364, + "loss": 0.0966, + "step": 10600 + }, + { + "epoch": 15.23, + "eval_loss": 0.1691877841949463, + "eval_runtime": 40.0386, + "eval_samples_per_second": 11.414, + "eval_steps_per_second": 1.449, + "eval_wer": 0.1802439391657883, + "step": 10600 + }, + { + "epoch": 15.24, + "learning_rate": 0.00015123650637880275, + "loss": 0.087, + "step": 10610 + }, + { + "epoch": 15.26, + "learning_rate": 0.00015108930323846906, + "loss": 0.1237, + "step": 10620 + }, + { + "epoch": 15.27, + "learning_rate": 0.00015094210009813542, + "loss": 0.087, + "step": 10630 + }, + { + "epoch": 15.29, + "learning_rate": 0.00015079489695780175, + "loss": 0.0968, + "step": 10640 + }, + { + "epoch": 15.3, + "learning_rate": 0.00015064769381746811, + "loss": 0.1188, + "step": 10650 + }, + { + "epoch": 15.32, + "learning_rate": 0.00015050049067713442, + "loss": 0.0945, + "step": 10660 + }, + { + "epoch": 15.33, + "learning_rate": 0.00015035328753680078, + "loss": 0.1007, + "step": 10670 + }, + { + "epoch": 15.34, + "learning_rate": 0.00015020608439646711, + "loss": 0.0988, + "step": 10680 + }, + { + "epoch": 15.36, + "learning_rate": 0.00015005888125613348, + "loss": 0.0876, + "step": 10690 + }, + { + "epoch": 15.37, + "learning_rate": 0.00014991167811579978, + "loss": 0.0931, + "step": 10700 + }, + { + "epoch": 15.37, + "eval_loss": 0.16350314021110535, + "eval_runtime": 39.8693, + "eval_samples_per_second": 11.462, + "eval_steps_per_second": 1.455, + "eval_wer": 0.17753350399036288, + "step": 10700 + }, + { + "epoch": 15.39, + "learning_rate": 0.00014976447497546614, + "loss": 0.0825, + "step": 10710 + }, + { + "epoch": 15.4, + "learning_rate": 0.00014961727183513248, + "loss": 0.1109, + "step": 10720 + }, + { + "epoch": 15.42, + "learning_rate": 0.0001494700686947988, + "loss": 0.095, + "step": 10730 + }, + { + "epoch": 15.43, + "learning_rate": 0.00014932286555446514, + "loss": 0.1073, + "step": 10740 + }, + { + "epoch": 15.45, + "learning_rate": 0.0001491756624141315, + "loss": 0.111, + "step": 10750 + }, + { + "epoch": 15.46, + "learning_rate": 0.00014902845927379784, + "loss": 0.0962, + "step": 10760 + }, + { + "epoch": 15.47, + "learning_rate": 0.00014888125613346417, + "loss": 0.096, + "step": 10770 + }, + { + "epoch": 15.49, + "learning_rate": 0.0001487340529931305, + "loss": 0.0717, + "step": 10780 + }, + { + "epoch": 15.5, + "learning_rate": 0.00014858684985279686, + "loss": 0.0893, + "step": 10790 + }, + { + "epoch": 15.52, + "learning_rate": 0.0001484396467124632, + "loss": 0.1068, + "step": 10800 + }, + { + "epoch": 15.52, + "eval_loss": 0.16544069349765778, + "eval_runtime": 39.8983, + "eval_samples_per_second": 11.454, + "eval_steps_per_second": 1.454, + "eval_wer": 0.17407017015509713, + "step": 10800 + }, + { + "epoch": 15.53, + "learning_rate": 0.00014829244357212953, + "loss": 0.0968, + "step": 10810 + }, + { + "epoch": 15.55, + "learning_rate": 0.00014814524043179586, + "loss": 0.0907, + "step": 10820 + }, + { + "epoch": 15.56, + "learning_rate": 0.00014799803729146222, + "loss": 0.0836, + "step": 10830 + }, + { + "epoch": 15.57, + "learning_rate": 0.00014785083415112856, + "loss": 0.0866, + "step": 10840 + }, + { + "epoch": 15.59, + "learning_rate": 0.00014770363101079486, + "loss": 0.1004, + "step": 10850 + }, + { + "epoch": 15.6, + "learning_rate": 0.00014755642787046122, + "loss": 0.0972, + "step": 10860 + }, + { + "epoch": 15.62, + "learning_rate": 0.00014740922473012756, + "loss": 0.1118, + "step": 10870 + }, + { + "epoch": 15.63, + "learning_rate": 0.00014726202158979392, + "loss": 0.1021, + "step": 10880 + }, + { + "epoch": 15.65, + "learning_rate": 0.00014711481844946022, + "loss": 0.0791, + "step": 10890 + }, + { + "epoch": 15.66, + "learning_rate": 0.00014696761530912658, + "loss": 0.1224, + "step": 10900 + }, + { + "epoch": 15.66, + "eval_loss": 0.16307871043682098, + "eval_runtime": 40.0248, + "eval_samples_per_second": 11.418, + "eval_steps_per_second": 1.449, + "eval_wer": 0.1767806053305225, + "step": 10900 + }, + { + "epoch": 15.68, + "learning_rate": 0.00014682041216879292, + "loss": 0.0825, + "step": 10910 + }, + { + "epoch": 15.69, + "learning_rate": 0.00014667320902845928, + "loss": 0.0958, + "step": 10920 + }, + { + "epoch": 15.7, + "learning_rate": 0.00014652600588812558, + "loss": 0.112, + "step": 10930 + }, + { + "epoch": 15.72, + "learning_rate": 0.00014637880274779195, + "loss": 0.0934, + "step": 10940 + }, + { + "epoch": 15.73, + "learning_rate": 0.00014623159960745828, + "loss": 0.0917, + "step": 10950 + }, + { + "epoch": 15.75, + "learning_rate": 0.00014608439646712464, + "loss": 0.0813, + "step": 10960 + }, + { + "epoch": 15.76, + "learning_rate": 0.00014593719332679095, + "loss": 0.1391, + "step": 10970 + }, + { + "epoch": 15.78, + "learning_rate": 0.0001457899901864573, + "loss": 0.1232, + "step": 10980 + }, + { + "epoch": 15.79, + "learning_rate": 0.00014564278704612364, + "loss": 0.1132, + "step": 10990 + }, + { + "epoch": 15.8, + "learning_rate": 0.00014549558390578997, + "loss": 0.0999, + "step": 11000 + }, + { + "epoch": 15.8, + "eval_loss": 0.15900734066963196, + "eval_runtime": 40.0131, + "eval_samples_per_second": 11.421, + "eval_steps_per_second": 1.45, + "eval_wer": 0.17663002559855442, + "step": 11000 + }, + { + "epoch": 15.82, + "learning_rate": 0.0001453483807654563, + "loss": 0.079, + "step": 11010 + }, + { + "epoch": 15.83, + "learning_rate": 0.00014520117762512264, + "loss": 0.102, + "step": 11020 + }, + { + "epoch": 15.85, + "learning_rate": 0.000145053974484789, + "loss": 0.088, + "step": 11030 + }, + { + "epoch": 15.86, + "learning_rate": 0.00014490677134445533, + "loss": 0.0976, + "step": 11040 + }, + { + "epoch": 15.88, + "learning_rate": 0.00014475956820412167, + "loss": 0.1118, + "step": 11050 + }, + { + "epoch": 15.89, + "learning_rate": 0.000144612365063788, + "loss": 0.0847, + "step": 11060 + }, + { + "epoch": 15.91, + "learning_rate": 0.00014446516192345436, + "loss": 0.0962, + "step": 11070 + }, + { + "epoch": 15.92, + "learning_rate": 0.0001443179587831207, + "loss": 0.1053, + "step": 11080 + }, + { + "epoch": 15.93, + "learning_rate": 0.00014417075564278703, + "loss": 0.1131, + "step": 11090 + }, + { + "epoch": 15.95, + "learning_rate": 0.00014402355250245336, + "loss": 0.0879, + "step": 11100 + }, + { + "epoch": 15.95, + "eval_loss": 0.16153839230537415, + "eval_runtime": 40.5046, + "eval_samples_per_second": 11.283, + "eval_steps_per_second": 1.432, + "eval_wer": 0.17196205390754404, + "step": 11100 + }, + { + "epoch": 15.96, + "learning_rate": 0.00014387634936211972, + "loss": 0.1013, + "step": 11110 + }, + { + "epoch": 15.98, + "learning_rate": 0.00014372914622178605, + "loss": 0.1083, + "step": 11120 + }, + { + "epoch": 15.99, + "learning_rate": 0.0001435819430814524, + "loss": 0.1037, + "step": 11130 + }, + { + "epoch": 16.01, + "learning_rate": 0.00014343473994111872, + "loss": 0.0954, + "step": 11140 + }, + { + "epoch": 16.02, + "learning_rate": 0.00014328753680078506, + "loss": 0.0845, + "step": 11150 + }, + { + "epoch": 16.03, + "learning_rate": 0.00014314033366045142, + "loss": 0.0827, + "step": 11160 + }, + { + "epoch": 16.05, + "learning_rate": 0.00014299313052011775, + "loss": 0.1113, + "step": 11170 + }, + { + "epoch": 16.06, + "learning_rate": 0.00014284592737978408, + "loss": 0.0934, + "step": 11180 + }, + { + "epoch": 16.08, + "learning_rate": 0.00014269872423945042, + "loss": 0.0903, + "step": 11190 + }, + { + "epoch": 16.09, + "learning_rate": 0.00014255152109911678, + "loss": 0.0761, + "step": 11200 + }, + { + "epoch": 16.09, + "eval_loss": 0.16535413265228271, + "eval_runtime": 40.0395, + "eval_samples_per_second": 11.414, + "eval_steps_per_second": 1.449, + "eval_wer": 0.17497364854690559, + "step": 11200 + }, + { + "epoch": 16.11, + "learning_rate": 0.0001424043179587831, + "loss": 0.0709, + "step": 11210 + }, + { + "epoch": 16.12, + "learning_rate": 0.00014225711481844944, + "loss": 0.1006, + "step": 11220 + }, + { + "epoch": 16.14, + "learning_rate": 0.00014210991167811578, + "loss": 0.1218, + "step": 11230 + }, + { + "epoch": 16.15, + "learning_rate": 0.00014196270853778214, + "loss": 0.0994, + "step": 11240 + }, + { + "epoch": 16.16, + "learning_rate": 0.00014181550539744847, + "loss": 0.0986, + "step": 11250 + }, + { + "epoch": 16.18, + "learning_rate": 0.0001416683022571148, + "loss": 0.0789, + "step": 11260 + }, + { + "epoch": 16.19, + "learning_rate": 0.00014152109911678114, + "loss": 0.1026, + "step": 11270 + }, + { + "epoch": 16.21, + "learning_rate": 0.0001413738959764475, + "loss": 0.0982, + "step": 11280 + }, + { + "epoch": 16.22, + "learning_rate": 0.00014122669283611383, + "loss": 0.1112, + "step": 11290 + }, + { + "epoch": 16.24, + "learning_rate": 0.00014107948969578016, + "loss": 0.0821, + "step": 11300 + }, + { + "epoch": 16.24, + "eval_loss": 0.15813738107681274, + "eval_runtime": 39.8582, + "eval_samples_per_second": 11.466, + "eval_steps_per_second": 1.455, + "eval_wer": 0.17452190935100134, + "step": 11300 + }, + { + "epoch": 16.25, + "learning_rate": 0.0001409322865554465, + "loss": 0.0935, + "step": 11310 + }, + { + "epoch": 16.26, + "learning_rate": 0.00014078508341511283, + "loss": 0.1029, + "step": 11320 + }, + { + "epoch": 16.28, + "learning_rate": 0.0001406378802747792, + "loss": 0.1002, + "step": 11330 + }, + { + "epoch": 16.29, + "learning_rate": 0.00014049067713444553, + "loss": 0.095, + "step": 11340 + }, + { + "epoch": 16.31, + "learning_rate": 0.00014034347399411186, + "loss": 0.1028, + "step": 11350 + }, + { + "epoch": 16.32, + "learning_rate": 0.0001401962708537782, + "loss": 0.079, + "step": 11360 + }, + { + "epoch": 16.34, + "learning_rate": 0.00014004906771344455, + "loss": 0.0941, + "step": 11370 + }, + { + "epoch": 16.35, + "learning_rate": 0.00013990186457311089, + "loss": 0.0839, + "step": 11380 + }, + { + "epoch": 16.36, + "learning_rate": 0.00013975466143277722, + "loss": 0.0976, + "step": 11390 + }, + { + "epoch": 16.38, + "learning_rate": 0.00013960745829244355, + "loss": 0.0984, + "step": 11400 + }, + { + "epoch": 16.38, + "eval_loss": 0.16124248504638672, + "eval_runtime": 40.0383, + "eval_samples_per_second": 11.414, + "eval_steps_per_second": 1.449, + "eval_wer": 0.16940219846408675, + "step": 11400 + }, + { + "epoch": 16.39, + "learning_rate": 0.0001394602551521099, + "loss": 0.0889, + "step": 11410 + }, + { + "epoch": 16.41, + "learning_rate": 0.00013931305201177625, + "loss": 0.0951, + "step": 11420 + }, + { + "epoch": 16.42, + "learning_rate": 0.00013916584887144258, + "loss": 0.075, + "step": 11430 + }, + { + "epoch": 16.44, + "learning_rate": 0.0001390186457311089, + "loss": 0.1025, + "step": 11440 + }, + { + "epoch": 16.45, + "learning_rate": 0.00013887144259077525, + "loss": 0.0838, + "step": 11450 + }, + { + "epoch": 16.47, + "learning_rate": 0.0001387242394504416, + "loss": 0.093, + "step": 11460 + }, + { + "epoch": 16.48, + "learning_rate": 0.00013857703631010794, + "loss": 0.1044, + "step": 11470 + }, + { + "epoch": 16.49, + "learning_rate": 0.00013842983316977427, + "loss": 0.0944, + "step": 11480 + }, + { + "epoch": 16.51, + "learning_rate": 0.0001382826300294406, + "loss": 0.0967, + "step": 11490 + }, + { + "epoch": 16.52, + "learning_rate": 0.00013813542688910697, + "loss": 0.0815, + "step": 11500 + }, + { + "epoch": 16.52, + "eval_loss": 0.16426511108875275, + "eval_runtime": 39.87, + "eval_samples_per_second": 11.462, + "eval_steps_per_second": 1.455, + "eval_wer": 0.17361843095919288, + "step": 11500 + }, + { + "epoch": 16.54, + "learning_rate": 0.0001379882237487733, + "loss": 0.1004, + "step": 11510 + }, + { + "epoch": 16.55, + "learning_rate": 0.00013784102060843963, + "loss": 0.0916, + "step": 11520 + }, + { + "epoch": 16.57, + "learning_rate": 0.00013769381746810597, + "loss": 0.0947, + "step": 11530 + }, + { + "epoch": 16.58, + "learning_rate": 0.00013754661432777233, + "loss": 0.0905, + "step": 11540 + }, + { + "epoch": 16.59, + "learning_rate": 0.00013739941118743866, + "loss": 0.0864, + "step": 11550 + }, + { + "epoch": 16.61, + "learning_rate": 0.000137252208047105, + "loss": 0.0852, + "step": 11560 + }, + { + "epoch": 16.62, + "learning_rate": 0.00013710500490677133, + "loss": 0.1071, + "step": 11570 + }, + { + "epoch": 16.64, + "learning_rate": 0.0001369578017664377, + "loss": 0.0939, + "step": 11580 + }, + { + "epoch": 16.65, + "learning_rate": 0.00013681059862610402, + "loss": 0.1154, + "step": 11590 + }, + { + "epoch": 16.67, + "learning_rate": 0.00013666339548577036, + "loss": 0.0898, + "step": 11600 + }, + { + "epoch": 16.67, + "eval_loss": 0.16324785351753235, + "eval_runtime": 39.9344, + "eval_samples_per_second": 11.444, + "eval_steps_per_second": 1.452, + "eval_wer": 0.17723234452642675, + "step": 11600 + }, + { + "epoch": 16.68, + "learning_rate": 0.0001365161923454367, + "loss": 0.0818, + "step": 11610 + }, + { + "epoch": 16.7, + "learning_rate": 0.00013636898920510302, + "loss": 0.0951, + "step": 11620 + }, + { + "epoch": 16.71, + "learning_rate": 0.00013622178606476938, + "loss": 0.1037, + "step": 11630 + }, + { + "epoch": 16.72, + "learning_rate": 0.00013607458292443572, + "loss": 0.0855, + "step": 11640 + }, + { + "epoch": 16.74, + "learning_rate": 0.00013592737978410205, + "loss": 0.0795, + "step": 11650 + }, + { + "epoch": 16.75, + "learning_rate": 0.00013578017664376838, + "loss": 0.0877, + "step": 11660 + }, + { + "epoch": 16.77, + "learning_rate": 0.00013563297350343474, + "loss": 0.1126, + "step": 11670 + }, + { + "epoch": 16.78, + "learning_rate": 0.00013548577036310108, + "loss": 0.0809, + "step": 11680 + }, + { + "epoch": 16.8, + "learning_rate": 0.0001353385672227674, + "loss": 0.1051, + "step": 11690 + }, + { + "epoch": 16.81, + "learning_rate": 0.00013519136408243374, + "loss": 0.0958, + "step": 11700 + }, + { + "epoch": 16.81, + "eval_loss": 0.159054696559906, + "eval_runtime": 40.0796, + "eval_samples_per_second": 11.402, + "eval_steps_per_second": 1.447, + "eval_wer": 0.17467248908296942, + "step": 11700 + }, + { + "epoch": 16.82, + "learning_rate": 0.0001350441609421001, + "loss": 0.0972, + "step": 11710 + }, + { + "epoch": 16.84, + "learning_rate": 0.00013489695780176644, + "loss": 0.0908, + "step": 11720 + }, + { + "epoch": 16.85, + "learning_rate": 0.00013474975466143274, + "loss": 0.1005, + "step": 11730 + }, + { + "epoch": 16.87, + "learning_rate": 0.0001346025515210991, + "loss": 0.1101, + "step": 11740 + }, + { + "epoch": 16.88, + "learning_rate": 0.00013445534838076544, + "loss": 0.1086, + "step": 11750 + }, + { + "epoch": 16.9, + "learning_rate": 0.0001343081452404318, + "loss": 0.0864, + "step": 11760 + }, + { + "epoch": 16.91, + "learning_rate": 0.0001341609421000981, + "loss": 0.1002, + "step": 11770 + }, + { + "epoch": 16.93, + "learning_rate": 0.00013401373895976447, + "loss": 0.1145, + "step": 11780 + }, + { + "epoch": 16.94, + "learning_rate": 0.0001338665358194308, + "loss": 0.0848, + "step": 11790 + }, + { + "epoch": 16.95, + "learning_rate": 0.00013371933267909716, + "loss": 0.0986, + "step": 11800 + }, + { + "epoch": 16.95, + "eval_loss": 0.16650956869125366, + "eval_runtime": 40.0741, + "eval_samples_per_second": 11.404, + "eval_steps_per_second": 1.447, + "eval_wer": 0.17331727149525675, + "step": 11800 + }, + { + "epoch": 16.97, + "learning_rate": 0.00013357212953876347, + "loss": 0.0942, + "step": 11810 + }, + { + "epoch": 16.98, + "learning_rate": 0.00013342492639842983, + "loss": 0.0868, + "step": 11820 + }, + { + "epoch": 17.0, + "learning_rate": 0.00013327772325809616, + "loss": 0.0857, + "step": 11830 + }, + { + "epoch": 17.01, + "learning_rate": 0.00013313052011776252, + "loss": 0.0911, + "step": 11840 + }, + { + "epoch": 17.03, + "learning_rate": 0.00013298331697742883, + "loss": 0.0743, + "step": 11850 + }, + { + "epoch": 17.04, + "learning_rate": 0.0001328361138370952, + "loss": 0.0727, + "step": 11860 + }, + { + "epoch": 17.05, + "learning_rate": 0.00013268891069676152, + "loss": 0.0905, + "step": 11870 + }, + { + "epoch": 17.07, + "learning_rate": 0.00013254170755642785, + "loss": 0.0724, + "step": 11880 + }, + { + "epoch": 17.08, + "learning_rate": 0.0001323945044160942, + "loss": 0.0872, + "step": 11890 + }, + { + "epoch": 17.1, + "learning_rate": 0.00013224730127576052, + "loss": 0.0843, + "step": 11900 + }, + { + "epoch": 17.1, + "eval_loss": 0.16180233657360077, + "eval_runtime": 40.2757, + "eval_samples_per_second": 11.347, + "eval_steps_per_second": 1.44, + "eval_wer": 0.17256437283541634, + "step": 11900 + }, + { + "epoch": 17.11, + "learning_rate": 0.00013210009813542688, + "loss": 0.1044, + "step": 11910 + }, + { + "epoch": 17.13, + "learning_rate": 0.00013195289499509321, + "loss": 0.1075, + "step": 11920 + }, + { + "epoch": 17.14, + "learning_rate": 0.00013180569185475955, + "loss": 0.0632, + "step": 11930 + }, + { + "epoch": 17.16, + "learning_rate": 0.00013165848871442588, + "loss": 0.1181, + "step": 11940 + }, + { + "epoch": 17.17, + "learning_rate": 0.00013151128557409224, + "loss": 0.0798, + "step": 11950 + }, + { + "epoch": 17.18, + "learning_rate": 0.00013136408243375857, + "loss": 0.0976, + "step": 11960 + }, + { + "epoch": 17.2, + "learning_rate": 0.0001312168792934249, + "loss": 0.1028, + "step": 11970 + }, + { + "epoch": 17.21, + "learning_rate": 0.00013106967615309124, + "loss": 0.0819, + "step": 11980 + }, + { + "epoch": 17.23, + "learning_rate": 0.0001309224730127576, + "loss": 0.0977, + "step": 11990 + }, + { + "epoch": 17.24, + "learning_rate": 0.00013077526987242394, + "loss": 0.0888, + "step": 12000 + }, + { + "epoch": 17.24, + "eval_loss": 0.1597016453742981, + "eval_runtime": 40.0997, + "eval_samples_per_second": 11.397, + "eval_steps_per_second": 1.446, + "eval_wer": 0.16985393765999096, + "step": 12000 + }, + { + "epoch": 17.26, + "learning_rate": 0.00013062806673209027, + "loss": 0.0903, + "step": 12010 + }, + { + "epoch": 17.27, + "learning_rate": 0.0001304808635917566, + "loss": 0.0879, + "step": 12020 + }, + { + "epoch": 17.28, + "learning_rate": 0.00013033366045142294, + "loss": 0.0902, + "step": 12030 + }, + { + "epoch": 17.3, + "learning_rate": 0.0001301864573110893, + "loss": 0.0922, + "step": 12040 + }, + { + "epoch": 17.31, + "learning_rate": 0.00013003925417075563, + "loss": 0.0705, + "step": 12050 + }, + { + "epoch": 17.33, + "learning_rate": 0.00012989205103042196, + "loss": 0.0861, + "step": 12060 + }, + { + "epoch": 17.34, + "learning_rate": 0.0001297448478900883, + "loss": 0.0923, + "step": 12070 + }, + { + "epoch": 17.36, + "learning_rate": 0.00012959764474975466, + "loss": 0.0776, + "step": 12080 + }, + { + "epoch": 17.37, + "learning_rate": 0.000129450441609421, + "loss": 0.1092, + "step": 12090 + }, + { + "epoch": 17.39, + "learning_rate": 0.00012930323846908732, + "loss": 0.0851, + "step": 12100 + }, + { + "epoch": 17.39, + "eval_loss": 0.15801562368869781, + "eval_runtime": 40.1138, + "eval_samples_per_second": 11.393, + "eval_steps_per_second": 1.446, + "eval_wer": 0.1704562565878633, + "step": 12100 + }, + { + "epoch": 17.4, + "learning_rate": 0.00012915603532875366, + "loss": 0.0997, + "step": 12110 + }, + { + "epoch": 17.41, + "learning_rate": 0.00012900883218842002, + "loss": 0.0931, + "step": 12120 + }, + { + "epoch": 17.43, + "learning_rate": 0.00012886162904808635, + "loss": 0.0745, + "step": 12130 + }, + { + "epoch": 17.44, + "learning_rate": 0.00012871442590775268, + "loss": 0.0965, + "step": 12140 + }, + { + "epoch": 17.46, + "learning_rate": 0.00012856722276741902, + "loss": 0.0909, + "step": 12150 + }, + { + "epoch": 17.47, + "learning_rate": 0.00012842001962708538, + "loss": 0.1066, + "step": 12160 + }, + { + "epoch": 17.49, + "learning_rate": 0.0001282728164867517, + "loss": 0.0924, + "step": 12170 + }, + { + "epoch": 17.5, + "learning_rate": 0.00012812561334641804, + "loss": 0.0757, + "step": 12180 + }, + { + "epoch": 17.51, + "learning_rate": 0.00012797841020608438, + "loss": 0.0849, + "step": 12190 + }, + { + "epoch": 17.53, + "learning_rate": 0.0001278459273797841, + "loss": 0.0928, + "step": 12200 + }, + { + "epoch": 17.53, + "eval_loss": 0.16045060753822327, + "eval_runtime": 40.0909, + "eval_samples_per_second": 11.399, + "eval_steps_per_second": 1.447, + "eval_wer": 0.1695527781960548, + "step": 12200 + }, + { + "epoch": 17.54, + "learning_rate": 0.00012769872423945043, + "loss": 0.1008, + "step": 12210 + }, + { + "epoch": 17.56, + "learning_rate": 0.00012755152109911676, + "loss": 0.1008, + "step": 12220 + }, + { + "epoch": 17.57, + "learning_rate": 0.0001274043179587831, + "loss": 0.0863, + "step": 12230 + }, + { + "epoch": 17.59, + "learning_rate": 0.00012725711481844946, + "loss": 0.0996, + "step": 12240 + }, + { + "epoch": 17.6, + "learning_rate": 0.0001271099116781158, + "loss": 0.067, + "step": 12250 + }, + { + "epoch": 17.61, + "learning_rate": 0.00012696270853778212, + "loss": 0.0988, + "step": 12260 + }, + { + "epoch": 17.63, + "learning_rate": 0.00012681550539744846, + "loss": 0.0883, + "step": 12270 + }, + { + "epoch": 17.64, + "learning_rate": 0.0001266683022571148, + "loss": 0.0811, + "step": 12280 + }, + { + "epoch": 17.66, + "learning_rate": 0.00012652109911678115, + "loss": 0.0999, + "step": 12290 + }, + { + "epoch": 17.67, + "learning_rate": 0.00012637389597644749, + "loss": 0.0886, + "step": 12300 + }, + { + "epoch": 17.67, + "eval_loss": 0.1619402915239334, + "eval_runtime": 40.3366, + "eval_samples_per_second": 11.33, + "eval_steps_per_second": 1.438, + "eval_wer": 0.16940219846408675, + "step": 12300 + }, + { + "epoch": 17.69, + "learning_rate": 0.00012622669283611382, + "loss": 0.0936, + "step": 12310 + }, + { + "epoch": 17.7, + "learning_rate": 0.00012607948969578015, + "loss": 0.1139, + "step": 12320 + }, + { + "epoch": 17.72, + "learning_rate": 0.0001259322865554465, + "loss": 0.0851, + "step": 12330 + }, + { + "epoch": 17.73, + "learning_rate": 0.00012578508341511285, + "loss": 0.1101, + "step": 12340 + }, + { + "epoch": 17.74, + "learning_rate": 0.00012563788027477918, + "loss": 0.0792, + "step": 12350 + }, + { + "epoch": 17.76, + "learning_rate": 0.0001254906771344455, + "loss": 0.0789, + "step": 12360 + }, + { + "epoch": 17.77, + "learning_rate": 0.00012534347399411187, + "loss": 0.1043, + "step": 12370 + }, + { + "epoch": 17.79, + "learning_rate": 0.0001251962708537782, + "loss": 0.0701, + "step": 12380 + }, + { + "epoch": 17.8, + "learning_rate": 0.00012504906771344454, + "loss": 0.0817, + "step": 12390 + }, + { + "epoch": 17.82, + "learning_rate": 0.00012490186457311087, + "loss": 0.0931, + "step": 12400 + }, + { + "epoch": 17.82, + "eval_loss": 0.15292048454284668, + "eval_runtime": 40.0068, + "eval_samples_per_second": 11.423, + "eval_steps_per_second": 1.45, + "eval_wer": 0.16819756060834212, + "step": 12400 + }, + { + "epoch": 17.83, + "learning_rate": 0.0001247546614327772, + "loss": 0.1021, + "step": 12410 + }, + { + "epoch": 17.84, + "learning_rate": 0.00012460745829244357, + "loss": 0.0851, + "step": 12420 + }, + { + "epoch": 17.86, + "learning_rate": 0.0001244602551521099, + "loss": 0.07, + "step": 12430 + }, + { + "epoch": 17.87, + "learning_rate": 0.00012431305201177623, + "loss": 0.108, + "step": 12440 + }, + { + "epoch": 17.89, + "learning_rate": 0.00012416584887144257, + "loss": 0.0826, + "step": 12450 + }, + { + "epoch": 17.9, + "learning_rate": 0.00012401864573110893, + "loss": 0.0834, + "step": 12460 + }, + { + "epoch": 17.92, + "learning_rate": 0.00012387144259077526, + "loss": 0.082, + "step": 12470 + }, + { + "epoch": 17.93, + "learning_rate": 0.0001237242394504416, + "loss": 0.0886, + "step": 12480 + }, + { + "epoch": 17.95, + "learning_rate": 0.00012357703631010793, + "loss": 0.0873, + "step": 12490 + }, + { + "epoch": 17.96, + "learning_rate": 0.0001234298331697743, + "loss": 0.0747, + "step": 12500 + }, + { + "epoch": 17.96, + "eval_loss": 0.14587688446044922, + "eval_runtime": 40.2304, + "eval_samples_per_second": 11.36, + "eval_steps_per_second": 1.442, + "eval_wer": 0.16277669025749134, + "step": 12500 + }, + { + "epoch": 17.97, + "learning_rate": 0.00012328263002944062, + "loss": 0.0806, + "step": 12510 + }, + { + "epoch": 17.99, + "learning_rate": 0.00012313542688910696, + "loss": 0.0835, + "step": 12520 + }, + { + "epoch": 18.0, + "learning_rate": 0.0001229882237487733, + "loss": 0.0926, + "step": 12530 + }, + { + "epoch": 18.02, + "learning_rate": 0.00012284102060843965, + "loss": 0.0802, + "step": 12540 + }, + { + "epoch": 18.03, + "learning_rate": 0.00012269381746810598, + "loss": 0.0666, + "step": 12550 + }, + { + "epoch": 18.05, + "learning_rate": 0.00012254661432777232, + "loss": 0.0892, + "step": 12560 + }, + { + "epoch": 18.06, + "learning_rate": 0.00012239941118743865, + "loss": 0.0741, + "step": 12570 + }, + { + "epoch": 18.07, + "learning_rate": 0.00012225220804710498, + "loss": 0.0788, + "step": 12580 + }, + { + "epoch": 18.09, + "learning_rate": 0.00012210500490677134, + "loss": 0.0796, + "step": 12590 + }, + { + "epoch": 18.1, + "learning_rate": 0.00012195780176643766, + "loss": 0.1014, + "step": 12600 + }, + { + "epoch": 18.1, + "eval_loss": 0.15678279101848602, + "eval_runtime": 40.1685, + "eval_samples_per_second": 11.377, + "eval_steps_per_second": 1.444, + "eval_wer": 0.16608944436078904, + "step": 12600 + }, + { + "epoch": 18.12, + "learning_rate": 0.00012181059862610401, + "loss": 0.0859, + "step": 12610 + }, + { + "epoch": 18.13, + "learning_rate": 0.00012166339548577034, + "loss": 0.0854, + "step": 12620 + }, + { + "epoch": 18.15, + "learning_rate": 0.00012151619234543669, + "loss": 0.078, + "step": 12630 + }, + { + "epoch": 18.16, + "learning_rate": 0.00012136898920510302, + "loss": 0.0905, + "step": 12640 + }, + { + "epoch": 18.18, + "learning_rate": 0.00012122178606476937, + "loss": 0.0968, + "step": 12650 + }, + { + "epoch": 18.19, + "learning_rate": 0.0001210745829244357, + "loss": 0.0987, + "step": 12660 + }, + { + "epoch": 18.2, + "learning_rate": 0.00012092737978410205, + "loss": 0.0743, + "step": 12670 + }, + { + "epoch": 18.22, + "learning_rate": 0.00012078017664376838, + "loss": 0.0799, + "step": 12680 + }, + { + "epoch": 18.23, + "learning_rate": 0.00012063297350343472, + "loss": 0.087, + "step": 12690 + }, + { + "epoch": 18.25, + "learning_rate": 0.00012048577036310106, + "loss": 0.0729, + "step": 12700 + }, + { + "epoch": 18.25, + "eval_loss": 0.1656101793050766, + "eval_runtime": 39.9566, + "eval_samples_per_second": 11.437, + "eval_steps_per_second": 1.452, + "eval_wer": 0.17120915524770366, + "step": 12700 + }, + { + "epoch": 18.26, + "learning_rate": 0.0001203385672227674, + "loss": 0.0898, + "step": 12710 + }, + { + "epoch": 18.28, + "learning_rate": 0.00012019136408243375, + "loss": 0.0798, + "step": 12720 + }, + { + "epoch": 18.29, + "learning_rate": 0.00012004416094210008, + "loss": 0.0952, + "step": 12730 + }, + { + "epoch": 18.3, + "learning_rate": 0.00011989695780176643, + "loss": 0.0874, + "step": 12740 + }, + { + "epoch": 18.32, + "learning_rate": 0.00011974975466143276, + "loss": 0.0713, + "step": 12750 + }, + { + "epoch": 18.33, + "learning_rate": 0.0001196025515210991, + "loss": 0.0865, + "step": 12760 + }, + { + "epoch": 18.35, + "learning_rate": 0.00011945534838076544, + "loss": 0.073, + "step": 12770 + }, + { + "epoch": 18.36, + "learning_rate": 0.00011930814524043179, + "loss": 0.0902, + "step": 12780 + }, + { + "epoch": 18.38, + "learning_rate": 0.00011916094210009812, + "loss": 0.0766, + "step": 12790 + }, + { + "epoch": 18.39, + "learning_rate": 0.00011901373895976447, + "loss": 0.0884, + "step": 12800 + }, + { + "epoch": 18.39, + "eval_loss": 0.15617236495018005, + "eval_runtime": 40.4371, + "eval_samples_per_second": 11.302, + "eval_steps_per_second": 1.434, + "eval_wer": 0.16789640114440596, + "step": 12800 + }, + { + "epoch": 18.41, + "learning_rate": 0.0001188665358194308, + "loss": 0.0802, + "step": 12810 + }, + { + "epoch": 18.42, + "learning_rate": 0.00011871933267909715, + "loss": 0.0701, + "step": 12820 + }, + { + "epoch": 18.43, + "learning_rate": 0.00011857212953876348, + "loss": 0.0678, + "step": 12830 + }, + { + "epoch": 18.45, + "learning_rate": 0.00011842492639842981, + "loss": 0.08, + "step": 12840 + }, + { + "epoch": 18.46, + "learning_rate": 0.00011827772325809616, + "loss": 0.0661, + "step": 12850 + }, + { + "epoch": 18.48, + "learning_rate": 0.0001181305201177625, + "loss": 0.0891, + "step": 12860 + }, + { + "epoch": 18.49, + "learning_rate": 0.00011798331697742884, + "loss": 0.0792, + "step": 12870 + }, + { + "epoch": 18.51, + "learning_rate": 0.00011783611383709517, + "loss": 0.0976, + "step": 12880 + }, + { + "epoch": 18.52, + "learning_rate": 0.00011768891069676152, + "loss": 0.0936, + "step": 12890 + }, + { + "epoch": 18.53, + "learning_rate": 0.00011754170755642785, + "loss": 0.0823, + "step": 12900 + }, + { + "epoch": 18.53, + "eval_loss": 0.15830214321613312, + "eval_runtime": 40.3114, + "eval_samples_per_second": 11.337, + "eval_steps_per_second": 1.439, + "eval_wer": 0.16970335792802288, + "step": 12900 + }, + { + "epoch": 18.55, + "learning_rate": 0.0001173945044160942, + "loss": 0.0743, + "step": 12910 + }, + { + "epoch": 18.56, + "learning_rate": 0.00011724730127576054, + "loss": 0.0868, + "step": 12920 + }, + { + "epoch": 18.58, + "learning_rate": 0.00011710009813542688, + "loss": 0.0812, + "step": 12930 + }, + { + "epoch": 18.59, + "learning_rate": 0.00011695289499509322, + "loss": 0.0652, + "step": 12940 + }, + { + "epoch": 18.61, + "learning_rate": 0.00011680569185475956, + "loss": 0.0738, + "step": 12950 + }, + { + "epoch": 18.62, + "learning_rate": 0.0001166584887144259, + "loss": 0.1027, + "step": 12960 + }, + { + "epoch": 18.64, + "learning_rate": 0.00011651128557409224, + "loss": 0.0777, + "step": 12970 + }, + { + "epoch": 18.65, + "learning_rate": 0.00011636408243375858, + "loss": 0.1243, + "step": 12980 + }, + { + "epoch": 18.66, + "learning_rate": 0.00011621687929342491, + "loss": 0.092, + "step": 12990 + }, + { + "epoch": 18.68, + "learning_rate": 0.00011606967615309126, + "loss": 0.066, + "step": 13000 + }, + { + "epoch": 18.68, + "eval_loss": 0.1592216044664383, + "eval_runtime": 40.6807, + "eval_samples_per_second": 11.234, + "eval_steps_per_second": 1.426, + "eval_wer": 0.17166089444360788, + "step": 13000 + }, + { + "epoch": 18.69, + "learning_rate": 0.00011592247301275759, + "loss": 0.08, + "step": 13010 + }, + { + "epoch": 18.71, + "learning_rate": 0.00011577526987242394, + "loss": 0.0768, + "step": 13020 + }, + { + "epoch": 18.72, + "learning_rate": 0.00011562806673209027, + "loss": 0.078, + "step": 13030 + }, + { + "epoch": 18.74, + "learning_rate": 0.00011548086359175662, + "loss": 0.0931, + "step": 13040 + }, + { + "epoch": 18.75, + "learning_rate": 0.00011533366045142295, + "loss": 0.0784, + "step": 13050 + }, + { + "epoch": 18.76, + "learning_rate": 0.0001151864573110893, + "loss": 0.0902, + "step": 13060 + }, + { + "epoch": 18.78, + "learning_rate": 0.00011503925417075563, + "loss": 0.0885, + "step": 13070 + }, + { + "epoch": 18.79, + "learning_rate": 0.00011489205103042198, + "loss": 0.0786, + "step": 13080 + }, + { + "epoch": 18.81, + "learning_rate": 0.00011474484789008831, + "loss": 0.0763, + "step": 13090 + }, + { + "epoch": 18.82, + "learning_rate": 0.00011459764474975466, + "loss": 0.0849, + "step": 13100 + }, + { + "epoch": 18.82, + "eval_loss": 0.15664438903331757, + "eval_runtime": 40.0732, + "eval_samples_per_second": 11.404, + "eval_steps_per_second": 1.447, + "eval_wer": 0.16684234302062942, + "step": 13100 + }, + { + "epoch": 18.84, + "learning_rate": 0.00011445044160942099, + "loss": 0.0843, + "step": 13110 + }, + { + "epoch": 18.85, + "learning_rate": 0.00011430323846908734, + "loss": 0.0776, + "step": 13120 + }, + { + "epoch": 18.86, + "learning_rate": 0.00011415603532875367, + "loss": 0.0597, + "step": 13130 + }, + { + "epoch": 18.88, + "learning_rate": 0.00011400883218842, + "loss": 0.0803, + "step": 13140 + }, + { + "epoch": 18.89, + "learning_rate": 0.00011386162904808635, + "loss": 0.0802, + "step": 13150 + }, + { + "epoch": 18.91, + "learning_rate": 0.00011371442590775269, + "loss": 0.0719, + "step": 13160 + }, + { + "epoch": 18.92, + "learning_rate": 0.00011356722276741903, + "loss": 0.0707, + "step": 13170 + }, + { + "epoch": 18.94, + "learning_rate": 0.00011342001962708537, + "loss": 0.0741, + "step": 13180 + }, + { + "epoch": 18.95, + "learning_rate": 0.00011327281648675171, + "loss": 0.0834, + "step": 13190 + }, + { + "epoch": 18.97, + "learning_rate": 0.00011312561334641805, + "loss": 0.0706, + "step": 13200 + }, + { + "epoch": 18.97, + "eval_loss": 0.16251307725906372, + "eval_runtime": 39.9205, + "eval_samples_per_second": 11.448, + "eval_steps_per_second": 1.453, + "eval_wer": 0.16774582141243788, + "step": 13200 + }, + { + "epoch": 18.98, + "learning_rate": 0.00011297841020608439, + "loss": 0.0606, + "step": 13210 + }, + { + "epoch": 18.99, + "learning_rate": 0.00011283120706575073, + "loss": 0.0619, + "step": 13220 + }, + { + "epoch": 19.01, + "learning_rate": 0.00011268400392541707, + "loss": 0.0671, + "step": 13230 + }, + { + "epoch": 19.02, + "learning_rate": 0.00011253680078508341, + "loss": 0.0765, + "step": 13240 + }, + { + "epoch": 19.04, + "learning_rate": 0.00011238959764474975, + "loss": 0.0798, + "step": 13250 + }, + { + "epoch": 19.05, + "learning_rate": 0.00011224239450441609, + "loss": 0.0822, + "step": 13260 + }, + { + "epoch": 19.07, + "learning_rate": 0.00011209519136408243, + "loss": 0.0743, + "step": 13270 + }, + { + "epoch": 19.08, + "learning_rate": 0.00011194798822374877, + "loss": 0.0842, + "step": 13280 + }, + { + "epoch": 19.09, + "learning_rate": 0.0001118007850834151, + "loss": 0.08, + "step": 13290 + }, + { + "epoch": 19.11, + "learning_rate": 0.00011165358194308145, + "loss": 0.0693, + "step": 13300 + }, + { + "epoch": 19.11, + "eval_loss": 0.16297851502895355, + "eval_runtime": 40.169, + "eval_samples_per_second": 11.377, + "eval_steps_per_second": 1.444, + "eval_wer": 0.16910103900015058, + "step": 13300 + }, + { + "epoch": 19.12, + "learning_rate": 0.00011150637880274778, + "loss": 0.0847, + "step": 13310 + }, + { + "epoch": 19.14, + "learning_rate": 0.00011135917566241413, + "loss": 0.0775, + "step": 13320 + }, + { + "epoch": 19.15, + "learning_rate": 0.00011121197252208046, + "loss": 0.0876, + "step": 13330 + }, + { + "epoch": 19.17, + "learning_rate": 0.00011106476938174681, + "loss": 0.0912, + "step": 13340 + }, + { + "epoch": 19.18, + "learning_rate": 0.00011091756624141314, + "loss": 0.0635, + "step": 13350 + }, + { + "epoch": 19.2, + "learning_rate": 0.00011077036310107949, + "loss": 0.0762, + "step": 13360 + }, + { + "epoch": 19.21, + "learning_rate": 0.00011062315996074582, + "loss": 0.0885, + "step": 13370 + }, + { + "epoch": 19.22, + "learning_rate": 0.00011047595682041217, + "loss": 0.0821, + "step": 13380 + }, + { + "epoch": 19.24, + "learning_rate": 0.0001103287536800785, + "loss": 0.0731, + "step": 13390 + }, + { + "epoch": 19.25, + "learning_rate": 0.00011018155053974485, + "loss": 0.0736, + "step": 13400 + }, + { + "epoch": 19.25, + "eval_loss": 0.16010314226150513, + "eval_runtime": 40.0705, + "eval_samples_per_second": 11.405, + "eval_steps_per_second": 1.447, + "eval_wer": 0.16714350248456558, + "step": 13400 + }, + { + "epoch": 19.27, + "learning_rate": 0.00011003434739941118, + "loss": 0.0817, + "step": 13410 + }, + { + "epoch": 19.28, + "learning_rate": 0.00010988714425907753, + "loss": 0.0842, + "step": 13420 + }, + { + "epoch": 19.3, + "learning_rate": 0.00010973994111874386, + "loss": 0.0852, + "step": 13430 + }, + { + "epoch": 19.31, + "learning_rate": 0.00010959273797841018, + "loss": 0.0867, + "step": 13440 + }, + { + "epoch": 19.32, + "learning_rate": 0.00010944553483807654, + "loss": 0.0984, + "step": 13450 + }, + { + "epoch": 19.34, + "learning_rate": 0.00010929833169774286, + "loss": 0.0867, + "step": 13460 + }, + { + "epoch": 19.35, + "learning_rate": 0.00010915112855740922, + "loss": 0.0619, + "step": 13470 + }, + { + "epoch": 19.37, + "learning_rate": 0.00010900392541707554, + "loss": 0.089, + "step": 13480 + }, + { + "epoch": 19.38, + "learning_rate": 0.0001088567222767419, + "loss": 0.0666, + "step": 13490 + }, + { + "epoch": 19.4, + "learning_rate": 0.00010870951913640822, + "loss": 0.0877, + "step": 13500 + }, + { + "epoch": 19.4, + "eval_loss": 0.16647975146770477, + "eval_runtime": 39.9295, + "eval_samples_per_second": 11.445, + "eval_steps_per_second": 1.453, + "eval_wer": 0.1689504592681825, + "step": 13500 + }, + { + "epoch": 19.41, + "learning_rate": 0.00010856231599607458, + "loss": 0.0905, + "step": 13510 + }, + { + "epoch": 19.43, + "learning_rate": 0.0001084151128557409, + "loss": 0.0656, + "step": 13520 + }, + { + "epoch": 19.44, + "learning_rate": 0.00010826790971540726, + "loss": 0.0834, + "step": 13530 + }, + { + "epoch": 19.45, + "learning_rate": 0.00010812070657507358, + "loss": 0.0769, + "step": 13540 + }, + { + "epoch": 19.47, + "learning_rate": 0.00010797350343473995, + "loss": 0.0981, + "step": 13550 + }, + { + "epoch": 19.48, + "learning_rate": 0.00010782630029440627, + "loss": 0.1006, + "step": 13560 + }, + { + "epoch": 19.5, + "learning_rate": 0.00010767909715407263, + "loss": 0.0693, + "step": 13570 + }, + { + "epoch": 19.51, + "learning_rate": 0.00010753189401373895, + "loss": 0.0747, + "step": 13580 + }, + { + "epoch": 19.53, + "learning_rate": 0.00010738469087340528, + "loss": 0.077, + "step": 13590 + }, + { + "epoch": 19.54, + "learning_rate": 0.00010723748773307163, + "loss": 0.0735, + "step": 13600 + }, + { + "epoch": 19.54, + "eval_loss": 0.16026227176189423, + "eval_runtime": 39.8849, + "eval_samples_per_second": 11.458, + "eval_steps_per_second": 1.454, + "eval_wer": 0.1675952416804698, + "step": 13600 + }, + { + "epoch": 19.55, + "learning_rate": 0.00010709028459273796, + "loss": 0.1046, + "step": 13610 + }, + { + "epoch": 19.57, + "learning_rate": 0.0001069430814524043, + "loss": 0.0685, + "step": 13620 + }, + { + "epoch": 19.58, + "learning_rate": 0.00010679587831207064, + "loss": 0.0856, + "step": 13630 + }, + { + "epoch": 19.6, + "learning_rate": 0.00010664867517173699, + "loss": 0.0621, + "step": 13640 + }, + { + "epoch": 19.61, + "learning_rate": 0.00010650147203140332, + "loss": 0.0743, + "step": 13650 + }, + { + "epoch": 19.63, + "learning_rate": 0.00010635426889106967, + "loss": 0.0899, + "step": 13660 + }, + { + "epoch": 19.64, + "learning_rate": 0.000106207065750736, + "loss": 0.0761, + "step": 13670 + }, + { + "epoch": 19.66, + "learning_rate": 0.00010605986261040235, + "loss": 0.0887, + "step": 13680 + }, + { + "epoch": 19.67, + "learning_rate": 0.00010591265947006868, + "loss": 0.082, + "step": 13690 + }, + { + "epoch": 19.68, + "learning_rate": 0.00010576545632973503, + "loss": 0.0804, + "step": 13700 + }, + { + "epoch": 19.68, + "eval_loss": 0.16200566291809082, + "eval_runtime": 40.0981, + "eval_samples_per_second": 11.397, + "eval_steps_per_second": 1.446, + "eval_wer": 0.17060683631983134, + "step": 13700 + }, + { + "epoch": 19.7, + "learning_rate": 0.00010561825318940136, + "loss": 0.08, + "step": 13710 + }, + { + "epoch": 19.71, + "learning_rate": 0.00010547105004906771, + "loss": 0.0683, + "step": 13720 + }, + { + "epoch": 19.73, + "learning_rate": 0.00010532384690873404, + "loss": 0.0769, + "step": 13730 + }, + { + "epoch": 19.74, + "learning_rate": 0.00010517664376840037, + "loss": 0.0768, + "step": 13740 + }, + { + "epoch": 19.76, + "learning_rate": 0.00010502944062806672, + "loss": 0.0666, + "step": 13750 + }, + { + "epoch": 19.77, + "learning_rate": 0.00010488223748773305, + "loss": 0.0676, + "step": 13760 + }, + { + "epoch": 19.78, + "learning_rate": 0.0001047350343473994, + "loss": 0.0745, + "step": 13770 + }, + { + "epoch": 19.8, + "learning_rate": 0.00010458783120706574, + "loss": 0.0802, + "step": 13780 + }, + { + "epoch": 19.81, + "learning_rate": 0.00010444062806673208, + "loss": 0.0733, + "step": 13790 + }, + { + "epoch": 19.83, + "learning_rate": 0.00010429342492639842, + "loss": 0.0871, + "step": 13800 + }, + { + "epoch": 19.83, + "eval_loss": 0.1567193865776062, + "eval_runtime": 39.8991, + "eval_samples_per_second": 11.454, + "eval_steps_per_second": 1.454, + "eval_wer": 0.1644330673091402, + "step": 13800 + }, + { + "epoch": 19.84, + "learning_rate": 0.00010414622178606476, + "loss": 0.0767, + "step": 13810 + }, + { + "epoch": 19.86, + "learning_rate": 0.0001039990186457311, + "loss": 0.0782, + "step": 13820 + }, + { + "epoch": 19.87, + "learning_rate": 0.00010385181550539744, + "loss": 0.077, + "step": 13830 + }, + { + "epoch": 19.89, + "learning_rate": 0.00010370461236506378, + "loss": 0.0592, + "step": 13840 + }, + { + "epoch": 19.9, + "learning_rate": 0.00010355740922473012, + "loss": 0.0768, + "step": 13850 + }, + { + "epoch": 19.91, + "learning_rate": 0.00010341020608439646, + "loss": 0.0797, + "step": 13860 + }, + { + "epoch": 19.93, + "learning_rate": 0.0001032630029440628, + "loss": 0.0721, + "step": 13870 + }, + { + "epoch": 19.94, + "learning_rate": 0.00010311579980372914, + "loss": 0.0699, + "step": 13880 + }, + { + "epoch": 19.96, + "learning_rate": 0.00010296859666339547, + "loss": 0.0656, + "step": 13890 + }, + { + "epoch": 19.97, + "learning_rate": 0.00010282139352306182, + "loss": 0.0822, + "step": 13900 + }, + { + "epoch": 19.97, + "eval_loss": 0.1556914746761322, + "eval_runtime": 40.153, + "eval_samples_per_second": 11.381, + "eval_steps_per_second": 1.444, + "eval_wer": 0.16578828489685288, + "step": 13900 + }, + { + "epoch": 19.99, + "learning_rate": 0.00010267419038272815, + "loss": 0.0944, + "step": 13910 + }, + { + "epoch": 20.0, + "learning_rate": 0.0001025269872423945, + "loss": 0.0612, + "step": 13920 + }, + { + "epoch": 20.01, + "learning_rate": 0.00010237978410206083, + "loss": 0.082, + "step": 13930 + }, + { + "epoch": 20.03, + "learning_rate": 0.00010224730127576054, + "loss": 0.0691, + "step": 13940 + }, + { + "epoch": 20.04, + "learning_rate": 0.00010210009813542687, + "loss": 0.068, + "step": 13950 + }, + { + "epoch": 20.06, + "learning_rate": 0.00010195289499509322, + "loss": 0.0663, + "step": 13960 + }, + { + "epoch": 20.07, + "learning_rate": 0.00010180569185475955, + "loss": 0.0654, + "step": 13970 + }, + { + "epoch": 20.09, + "learning_rate": 0.0001016584887144259, + "loss": 0.091, + "step": 13980 + }, + { + "epoch": 20.1, + "learning_rate": 0.00010151128557409223, + "loss": 0.075, + "step": 13990 + }, + { + "epoch": 20.11, + "learning_rate": 0.00010136408243375858, + "loss": 0.0784, + "step": 14000 + }, + { + "epoch": 20.11, + "eval_loss": 0.16241466999053955, + "eval_runtime": 39.9865, + "eval_samples_per_second": 11.429, + "eval_steps_per_second": 1.45, + "eval_wer": 0.16187321186568288, + "step": 14000 + }, + { + "epoch": 20.13, + "learning_rate": 0.00010121687929342491, + "loss": 0.0876, + "step": 14010 + }, + { + "epoch": 20.14, + "learning_rate": 0.00010106967615309126, + "loss": 0.0809, + "step": 14020 + }, + { + "epoch": 20.16, + "learning_rate": 0.00010092247301275759, + "loss": 0.0855, + "step": 14030 + }, + { + "epoch": 20.17, + "learning_rate": 0.00010077526987242394, + "loss": 0.0702, + "step": 14040 + }, + { + "epoch": 20.19, + "learning_rate": 0.00010062806673209027, + "loss": 0.0846, + "step": 14050 + }, + { + "epoch": 20.2, + "learning_rate": 0.00010048086359175662, + "loss": 0.0724, + "step": 14060 + }, + { + "epoch": 20.22, + "learning_rate": 0.00010033366045142295, + "loss": 0.0664, + "step": 14070 + }, + { + "epoch": 20.23, + "learning_rate": 0.0001001864573110893, + "loss": 0.0825, + "step": 14080 + }, + { + "epoch": 20.24, + "learning_rate": 0.00010003925417075563, + "loss": 0.0651, + "step": 14090 + }, + { + "epoch": 20.26, + "learning_rate": 9.989205103042197e-05, + "loss": 0.0822, + "step": 14100 + }, + { + "epoch": 20.26, + "eval_loss": 0.16037575900554657, + "eval_runtime": 39.914, + "eval_samples_per_second": 11.45, + "eval_steps_per_second": 1.453, + "eval_wer": 0.1617226321337148, + "step": 14100 + }, + { + "epoch": 20.27, + "learning_rate": 9.974484789008831e-05, + "loss": 0.0743, + "step": 14110 + }, + { + "epoch": 20.29, + "learning_rate": 9.959764474975465e-05, + "loss": 0.0709, + "step": 14120 + }, + { + "epoch": 20.3, + "learning_rate": 9.945044160942099e-05, + "loss": 0.068, + "step": 14130 + }, + { + "epoch": 20.32, + "learning_rate": 9.930323846908733e-05, + "loss": 0.067, + "step": 14140 + }, + { + "epoch": 20.33, + "learning_rate": 9.915603532875367e-05, + "loss": 0.0749, + "step": 14150 + }, + { + "epoch": 20.34, + "learning_rate": 9.900883218842e-05, + "loss": 0.0676, + "step": 14160 + }, + { + "epoch": 20.36, + "learning_rate": 9.886162904808635e-05, + "loss": 0.0652, + "step": 14170 + }, + { + "epoch": 20.37, + "learning_rate": 9.871442590775269e-05, + "loss": 0.0841, + "step": 14180 + }, + { + "epoch": 20.39, + "learning_rate": 9.856722276741903e-05, + "loss": 0.0779, + "step": 14190 + }, + { + "epoch": 20.4, + "learning_rate": 9.842001962708537e-05, + "loss": 0.0694, + "step": 14200 + }, + { + "epoch": 20.4, + "eval_loss": 0.14927269518375397, + "eval_runtime": 40.1956, + "eval_samples_per_second": 11.369, + "eval_steps_per_second": 1.443, + "eval_wer": 0.16142147266977866, + "step": 14200 + }, + { + "epoch": 20.42, + "learning_rate": 9.827281648675171e-05, + "loss": 0.0796, + "step": 14210 + }, + { + "epoch": 20.43, + "learning_rate": 9.812561334641805e-05, + "loss": 0.0779, + "step": 14220 + }, + { + "epoch": 20.45, + "learning_rate": 9.79784102060844e-05, + "loss": 0.0788, + "step": 14230 + }, + { + "epoch": 20.46, + "learning_rate": 9.783120706575073e-05, + "loss": 0.0567, + "step": 14240 + }, + { + "epoch": 20.47, + "learning_rate": 9.768400392541706e-05, + "loss": 0.0715, + "step": 14250 + }, + { + "epoch": 20.49, + "learning_rate": 9.753680078508341e-05, + "loss": 0.0744, + "step": 14260 + }, + { + "epoch": 20.5, + "learning_rate": 9.738959764474974e-05, + "loss": 0.0641, + "step": 14270 + }, + { + "epoch": 20.52, + "learning_rate": 9.724239450441609e-05, + "loss": 0.0776, + "step": 14280 + }, + { + "epoch": 20.53, + "learning_rate": 9.709519136408242e-05, + "loss": 0.0637, + "step": 14290 + }, + { + "epoch": 20.55, + "learning_rate": 9.694798822374877e-05, + "loss": 0.0775, + "step": 14300 + }, + { + "epoch": 20.55, + "eval_loss": 0.1541454941034317, + "eval_runtime": 39.9553, + "eval_samples_per_second": 11.438, + "eval_steps_per_second": 1.452, + "eval_wer": 0.16081915374190633, + "step": 14300 + }, + { + "epoch": 20.56, + "learning_rate": 9.68007850834151e-05, + "loss": 0.0805, + "step": 14310 + }, + { + "epoch": 20.57, + "learning_rate": 9.665358194308145e-05, + "loss": 0.0722, + "step": 14320 + }, + { + "epoch": 20.59, + "learning_rate": 9.650637880274778e-05, + "loss": 0.0682, + "step": 14330 + }, + { + "epoch": 20.6, + "learning_rate": 9.635917566241413e-05, + "loss": 0.0724, + "step": 14340 + }, + { + "epoch": 20.62, + "learning_rate": 9.621197252208046e-05, + "loss": 0.0834, + "step": 14350 + }, + { + "epoch": 20.63, + "learning_rate": 9.606476938174681e-05, + "loss": 0.0795, + "step": 14360 + }, + { + "epoch": 20.65, + "learning_rate": 9.591756624141314e-05, + "loss": 0.0874, + "step": 14370 + }, + { + "epoch": 20.66, + "learning_rate": 9.577036310107949e-05, + "loss": 0.0689, + "step": 14380 + }, + { + "epoch": 20.68, + "learning_rate": 9.562315996074582e-05, + "loss": 0.0669, + "step": 14390 + }, + { + "epoch": 20.69, + "learning_rate": 9.547595682041216e-05, + "loss": 0.0747, + "step": 14400 + }, + { + "epoch": 20.69, + "eval_loss": 0.15958380699157715, + "eval_runtime": 40.1805, + "eval_samples_per_second": 11.374, + "eval_steps_per_second": 1.443, + "eval_wer": 0.1624755307935552, + "step": 14400 + }, + { + "epoch": 20.7, + "learning_rate": 9.53287536800785e-05, + "loss": 0.0737, + "step": 14410 + }, + { + "epoch": 20.72, + "learning_rate": 9.518155053974484e-05, + "loss": 0.0717, + "step": 14420 + }, + { + "epoch": 20.73, + "learning_rate": 9.503434739941118e-05, + "loss": 0.0923, + "step": 14430 + }, + { + "epoch": 20.75, + "learning_rate": 9.488714425907752e-05, + "loss": 0.0623, + "step": 14440 + }, + { + "epoch": 20.76, + "learning_rate": 9.473994111874386e-05, + "loss": 0.0658, + "step": 14450 + }, + { + "epoch": 20.78, + "learning_rate": 9.45927379784102e-05, + "loss": 0.0658, + "step": 14460 + }, + { + "epoch": 20.79, + "learning_rate": 9.444553483807654e-05, + "loss": 0.068, + "step": 14470 + }, + { + "epoch": 20.8, + "learning_rate": 9.429833169774288e-05, + "loss": 0.0697, + "step": 14480 + }, + { + "epoch": 20.82, + "learning_rate": 9.415112855740923e-05, + "loss": 0.0618, + "step": 14490 + }, + { + "epoch": 20.83, + "learning_rate": 9.400392541707556e-05, + "loss": 0.0701, + "step": 14500 + }, + { + "epoch": 20.83, + "eval_loss": 0.15933384001255035, + "eval_runtime": 40.0625, + "eval_samples_per_second": 11.407, + "eval_steps_per_second": 1.448, + "eval_wer": 0.16081915374190633, + "step": 14500 + }, + { + "epoch": 20.85, + "learning_rate": 9.38567222767419e-05, + "loss": 0.0737, + "step": 14510 + }, + { + "epoch": 20.86, + "learning_rate": 9.370951913640824e-05, + "loss": 0.0772, + "step": 14520 + }, + { + "epoch": 20.88, + "learning_rate": 9.356231599607459e-05, + "loss": 0.0846, + "step": 14530 + }, + { + "epoch": 20.89, + "learning_rate": 9.341511285574092e-05, + "loss": 0.0514, + "step": 14540 + }, + { + "epoch": 20.91, + "learning_rate": 9.326790971540725e-05, + "loss": 0.0853, + "step": 14550 + }, + { + "epoch": 20.92, + "learning_rate": 9.31207065750736e-05, + "loss": 0.0715, + "step": 14560 + }, + { + "epoch": 20.93, + "learning_rate": 9.297350343473993e-05, + "loss": 0.0635, + "step": 14570 + }, + { + "epoch": 20.95, + "learning_rate": 9.282630029440628e-05, + "loss": 0.0978, + "step": 14580 + }, + { + "epoch": 20.96, + "learning_rate": 9.267909715407261e-05, + "loss": 0.0803, + "step": 14590 + }, + { + "epoch": 20.98, + "learning_rate": 9.253189401373896e-05, + "loss": 0.0698, + "step": 14600 + }, + { + "epoch": 20.98, + "eval_loss": 0.15506555140018463, + "eval_runtime": 40.1892, + "eval_samples_per_second": 11.371, + "eval_steps_per_second": 1.443, + "eval_wer": 0.16081915374190633, + "step": 14600 + }, + { + "epoch": 20.99, + "learning_rate": 9.23846908734053e-05, + "loss": 0.0791, + "step": 14610 + }, + { + "epoch": 21.01, + "learning_rate": 9.223748773307164e-05, + "loss": 0.0568, + "step": 14620 + }, + { + "epoch": 21.02, + "learning_rate": 9.209028459273797e-05, + "loss": 0.0696, + "step": 14630 + }, + { + "epoch": 21.03, + "learning_rate": 9.194308145240432e-05, + "loss": 0.082, + "step": 14640 + }, + { + "epoch": 21.05, + "learning_rate": 9.179587831207065e-05, + "loss": 0.0648, + "step": 14650 + }, + { + "epoch": 21.06, + "learning_rate": 9.1648675171737e-05, + "loss": 0.056, + "step": 14660 + }, + { + "epoch": 21.08, + "learning_rate": 9.150147203140332e-05, + "loss": 0.0694, + "step": 14670 + }, + { + "epoch": 21.09, + "learning_rate": 9.135426889106968e-05, + "loss": 0.0662, + "step": 14680 + }, + { + "epoch": 21.11, + "learning_rate": 9.1207065750736e-05, + "loss": 0.0671, + "step": 14690 + }, + { + "epoch": 21.12, + "learning_rate": 9.105986261040233e-05, + "loss": 0.0785, + "step": 14700 + }, + { + "epoch": 21.12, + "eval_loss": 0.15715524554252625, + "eval_runtime": 40.3412, + "eval_samples_per_second": 11.328, + "eval_steps_per_second": 1.438, + "eval_wer": 0.1636801686492998, + "step": 14700 + }, + { + "epoch": 21.14, + "learning_rate": 9.091265947006868e-05, + "loss": 0.0661, + "step": 14710 + }, + { + "epoch": 21.15, + "learning_rate": 9.076545632973502e-05, + "loss": 0.0702, + "step": 14720 + }, + { + "epoch": 21.16, + "learning_rate": 9.061825318940136e-05, + "loss": 0.0671, + "step": 14730 + }, + { + "epoch": 21.18, + "learning_rate": 9.04710500490677e-05, + "loss": 0.0707, + "step": 14740 + }, + { + "epoch": 21.19, + "learning_rate": 9.032384690873404e-05, + "loss": 0.0559, + "step": 14750 + }, + { + "epoch": 21.21, + "learning_rate": 9.017664376840038e-05, + "loss": 0.068, + "step": 14760 + }, + { + "epoch": 21.22, + "learning_rate": 9.002944062806672e-05, + "loss": 0.0817, + "step": 14770 + }, + { + "epoch": 21.24, + "learning_rate": 8.988223748773306e-05, + "loss": 0.0792, + "step": 14780 + }, + { + "epoch": 21.25, + "learning_rate": 8.97350343473994e-05, + "loss": 0.054, + "step": 14790 + }, + { + "epoch": 21.26, + "learning_rate": 8.958783120706574e-05, + "loss": 0.0975, + "step": 14800 + }, + { + "epoch": 21.26, + "eval_loss": 0.16008907556533813, + "eval_runtime": 40.1457, + "eval_samples_per_second": 11.384, + "eval_steps_per_second": 1.445, + "eval_wer": 0.16322842945339558, + "step": 14800 + }, + { + "epoch": 21.28, + "learning_rate": 8.944062806673208e-05, + "loss": 0.0653, + "step": 14810 + }, + { + "epoch": 21.29, + "learning_rate": 8.929342492639842e-05, + "loss": 0.0675, + "step": 14820 + }, + { + "epoch": 21.31, + "learning_rate": 8.914622178606476e-05, + "loss": 0.0676, + "step": 14830 + }, + { + "epoch": 21.32, + "learning_rate": 8.89990186457311e-05, + "loss": 0.0631, + "step": 14840 + }, + { + "epoch": 21.34, + "learning_rate": 8.885181550539743e-05, + "loss": 0.0625, + "step": 14850 + }, + { + "epoch": 21.35, + "learning_rate": 8.870461236506378e-05, + "loss": 0.071, + "step": 14860 + }, + { + "epoch": 21.36, + "learning_rate": 8.855740922473011e-05, + "loss": 0.0684, + "step": 14870 + }, + { + "epoch": 21.38, + "learning_rate": 8.841020608439646e-05, + "loss": 0.0656, + "step": 14880 + }, + { + "epoch": 21.39, + "learning_rate": 8.826300294406279e-05, + "loss": 0.0609, + "step": 14890 + }, + { + "epoch": 21.41, + "learning_rate": 8.811579980372914e-05, + "loss": 0.0697, + "step": 14900 + }, + { + "epoch": 21.41, + "eval_loss": 0.15438880026340485, + "eval_runtime": 40.0849, + "eval_samples_per_second": 11.401, + "eval_steps_per_second": 1.447, + "eval_wer": 0.15931335642222558, + "step": 14900 + }, + { + "epoch": 21.42, + "learning_rate": 8.796859666339547e-05, + "loss": 0.0698, + "step": 14910 + }, + { + "epoch": 21.44, + "learning_rate": 8.782139352306182e-05, + "loss": 0.0645, + "step": 14920 + }, + { + "epoch": 21.45, + "learning_rate": 8.767419038272815e-05, + "loss": 0.0664, + "step": 14930 + }, + { + "epoch": 21.47, + "learning_rate": 8.75269872423945e-05, + "loss": 0.0682, + "step": 14940 + }, + { + "epoch": 21.48, + "learning_rate": 8.737978410206083e-05, + "loss": 0.0693, + "step": 14950 + }, + { + "epoch": 21.49, + "learning_rate": 8.723258096172718e-05, + "loss": 0.0717, + "step": 14960 + }, + { + "epoch": 21.51, + "learning_rate": 8.708537782139351e-05, + "loss": 0.0818, + "step": 14970 + }, + { + "epoch": 21.52, + "learning_rate": 8.693817468105985e-05, + "loss": 0.0579, + "step": 14980 + }, + { + "epoch": 21.54, + "learning_rate": 8.679097154072619e-05, + "loss": 0.0598, + "step": 14990 + }, + { + "epoch": 21.55, + "learning_rate": 8.664376840039253e-05, + "loss": 0.0638, + "step": 15000 + }, + { + "epoch": 21.55, + "eval_loss": 0.14896854758262634, + "eval_runtime": 40.2901, + "eval_samples_per_second": 11.343, + "eval_steps_per_second": 1.44, + "eval_wer": 0.1572052401746725, + "step": 15000 + }, + { + "epoch": 21.57, + "learning_rate": 8.649656526005887e-05, + "loss": 0.07, + "step": 15010 + }, + { + "epoch": 21.58, + "learning_rate": 8.63493621197252e-05, + "loss": 0.0689, + "step": 15020 + }, + { + "epoch": 21.59, + "learning_rate": 8.620215897939155e-05, + "loss": 0.064, + "step": 15030 + }, + { + "epoch": 21.61, + "learning_rate": 8.605495583905789e-05, + "loss": 0.0582, + "step": 15040 + }, + { + "epoch": 21.62, + "learning_rate": 8.590775269872423e-05, + "loss": 0.0626, + "step": 15050 + }, + { + "epoch": 21.64, + "learning_rate": 8.576054955839057e-05, + "loss": 0.0564, + "step": 15060 + }, + { + "epoch": 21.65, + "learning_rate": 8.561334641805691e-05, + "loss": 0.0642, + "step": 15070 + }, + { + "epoch": 21.67, + "learning_rate": 8.546614327772325e-05, + "loss": 0.056, + "step": 15080 + }, + { + "epoch": 21.68, + "learning_rate": 8.53189401373896e-05, + "loss": 0.064, + "step": 15090 + }, + { + "epoch": 21.7, + "learning_rate": 8.517173699705593e-05, + "loss": 0.0665, + "step": 15100 + }, + { + "epoch": 21.7, + "eval_loss": 0.15601423382759094, + "eval_runtime": 40.1857, + "eval_samples_per_second": 11.372, + "eval_steps_per_second": 1.443, + "eval_wer": 0.1558500225869598, + "step": 15100 + }, + { + "epoch": 21.71, + "learning_rate": 8.502453385672227e-05, + "loss": 0.0687, + "step": 15110 + }, + { + "epoch": 21.72, + "learning_rate": 8.487733071638861e-05, + "loss": 0.0617, + "step": 15120 + }, + { + "epoch": 21.74, + "learning_rate": 8.473012757605494e-05, + "loss": 0.0851, + "step": 15130 + }, + { + "epoch": 21.75, + "learning_rate": 8.458292443572129e-05, + "loss": 0.0644, + "step": 15140 + }, + { + "epoch": 21.77, + "learning_rate": 8.443572129538762e-05, + "loss": 0.073, + "step": 15150 + }, + { + "epoch": 21.78, + "learning_rate": 8.428851815505397e-05, + "loss": 0.0676, + "step": 15160 + }, + { + "epoch": 21.8, + "learning_rate": 8.41413150147203e-05, + "loss": 0.0772, + "step": 15170 + }, + { + "epoch": 21.81, + "learning_rate": 8.399411187438665e-05, + "loss": 0.0654, + "step": 15180 + }, + { + "epoch": 21.82, + "learning_rate": 8.384690873405298e-05, + "loss": 0.0832, + "step": 15190 + }, + { + "epoch": 21.84, + "learning_rate": 8.369970559371933e-05, + "loss": 0.0764, + "step": 15200 + }, + { + "epoch": 21.84, + "eval_loss": 0.15133680403232574, + "eval_runtime": 40.219, + "eval_samples_per_second": 11.363, + "eval_steps_per_second": 1.442, + "eval_wer": 0.15795813883451287, + "step": 15200 + }, + { + "epoch": 21.85, + "learning_rate": 8.355250245338566e-05, + "loss": 0.0564, + "step": 15210 + }, + { + "epoch": 21.87, + "learning_rate": 8.340529931305201e-05, + "loss": 0.0689, + "step": 15220 + }, + { + "epoch": 21.88, + "learning_rate": 8.325809617271834e-05, + "loss": 0.0747, + "step": 15230 + }, + { + "epoch": 21.9, + "learning_rate": 8.311089303238469e-05, + "loss": 0.0566, + "step": 15240 + }, + { + "epoch": 21.91, + "learning_rate": 8.296368989205102e-05, + "loss": 0.0712, + "step": 15250 + }, + { + "epoch": 21.93, + "learning_rate": 8.281648675171737e-05, + "loss": 0.0637, + "step": 15260 + }, + { + "epoch": 21.94, + "learning_rate": 8.26692836113837e-05, + "loss": 0.0638, + "step": 15270 + }, + { + "epoch": 21.95, + "learning_rate": 8.252208047105004e-05, + "loss": 0.0679, + "step": 15280 + }, + { + "epoch": 21.97, + "learning_rate": 8.237487733071638e-05, + "loss": 0.0616, + "step": 15290 + }, + { + "epoch": 21.98, + "learning_rate": 8.222767419038272e-05, + "loss": 0.0642, + "step": 15300 + }, + { + "epoch": 21.98, + "eval_loss": 0.149861678481102, + "eval_runtime": 40.2796, + "eval_samples_per_second": 11.346, + "eval_steps_per_second": 1.44, + "eval_wer": 0.1552477036590875, + "step": 15300 + }, + { + "epoch": 22.0, + "learning_rate": 8.208047105004906e-05, + "loss": 0.0694, + "step": 15310 + }, + { + "epoch": 22.01, + "learning_rate": 8.19332679097154e-05, + "loss": 0.0605, + "step": 15320 + }, + { + "epoch": 22.03, + "learning_rate": 8.178606476938174e-05, + "loss": 0.0637, + "step": 15330 + }, + { + "epoch": 22.04, + "learning_rate": 8.163886162904808e-05, + "loss": 0.0606, + "step": 15340 + }, + { + "epoch": 22.05, + "learning_rate": 8.149165848871443e-05, + "loss": 0.0583, + "step": 15350 + }, + { + "epoch": 22.07, + "learning_rate": 8.134445534838076e-05, + "loss": 0.0483, + "step": 15360 + }, + { + "epoch": 22.08, + "learning_rate": 8.11972522080471e-05, + "loss": 0.0672, + "step": 15370 + }, + { + "epoch": 22.1, + "learning_rate": 8.105004906771344e-05, + "loss": 0.0558, + "step": 15380 + }, + { + "epoch": 22.11, + "learning_rate": 8.090284592737979e-05, + "loss": 0.0598, + "step": 15390 + }, + { + "epoch": 22.13, + "learning_rate": 8.075564278704612e-05, + "loss": 0.0577, + "step": 15400 + }, + { + "epoch": 22.13, + "eval_loss": 0.15612779557704926, + "eval_runtime": 40.1084, + "eval_samples_per_second": 11.394, + "eval_steps_per_second": 1.446, + "eval_wer": 0.15871103749435325, + "step": 15400 + }, + { + "epoch": 22.14, + "learning_rate": 8.060843964671247e-05, + "loss": 0.0704, + "step": 15410 + }, + { + "epoch": 22.16, + "learning_rate": 8.04612365063788e-05, + "loss": 0.0887, + "step": 15420 + }, + { + "epoch": 22.17, + "learning_rate": 8.031403336604513e-05, + "loss": 0.0569, + "step": 15430 + }, + { + "epoch": 22.18, + "learning_rate": 8.016683022571148e-05, + "loss": 0.0672, + "step": 15440 + }, + { + "epoch": 22.2, + "learning_rate": 8.001962708537781e-05, + "loss": 0.0557, + "step": 15450 + }, + { + "epoch": 22.21, + "learning_rate": 7.987242394504416e-05, + "loss": 0.041, + "step": 15460 + }, + { + "epoch": 22.23, + "learning_rate": 7.97252208047105e-05, + "loss": 0.0759, + "step": 15470 + }, + { + "epoch": 22.24, + "learning_rate": 7.957801766437684e-05, + "loss": 0.0464, + "step": 15480 + }, + { + "epoch": 22.26, + "learning_rate": 7.943081452404317e-05, + "loss": 0.0764, + "step": 15490 + }, + { + "epoch": 22.27, + "learning_rate": 7.928361138370952e-05, + "loss": 0.0551, + "step": 15500 + }, + { + "epoch": 22.27, + "eval_loss": 0.1587643325328827, + "eval_runtime": 40.2333, + "eval_samples_per_second": 11.359, + "eval_steps_per_second": 1.442, + "eval_wer": 0.1570546604427044, + "step": 15500 + }, + { + "epoch": 22.28, + "learning_rate": 7.913640824337585e-05, + "loss": 0.0516, + "step": 15510 + }, + { + "epoch": 22.3, + "learning_rate": 7.89892051030422e-05, + "loss": 0.0619, + "step": 15520 + }, + { + "epoch": 22.31, + "learning_rate": 7.884200196270853e-05, + "loss": 0.0618, + "step": 15530 + }, + { + "epoch": 22.33, + "learning_rate": 7.869479882237488e-05, + "loss": 0.0654, + "step": 15540 + }, + { + "epoch": 22.34, + "learning_rate": 7.854759568204122e-05, + "loss": 0.0652, + "step": 15550 + }, + { + "epoch": 22.36, + "learning_rate": 7.840039254170756e-05, + "loss": 0.0614, + "step": 15560 + }, + { + "epoch": 22.37, + "learning_rate": 7.82531894013739e-05, + "loss": 0.0753, + "step": 15570 + }, + { + "epoch": 22.39, + "learning_rate": 7.810598626104022e-05, + "loss": 0.0618, + "step": 15580 + }, + { + "epoch": 22.4, + "learning_rate": 7.795878312070658e-05, + "loss": 0.0634, + "step": 15590 + }, + { + "epoch": 22.41, + "learning_rate": 7.78115799803729e-05, + "loss": 0.0707, + "step": 15600 + }, + { + "epoch": 22.41, + "eval_loss": 0.1521938592195511, + "eval_runtime": 40.3124, + "eval_samples_per_second": 11.336, + "eval_steps_per_second": 1.439, + "eval_wer": 0.15810871856648095, + "step": 15600 + }, + { + "epoch": 22.43, + "learning_rate": 7.766437684003926e-05, + "loss": 0.0505, + "step": 15610 + }, + { + "epoch": 22.44, + "learning_rate": 7.751717369970558e-05, + "loss": 0.0701, + "step": 15620 + }, + { + "epoch": 22.46, + "learning_rate": 7.736997055937194e-05, + "loss": 0.058, + "step": 15630 + }, + { + "epoch": 22.47, + "learning_rate": 7.722276741903826e-05, + "loss": 0.0668, + "step": 15640 + }, + { + "epoch": 22.49, + "learning_rate": 7.707556427870462e-05, + "loss": 0.0538, + "step": 15650 + }, + { + "epoch": 22.5, + "learning_rate": 7.692836113837094e-05, + "loss": 0.0613, + "step": 15660 + }, + { + "epoch": 22.51, + "learning_rate": 7.67811579980373e-05, + "loss": 0.0562, + "step": 15670 + }, + { + "epoch": 22.53, + "learning_rate": 7.663395485770362e-05, + "loss": 0.0581, + "step": 15680 + }, + { + "epoch": 22.54, + "learning_rate": 7.648675171736998e-05, + "loss": 0.0557, + "step": 15690 + }, + { + "epoch": 22.56, + "learning_rate": 7.63395485770363e-05, + "loss": 0.076, + "step": 15700 + }, + { + "epoch": 22.56, + "eval_loss": 0.14777785539627075, + "eval_runtime": 40.7818, + "eval_samples_per_second": 11.206, + "eval_steps_per_second": 1.422, + "eval_wer": 0.1596145158861617, + "step": 15700 + }, + { + "epoch": 22.57, + "learning_rate": 7.619234543670264e-05, + "loss": 0.0626, + "step": 15710 + }, + { + "epoch": 22.59, + "learning_rate": 7.604514229636898e-05, + "loss": 0.069, + "step": 15720 + }, + { + "epoch": 22.6, + "learning_rate": 7.589793915603531e-05, + "loss": 0.0668, + "step": 15730 + }, + { + "epoch": 22.61, + "learning_rate": 7.575073601570166e-05, + "loss": 0.0886, + "step": 15740 + }, + { + "epoch": 22.63, + "learning_rate": 7.560353287536799e-05, + "loss": 0.0619, + "step": 15750 + }, + { + "epoch": 22.64, + "learning_rate": 7.547105004906771e-05, + "loss": 0.0481, + "step": 15760 + }, + { + "epoch": 22.66, + "learning_rate": 7.532384690873406e-05, + "loss": 0.0674, + "step": 15770 + }, + { + "epoch": 22.67, + "learning_rate": 7.517664376840039e-05, + "loss": 0.073, + "step": 15780 + }, + { + "epoch": 22.69, + "learning_rate": 7.502944062806674e-05, + "loss": 0.057, + "step": 15790 + }, + { + "epoch": 22.7, + "learning_rate": 7.488223748773307e-05, + "loss": 0.0802, + "step": 15800 + }, + { + "epoch": 22.7, + "eval_loss": 0.1453210413455963, + "eval_runtime": 40.4045, + "eval_samples_per_second": 11.311, + "eval_steps_per_second": 1.435, + "eval_wer": 0.15464538473121517, + "step": 15800 + }, + { + "epoch": 22.72, + "learning_rate": 7.47350343473994e-05, + "loss": 0.063, + "step": 15810 + }, + { + "epoch": 22.73, + "learning_rate": 7.458783120706575e-05, + "loss": 0.0889, + "step": 15820 + }, + { + "epoch": 22.74, + "learning_rate": 7.444062806673208e-05, + "loss": 0.0682, + "step": 15830 + }, + { + "epoch": 22.76, + "learning_rate": 7.429342492639843e-05, + "loss": 0.0548, + "step": 15840 + }, + { + "epoch": 22.77, + "learning_rate": 7.414622178606477e-05, + "loss": 0.0677, + "step": 15850 + }, + { + "epoch": 22.79, + "learning_rate": 7.399901864573111e-05, + "loss": 0.0705, + "step": 15860 + }, + { + "epoch": 22.8, + "learning_rate": 7.385181550539743e-05, + "loss": 0.0634, + "step": 15870 + }, + { + "epoch": 22.82, + "learning_rate": 7.370461236506378e-05, + "loss": 0.0574, + "step": 15880 + }, + { + "epoch": 22.83, + "learning_rate": 7.355740922473011e-05, + "loss": 0.0654, + "step": 15890 + }, + { + "epoch": 22.84, + "learning_rate": 7.341020608439646e-05, + "loss": 0.0593, + "step": 15900 + }, + { + "epoch": 22.84, + "eval_loss": 0.14600467681884766, + "eval_runtime": 40.4483, + "eval_samples_per_second": 11.298, + "eval_steps_per_second": 1.434, + "eval_wer": 0.1552477036590875, + "step": 15900 + }, + { + "epoch": 22.86, + "learning_rate": 7.326300294406279e-05, + "loss": 0.0698, + "step": 15910 + }, + { + "epoch": 22.87, + "learning_rate": 7.311579980372914e-05, + "loss": 0.0741, + "step": 15920 + }, + { + "epoch": 22.89, + "learning_rate": 7.296859666339547e-05, + "loss": 0.0498, + "step": 15930 + }, + { + "epoch": 22.9, + "learning_rate": 7.282139352306182e-05, + "loss": 0.0633, + "step": 15940 + }, + { + "epoch": 22.92, + "learning_rate": 7.267419038272815e-05, + "loss": 0.0705, + "step": 15950 + }, + { + "epoch": 22.93, + "learning_rate": 7.25269872423945e-05, + "loss": 0.0648, + "step": 15960 + }, + { + "epoch": 22.95, + "learning_rate": 7.237978410206083e-05, + "loss": 0.0609, + "step": 15970 + }, + { + "epoch": 22.96, + "learning_rate": 7.223258096172718e-05, + "loss": 0.06, + "step": 15980 + }, + { + "epoch": 22.97, + "learning_rate": 7.208537782139351e-05, + "loss": 0.0535, + "step": 15990 + }, + { + "epoch": 22.99, + "learning_rate": 7.193817468105986e-05, + "loss": 0.0609, + "step": 16000 + }, + { + "epoch": 22.99, + "eval_loss": 0.14838065207004547, + "eval_runtime": 40.4523, + "eval_samples_per_second": 11.297, + "eval_steps_per_second": 1.434, + "eval_wer": 0.15675350097876825, + "step": 16000 + }, + { + "epoch": 23.0, + "learning_rate": 7.17909715407262e-05, + "loss": 0.0718, + "step": 16010 + }, + { + "epoch": 23.02, + "learning_rate": 7.164376840039253e-05, + "loss": 0.061, + "step": 16020 + }, + { + "epoch": 23.03, + "learning_rate": 7.149656526005887e-05, + "loss": 0.0591, + "step": 16030 + }, + { + "epoch": 23.05, + "learning_rate": 7.134936211972521e-05, + "loss": 0.0588, + "step": 16040 + }, + { + "epoch": 23.06, + "learning_rate": 7.120215897939155e-05, + "loss": 0.0599, + "step": 16050 + }, + { + "epoch": 23.07, + "learning_rate": 7.105495583905789e-05, + "loss": 0.0639, + "step": 16060 + }, + { + "epoch": 23.09, + "learning_rate": 7.090775269872424e-05, + "loss": 0.0617, + "step": 16070 + }, + { + "epoch": 23.1, + "learning_rate": 7.076054955839057e-05, + "loss": 0.0563, + "step": 16080 + }, + { + "epoch": 23.12, + "learning_rate": 7.061334641805692e-05, + "loss": 0.0638, + "step": 16090 + }, + { + "epoch": 23.13, + "learning_rate": 7.046614327772325e-05, + "loss": 0.0587, + "step": 16100 + }, + { + "epoch": 23.13, + "eval_loss": 0.1451614946126938, + "eval_runtime": 40.4862, + "eval_samples_per_second": 11.288, + "eval_steps_per_second": 1.433, + "eval_wer": 0.15359132660743863, + "step": 16100 + }, + { + "epoch": 23.15, + "learning_rate": 7.03189401373896e-05, + "loss": 0.069, + "step": 16110 + }, + { + "epoch": 23.16, + "learning_rate": 7.017173699705593e-05, + "loss": 0.0651, + "step": 16120 + }, + { + "epoch": 23.18, + "learning_rate": 7.002453385672228e-05, + "loss": 0.0551, + "step": 16130 + }, + { + "epoch": 23.19, + "learning_rate": 6.987733071638861e-05, + "loss": 0.064, + "step": 16140 + }, + { + "epoch": 23.2, + "learning_rate": 6.973012757605496e-05, + "loss": 0.0604, + "step": 16150 + }, + { + "epoch": 23.22, + "learning_rate": 6.958292443572129e-05, + "loss": 0.0697, + "step": 16160 + }, + { + "epoch": 23.23, + "learning_rate": 6.943572129538762e-05, + "loss": 0.0564, + "step": 16170 + }, + { + "epoch": 23.25, + "learning_rate": 6.928851815505397e-05, + "loss": 0.0583, + "step": 16180 + }, + { + "epoch": 23.26, + "learning_rate": 6.91413150147203e-05, + "loss": 0.0566, + "step": 16190 + }, + { + "epoch": 23.28, + "learning_rate": 6.899411187438665e-05, + "loss": 0.0636, + "step": 16200 + }, + { + "epoch": 23.28, + "eval_loss": 0.14748641848564148, + "eval_runtime": 40.5091, + "eval_samples_per_second": 11.281, + "eval_steps_per_second": 1.432, + "eval_wer": 0.15283842794759825, + "step": 16200 + }, + { + "epoch": 23.29, + "learning_rate": 6.884690873405298e-05, + "loss": 0.0613, + "step": 16210 + }, + { + "epoch": 23.3, + "learning_rate": 6.869970559371933e-05, + "loss": 0.0664, + "step": 16220 + }, + { + "epoch": 23.32, + "learning_rate": 6.855250245338566e-05, + "loss": 0.0562, + "step": 16230 + }, + { + "epoch": 23.33, + "learning_rate": 6.840529931305201e-05, + "loss": 0.0588, + "step": 16240 + }, + { + "epoch": 23.35, + "learning_rate": 6.825809617271834e-05, + "loss": 0.0571, + "step": 16250 + }, + { + "epoch": 23.36, + "learning_rate": 6.811089303238469e-05, + "loss": 0.0562, + "step": 16260 + }, + { + "epoch": 23.38, + "learning_rate": 6.796368989205102e-05, + "loss": 0.0643, + "step": 16270 + }, + { + "epoch": 23.39, + "learning_rate": 6.781648675171737e-05, + "loss": 0.0578, + "step": 16280 + }, + { + "epoch": 23.41, + "learning_rate": 6.76692836113837e-05, + "loss": 0.0546, + "step": 16290 + }, + { + "epoch": 23.42, + "learning_rate": 6.752208047105005e-05, + "loss": 0.0506, + "step": 16300 + }, + { + "epoch": 23.42, + "eval_loss": 0.1494196057319641, + "eval_runtime": 40.2779, + "eval_samples_per_second": 11.346, + "eval_steps_per_second": 1.44, + "eval_wer": 0.15449480499924712, + "step": 16300 + }, + { + "epoch": 23.43, + "learning_rate": 6.737487733071637e-05, + "loss": 0.0556, + "step": 16310 + }, + { + "epoch": 23.45, + "learning_rate": 6.722767419038272e-05, + "loss": 0.0671, + "step": 16320 + }, + { + "epoch": 23.46, + "learning_rate": 6.708047105004905e-05, + "loss": 0.0531, + "step": 16330 + }, + { + "epoch": 23.48, + "learning_rate": 6.69332679097154e-05, + "loss": 0.0664, + "step": 16340 + }, + { + "epoch": 23.49, + "learning_rate": 6.678606476938173e-05, + "loss": 0.0583, + "step": 16350 + }, + { + "epoch": 23.51, + "learning_rate": 6.663886162904808e-05, + "loss": 0.0605, + "step": 16360 + }, + { + "epoch": 23.52, + "learning_rate": 6.649165848871441e-05, + "loss": 0.0523, + "step": 16370 + }, + { + "epoch": 23.53, + "learning_rate": 6.634445534838076e-05, + "loss": 0.0456, + "step": 16380 + }, + { + "epoch": 23.55, + "learning_rate": 6.61972522080471e-05, + "loss": 0.0773, + "step": 16390 + }, + { + "epoch": 23.56, + "learning_rate": 6.605004906771344e-05, + "loss": 0.0585, + "step": 16400 + }, + { + "epoch": 23.56, + "eval_loss": 0.15359418094158173, + "eval_runtime": 40.8191, + "eval_samples_per_second": 11.196, + "eval_steps_per_second": 1.421, + "eval_wer": 0.16021683481403404, + "step": 16400 + }, + { + "epoch": 23.58, + "learning_rate": 6.590284592737977e-05, + "loss": 0.0512, + "step": 16410 + }, + { + "epoch": 23.59, + "learning_rate": 6.575564278704612e-05, + "loss": 0.0639, + "step": 16420 + }, + { + "epoch": 23.61, + "learning_rate": 6.560843964671245e-05, + "loss": 0.0606, + "step": 16430 + }, + { + "epoch": 23.62, + "learning_rate": 6.54612365063788e-05, + "loss": 0.0591, + "step": 16440 + }, + { + "epoch": 23.64, + "learning_rate": 6.531403336604513e-05, + "loss": 0.0458, + "step": 16450 + }, + { + "epoch": 23.65, + "learning_rate": 6.516683022571147e-05, + "loss": 0.0609, + "step": 16460 + }, + { + "epoch": 23.66, + "learning_rate": 6.501962708537781e-05, + "loss": 0.0537, + "step": 16470 + }, + { + "epoch": 23.68, + "learning_rate": 6.487242394504415e-05, + "loss": 0.0546, + "step": 16480 + }, + { + "epoch": 23.69, + "learning_rate": 6.47252208047105e-05, + "loss": 0.0694, + "step": 16490 + }, + { + "epoch": 23.71, + "learning_rate": 6.457801766437683e-05, + "loss": 0.0585, + "step": 16500 + }, + { + "epoch": 23.71, + "eval_loss": 0.14631050825119019, + "eval_runtime": 40.2888, + "eval_samples_per_second": 11.343, + "eval_steps_per_second": 1.44, + "eval_wer": 0.15735581990664058, + "step": 16500 + }, + { + "epoch": 23.72, + "learning_rate": 6.443081452404318e-05, + "loss": 0.0717, + "step": 16510 + }, + { + "epoch": 23.74, + "learning_rate": 6.428361138370951e-05, + "loss": 0.0656, + "step": 16520 + }, + { + "epoch": 23.75, + "learning_rate": 6.413640824337586e-05, + "loss": 0.0461, + "step": 16530 + }, + { + "epoch": 23.76, + "learning_rate": 6.398920510304219e-05, + "loss": 0.0743, + "step": 16540 + }, + { + "epoch": 23.78, + "learning_rate": 6.384200196270854e-05, + "loss": 0.0533, + "step": 16550 + }, + { + "epoch": 23.79, + "learning_rate": 6.369479882237487e-05, + "loss": 0.0672, + "step": 16560 + }, + { + "epoch": 23.81, + "learning_rate": 6.354759568204122e-05, + "loss": 0.0631, + "step": 16570 + }, + { + "epoch": 23.82, + "learning_rate": 6.340039254170755e-05, + "loss": 0.0507, + "step": 16580 + }, + { + "epoch": 23.84, + "learning_rate": 6.32531894013739e-05, + "loss": 0.071, + "step": 16590 + }, + { + "epoch": 23.85, + "learning_rate": 6.310598626104023e-05, + "loss": 0.0546, + "step": 16600 + }, + { + "epoch": 23.85, + "eval_loss": 0.14672046899795532, + "eval_runtime": 40.2017, + "eval_samples_per_second": 11.368, + "eval_steps_per_second": 1.443, + "eval_wer": 0.1550971239271194, + "step": 16600 + }, + { + "epoch": 23.86, + "learning_rate": 6.295878312070656e-05, + "loss": 0.049, + "step": 16610 + }, + { + "epoch": 23.88, + "learning_rate": 6.281157998037291e-05, + "loss": 0.0709, + "step": 16620 + }, + { + "epoch": 23.89, + "learning_rate": 6.266437684003924e-05, + "loss": 0.0539, + "step": 16630 + }, + { + "epoch": 23.91, + "learning_rate": 6.251717369970559e-05, + "loss": 0.0669, + "step": 16640 + }, + { + "epoch": 23.92, + "learning_rate": 6.236997055937192e-05, + "loss": 0.0532, + "step": 16650 + }, + { + "epoch": 23.94, + "learning_rate": 6.222276741903827e-05, + "loss": 0.047, + "step": 16660 + }, + { + "epoch": 23.95, + "learning_rate": 6.20755642787046e-05, + "loss": 0.0563, + "step": 16670 + }, + { + "epoch": 23.97, + "learning_rate": 6.192836113837095e-05, + "loss": 0.0506, + "step": 16680 + }, + { + "epoch": 23.98, + "learning_rate": 6.178115799803728e-05, + "loss": 0.0708, + "step": 16690 + }, + { + "epoch": 23.99, + "learning_rate": 6.163395485770363e-05, + "loss": 0.0816, + "step": 16700 + }, + { + "epoch": 23.99, + "eval_loss": 0.15094982087612152, + "eval_runtime": 40.1931, + "eval_samples_per_second": 11.37, + "eval_steps_per_second": 1.443, + "eval_wer": 0.15464538473121517, + "step": 16700 + }, + { + "epoch": 24.01, + "learning_rate": 6.148675171736997e-05, + "loss": 0.0557, + "step": 16710 + }, + { + "epoch": 24.02, + "learning_rate": 6.133954857703631e-05, + "loss": 0.0544, + "step": 16720 + }, + { + "epoch": 24.04, + "learning_rate": 6.119234543670265e-05, + "loss": 0.0681, + "step": 16730 + }, + { + "epoch": 24.05, + "learning_rate": 6.104514229636899e-05, + "loss": 0.0576, + "step": 16740 + }, + { + "epoch": 24.07, + "learning_rate": 6.0897939156035326e-05, + "loss": 0.0663, + "step": 16750 + }, + { + "epoch": 24.08, + "learning_rate": 6.075073601570166e-05, + "loss": 0.0617, + "step": 16760 + }, + { + "epoch": 24.09, + "learning_rate": 6.0603532875368e-05, + "loss": 0.05, + "step": 16770 + }, + { + "epoch": 24.11, + "learning_rate": 6.045632973503434e-05, + "loss": 0.0622, + "step": 16780 + }, + { + "epoch": 24.12, + "learning_rate": 6.030912659470068e-05, + "loss": 0.0681, + "step": 16790 + }, + { + "epoch": 24.14, + "learning_rate": 6.016192345436702e-05, + "loss": 0.0556, + "step": 16800 + }, + { + "epoch": 24.14, + "eval_loss": 0.15066751837730408, + "eval_runtime": 40.0599, + "eval_samples_per_second": 11.408, + "eval_steps_per_second": 1.448, + "eval_wer": 0.15600060231892787, + "step": 16800 + }, + { + "epoch": 24.15, + "learning_rate": 6.001472031403336e-05, + "loss": 0.0585, + "step": 16810 + }, + { + "epoch": 24.17, + "learning_rate": 5.98675171736997e-05, + "loss": 0.0546, + "step": 16820 + }, + { + "epoch": 24.18, + "learning_rate": 5.972031403336604e-05, + "loss": 0.0532, + "step": 16830 + }, + { + "epoch": 24.2, + "learning_rate": 5.957311089303238e-05, + "loss": 0.0664, + "step": 16840 + }, + { + "epoch": 24.21, + "learning_rate": 5.942590775269872e-05, + "loss": 0.0492, + "step": 16850 + }, + { + "epoch": 24.22, + "learning_rate": 5.927870461236506e-05, + "loss": 0.0616, + "step": 16860 + }, + { + "epoch": 24.24, + "learning_rate": 5.91315014720314e-05, + "loss": 0.0582, + "step": 16870 + }, + { + "epoch": 24.25, + "learning_rate": 5.898429833169774e-05, + "loss": 0.0613, + "step": 16880 + }, + { + "epoch": 24.27, + "learning_rate": 5.883709519136408e-05, + "loss": 0.0545, + "step": 16890 + }, + { + "epoch": 24.28, + "learning_rate": 5.8689892051030415e-05, + "loss": 0.056, + "step": 16900 + }, + { + "epoch": 24.28, + "eval_loss": 0.15041780471801758, + "eval_runtime": 40.1424, + "eval_samples_per_second": 11.384, + "eval_steps_per_second": 1.445, + "eval_wer": 0.16051799427797017, + "step": 16900 + }, + { + "epoch": 24.3, + "learning_rate": 5.8542688910696755e-05, + "loss": 0.0638, + "step": 16910 + }, + { + "epoch": 24.31, + "learning_rate": 5.8395485770363095e-05, + "loss": 0.0512, + "step": 16920 + }, + { + "epoch": 24.32, + "learning_rate": 5.8248282630029435e-05, + "loss": 0.0619, + "step": 16930 + }, + { + "epoch": 24.34, + "learning_rate": 5.8101079489695775e-05, + "loss": 0.0641, + "step": 16940 + }, + { + "epoch": 24.35, + "learning_rate": 5.7953876349362116e-05, + "loss": 0.0507, + "step": 16950 + }, + { + "epoch": 24.37, + "learning_rate": 5.7806673209028456e-05, + "loss": 0.0543, + "step": 16960 + }, + { + "epoch": 24.38, + "learning_rate": 5.7659470068694796e-05, + "loss": 0.0493, + "step": 16970 + }, + { + "epoch": 24.4, + "learning_rate": 5.7512266928361136e-05, + "loss": 0.0567, + "step": 16980 + }, + { + "epoch": 24.41, + "learning_rate": 5.7365063788027476e-05, + "loss": 0.0776, + "step": 16990 + }, + { + "epoch": 24.43, + "learning_rate": 5.7217860647693816e-05, + "loss": 0.0621, + "step": 17000 + }, + { + "epoch": 24.43, + "eval_loss": 0.14634354412555695, + "eval_runtime": 40.0304, + "eval_samples_per_second": 11.416, + "eval_steps_per_second": 1.449, + "eval_wer": 0.15825929829844904, + "step": 17000 + }, + { + "epoch": 24.44, + "learning_rate": 5.7070657507360157e-05, + "loss": 0.0731, + "step": 17010 + }, + { + "epoch": 24.45, + "learning_rate": 5.69234543670265e-05, + "loss": 0.0588, + "step": 17020 + }, + { + "epoch": 24.47, + "learning_rate": 5.677625122669284e-05, + "loss": 0.0555, + "step": 17030 + }, + { + "epoch": 24.48, + "learning_rate": 5.662904808635918e-05, + "loss": 0.0633, + "step": 17040 + }, + { + "epoch": 24.5, + "learning_rate": 5.6481844946025504e-05, + "loss": 0.0477, + "step": 17050 + }, + { + "epoch": 24.51, + "learning_rate": 5.6334641805691844e-05, + "loss": 0.0584, + "step": 17060 + }, + { + "epoch": 24.53, + "learning_rate": 5.6187438665358184e-05, + "loss": 0.0594, + "step": 17070 + }, + { + "epoch": 24.54, + "learning_rate": 5.6040235525024524e-05, + "loss": 0.0613, + "step": 17080 + }, + { + "epoch": 24.55, + "learning_rate": 5.5893032384690864e-05, + "loss": 0.0608, + "step": 17090 + }, + { + "epoch": 24.57, + "learning_rate": 5.5745829244357205e-05, + "loss": 0.0514, + "step": 17100 + }, + { + "epoch": 24.57, + "eval_loss": 0.14699435234069824, + "eval_runtime": 40.2333, + "eval_samples_per_second": 11.359, + "eval_steps_per_second": 1.442, + "eval_wer": 0.15856045776238517, + "step": 17100 + }, + { + "epoch": 24.58, + "learning_rate": 5.5598626104023545e-05, + "loss": 0.0718, + "step": 17110 + }, + { + "epoch": 24.6, + "learning_rate": 5.5451422963689885e-05, + "loss": 0.0498, + "step": 17120 + }, + { + "epoch": 24.61, + "learning_rate": 5.5304219823356225e-05, + "loss": 0.0534, + "step": 17130 + }, + { + "epoch": 24.63, + "learning_rate": 5.5157016683022565e-05, + "loss": 0.0606, + "step": 17140 + }, + { + "epoch": 24.64, + "learning_rate": 5.5009813542688905e-05, + "loss": 0.0532, + "step": 17150 + }, + { + "epoch": 24.66, + "learning_rate": 5.4862610402355246e-05, + "loss": 0.062, + "step": 17160 + }, + { + "epoch": 24.67, + "learning_rate": 5.4715407262021586e-05, + "loss": 0.0483, + "step": 17170 + }, + { + "epoch": 24.68, + "learning_rate": 5.4568204121687926e-05, + "loss": 0.0428, + "step": 17180 + }, + { + "epoch": 24.7, + "learning_rate": 5.4421000981354266e-05, + "loss": 0.0725, + "step": 17190 + }, + { + "epoch": 24.71, + "learning_rate": 5.42737978410206e-05, + "loss": 0.0487, + "step": 17200 + }, + { + "epoch": 24.71, + "eval_loss": 0.1460464745759964, + "eval_runtime": 40.1151, + "eval_samples_per_second": 11.392, + "eval_steps_per_second": 1.446, + "eval_wer": 0.1556994428549917, + "step": 17200 + }, + { + "epoch": 24.73, + "learning_rate": 5.412659470068694e-05, + "loss": 0.0566, + "step": 17210 + }, + { + "epoch": 24.74, + "learning_rate": 5.397939156035328e-05, + "loss": 0.056, + "step": 17220 + }, + { + "epoch": 24.76, + "learning_rate": 5.383218842001962e-05, + "loss": 0.0526, + "step": 17230 + }, + { + "epoch": 24.77, + "learning_rate": 5.368498527968596e-05, + "loss": 0.0623, + "step": 17240 + }, + { + "epoch": 24.78, + "learning_rate": 5.35377821393523e-05, + "loss": 0.0532, + "step": 17250 + }, + { + "epoch": 24.8, + "learning_rate": 5.339057899901864e-05, + "loss": 0.0671, + "step": 17260 + }, + { + "epoch": 24.81, + "learning_rate": 5.324337585868498e-05, + "loss": 0.0525, + "step": 17270 + }, + { + "epoch": 24.83, + "learning_rate": 5.309617271835132e-05, + "loss": 0.0492, + "step": 17280 + }, + { + "epoch": 24.84, + "learning_rate": 5.294896957801766e-05, + "loss": 0.0518, + "step": 17290 + }, + { + "epoch": 24.86, + "learning_rate": 5.2801766437684e-05, + "loss": 0.0474, + "step": 17300 + }, + { + "epoch": 24.86, + "eval_loss": 0.1450837403535843, + "eval_runtime": 40.0465, + "eval_samples_per_second": 11.412, + "eval_steps_per_second": 1.448, + "eval_wer": 0.15238668875169403, + "step": 17300 + }, + { + "epoch": 24.87, + "learning_rate": 5.265456329735034e-05, + "loss": 0.0572, + "step": 17310 + }, + { + "epoch": 24.89, + "learning_rate": 5.250736015701668e-05, + "loss": 0.0502, + "step": 17320 + }, + { + "epoch": 24.9, + "learning_rate": 5.236015701668302e-05, + "loss": 0.0592, + "step": 17330 + }, + { + "epoch": 24.91, + "learning_rate": 5.221295387634936e-05, + "loss": 0.0609, + "step": 17340 + }, + { + "epoch": 24.93, + "learning_rate": 5.2065750736015695e-05, + "loss": 0.0617, + "step": 17350 + }, + { + "epoch": 24.94, + "learning_rate": 5.1918547595682035e-05, + "loss": 0.0525, + "step": 17360 + }, + { + "epoch": 24.96, + "learning_rate": 5.1771344455348375e-05, + "loss": 0.0649, + "step": 17370 + }, + { + "epoch": 24.97, + "learning_rate": 5.1624141315014716e-05, + "loss": 0.0487, + "step": 17380 + }, + { + "epoch": 24.99, + "learning_rate": 5.1476938174681056e-05, + "loss": 0.062, + "step": 17390 + }, + { + "epoch": 25.0, + "learning_rate": 5.1329735034347396e-05, + "loss": 0.0402, + "step": 17400 + }, + { + "epoch": 25.0, + "eval_loss": 0.14534904062747955, + "eval_runtime": 40.0375, + "eval_samples_per_second": 11.414, + "eval_steps_per_second": 1.449, + "eval_wer": 0.1513326306279175, + "step": 17400 + }, + { + "epoch": 25.01, + "learning_rate": 5.1182531894013736e-05, + "loss": 0.0566, + "step": 17410 + }, + { + "epoch": 25.03, + "learning_rate": 5.1035328753680076e-05, + "loss": 0.0545, + "step": 17420 + }, + { + "epoch": 25.04, + "learning_rate": 5.0888125613346416e-05, + "loss": 0.0524, + "step": 17430 + }, + { + "epoch": 25.06, + "learning_rate": 5.074092247301276e-05, + "loss": 0.0482, + "step": 17440 + }, + { + "epoch": 25.07, + "learning_rate": 5.05937193326791e-05, + "loss": 0.0479, + "step": 17450 + }, + { + "epoch": 25.09, + "learning_rate": 5.044651619234544e-05, + "loss": 0.0574, + "step": 17460 + }, + { + "epoch": 25.1, + "learning_rate": 5.029931305201178e-05, + "loss": 0.0516, + "step": 17470 + }, + { + "epoch": 25.11, + "learning_rate": 5.015210991167812e-05, + "loss": 0.0564, + "step": 17480 + }, + { + "epoch": 25.13, + "learning_rate": 5.000490677134446e-05, + "loss": 0.0478, + "step": 17490 + }, + { + "epoch": 25.14, + "learning_rate": 4.9857703631010784e-05, + "loss": 0.0754, + "step": 17500 + }, + { + "epoch": 25.14, + "eval_loss": 0.14766934514045715, + "eval_runtime": 39.973, + "eval_samples_per_second": 11.433, + "eval_steps_per_second": 1.451, + "eval_wer": 0.15148321035988557, + "step": 17500 + }, + { + "epoch": 25.16, + "learning_rate": 4.9710500490677124e-05, + "loss": 0.0675, + "step": 17510 + }, + { + "epoch": 25.17, + "learning_rate": 4.9563297350343464e-05, + "loss": 0.0486, + "step": 17520 + }, + { + "epoch": 25.19, + "learning_rate": 4.9416094210009805e-05, + "loss": 0.0603, + "step": 17530 + }, + { + "epoch": 25.2, + "learning_rate": 4.9268891069676145e-05, + "loss": 0.0655, + "step": 17540 + }, + { + "epoch": 25.22, + "learning_rate": 4.9121687929342485e-05, + "loss": 0.0523, + "step": 17550 + }, + { + "epoch": 25.23, + "learning_rate": 4.8974484789008825e-05, + "loss": 0.0565, + "step": 17560 + }, + { + "epoch": 25.24, + "learning_rate": 4.8827281648675165e-05, + "loss": 0.051, + "step": 17570 + }, + { + "epoch": 25.26, + "learning_rate": 4.8680078508341505e-05, + "loss": 0.0615, + "step": 17580 + }, + { + "epoch": 25.27, + "learning_rate": 4.8532875368007846e-05, + "loss": 0.0576, + "step": 17590 + }, + { + "epoch": 25.29, + "learning_rate": 4.8385672227674186e-05, + "loss": 0.0409, + "step": 17600 + }, + { + "epoch": 25.29, + "eval_loss": 0.14516086876392365, + "eval_runtime": 40.1057, + "eval_samples_per_second": 11.395, + "eval_steps_per_second": 1.446, + "eval_wer": 0.14907393464839633, + "step": 17600 + }, + { + "epoch": 25.3, + "learning_rate": 4.8238469087340526e-05, + "loss": 0.0673, + "step": 17610 + }, + { + "epoch": 25.32, + "learning_rate": 4.8091265947006866e-05, + "loss": 0.0686, + "step": 17620 + }, + { + "epoch": 25.33, + "learning_rate": 4.7944062806673206e-05, + "loss": 0.0512, + "step": 17630 + }, + { + "epoch": 25.34, + "learning_rate": 4.779685966633954e-05, + "loss": 0.0556, + "step": 17640 + }, + { + "epoch": 25.36, + "learning_rate": 4.764965652600588e-05, + "loss": 0.0619, + "step": 17650 + }, + { + "epoch": 25.37, + "learning_rate": 4.750245338567222e-05, + "loss": 0.0516, + "step": 17660 + }, + { + "epoch": 25.39, + "learning_rate": 4.735525024533856e-05, + "loss": 0.0491, + "step": 17670 + }, + { + "epoch": 25.4, + "learning_rate": 4.72080471050049e-05, + "loss": 0.0561, + "step": 17680 + }, + { + "epoch": 25.42, + "learning_rate": 4.706084396467124e-05, + "loss": 0.0609, + "step": 17690 + }, + { + "epoch": 25.43, + "learning_rate": 4.691364082433758e-05, + "loss": 0.0414, + "step": 17700 + }, + { + "epoch": 25.43, + "eval_loss": 0.1499926894903183, + "eval_runtime": 39.8722, + "eval_samples_per_second": 11.462, + "eval_steps_per_second": 1.455, + "eval_wer": 0.1511820508959494, + "step": 17700 + }, + { + "epoch": 25.45, + "learning_rate": 4.676643768400392e-05, + "loss": 0.0555, + "step": 17710 + }, + { + "epoch": 25.46, + "learning_rate": 4.661923454367026e-05, + "loss": 0.0568, + "step": 17720 + }, + { + "epoch": 25.47, + "learning_rate": 4.64720314033366e-05, + "loss": 0.0551, + "step": 17730 + }, + { + "epoch": 25.49, + "learning_rate": 4.632482826300294e-05, + "loss": 0.0441, + "step": 17740 + }, + { + "epoch": 25.5, + "learning_rate": 4.617762512266928e-05, + "loss": 0.0469, + "step": 17750 + }, + { + "epoch": 25.52, + "learning_rate": 4.603042198233562e-05, + "loss": 0.0562, + "step": 17760 + }, + { + "epoch": 25.53, + "learning_rate": 4.588321884200196e-05, + "loss": 0.0511, + "step": 17770 + }, + { + "epoch": 25.55, + "learning_rate": 4.57360157016683e-05, + "loss": 0.0456, + "step": 17780 + }, + { + "epoch": 25.56, + "learning_rate": 4.5588812561334635e-05, + "loss": 0.0419, + "step": 17790 + }, + { + "epoch": 25.57, + "learning_rate": 4.5441609421000976e-05, + "loss": 0.0596, + "step": 17800 + }, + { + "epoch": 25.57, + "eval_loss": 0.14854370057582855, + "eval_runtime": 40.2407, + "eval_samples_per_second": 11.357, + "eval_steps_per_second": 1.441, + "eval_wer": 0.1538924860713748, + "step": 17800 + }, + { + "epoch": 25.59, + "learning_rate": 4.5294406280667316e-05, + "loss": 0.0575, + "step": 17810 + }, + { + "epoch": 25.6, + "learning_rate": 4.5147203140333656e-05, + "loss": 0.0565, + "step": 17820 + }, + { + "epoch": 25.62, + "learning_rate": 4.4999999999999996e-05, + "loss": 0.0598, + "step": 17830 + }, + { + "epoch": 25.63, + "learning_rate": 4.4852796859666336e-05, + "loss": 0.0482, + "step": 17840 + }, + { + "epoch": 25.65, + "learning_rate": 4.4705593719332676e-05, + "loss": 0.0505, + "step": 17850 + }, + { + "epoch": 25.66, + "learning_rate": 4.4558390578999017e-05, + "loss": 0.0588, + "step": 17860 + }, + { + "epoch": 25.68, + "learning_rate": 4.441118743866536e-05, + "loss": 0.0481, + "step": 17870 + }, + { + "epoch": 25.69, + "learning_rate": 4.42639842983317e-05, + "loss": 0.05, + "step": 17880 + }, + { + "epoch": 25.7, + "learning_rate": 4.411678115799804e-05, + "loss": 0.0587, + "step": 17890 + }, + { + "epoch": 25.72, + "learning_rate": 4.396957801766438e-05, + "loss": 0.0441, + "step": 17900 + }, + { + "epoch": 25.72, + "eval_loss": 0.14327119290828705, + "eval_runtime": 39.9632, + "eval_samples_per_second": 11.436, + "eval_steps_per_second": 1.451, + "eval_wer": 0.15344074687547057, + "step": 17900 + }, + { + "epoch": 25.73, + "learning_rate": 4.382237487733072e-05, + "loss": 0.0595, + "step": 17910 + }, + { + "epoch": 25.75, + "learning_rate": 4.367517173699706e-05, + "loss": 0.0519, + "step": 17920 + }, + { + "epoch": 25.76, + "learning_rate": 4.35279685966634e-05, + "loss": 0.052, + "step": 17930 + }, + { + "epoch": 25.78, + "learning_rate": 4.3380765456329724e-05, + "loss": 0.0412, + "step": 17940 + }, + { + "epoch": 25.79, + "learning_rate": 4.3233562315996065e-05, + "loss": 0.0462, + "step": 17950 + }, + { + "epoch": 25.8, + "learning_rate": 4.3086359175662405e-05, + "loss": 0.0646, + "step": 17960 + }, + { + "epoch": 25.82, + "learning_rate": 4.2939156035328745e-05, + "loss": 0.0572, + "step": 17970 + }, + { + "epoch": 25.83, + "learning_rate": 4.2791952894995085e-05, + "loss": 0.062, + "step": 17980 + }, + { + "epoch": 25.85, + "learning_rate": 4.2644749754661425e-05, + "loss": 0.0485, + "step": 17990 + }, + { + "epoch": 25.86, + "learning_rate": 4.2497546614327765e-05, + "loss": 0.0517, + "step": 18000 + }, + { + "epoch": 25.86, + "eval_loss": 0.1446276158094406, + "eval_runtime": 40.1161, + "eval_samples_per_second": 11.392, + "eval_steps_per_second": 1.446, + "eval_wer": 0.15238668875169403, + "step": 18000 + }, + { + "epoch": 25.88, + "learning_rate": 4.2350343473994106e-05, + "loss": 0.0556, + "step": 18010 + }, + { + "epoch": 25.89, + "learning_rate": 4.2203140333660446e-05, + "loss": 0.0542, + "step": 18020 + }, + { + "epoch": 25.91, + "learning_rate": 4.2055937193326786e-05, + "loss": 0.0517, + "step": 18030 + }, + { + "epoch": 25.92, + "learning_rate": 4.1908734052993126e-05, + "loss": 0.0483, + "step": 18040 + }, + { + "epoch": 25.93, + "learning_rate": 4.1761530912659466e-05, + "loss": 0.0454, + "step": 18050 + }, + { + "epoch": 25.95, + "learning_rate": 4.1614327772325806e-05, + "loss": 0.0649, + "step": 18060 + }, + { + "epoch": 25.96, + "learning_rate": 4.1467124631992147e-05, + "loss": 0.0449, + "step": 18070 + }, + { + "epoch": 25.98, + "learning_rate": 4.131992149165849e-05, + "loss": 0.0604, + "step": 18080 + }, + { + "epoch": 25.99, + "learning_rate": 4.117271835132482e-05, + "loss": 0.0486, + "step": 18090 + }, + { + "epoch": 26.01, + "learning_rate": 4.102551521099116e-05, + "loss": 0.0752, + "step": 18100 + }, + { + "epoch": 26.01, + "eval_loss": 0.14016593992710114, + "eval_runtime": 40.0408, + "eval_samples_per_second": 11.413, + "eval_steps_per_second": 1.449, + "eval_wer": 0.14967625357626863, + "step": 18100 + }, + { + "epoch": 26.02, + "learning_rate": 4.08783120706575e-05, + "loss": 0.0568, + "step": 18110 + }, + { + "epoch": 26.03, + "learning_rate": 4.073110893032384e-05, + "loss": 0.0504, + "step": 18120 + }, + { + "epoch": 26.05, + "learning_rate": 4.058390578999018e-05, + "loss": 0.0536, + "step": 18130 + }, + { + "epoch": 26.06, + "learning_rate": 4.043670264965652e-05, + "loss": 0.0465, + "step": 18140 + }, + { + "epoch": 26.08, + "learning_rate": 4.028949950932286e-05, + "loss": 0.05, + "step": 18150 + }, + { + "epoch": 26.09, + "learning_rate": 4.01422963689892e-05, + "loss": 0.047, + "step": 18160 + }, + { + "epoch": 26.11, + "learning_rate": 3.999509322865554e-05, + "loss": 0.0545, + "step": 18170 + }, + { + "epoch": 26.12, + "learning_rate": 3.984789008832188e-05, + "loss": 0.0559, + "step": 18180 + }, + { + "epoch": 26.14, + "learning_rate": 3.970068694798822e-05, + "loss": 0.049, + "step": 18190 + }, + { + "epoch": 26.15, + "learning_rate": 3.955348380765456e-05, + "loss": 0.0543, + "step": 18200 + }, + { + "epoch": 26.15, + "eval_loss": 0.14435161650180817, + "eval_runtime": 40.7685, + "eval_samples_per_second": 11.21, + "eval_steps_per_second": 1.423, + "eval_wer": 0.1519349495557898, + "step": 18200 + }, + { + "epoch": 26.16, + "learning_rate": 3.94062806673209e-05, + "loss": 0.058, + "step": 18210 + }, + { + "epoch": 26.18, + "learning_rate": 3.925907752698724e-05, + "loss": 0.0459, + "step": 18220 + }, + { + "epoch": 26.19, + "learning_rate": 3.9111874386653576e-05, + "loss": 0.064, + "step": 18230 + }, + { + "epoch": 26.21, + "learning_rate": 3.8964671246319916e-05, + "loss": 0.0452, + "step": 18240 + }, + { + "epoch": 26.22, + "learning_rate": 3.8817468105986256e-05, + "loss": 0.0497, + "step": 18250 + }, + { + "epoch": 26.24, + "learning_rate": 3.8670264965652596e-05, + "loss": 0.0505, + "step": 18260 + }, + { + "epoch": 26.25, + "learning_rate": 3.8523061825318936e-05, + "loss": 0.0551, + "step": 18270 + }, + { + "epoch": 26.26, + "learning_rate": 3.8375858684985276e-05, + "loss": 0.0565, + "step": 18280 + }, + { + "epoch": 26.28, + "learning_rate": 3.822865554465162e-05, + "loss": 0.0501, + "step": 18290 + }, + { + "epoch": 26.29, + "learning_rate": 3.808145240431796e-05, + "loss": 0.0556, + "step": 18300 + }, + { + "epoch": 26.29, + "eval_loss": 0.1450069099664688, + "eval_runtime": 40.1396, + "eval_samples_per_second": 11.385, + "eval_steps_per_second": 1.445, + "eval_wer": 0.14967625357626863, + "step": 18300 + }, + { + "epoch": 26.31, + "learning_rate": 3.79342492639843e-05, + "loss": 0.0543, + "step": 18310 + }, + { + "epoch": 26.32, + "learning_rate": 3.778704612365064e-05, + "loss": 0.0547, + "step": 18320 + }, + { + "epoch": 26.34, + "learning_rate": 3.763984298331698e-05, + "loss": 0.0608, + "step": 18330 + }, + { + "epoch": 26.35, + "learning_rate": 3.749263984298331e-05, + "loss": 0.0458, + "step": 18340 + }, + { + "epoch": 26.36, + "learning_rate": 3.734543670264965e-05, + "loss": 0.0481, + "step": 18350 + }, + { + "epoch": 26.38, + "learning_rate": 3.719823356231599e-05, + "loss": 0.0601, + "step": 18360 + }, + { + "epoch": 26.39, + "learning_rate": 3.705103042198233e-05, + "loss": 0.0451, + "step": 18370 + }, + { + "epoch": 26.41, + "learning_rate": 3.690382728164867e-05, + "loss": 0.0623, + "step": 18380 + }, + { + "epoch": 26.42, + "learning_rate": 3.675662414131501e-05, + "loss": 0.0396, + "step": 18390 + }, + { + "epoch": 26.44, + "learning_rate": 3.660942100098135e-05, + "loss": 0.0514, + "step": 18400 + }, + { + "epoch": 26.44, + "eval_loss": 0.14546437561511993, + "eval_runtime": 40.3801, + "eval_samples_per_second": 11.317, + "eval_steps_per_second": 1.436, + "eval_wer": 0.15042915223610903, + "step": 18400 + }, + { + "epoch": 26.45, + "learning_rate": 3.646221786064769e-05, + "loss": 0.065, + "step": 18410 + }, + { + "epoch": 26.47, + "learning_rate": 3.6315014720314025e-05, + "loss": 0.0446, + "step": 18420 + }, + { + "epoch": 26.48, + "learning_rate": 3.6167811579980365e-05, + "loss": 0.0568, + "step": 18430 + }, + { + "epoch": 26.49, + "learning_rate": 3.6020608439646706e-05, + "loss": 0.0467, + "step": 18440 + }, + { + "epoch": 26.51, + "learning_rate": 3.5873405299313046e-05, + "loss": 0.0515, + "step": 18450 + }, + { + "epoch": 26.52, + "learning_rate": 3.5726202158979386e-05, + "loss": 0.0528, + "step": 18460 + }, + { + "epoch": 26.54, + "learning_rate": 3.5578999018645726e-05, + "loss": 0.0518, + "step": 18470 + }, + { + "epoch": 26.55, + "learning_rate": 3.5431795878312066e-05, + "loss": 0.0506, + "step": 18480 + }, + { + "epoch": 26.57, + "learning_rate": 3.5284592737978406e-05, + "loss": 0.0501, + "step": 18490 + }, + { + "epoch": 26.58, + "learning_rate": 3.5137389597644747e-05, + "loss": 0.0424, + "step": 18500 + }, + { + "epoch": 26.58, + "eval_loss": 0.14528827369213104, + "eval_runtime": 40.49, + "eval_samples_per_second": 11.287, + "eval_steps_per_second": 1.432, + "eval_wer": 0.15057973196807709, + "step": 18500 + }, + { + "epoch": 26.59, + "learning_rate": 3.499018645731109e-05, + "loss": 0.0556, + "step": 18510 + }, + { + "epoch": 26.61, + "learning_rate": 3.484298331697743e-05, + "loss": 0.0624, + "step": 18520 + }, + { + "epoch": 26.62, + "learning_rate": 3.469578017664377e-05, + "loss": 0.0551, + "step": 18530 + }, + { + "epoch": 26.64, + "learning_rate": 3.454857703631011e-05, + "loss": 0.0548, + "step": 18540 + }, + { + "epoch": 26.65, + "learning_rate": 3.440137389597645e-05, + "loss": 0.0501, + "step": 18550 + }, + { + "epoch": 26.67, + "learning_rate": 3.425417075564279e-05, + "loss": 0.0622, + "step": 18560 + }, + { + "epoch": 26.68, + "learning_rate": 3.410696761530912e-05, + "loss": 0.0475, + "step": 18570 + }, + { + "epoch": 26.7, + "learning_rate": 3.395976447497546e-05, + "loss": 0.0534, + "step": 18580 + }, + { + "epoch": 26.71, + "learning_rate": 3.38125613346418e-05, + "loss": 0.0405, + "step": 18590 + }, + { + "epoch": 26.72, + "learning_rate": 3.366535819430814e-05, + "loss": 0.0689, + "step": 18600 + }, + { + "epoch": 26.72, + "eval_loss": 0.1431579440832138, + "eval_runtime": 39.9989, + "eval_samples_per_second": 11.425, + "eval_steps_per_second": 1.45, + "eval_wer": 0.15088089143201325, + "step": 18600 + }, + { + "epoch": 26.74, + "learning_rate": 3.351815505397448e-05, + "loss": 0.0541, + "step": 18610 + }, + { + "epoch": 26.75, + "learning_rate": 3.337095191364082e-05, + "loss": 0.0604, + "step": 18620 + }, + { + "epoch": 26.77, + "learning_rate": 3.322374877330716e-05, + "loss": 0.0546, + "step": 18630 + }, + { + "epoch": 26.78, + "learning_rate": 3.30765456329735e-05, + "loss": 0.0476, + "step": 18640 + }, + { + "epoch": 26.8, + "learning_rate": 3.2929342492639836e-05, + "loss": 0.0532, + "step": 18650 + }, + { + "epoch": 26.81, + "learning_rate": 3.2782139352306176e-05, + "loss": 0.0361, + "step": 18660 + }, + { + "epoch": 26.82, + "learning_rate": 3.2634936211972516e-05, + "loss": 0.0366, + "step": 18670 + }, + { + "epoch": 26.84, + "learning_rate": 3.2487733071638856e-05, + "loss": 0.0511, + "step": 18680 + }, + { + "epoch": 26.85, + "learning_rate": 3.2340529931305196e-05, + "loss": 0.0484, + "step": 18690 + }, + { + "epoch": 26.87, + "learning_rate": 3.2193326790971536e-05, + "loss": 0.0467, + "step": 18700 + }, + { + "epoch": 26.87, + "eval_loss": 0.1416984647512436, + "eval_runtime": 40.7855, + "eval_samples_per_second": 11.205, + "eval_steps_per_second": 1.422, + "eval_wer": 0.15088089143201325, + "step": 18700 + }, + { + "epoch": 26.88, + "learning_rate": 3.2046123650637877e-05, + "loss": 0.0566, + "step": 18710 + }, + { + "epoch": 26.9, + "learning_rate": 3.189892051030422e-05, + "loss": 0.0387, + "step": 18720 + }, + { + "epoch": 26.91, + "learning_rate": 3.175171736997056e-05, + "loss": 0.0504, + "step": 18730 + }, + { + "epoch": 26.93, + "learning_rate": 3.16045142296369e-05, + "loss": 0.0447, + "step": 18740 + }, + { + "epoch": 26.94, + "learning_rate": 3.145731108930324e-05, + "loss": 0.0454, + "step": 18750 + }, + { + "epoch": 26.95, + "learning_rate": 3.131010794896958e-05, + "loss": 0.0518, + "step": 18760 + }, + { + "epoch": 26.97, + "learning_rate": 3.116290480863592e-05, + "loss": 0.0476, + "step": 18770 + }, + { + "epoch": 26.98, + "learning_rate": 3.101570166830226e-05, + "loss": 0.0463, + "step": 18780 + }, + { + "epoch": 27.0, + "learning_rate": 3.086849852796859e-05, + "loss": 0.0527, + "step": 18790 + }, + { + "epoch": 27.01, + "learning_rate": 3.072129538763493e-05, + "loss": 0.0409, + "step": 18800 + }, + { + "epoch": 27.01, + "eval_loss": 0.14151474833488464, + "eval_runtime": 40.0113, + "eval_samples_per_second": 11.422, + "eval_steps_per_second": 1.45, + "eval_wer": 0.15298900767956633, + "step": 18800 + }, + { + "epoch": 27.03, + "learning_rate": 3.057409224730127e-05, + "loss": 0.047, + "step": 18810 + }, + { + "epoch": 27.04, + "learning_rate": 3.042688910696761e-05, + "loss": 0.0531, + "step": 18820 + }, + { + "epoch": 27.05, + "learning_rate": 3.0279685966633952e-05, + "loss": 0.0498, + "step": 18830 + }, + { + "epoch": 27.07, + "learning_rate": 3.0132482826300292e-05, + "loss": 0.0562, + "step": 18840 + }, + { + "epoch": 27.08, + "learning_rate": 2.9985279685966632e-05, + "loss": 0.0657, + "step": 18850 + }, + { + "epoch": 27.1, + "learning_rate": 2.983807654563297e-05, + "loss": 0.0474, + "step": 18860 + }, + { + "epoch": 27.11, + "learning_rate": 2.969087340529931e-05, + "loss": 0.0656, + "step": 18870 + }, + { + "epoch": 27.13, + "learning_rate": 2.954367026496565e-05, + "loss": 0.0483, + "step": 18880 + }, + { + "epoch": 27.14, + "learning_rate": 2.939646712463199e-05, + "loss": 0.0482, + "step": 18890 + }, + { + "epoch": 27.16, + "learning_rate": 2.924926398429833e-05, + "loss": 0.0612, + "step": 18900 + }, + { + "epoch": 27.16, + "eval_loss": 0.1420021653175354, + "eval_runtime": 40.3238, + "eval_samples_per_second": 11.333, + "eval_steps_per_second": 1.438, + "eval_wer": 0.14952567384430054, + "step": 18900 + }, + { + "epoch": 27.17, + "learning_rate": 2.910206084396467e-05, + "loss": 0.0621, + "step": 18910 + }, + { + "epoch": 27.18, + "learning_rate": 2.895485770363101e-05, + "loss": 0.0583, + "step": 18920 + }, + { + "epoch": 27.2, + "learning_rate": 2.880765456329735e-05, + "loss": 0.0569, + "step": 18930 + }, + { + "epoch": 27.21, + "learning_rate": 2.8660451422963687e-05, + "loss": 0.0529, + "step": 18940 + }, + { + "epoch": 27.23, + "learning_rate": 2.8513248282630027e-05, + "loss": 0.07, + "step": 18950 + }, + { + "epoch": 27.24, + "learning_rate": 2.8366045142296367e-05, + "loss": 0.0585, + "step": 18960 + }, + { + "epoch": 27.26, + "learning_rate": 2.8218842001962707e-05, + "loss": 0.054, + "step": 18970 + }, + { + "epoch": 27.27, + "learning_rate": 2.8071638861629047e-05, + "loss": 0.0523, + "step": 18980 + }, + { + "epoch": 27.28, + "learning_rate": 2.7924435721295388e-05, + "loss": 0.0416, + "step": 18990 + }, + { + "epoch": 27.3, + "learning_rate": 2.7777232580961728e-05, + "loss": 0.0501, + "step": 19000 + }, + { + "epoch": 27.3, + "eval_loss": 0.14232105016708374, + "eval_runtime": 40.1869, + "eval_samples_per_second": 11.372, + "eval_steps_per_second": 1.443, + "eval_wer": 0.14892335491642825, + "step": 19000 + }, + { + "epoch": 27.31, + "learning_rate": 2.763002944062806e-05, + "loss": 0.0531, + "step": 19010 + }, + { + "epoch": 27.33, + "learning_rate": 2.74828263002944e-05, + "loss": 0.0529, + "step": 19020 + }, + { + "epoch": 27.34, + "learning_rate": 2.733562315996074e-05, + "loss": 0.0519, + "step": 19030 + }, + { + "epoch": 27.36, + "learning_rate": 2.718842001962708e-05, + "loss": 0.0456, + "step": 19040 + }, + { + "epoch": 27.37, + "learning_rate": 2.7041216879293422e-05, + "loss": 0.0546, + "step": 19050 + }, + { + "epoch": 27.39, + "learning_rate": 2.6894013738959762e-05, + "loss": 0.0488, + "step": 19060 + }, + { + "epoch": 27.4, + "learning_rate": 2.6746810598626102e-05, + "loss": 0.052, + "step": 19070 + }, + { + "epoch": 27.41, + "learning_rate": 2.659960745829244e-05, + "loss": 0.0537, + "step": 19080 + }, + { + "epoch": 27.43, + "learning_rate": 2.645240431795878e-05, + "loss": 0.0474, + "step": 19090 + }, + { + "epoch": 27.44, + "learning_rate": 2.630520117762512e-05, + "loss": 0.0579, + "step": 19100 + }, + { + "epoch": 27.44, + "eval_loss": 0.14417009055614471, + "eval_runtime": 40.3442, + "eval_samples_per_second": 11.328, + "eval_steps_per_second": 1.438, + "eval_wer": 0.15238668875169403, + "step": 19100 + }, + { + "epoch": 27.46, + "learning_rate": 2.615799803729146e-05, + "loss": 0.0403, + "step": 19110 + }, + { + "epoch": 27.47, + "learning_rate": 2.60107948969578e-05, + "loss": 0.0537, + "step": 19120 + }, + { + "epoch": 27.49, + "learning_rate": 2.586359175662414e-05, + "loss": 0.0529, + "step": 19130 + }, + { + "epoch": 27.5, + "learning_rate": 2.571638861629048e-05, + "loss": 0.0466, + "step": 19140 + }, + { + "epoch": 27.51, + "learning_rate": 2.556918547595682e-05, + "loss": 0.0552, + "step": 19150 + }, + { + "epoch": 27.53, + "learning_rate": 2.5421982335623157e-05, + "loss": 0.0525, + "step": 19160 + }, + { + "epoch": 27.54, + "learning_rate": 2.5274779195289497e-05, + "loss": 0.0508, + "step": 19170 + }, + { + "epoch": 27.56, + "learning_rate": 2.5127576054955837e-05, + "loss": 0.047, + "step": 19180 + }, + { + "epoch": 27.57, + "learning_rate": 2.4980372914622177e-05, + "loss": 0.0459, + "step": 19190 + }, + { + "epoch": 27.59, + "learning_rate": 2.4833169774288518e-05, + "loss": 0.0449, + "step": 19200 + }, + { + "epoch": 27.59, + "eval_loss": 0.142539843916893, + "eval_runtime": 40.2027, + "eval_samples_per_second": 11.367, + "eval_steps_per_second": 1.443, + "eval_wer": 0.1519349495557898, + "step": 19200 + }, + { + "epoch": 27.6, + "learning_rate": 2.4685966633954858e-05, + "loss": 0.0526, + "step": 19210 + }, + { + "epoch": 27.61, + "learning_rate": 2.4538763493621198e-05, + "loss": 0.0453, + "step": 19220 + }, + { + "epoch": 27.63, + "learning_rate": 2.439156035328753e-05, + "loss": 0.0568, + "step": 19230 + }, + { + "epoch": 27.64, + "learning_rate": 2.424435721295387e-05, + "loss": 0.0441, + "step": 19240 + }, + { + "epoch": 27.66, + "learning_rate": 2.409715407262021e-05, + "loss": 0.0516, + "step": 19250 + }, + { + "epoch": 27.67, + "learning_rate": 2.3949950932286552e-05, + "loss": 0.0448, + "step": 19260 + }, + { + "epoch": 27.69, + "learning_rate": 2.3802747791952892e-05, + "loss": 0.0411, + "step": 19270 + }, + { + "epoch": 27.7, + "learning_rate": 2.3655544651619232e-05, + "loss": 0.0495, + "step": 19280 + }, + { + "epoch": 27.72, + "learning_rate": 2.3508341511285572e-05, + "loss": 0.0483, + "step": 19290 + }, + { + "epoch": 27.73, + "learning_rate": 2.336113837095191e-05, + "loss": 0.0615, + "step": 19300 + }, + { + "epoch": 27.73, + "eval_loss": 0.14353878796100616, + "eval_runtime": 40.2924, + "eval_samples_per_second": 11.342, + "eval_steps_per_second": 1.439, + "eval_wer": 0.15148321035988557, + "step": 19300 + }, + { + "epoch": 27.74, + "learning_rate": 2.321393523061825e-05, + "loss": 0.0478, + "step": 19310 + }, + { + "epoch": 27.76, + "learning_rate": 2.306673209028459e-05, + "loss": 0.0515, + "step": 19320 + }, + { + "epoch": 27.77, + "learning_rate": 2.291952894995093e-05, + "loss": 0.0488, + "step": 19330 + }, + { + "epoch": 27.79, + "learning_rate": 2.277232580961727e-05, + "loss": 0.0482, + "step": 19340 + }, + { + "epoch": 27.8, + "learning_rate": 2.262512266928361e-05, + "loss": 0.0503, + "step": 19350 + }, + { + "epoch": 27.82, + "learning_rate": 2.247791952894995e-05, + "loss": 0.0388, + "step": 19360 + }, + { + "epoch": 27.83, + "learning_rate": 2.233071638861629e-05, + "loss": 0.0654, + "step": 19370 + }, + { + "epoch": 27.84, + "learning_rate": 2.2183513248282627e-05, + "loss": 0.0439, + "step": 19380 + }, + { + "epoch": 27.86, + "learning_rate": 2.2036310107948967e-05, + "loss": 0.0409, + "step": 19390 + }, + { + "epoch": 27.87, + "learning_rate": 2.1889106967615307e-05, + "loss": 0.063, + "step": 19400 + }, + { + "epoch": 27.87, + "eval_loss": 0.14183540642261505, + "eval_runtime": 40.2851, + "eval_samples_per_second": 11.344, + "eval_steps_per_second": 1.44, + "eval_wer": 0.1511820508959494, + "step": 19400 + }, + { + "epoch": 27.89, + "learning_rate": 2.1741903827281648e-05, + "loss": 0.0444, + "step": 19410 + }, + { + "epoch": 27.9, + "learning_rate": 2.1594700686947988e-05, + "loss": 0.0494, + "step": 19420 + }, + { + "epoch": 27.92, + "learning_rate": 2.1447497546614328e-05, + "loss": 0.0464, + "step": 19430 + }, + { + "epoch": 27.93, + "learning_rate": 2.1300294406280668e-05, + "loss": 0.0425, + "step": 19440 + }, + { + "epoch": 27.95, + "learning_rate": 2.1153091265947e-05, + "loss": 0.0519, + "step": 19450 + }, + { + "epoch": 27.96, + "learning_rate": 2.100588812561334e-05, + "loss": 0.0466, + "step": 19460 + }, + { + "epoch": 27.97, + "learning_rate": 2.0858684985279682e-05, + "loss": 0.0479, + "step": 19470 + }, + { + "epoch": 27.99, + "learning_rate": 2.0711481844946022e-05, + "loss": 0.0433, + "step": 19480 + }, + { + "epoch": 28.0, + "learning_rate": 2.0564278704612362e-05, + "loss": 0.0472, + "step": 19490 + }, + { + "epoch": 28.02, + "learning_rate": 2.0417075564278702e-05, + "loss": 0.0422, + "step": 19500 + }, + { + "epoch": 28.02, + "eval_loss": 0.14156275987625122, + "eval_runtime": 40.1542, + "eval_samples_per_second": 11.381, + "eval_steps_per_second": 1.444, + "eval_wer": 0.14817045625658787, + "step": 19500 + }, + { + "epoch": 28.03, + "learning_rate": 2.0269872423945042e-05, + "loss": 0.0457, + "step": 19510 + }, + { + "epoch": 28.05, + "learning_rate": 2.0122669283611383e-05, + "loss": 0.051, + "step": 19520 + }, + { + "epoch": 28.06, + "learning_rate": 1.997546614327772e-05, + "loss": 0.0448, + "step": 19530 + }, + { + "epoch": 28.07, + "learning_rate": 1.982826300294406e-05, + "loss": 0.0419, + "step": 19540 + }, + { + "epoch": 28.09, + "learning_rate": 1.96810598626104e-05, + "loss": 0.0488, + "step": 19550 + }, + { + "epoch": 28.1, + "learning_rate": 1.953385672227674e-05, + "loss": 0.0524, + "step": 19560 + }, + { + "epoch": 28.12, + "learning_rate": 1.938665358194308e-05, + "loss": 0.0404, + "step": 19570 + }, + { + "epoch": 28.13, + "learning_rate": 1.923945044160942e-05, + "loss": 0.0431, + "step": 19580 + }, + { + "epoch": 28.15, + "learning_rate": 1.909224730127576e-05, + "loss": 0.0428, + "step": 19590 + }, + { + "epoch": 28.16, + "learning_rate": 1.8945044160942097e-05, + "loss": 0.0468, + "step": 19600 + }, + { + "epoch": 28.16, + "eval_loss": 0.14033865928649902, + "eval_runtime": 40.1669, + "eval_samples_per_second": 11.378, + "eval_steps_per_second": 1.444, + "eval_wer": 0.14952567384430054, + "step": 19600 + }, + { + "epoch": 28.18, + "learning_rate": 1.8797841020608437e-05, + "loss": 0.0554, + "step": 19610 + }, + { + "epoch": 28.19, + "learning_rate": 1.8650637880274777e-05, + "loss": 0.057, + "step": 19620 + }, + { + "epoch": 28.2, + "learning_rate": 1.8503434739941118e-05, + "loss": 0.0387, + "step": 19630 + }, + { + "epoch": 28.22, + "learning_rate": 1.8356231599607458e-05, + "loss": 0.0496, + "step": 19640 + }, + { + "epoch": 28.23, + "learning_rate": 1.8209028459273798e-05, + "loss": 0.0547, + "step": 19650 + }, + { + "epoch": 28.25, + "learning_rate": 1.8061825318940135e-05, + "loss": 0.0383, + "step": 19660 + }, + { + "epoch": 28.26, + "learning_rate": 1.7914622178606475e-05, + "loss": 0.0445, + "step": 19670 + }, + { + "epoch": 28.28, + "learning_rate": 1.7767419038272815e-05, + "loss": 0.0391, + "step": 19680 + }, + { + "epoch": 28.29, + "learning_rate": 1.7620215897939155e-05, + "loss": 0.052, + "step": 19690 + }, + { + "epoch": 28.3, + "learning_rate": 1.7473012757605495e-05, + "loss": 0.0421, + "step": 19700 + }, + { + "epoch": 28.3, + "eval_loss": 0.14019441604614258, + "eval_runtime": 40.1804, + "eval_samples_per_second": 11.374, + "eval_steps_per_second": 1.443, + "eval_wer": 0.1511820508959494, + "step": 19700 + }, + { + "epoch": 28.32, + "learning_rate": 1.7325809617271832e-05, + "loss": 0.0461, + "step": 19710 + }, + { + "epoch": 28.33, + "learning_rate": 1.7178606476938172e-05, + "loss": 0.0495, + "step": 19720 + }, + { + "epoch": 28.35, + "learning_rate": 1.7031403336604513e-05, + "loss": 0.0406, + "step": 19730 + }, + { + "epoch": 28.36, + "learning_rate": 1.6884200196270853e-05, + "loss": 0.0612, + "step": 19740 + }, + { + "epoch": 28.38, + "learning_rate": 1.6736997055937193e-05, + "loss": 0.044, + "step": 19750 + }, + { + "epoch": 28.39, + "learning_rate": 1.6589793915603533e-05, + "loss": 0.0439, + "step": 19760 + }, + { + "epoch": 28.41, + "learning_rate": 1.644259077526987e-05, + "loss": 0.0503, + "step": 19770 + }, + { + "epoch": 28.42, + "learning_rate": 1.629538763493621e-05, + "loss": 0.04, + "step": 19780 + }, + { + "epoch": 28.43, + "learning_rate": 1.614818449460255e-05, + "loss": 0.035, + "step": 19790 + }, + { + "epoch": 28.45, + "learning_rate": 1.600098135426889e-05, + "loss": 0.0446, + "step": 19800 + }, + { + "epoch": 28.45, + "eval_loss": 0.1425383985042572, + "eval_runtime": 40.1802, + "eval_samples_per_second": 11.374, + "eval_steps_per_second": 1.443, + "eval_wer": 0.1493750941123325, + "step": 19800 + }, + { + "epoch": 28.46, + "learning_rate": 1.585377821393523e-05, + "loss": 0.0487, + "step": 19810 + }, + { + "epoch": 28.48, + "learning_rate": 1.570657507360157e-05, + "loss": 0.066, + "step": 19820 + }, + { + "epoch": 28.49, + "learning_rate": 1.555937193326791e-05, + "loss": 0.0541, + "step": 19830 + }, + { + "epoch": 28.51, + "learning_rate": 1.5412168792934248e-05, + "loss": 0.047, + "step": 19840 + }, + { + "epoch": 28.52, + "learning_rate": 1.5264965652600588e-05, + "loss": 0.0415, + "step": 19850 + }, + { + "epoch": 28.53, + "learning_rate": 1.5117762512266928e-05, + "loss": 0.0401, + "step": 19860 + }, + { + "epoch": 28.55, + "learning_rate": 1.4970559371933268e-05, + "loss": 0.0457, + "step": 19870 + }, + { + "epoch": 28.56, + "learning_rate": 1.4823356231599605e-05, + "loss": 0.0445, + "step": 19880 + }, + { + "epoch": 28.58, + "learning_rate": 1.4676153091265945e-05, + "loss": 0.0419, + "step": 19890 + }, + { + "epoch": 28.59, + "learning_rate": 1.4528949950932285e-05, + "loss": 0.048, + "step": 19900 + }, + { + "epoch": 28.59, + "eval_loss": 0.14261671900749207, + "eval_runtime": 39.9856, + "eval_samples_per_second": 11.429, + "eval_steps_per_second": 1.451, + "eval_wer": 0.1474175575967475, + "step": 19900 + }, + { + "epoch": 28.61, + "learning_rate": 1.4381746810598624e-05, + "loss": 0.043, + "step": 19910 + }, + { + "epoch": 28.62, + "learning_rate": 1.4234543670264964e-05, + "loss": 0.0526, + "step": 19920 + }, + { + "epoch": 28.64, + "learning_rate": 1.4087340529931304e-05, + "loss": 0.0433, + "step": 19930 + }, + { + "epoch": 28.65, + "learning_rate": 1.3940137389597644e-05, + "loss": 0.0523, + "step": 19940 + }, + { + "epoch": 28.66, + "learning_rate": 1.3792934249263983e-05, + "loss": 0.0477, + "step": 19950 + }, + { + "epoch": 28.68, + "learning_rate": 1.3645731108930323e-05, + "loss": 0.0438, + "step": 19960 + }, + { + "epoch": 28.69, + "learning_rate": 1.3498527968596663e-05, + "loss": 0.0634, + "step": 19970 + }, + { + "epoch": 28.71, + "learning_rate": 1.3351324828263003e-05, + "loss": 0.0488, + "step": 19980 + }, + { + "epoch": 28.72, + "learning_rate": 1.320412168792934e-05, + "loss": 0.0561, + "step": 19990 + }, + { + "epoch": 28.74, + "learning_rate": 1.305691854759568e-05, + "loss": 0.0429, + "step": 20000 + }, + { + "epoch": 28.74, + "eval_loss": 0.14055244624614716, + "eval_runtime": 40.1463, + "eval_samples_per_second": 11.383, + "eval_steps_per_second": 1.445, + "eval_wer": 0.146514079204939, + "step": 20000 + }, + { + "epoch": 28.75, + "learning_rate": 1.290971540726202e-05, + "loss": 0.0455, + "step": 20010 + }, + { + "epoch": 28.76, + "learning_rate": 1.2762512266928359e-05, + "loss": 0.0559, + "step": 20020 + }, + { + "epoch": 28.78, + "learning_rate": 1.2615309126594699e-05, + "loss": 0.0384, + "step": 20030 + }, + { + "epoch": 28.79, + "learning_rate": 1.2468105986261039e-05, + "loss": 0.0537, + "step": 20040 + }, + { + "epoch": 28.81, + "learning_rate": 1.232090284592738e-05, + "loss": 0.0477, + "step": 20050 + }, + { + "epoch": 28.82, + "learning_rate": 1.2173699705593718e-05, + "loss": 0.0438, + "step": 20060 + }, + { + "epoch": 28.84, + "learning_rate": 1.2026496565260058e-05, + "loss": 0.0424, + "step": 20070 + }, + { + "epoch": 28.85, + "learning_rate": 1.1879293424926398e-05, + "loss": 0.0658, + "step": 20080 + }, + { + "epoch": 28.86, + "learning_rate": 1.1732090284592738e-05, + "loss": 0.0496, + "step": 20090 + }, + { + "epoch": 28.88, + "learning_rate": 1.1584887144259077e-05, + "loss": 0.0457, + "step": 20100 + }, + { + "epoch": 28.88, + "eval_loss": 0.14235013723373413, + "eval_runtime": 40.2402, + "eval_samples_per_second": 11.357, + "eval_steps_per_second": 1.441, + "eval_wer": 0.14606234000903479, + "step": 20100 + }, + { + "epoch": 28.89, + "learning_rate": 1.1437684003925415e-05, + "loss": 0.0438, + "step": 20110 + }, + { + "epoch": 28.91, + "learning_rate": 1.1290480863591755e-05, + "loss": 0.0575, + "step": 20120 + }, + { + "epoch": 28.92, + "learning_rate": 1.1143277723258095e-05, + "loss": 0.048, + "step": 20130 + }, + { + "epoch": 28.94, + "learning_rate": 1.0996074582924434e-05, + "loss": 0.0448, + "step": 20140 + }, + { + "epoch": 28.95, + "learning_rate": 1.0848871442590774e-05, + "loss": 0.0463, + "step": 20150 + }, + { + "epoch": 28.97, + "learning_rate": 1.0701668302257114e-05, + "loss": 0.0513, + "step": 20160 + }, + { + "epoch": 28.98, + "learning_rate": 1.0554465161923453e-05, + "loss": 0.0438, + "step": 20170 + }, + { + "epoch": 28.99, + "learning_rate": 1.0407262021589793e-05, + "loss": 0.0452, + "step": 20180 + }, + { + "epoch": 29.01, + "learning_rate": 1.0260058881256133e-05, + "loss": 0.0487, + "step": 20190 + }, + { + "epoch": 29.02, + "learning_rate": 1.0112855740922473e-05, + "loss": 0.0469, + "step": 20200 + }, + { + "epoch": 29.02, + "eval_loss": 0.14129261672496796, + "eval_runtime": 40.3493, + "eval_samples_per_second": 11.326, + "eval_steps_per_second": 1.437, + "eval_wer": 0.14561060081313054, + "step": 20200 + }, + { + "epoch": 29.04, + "learning_rate": 9.965652600588812e-06, + "loss": 0.0488, + "step": 20210 + }, + { + "epoch": 29.05, + "learning_rate": 9.818449460255152e-06, + "loss": 0.0448, + "step": 20220 + }, + { + "epoch": 29.07, + "learning_rate": 9.671246319921492e-06, + "loss": 0.0451, + "step": 20230 + }, + { + "epoch": 29.08, + "learning_rate": 9.52404317958783e-06, + "loss": 0.0551, + "step": 20240 + }, + { + "epoch": 29.09, + "learning_rate": 9.376840039254169e-06, + "loss": 0.0475, + "step": 20250 + }, + { + "epoch": 29.11, + "learning_rate": 9.22963689892051e-06, + "loss": 0.0424, + "step": 20260 + }, + { + "epoch": 29.12, + "learning_rate": 9.08243375858685e-06, + "loss": 0.0427, + "step": 20270 + }, + { + "epoch": 29.14, + "learning_rate": 8.93523061825319e-06, + "loss": 0.0487, + "step": 20280 + }, + { + "epoch": 29.15, + "learning_rate": 8.788027477919528e-06, + "loss": 0.0553, + "step": 20290 + }, + { + "epoch": 29.17, + "learning_rate": 8.640824337585868e-06, + "loss": 0.0543, + "step": 20300 + }, + { + "epoch": 29.17, + "eval_loss": 0.14143255352973938, + "eval_runtime": 40.1054, + "eval_samples_per_second": 11.395, + "eval_steps_per_second": 1.446, + "eval_wer": 0.146514079204939, + "step": 20300 + }, + { + "epoch": 29.18, + "learning_rate": 8.493621197252207e-06, + "loss": 0.0515, + "step": 20310 + }, + { + "epoch": 29.2, + "learning_rate": 8.346418056918547e-06, + "loss": 0.0423, + "step": 20320 + }, + { + "epoch": 29.21, + "learning_rate": 8.199214916584887e-06, + "loss": 0.0382, + "step": 20330 + }, + { + "epoch": 29.22, + "learning_rate": 8.052011776251227e-06, + "loss": 0.0436, + "step": 20340 + }, + { + "epoch": 29.24, + "learning_rate": 7.904808635917566e-06, + "loss": 0.0447, + "step": 20350 + }, + { + "epoch": 29.25, + "learning_rate": 7.757605495583906e-06, + "loss": 0.0386, + "step": 20360 + }, + { + "epoch": 29.27, + "learning_rate": 7.610402355250245e-06, + "loss": 0.0537, + "step": 20370 + }, + { + "epoch": 29.28, + "learning_rate": 7.4631992149165835e-06, + "loss": 0.0408, + "step": 20380 + }, + { + "epoch": 29.3, + "learning_rate": 7.315996074582924e-06, + "loss": 0.041, + "step": 20390 + }, + { + "epoch": 29.31, + "learning_rate": 7.168792934249263e-06, + "loss": 0.0416, + "step": 20400 + }, + { + "epoch": 29.31, + "eval_loss": 0.14171102643013, + "eval_runtime": 40.0654, + "eval_samples_per_second": 11.406, + "eval_steps_per_second": 1.448, + "eval_wer": 0.14681523866887516, + "step": 20400 + }, + { + "epoch": 29.32, + "learning_rate": 7.021589793915603e-06, + "loss": 0.0445, + "step": 20410 + }, + { + "epoch": 29.34, + "learning_rate": 6.8743866535819425e-06, + "loss": 0.0501, + "step": 20420 + }, + { + "epoch": 29.35, + "learning_rate": 6.741903827281648e-06, + "loss": 0.0454, + "step": 20430 + }, + { + "epoch": 29.37, + "learning_rate": 6.594700686947987e-06, + "loss": 0.0383, + "step": 20440 + }, + { + "epoch": 29.38, + "learning_rate": 6.4474975466143275e-06, + "loss": 0.0403, + "step": 20450 + }, + { + "epoch": 29.4, + "learning_rate": 6.300294406280667e-06, + "loss": 0.0387, + "step": 20460 + }, + { + "epoch": 29.41, + "learning_rate": 6.153091265947007e-06, + "loss": 0.055, + "step": 20470 + }, + { + "epoch": 29.43, + "learning_rate": 6.0058881256133454e-06, + "loss": 0.0377, + "step": 20480 + }, + { + "epoch": 29.44, + "learning_rate": 5.858684985279686e-06, + "loss": 0.0539, + "step": 20490 + }, + { + "epoch": 29.45, + "learning_rate": 5.711481844946025e-06, + "loss": 0.0491, + "step": 20500 + }, + { + "epoch": 29.45, + "eval_loss": 0.1411919742822647, + "eval_runtime": 40.3501, + "eval_samples_per_second": 11.326, + "eval_steps_per_second": 1.437, + "eval_wer": 0.14711639813281133, + "step": 20500 + }, + { + "epoch": 29.47, + "learning_rate": 5.564278704612364e-06, + "loss": 0.0521, + "step": 20510 + }, + { + "epoch": 29.48, + "learning_rate": 5.417075564278704e-06, + "loss": 0.0384, + "step": 20520 + }, + { + "epoch": 29.5, + "learning_rate": 5.269872423945043e-06, + "loss": 0.0496, + "step": 20530 + }, + { + "epoch": 29.51, + "learning_rate": 5.122669283611383e-06, + "loss": 0.0565, + "step": 20540 + }, + { + "epoch": 29.53, + "learning_rate": 4.975466143277722e-06, + "loss": 0.0496, + "step": 20550 + }, + { + "epoch": 29.54, + "learning_rate": 4.8282630029440625e-06, + "loss": 0.0423, + "step": 20560 + }, + { + "epoch": 29.55, + "learning_rate": 4.681059862610402e-06, + "loss": 0.0462, + "step": 20570 + }, + { + "epoch": 29.57, + "learning_rate": 4.533856722276741e-06, + "loss": 0.0471, + "step": 20580 + }, + { + "epoch": 29.58, + "learning_rate": 4.386653581943081e-06, + "loss": 0.0482, + "step": 20590 + }, + { + "epoch": 29.6, + "learning_rate": 4.239450441609421e-06, + "loss": 0.0441, + "step": 20600 + }, + { + "epoch": 29.6, + "eval_loss": 0.14090383052825928, + "eval_runtime": 40.3963, + "eval_samples_per_second": 11.313, + "eval_steps_per_second": 1.436, + "eval_wer": 0.14711639813281133, + "step": 20600 + }, + { + "epoch": 29.61, + "learning_rate": 4.09224730127576e-06, + "loss": 0.05, + "step": 20610 + }, + { + "epoch": 29.63, + "learning_rate": 3.9450441609421e-06, + "loss": 0.0457, + "step": 20620 + }, + { + "epoch": 29.64, + "learning_rate": 3.7978410206084395e-06, + "loss": 0.0535, + "step": 20630 + }, + { + "epoch": 29.66, + "learning_rate": 3.6506378802747788e-06, + "loss": 0.0479, + "step": 20640 + }, + { + "epoch": 29.67, + "learning_rate": 3.5034347399411185e-06, + "loss": 0.0386, + "step": 20650 + }, + { + "epoch": 29.68, + "learning_rate": 3.3562315996074583e-06, + "loss": 0.0382, + "step": 20660 + }, + { + "epoch": 29.7, + "learning_rate": 3.2090284592737976e-06, + "loss": 0.0424, + "step": 20670 + }, + { + "epoch": 29.71, + "learning_rate": 3.0618253189401373e-06, + "loss": 0.0628, + "step": 20680 + }, + { + "epoch": 29.73, + "learning_rate": 2.9146221786064766e-06, + "loss": 0.0585, + "step": 20690 + }, + { + "epoch": 29.74, + "learning_rate": 2.767419038272816e-06, + "loss": 0.0542, + "step": 20700 + }, + { + "epoch": 29.74, + "eval_loss": 0.14069251716136932, + "eval_runtime": 40.3961, + "eval_samples_per_second": 11.313, + "eval_steps_per_second": 1.436, + "eval_wer": 0.14696581840084325, + "step": 20700 + }, + { + "epoch": 29.76, + "learning_rate": 2.6202158979391557e-06, + "loss": 0.0418, + "step": 20710 + }, + { + "epoch": 29.77, + "learning_rate": 2.4730127576054954e-06, + "loss": 0.0415, + "step": 20720 + }, + { + "epoch": 29.78, + "learning_rate": 2.3258096172718348e-06, + "loss": 0.0373, + "step": 20730 + }, + { + "epoch": 29.8, + "learning_rate": 2.1786064769381745e-06, + "loss": 0.0381, + "step": 20740 + }, + { + "epoch": 29.81, + "learning_rate": 2.0314033366045143e-06, + "loss": 0.0445, + "step": 20750 + }, + { + "epoch": 29.83, + "learning_rate": 1.8842001962708538e-06, + "loss": 0.0482, + "step": 20760 + }, + { + "epoch": 29.84, + "learning_rate": 1.7369970559371933e-06, + "loss": 0.0463, + "step": 20770 + }, + { + "epoch": 29.86, + "learning_rate": 1.5897939156035326e-06, + "loss": 0.0402, + "step": 20780 + }, + { + "epoch": 29.87, + "learning_rate": 1.4425907752698722e-06, + "loss": 0.0503, + "step": 20790 + }, + { + "epoch": 29.89, + "learning_rate": 1.295387634936212e-06, + "loss": 0.0471, + "step": 20800 + }, + { + "epoch": 29.89, + "eval_loss": 0.1404000222682953, + "eval_runtime": 41.0194, + "eval_samples_per_second": 11.141, + "eval_steps_per_second": 1.414, + "eval_wer": 0.14711639813281133, + "step": 20800 + } + ], + "max_steps": 20880, + "num_train_epochs": 30, + "total_flos": 1.7201005515836912e+20, + "trial_name": null, + "trial_params": null +}