diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,13222 @@ +{ + "best_metric": 0.10748248671697858, + "best_model_checkpoint": "./wav2vec2-large-xlsr-53-german-cv13-restart/checkpoint-65220", + "epoch": 14.999885017822237, + "eval_steps": 500, + "global_step": 65220, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.01, + "learning_rate": 1.3323124042879019e-05, + "loss": 11.7551, + "step": 30 + }, + { + "epoch": 0.01, + "learning_rate": 2.5267993874425725e-05, + "loss": 13.2463, + "step": 60 + }, + { + "epoch": 0.02, + "learning_rate": 3.9050535987748854e-05, + "loss": 9.3024, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 5.283307810107197e-05, + "loss": 3.9605, + "step": 120 + }, + { + "epoch": 0.03, + "learning_rate": 6.66156202143951e-05, + "loss": 3.1293, + "step": 150 + }, + { + "epoch": 0.04, + "learning_rate": 8.039816232771821e-05, + "loss": 2.9889, + "step": 180 + }, + { + "epoch": 0.05, + "learning_rate": 9.418070444104134e-05, + "loss": 2.9889, + "step": 210 + }, + { + "epoch": 0.06, + "learning_rate": 0.00010796324655436447, + "loss": 2.9568, + "step": 240 + }, + { + "epoch": 0.06, + "learning_rate": 0.00012174578866768757, + "loss": 2.9741, + "step": 270 + }, + { + "epoch": 0.07, + "learning_rate": 0.0001355283307810107, + "loss": 2.9679, + "step": 300 + }, + { + "epoch": 0.08, + "learning_rate": 0.00014931087289433382, + "loss": 2.9437, + "step": 330 + }, + { + "epoch": 0.08, + "learning_rate": 0.00016309341500765696, + "loss": 2.928, + "step": 360 + }, + { + "epoch": 0.09, + "learning_rate": 0.00017687595712098005, + "loss": 2.8874, + "step": 390 + }, + { + "epoch": 0.1, + "learning_rate": 0.0001906584992343032, + "loss": 2.7554, + "step": 420 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002044410413476263, + "loss": 1.6682, + "step": 450 + }, + { + "epoch": 0.11, + "learning_rate": 0.00021822358346094942, + "loss": 0.7836, + "step": 480 + }, + { + "epoch": 0.12, + "learning_rate": 0.00023200612557427257, + "loss": 0.5938, + "step": 510 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002457886676875957, + "loss": 0.4396, + "step": 540 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002595712098009188, + "loss": 0.4354, + "step": 570 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002733537519142419, + "loss": 0.4037, + "step": 600 + }, + { + "epoch": 0.14, + "learning_rate": 0.00028713629402756506, + "loss": 0.3242, + "step": 630 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002999907073272724, + "loss": 0.3401, + "step": 660 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002998513172363591, + "loss": 0.3007, + "step": 690 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002997119271454458, + "loss": 0.3327, + "step": 720 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002995725370545325, + "loss": 0.3167, + "step": 750 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029943314696361916, + "loss": 0.2858, + "step": 780 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029929375687270585, + "loss": 0.2995, + "step": 810 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029915436678179254, + "loss": 0.2682, + "step": 840 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002990149766908792, + "loss": 0.2734, + "step": 870 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002988755865999659, + "loss": 0.2766, + "step": 900 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002987361965090526, + "loss": 0.2312, + "step": 930 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002985968064181393, + "loss": 0.2705, + "step": 960 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029845741632722597, + "loss": 0.2309, + "step": 990 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029831802623631265, + "loss": 0.2391, + "step": 1020 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029817863614539934, + "loss": 0.256, + "step": 1050 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029803924605448603, + "loss": 0.2233, + "step": 1080 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029789985596357266, + "loss": 0.2511, + "step": 1110 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029776046587265935, + "loss": 0.2155, + "step": 1140 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029762107578174603, + "loss": 0.2254, + "step": 1170 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002974816856908327, + "loss": 0.2429, + "step": 1200 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002973422955999194, + "loss": 0.2053, + "step": 1230 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002972029055090061, + "loss": 0.2326, + "step": 1260 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029706351541809283, + "loss": 0.2169, + "step": 1290 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002969241253271795, + "loss": 0.2168, + "step": 1320 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002967847352362662, + "loss": 0.2319, + "step": 1350 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002966453451453529, + "loss": 0.2023, + "step": 1380 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002965059550544396, + "loss": 0.2431, + "step": 1410 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029636656496352627, + "loss": 0.1865, + "step": 1440 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029622717487261295, + "loss": 0.2177, + "step": 1470 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002960877847816996, + "loss": 0.2291, + "step": 1500 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029594839469078627, + "loss": 0.1957, + "step": 1530 + }, + { + "epoch": 0.36, + "learning_rate": 0.00029580900459987296, + "loss": 0.2206, + "step": 1560 + }, + { + "epoch": 0.37, + "learning_rate": 0.00029566961450895965, + "loss": 0.1895, + "step": 1590 + }, + { + "epoch": 0.37, + "learning_rate": 0.00029553022441804633, + "loss": 0.1972, + "step": 1620 + }, + { + "epoch": 0.38, + "learning_rate": 0.000295390834327133, + "loss": 0.2147, + "step": 1650 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002952514442362197, + "loss": 0.183, + "step": 1680 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002951120541453064, + "loss": 0.2228, + "step": 1710 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002949726640543931, + "loss": 0.1752, + "step": 1740 + }, + { + "epoch": 0.41, + "learning_rate": 0.00029483327396347977, + "loss": 0.208, + "step": 1770 + }, + { + "epoch": 0.41, + "learning_rate": 0.00029469388387256645, + "loss": 0.2144, + "step": 1800 + }, + { + "epoch": 0.42, + "learning_rate": 0.00029455449378165314, + "loss": 0.1786, + "step": 1830 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002944151036907398, + "loss": 0.2043, + "step": 1860 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002942757135998265, + "loss": 0.1885, + "step": 1890 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002941363235089132, + "loss": 0.2034, + "step": 1920 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002939969334179999, + "loss": 0.2039, + "step": 1950 + }, + { + "epoch": 0.46, + "learning_rate": 0.00029385754332708657, + "loss": 0.1696, + "step": 1980 + }, + { + "epoch": 0.46, + "learning_rate": 0.00029371815323617326, + "loss": 0.2057, + "step": 2010 + }, + { + "epoch": 0.47, + "learning_rate": 0.00029357876314525994, + "loss": 0.176, + "step": 2040 + }, + { + "epoch": 0.48, + "learning_rate": 0.00029343937305434663, + "loss": 0.1952, + "step": 2070 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002932999829634333, + "loss": 0.2153, + "step": 2100 + }, + { + "epoch": 0.49, + "learning_rate": 0.00029316059287252, + "loss": 0.1689, + "step": 2130 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002930212027816067, + "loss": 0.1963, + "step": 2160 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002928818126906934, + "loss": 0.1792, + "step": 2190 + }, + { + "epoch": 0.51, + "learning_rate": 0.00029274242259978006, + "loss": 0.1861, + "step": 2220 + }, + { + "epoch": 0.52, + "learning_rate": 0.00029260303250886675, + "loss": 0.2035, + "step": 2250 + }, + { + "epoch": 0.52, + "learning_rate": 0.00029246364241795344, + "loss": 0.1723, + "step": 2280 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002923242523270401, + "loss": 0.1972, + "step": 2310 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002921848622361268, + "loss": 0.1818, + "step": 2340 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002920454721452135, + "loss": 0.1833, + "step": 2370 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002919060820543002, + "loss": 0.2019, + "step": 2400 + }, + { + "epoch": 0.56, + "learning_rate": 0.00029176669196338687, + "loss": 0.1673, + "step": 2430 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002916273018724735, + "loss": 0.1957, + "step": 2460 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002914879117815602, + "loss": 0.1636, + "step": 2490 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002913485216906469, + "loss": 0.1752, + "step": 2520 + }, + { + "epoch": 0.59, + "learning_rate": 0.00029120913159973356, + "loss": 0.1973, + "step": 2550 + }, + { + "epoch": 0.59, + "learning_rate": 0.00029106974150882025, + "loss": 0.1656, + "step": 2580 + }, + { + "epoch": 0.6, + "learning_rate": 0.00029093035141790693, + "loss": 0.1951, + "step": 2610 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002907909613269936, + "loss": 0.1662, + "step": 2640 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002906515712360803, + "loss": 0.1873, + "step": 2670 + }, + { + "epoch": 0.62, + "learning_rate": 0.000290512181145167, + "loss": 0.2026, + "step": 2700 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002903727910542537, + "loss": 0.1645, + "step": 2730 + }, + { + "epoch": 0.63, + "learning_rate": 0.00029023340096334037, + "loss": 0.1876, + "step": 2760 + }, + { + "epoch": 0.64, + "learning_rate": 0.00029009401087242705, + "loss": 0.172, + "step": 2790 + }, + { + "epoch": 0.65, + "learning_rate": 0.00028995462078151374, + "loss": 0.1864, + "step": 2820 + }, + { + "epoch": 0.66, + "learning_rate": 0.00028981523069060043, + "loss": 0.1838, + "step": 2850 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002896758405996871, + "loss": 0.162, + "step": 2880 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002895364505087738, + "loss": 0.1918, + "step": 2910 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002893970604178605, + "loss": 0.1659, + "step": 2940 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002892576703269472, + "loss": 0.1753, + "step": 2970 + }, + { + "epoch": 0.69, + "learning_rate": 0.00028911828023603386, + "loss": 0.1857, + "step": 3000 + }, + { + "epoch": 0.7, + "learning_rate": 0.00028897889014512055, + "loss": 0.1521, + "step": 3030 + }, + { + "epoch": 0.7, + "learning_rate": 0.00028883950005420723, + "loss": 0.1838, + "step": 3060 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002887001099632939, + "loss": 0.1675, + "step": 3090 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002885607198723806, + "loss": 0.1819, + "step": 3120 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002884213297814673, + "loss": 0.1906, + "step": 3150 + }, + { + "epoch": 0.73, + "learning_rate": 0.000288281939690554, + "loss": 0.1581, + "step": 3180 + }, + { + "epoch": 0.74, + "learning_rate": 0.00028814254959964067, + "loss": 0.1801, + "step": 3210 + }, + { + "epoch": 0.75, + "learning_rate": 0.00028800315950872735, + "loss": 0.1604, + "step": 3240 + }, + { + "epoch": 0.75, + "learning_rate": 0.00028786376941781404, + "loss": 0.1771, + "step": 3270 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002877243793269007, + "loss": 0.1866, + "step": 3300 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002875849892359874, + "loss": 0.1572, + "step": 3330 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002874455991450741, + "loss": 0.1898, + "step": 3360 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002873062090541608, + "loss": 0.1613, + "step": 3390 + }, + { + "epoch": 0.79, + "learning_rate": 0.00028716681896324747, + "loss": 0.175, + "step": 3420 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002870274288723341, + "loss": 0.1856, + "step": 3450 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002868880387814208, + "loss": 0.1499, + "step": 3480 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002867486486905075, + "loss": 0.1753, + "step": 3510 + }, + { + "epoch": 0.81, + "learning_rate": 0.00028660925859959416, + "loss": 0.1561, + "step": 3540 + }, + { + "epoch": 0.82, + "learning_rate": 0.00028646986850868085, + "loss": 0.1789, + "step": 3570 + }, + { + "epoch": 0.83, + "learning_rate": 0.00028633047841776754, + "loss": 0.1867, + "step": 3600 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002861910883268542, + "loss": 0.1538, + "step": 3630 + }, + { + "epoch": 0.84, + "learning_rate": 0.00028605169823594097, + "loss": 0.1819, + "step": 3660 + }, + { + "epoch": 0.85, + "learning_rate": 0.00028591230814502765, + "loss": 0.1655, + "step": 3690 + }, + { + "epoch": 0.86, + "learning_rate": 0.00028577291805411434, + "loss": 0.1677, + "step": 3720 + }, + { + "epoch": 0.86, + "learning_rate": 0.000285633527963201, + "loss": 0.1787, + "step": 3750 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002854941378722877, + "loss": 0.1477, + "step": 3780 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002853547477813744, + "loss": 0.1796, + "step": 3810 + }, + { + "epoch": 0.88, + "learning_rate": 0.00028521535769046103, + "loss": 0.1561, + "step": 3840 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002850759675995477, + "loss": 0.1713, + "step": 3870 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002849365775086344, + "loss": 0.1924, + "step": 3900 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002847971874177211, + "loss": 0.1541, + "step": 3930 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002846577973268078, + "loss": 0.1799, + "step": 3960 + }, + { + "epoch": 0.92, + "learning_rate": 0.00028451840723589446, + "loss": 0.1572, + "step": 3990 + }, + { + "epoch": 0.92, + "learning_rate": 0.00028437901714498115, + "loss": 0.166, + "step": 4020 + }, + { + "epoch": 0.93, + "learning_rate": 0.00028423962705406784, + "loss": 0.1849, + "step": 4050 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002841002369631545, + "loss": 0.1518, + "step": 4080 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002839608468722412, + "loss": 0.1801, + "step": 4110 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002838214567813279, + "loss": 0.1619, + "step": 4140 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002836820666904146, + "loss": 0.171, + "step": 4170 + }, + { + "epoch": 0.97, + "learning_rate": 0.00028354267659950127, + "loss": 0.1812, + "step": 4200 + }, + { + "epoch": 0.97, + "learning_rate": 0.00028340328650858796, + "loss": 0.1522, + "step": 4230 + }, + { + "epoch": 0.98, + "learning_rate": 0.00028326389641767464, + "loss": 0.1817, + "step": 4260 + }, + { + "epoch": 0.99, + "learning_rate": 0.00028312450632676133, + "loss": 0.1521, + "step": 4290 + }, + { + "epoch": 0.99, + "learning_rate": 0.000282985116235848, + "loss": 0.1679, + "step": 4320 + }, + { + "epoch": 1.0, + "eval_cer": 0.04590986454861357, + "eval_loss": 0.16172531247138977, + "eval_runtime": 407.0434, + "eval_samples_per_second": 39.659, + "eval_steps_per_second": 2.479, + "eval_wer": 0.17069274763951403, + "step": 4348 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002828457261449347, + "loss": 0.1773, + "step": 4350 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002827063360540214, + "loss": 0.1418, + "step": 4380 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002825669459631081, + "loss": 0.1615, + "step": 4410 + }, + { + "epoch": 1.02, + "learning_rate": 0.00028242755587219476, + "loss": 0.1501, + "step": 4440 + }, + { + "epoch": 1.03, + "learning_rate": 0.00028228816578128145, + "loss": 0.1594, + "step": 4470 + }, + { + "epoch": 1.03, + "learning_rate": 0.00028214877569036814, + "loss": 0.1696, + "step": 4500 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002820093855994548, + "loss": 0.1389, + "step": 4530 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002818699955085415, + "loss": 0.1649, + "step": 4560 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002817306054176282, + "loss": 0.1521, + "step": 4590 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002815912153267149, + "loss": 0.1489, + "step": 4620 + }, + { + "epoch": 1.07, + "learning_rate": 0.00028145182523580157, + "loss": 0.1678, + "step": 4650 + }, + { + "epoch": 1.08, + "learning_rate": 0.00028131243514488825, + "loss": 0.1357, + "step": 4680 + }, + { + "epoch": 1.08, + "learning_rate": 0.00028117304505397494, + "loss": 0.1749, + "step": 4710 + }, + { + "epoch": 1.09, + "learning_rate": 0.00028103365496306163, + "loss": 0.155, + "step": 4740 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002808942648721483, + "loss": 0.1549, + "step": 4770 + }, + { + "epoch": 1.1, + "learning_rate": 0.00028075487478123495, + "loss": 0.1729, + "step": 4800 + }, + { + "epoch": 1.11, + "learning_rate": 0.00028061548469032163, + "loss": 0.14, + "step": 4830 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002804760945994083, + "loss": 0.1599, + "step": 4860 + }, + { + "epoch": 1.12, + "learning_rate": 0.000280336704508495, + "loss": 0.1453, + "step": 4890 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002801973144175817, + "loss": 0.1556, + "step": 4920 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002800579243266684, + "loss": 0.169, + "step": 4950 + }, + { + "epoch": 1.15, + "learning_rate": 0.00027991853423575507, + "loss": 0.141, + "step": 4980 + }, + { + "epoch": 1.15, + "learning_rate": 0.00027977914414484175, + "loss": 0.1719, + "step": 5010 + }, + { + "epoch": 1.16, + "learning_rate": 0.00027963975405392844, + "loss": 0.15, + "step": 5040 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002795003639630151, + "loss": 0.1633, + "step": 5070 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002793609738721018, + "loss": 0.1665, + "step": 5100 + }, + { + "epoch": 1.18, + "learning_rate": 0.0002792215837811885, + "loss": 0.139, + "step": 5130 + }, + { + "epoch": 1.19, + "learning_rate": 0.0002790821936902752, + "loss": 0.1681, + "step": 5160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00027894280359936187, + "loss": 0.14, + "step": 5190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00027880341350844856, + "loss": 0.1487, + "step": 5220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00027866402341753525, + "loss": 0.1599, + "step": 5250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00027852463332662193, + "loss": 0.1386, + "step": 5280 + }, + { + "epoch": 1.22, + "learning_rate": 0.0002783852432357086, + "loss": 0.163, + "step": 5310 + }, + { + "epoch": 1.23, + "learning_rate": 0.0002782458531447953, + "loss": 0.1486, + "step": 5340 + }, + { + "epoch": 1.23, + "learning_rate": 0.000278106463053882, + "loss": 0.16, + "step": 5370 + }, + { + "epoch": 1.24, + "learning_rate": 0.0002779670729629687, + "loss": 0.165, + "step": 5400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00027782768287205536, + "loss": 0.1346, + "step": 5430 + }, + { + "epoch": 1.26, + "learning_rate": 0.00027768829278114205, + "loss": 0.1565, + "step": 5460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00027754890269022874, + "loss": 0.1506, + "step": 5490 + }, + { + "epoch": 1.27, + "learning_rate": 0.0002774095125993154, + "loss": 0.1577, + "step": 5520 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002772701225084021, + "loss": 0.1642, + "step": 5550 + }, + { + "epoch": 1.28, + "learning_rate": 0.0002771307324174888, + "loss": 0.1281, + "step": 5580 + }, + { + "epoch": 1.29, + "learning_rate": 0.0002769913423265755, + "loss": 0.1668, + "step": 5610 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027685195223566217, + "loss": 0.1422, + "step": 5640 + }, + { + "epoch": 1.3, + "learning_rate": 0.00027671256214474886, + "loss": 0.1474, + "step": 5670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00027657317205383554, + "loss": 0.1613, + "step": 5700 + }, + { + "epoch": 1.32, + "learning_rate": 0.00027643378196292223, + "loss": 0.1326, + "step": 5730 + }, + { + "epoch": 1.32, + "learning_rate": 0.0002762943918720089, + "loss": 0.1601, + "step": 5760 + }, + { + "epoch": 1.33, + "learning_rate": 0.00027615500178109555, + "loss": 0.1441, + "step": 5790 + }, + { + "epoch": 1.34, + "learning_rate": 0.00027601561169018224, + "loss": 0.1467, + "step": 5820 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002758762215992689, + "loss": 0.1771, + "step": 5850 + }, + { + "epoch": 1.35, + "learning_rate": 0.0002757368315083556, + "loss": 0.1377, + "step": 5880 + }, + { + "epoch": 1.36, + "learning_rate": 0.0002755974414174423, + "loss": 0.1598, + "step": 5910 + }, + { + "epoch": 1.37, + "learning_rate": 0.000275458051326529, + "loss": 0.1478, + "step": 5940 + }, + { + "epoch": 1.37, + "learning_rate": 0.00027531866123561567, + "loss": 0.1617, + "step": 5970 + }, + { + "epoch": 1.38, + "learning_rate": 0.00027517927114470236, + "loss": 0.166, + "step": 6000 + }, + { + "epoch": 1.39, + "learning_rate": 0.0002750398810537891, + "loss": 0.1406, + "step": 6030 + }, + { + "epoch": 1.39, + "learning_rate": 0.0002749004909628758, + "loss": 0.1657, + "step": 6060 + }, + { + "epoch": 1.4, + "learning_rate": 0.00027476110087196247, + "loss": 0.1458, + "step": 6090 + }, + { + "epoch": 1.41, + "learning_rate": 0.00027462171078104916, + "loss": 0.1534, + "step": 6120 + }, + { + "epoch": 1.41, + "learning_rate": 0.0002744823206901358, + "loss": 0.1643, + "step": 6150 + }, + { + "epoch": 1.42, + "learning_rate": 0.0002743429305992225, + "loss": 0.1355, + "step": 6180 + }, + { + "epoch": 1.43, + "learning_rate": 0.00027420354050830916, + "loss": 0.1602, + "step": 6210 + }, + { + "epoch": 1.43, + "learning_rate": 0.00027406415041739585, + "loss": 0.1492, + "step": 6240 + }, + { + "epoch": 1.44, + "learning_rate": 0.00027392476032648253, + "loss": 0.1487, + "step": 6270 + }, + { + "epoch": 1.45, + "learning_rate": 0.0002737853702355692, + "loss": 0.174, + "step": 6300 + }, + { + "epoch": 1.46, + "learning_rate": 0.0002736459801446559, + "loss": 0.1297, + "step": 6330 + }, + { + "epoch": 1.46, + "learning_rate": 0.0002735065900537426, + "loss": 0.1561, + "step": 6360 + }, + { + "epoch": 1.47, + "learning_rate": 0.0002733671999628293, + "loss": 0.147, + "step": 6390 + }, + { + "epoch": 1.48, + "learning_rate": 0.00027322780987191597, + "loss": 0.1556, + "step": 6420 + }, + { + "epoch": 1.48, + "learning_rate": 0.00027308841978100265, + "loss": 0.1579, + "step": 6450 + }, + { + "epoch": 1.49, + "learning_rate": 0.00027294902969008934, + "loss": 0.1379, + "step": 6480 + }, + { + "epoch": 1.5, + "learning_rate": 0.00027280963959917603, + "loss": 0.1619, + "step": 6510 + }, + { + "epoch": 1.5, + "learning_rate": 0.0002726702495082627, + "loss": 0.1448, + "step": 6540 + }, + { + "epoch": 1.51, + "learning_rate": 0.0002725308594173494, + "loss": 0.152, + "step": 6570 + }, + { + "epoch": 1.52, + "learning_rate": 0.0002723914693264361, + "loss": 0.1583, + "step": 6600 + }, + { + "epoch": 1.52, + "learning_rate": 0.0002722520792355228, + "loss": 0.1336, + "step": 6630 + }, + { + "epoch": 1.53, + "learning_rate": 0.00027211268914460946, + "loss": 0.1543, + "step": 6660 + }, + { + "epoch": 1.54, + "learning_rate": 0.00027197329905369615, + "loss": 0.1439, + "step": 6690 + }, + { + "epoch": 1.55, + "learning_rate": 0.00027183390896278283, + "loss": 0.1503, + "step": 6720 + }, + { + "epoch": 1.55, + "learning_rate": 0.0002716945188718695, + "loss": 0.1705, + "step": 6750 + }, + { + "epoch": 1.56, + "learning_rate": 0.00027155512878095615, + "loss": 0.1433, + "step": 6780 + }, + { + "epoch": 1.57, + "learning_rate": 0.00027141573869004284, + "loss": 0.1651, + "step": 6810 + }, + { + "epoch": 1.57, + "learning_rate": 0.0002712763485991296, + "loss": 0.144, + "step": 6840 + }, + { + "epoch": 1.58, + "learning_rate": 0.00027113695850821627, + "loss": 0.1622, + "step": 6870 + }, + { + "epoch": 1.59, + "learning_rate": 0.00027099756841730295, + "loss": 0.1592, + "step": 6900 + }, + { + "epoch": 1.59, + "learning_rate": 0.00027085817832638964, + "loss": 0.1318, + "step": 6930 + }, + { + "epoch": 1.6, + "learning_rate": 0.0002707187882354763, + "loss": 0.1598, + "step": 6960 + }, + { + "epoch": 1.61, + "learning_rate": 0.000270579398144563, + "loss": 0.1384, + "step": 6990 + }, + { + "epoch": 1.61, + "learning_rate": 0.0002704400080536497, + "loss": 0.154, + "step": 7020 + }, + { + "epoch": 1.62, + "learning_rate": 0.0002703006179627364, + "loss": 0.1596, + "step": 7050 + }, + { + "epoch": 1.63, + "learning_rate": 0.00027016122787182307, + "loss": 0.1306, + "step": 7080 + }, + { + "epoch": 1.64, + "learning_rate": 0.00027002183778090976, + "loss": 0.1588, + "step": 7110 + }, + { + "epoch": 1.64, + "learning_rate": 0.0002698824476899964, + "loss": 0.1342, + "step": 7140 + }, + { + "epoch": 1.65, + "learning_rate": 0.0002697430575990831, + "loss": 0.147, + "step": 7170 + }, + { + "epoch": 1.66, + "learning_rate": 0.00026960366750816976, + "loss": 0.1626, + "step": 7200 + }, + { + "epoch": 1.66, + "learning_rate": 0.00026946427741725645, + "loss": 0.1314, + "step": 7230 + }, + { + "epoch": 1.67, + "learning_rate": 0.00026932488732634314, + "loss": 0.1739, + "step": 7260 + }, + { + "epoch": 1.68, + "learning_rate": 0.0002691854972354298, + "loss": 0.142, + "step": 7290 + }, + { + "epoch": 1.68, + "learning_rate": 0.0002690461071445165, + "loss": 0.1623, + "step": 7320 + }, + { + "epoch": 1.69, + "learning_rate": 0.0002689067170536032, + "loss": 0.1606, + "step": 7350 + }, + { + "epoch": 1.7, + "learning_rate": 0.0002687673269626899, + "loss": 0.1391, + "step": 7380 + }, + { + "epoch": 1.7, + "learning_rate": 0.00026862793687177657, + "loss": 0.1631, + "step": 7410 + }, + { + "epoch": 1.71, + "learning_rate": 0.00026848854678086326, + "loss": 0.1428, + "step": 7440 + }, + { + "epoch": 1.72, + "learning_rate": 0.00026834915668994994, + "loss": 0.1546, + "step": 7470 + }, + { + "epoch": 1.72, + "learning_rate": 0.00026820976659903663, + "loss": 0.1639, + "step": 7500 + }, + { + "epoch": 1.73, + "learning_rate": 0.0002680703765081233, + "loss": 0.1296, + "step": 7530 + }, + { + "epoch": 1.74, + "learning_rate": 0.00026793098641721, + "loss": 0.1643, + "step": 7560 + }, + { + "epoch": 1.75, + "learning_rate": 0.0002677915963262967, + "loss": 0.141, + "step": 7590 + }, + { + "epoch": 1.75, + "learning_rate": 0.0002676522062353834, + "loss": 0.1596, + "step": 7620 + }, + { + "epoch": 1.76, + "learning_rate": 0.00026751281614447006, + "loss": 0.1555, + "step": 7650 + }, + { + "epoch": 1.77, + "learning_rate": 0.00026737342605355675, + "loss": 0.1275, + "step": 7680 + }, + { + "epoch": 1.77, + "learning_rate": 0.00026723403596264344, + "loss": 0.159, + "step": 7710 + }, + { + "epoch": 1.78, + "learning_rate": 0.0002670946458717301, + "loss": 0.1444, + "step": 7740 + }, + { + "epoch": 1.79, + "learning_rate": 0.0002669552557808168, + "loss": 0.145, + "step": 7770 + }, + { + "epoch": 1.79, + "learning_rate": 0.0002668158656899035, + "loss": 0.1585, + "step": 7800 + }, + { + "epoch": 1.8, + "learning_rate": 0.0002666764755989902, + "loss": 0.1342, + "step": 7830 + }, + { + "epoch": 1.81, + "learning_rate": 0.00026653708550807687, + "loss": 0.1548, + "step": 7860 + }, + { + "epoch": 1.81, + "learning_rate": 0.00026639769541716356, + "loss": 0.1427, + "step": 7890 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026625830532625024, + "loss": 0.1545, + "step": 7920 + }, + { + "epoch": 1.83, + "learning_rate": 0.00026611891523533693, + "loss": 0.1659, + "step": 7950 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002659795251444236, + "loss": 0.1376, + "step": 7980 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002658401350535103, + "loss": 0.1627, + "step": 8010 + }, + { + "epoch": 1.85, + "learning_rate": 0.000265700744962597, + "loss": 0.1384, + "step": 8040 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002655613548716837, + "loss": 0.1481, + "step": 8070 + }, + { + "epoch": 1.86, + "learning_rate": 0.00026542196478077036, + "loss": 0.1622, + "step": 8100 + }, + { + "epoch": 1.87, + "learning_rate": 0.000265282574689857, + "loss": 0.1408, + "step": 8130 + }, + { + "epoch": 1.88, + "learning_rate": 0.0002651431845989437, + "loss": 0.1654, + "step": 8160 + }, + { + "epoch": 1.88, + "learning_rate": 0.00026500379450803037, + "loss": 0.141, + "step": 8190 + }, + { + "epoch": 1.89, + "learning_rate": 0.00026486440441711705, + "loss": 0.1518, + "step": 8220 + }, + { + "epoch": 1.9, + "learning_rate": 0.00026472501432620374, + "loss": 0.176, + "step": 8250 + }, + { + "epoch": 1.9, + "learning_rate": 0.0002645856242352904, + "loss": 0.14, + "step": 8280 + }, + { + "epoch": 1.91, + "learning_rate": 0.0002644462341443771, + "loss": 0.171, + "step": 8310 + }, + { + "epoch": 1.92, + "learning_rate": 0.0002643068440534638, + "loss": 0.1492, + "step": 8340 + }, + { + "epoch": 1.92, + "learning_rate": 0.0002641674539625505, + "loss": 0.1592, + "step": 8370 + }, + { + "epoch": 1.93, + "learning_rate": 0.0002640280638716372, + "loss": 0.1694, + "step": 8400 + }, + { + "epoch": 1.94, + "learning_rate": 0.0002638886737807239, + "loss": 0.1356, + "step": 8430 + }, + { + "epoch": 1.95, + "learning_rate": 0.0002637492836898106, + "loss": 0.1622, + "step": 8460 + }, + { + "epoch": 1.95, + "learning_rate": 0.00026360989359889723, + "loss": 0.1416, + "step": 8490 + }, + { + "epoch": 1.96, + "learning_rate": 0.0002634705035079839, + "loss": 0.1523, + "step": 8520 + }, + { + "epoch": 1.97, + "learning_rate": 0.0002633311134170706, + "loss": 0.1546, + "step": 8550 + }, + { + "epoch": 1.97, + "learning_rate": 0.0002631917233261573, + "loss": 0.1366, + "step": 8580 + }, + { + "epoch": 1.98, + "learning_rate": 0.000263052333235244, + "loss": 0.1535, + "step": 8610 + }, + { + "epoch": 1.99, + "learning_rate": 0.00026291294314433067, + "loss": 0.1446, + "step": 8640 + }, + { + "epoch": 1.99, + "learning_rate": 0.00026277355305341735, + "loss": 0.1597, + "step": 8670 + }, + { + "epoch": 2.0, + "eval_cer": 0.0479201632665926, + "eval_loss": 0.15922409296035767, + "eval_runtime": 417.0022, + "eval_samples_per_second": 38.712, + "eval_steps_per_second": 2.42, + "eval_wer": 0.1717350840976006, + "step": 8697 + }, + { + "epoch": 2.0, + "learning_rate": 0.00026263416296250404, + "loss": 0.1696, + "step": 8700 + }, + { + "epoch": 2.01, + "learning_rate": 0.0002624947728715907, + "loss": 0.1347, + "step": 8730 + }, + { + "epoch": 2.01, + "learning_rate": 0.0002623553827806774, + "loss": 0.1478, + "step": 8760 + }, + { + "epoch": 2.02, + "learning_rate": 0.0002622159926897641, + "loss": 0.1478, + "step": 8790 + }, + { + "epoch": 2.03, + "learning_rate": 0.0002620766025988508, + "loss": 0.1405, + "step": 8820 + }, + { + "epoch": 2.04, + "learning_rate": 0.00026193721250793747, + "loss": 0.1594, + "step": 8850 + }, + { + "epoch": 2.04, + "learning_rate": 0.00026179782241702416, + "loss": 0.1238, + "step": 8880 + }, + { + "epoch": 2.05, + "learning_rate": 0.00026165843232611085, + "loss": 0.1452, + "step": 8910 + }, + { + "epoch": 2.06, + "learning_rate": 0.00026151904223519753, + "loss": 0.135, + "step": 8940 + }, + { + "epoch": 2.06, + "learning_rate": 0.0002613796521442842, + "loss": 0.1339, + "step": 8970 + }, + { + "epoch": 2.07, + "learning_rate": 0.0002612402620533709, + "loss": 0.1497, + "step": 9000 + }, + { + "epoch": 2.08, + "learning_rate": 0.0002611008719624576, + "loss": 0.1253, + "step": 9030 + }, + { + "epoch": 2.08, + "learning_rate": 0.0002609614818715443, + "loss": 0.1525, + "step": 9060 + }, + { + "epoch": 2.09, + "learning_rate": 0.0002608220917806309, + "loss": 0.1339, + "step": 9090 + }, + { + "epoch": 2.1, + "learning_rate": 0.0002606827016897176, + "loss": 0.1482, + "step": 9120 + }, + { + "epoch": 2.1, + "learning_rate": 0.0002605433115988043, + "loss": 0.1467, + "step": 9150 + }, + { + "epoch": 2.11, + "learning_rate": 0.00026040392150789097, + "loss": 0.1234, + "step": 9180 + }, + { + "epoch": 2.12, + "learning_rate": 0.0002602645314169777, + "loss": 0.1478, + "step": 9210 + }, + { + "epoch": 2.12, + "learning_rate": 0.0002601251413260644, + "loss": 0.1393, + "step": 9240 + }, + { + "epoch": 2.13, + "learning_rate": 0.0002599857512351511, + "loss": 0.1405, + "step": 9270 + }, + { + "epoch": 2.14, + "learning_rate": 0.00025984636114423777, + "loss": 0.1591, + "step": 9300 + }, + { + "epoch": 2.15, + "learning_rate": 0.00025970697105332446, + "loss": 0.1247, + "step": 9330 + }, + { + "epoch": 2.15, + "learning_rate": 0.00025956758096241114, + "loss": 0.1448, + "step": 9360 + }, + { + "epoch": 2.16, + "learning_rate": 0.00025942819087149783, + "loss": 0.1393, + "step": 9390 + }, + { + "epoch": 2.17, + "learning_rate": 0.0002592888007805845, + "loss": 0.1469, + "step": 9420 + }, + { + "epoch": 2.17, + "learning_rate": 0.0002591494106896712, + "loss": 0.1552, + "step": 9450 + }, + { + "epoch": 2.18, + "learning_rate": 0.00025901002059875784, + "loss": 0.1268, + "step": 9480 + }, + { + "epoch": 2.19, + "learning_rate": 0.0002588706305078445, + "loss": 0.1569, + "step": 9510 + }, + { + "epoch": 2.19, + "learning_rate": 0.0002587312404169312, + "loss": 0.1395, + "step": 9540 + }, + { + "epoch": 2.2, + "learning_rate": 0.0002585918503260179, + "loss": 0.1458, + "step": 9570 + }, + { + "epoch": 2.21, + "learning_rate": 0.0002584524602351046, + "loss": 0.1538, + "step": 9600 + }, + { + "epoch": 2.21, + "learning_rate": 0.00025831307014419127, + "loss": 0.1304, + "step": 9630 + }, + { + "epoch": 2.22, + "learning_rate": 0.00025817368005327796, + "loss": 0.1497, + "step": 9660 + }, + { + "epoch": 2.23, + "learning_rate": 0.00025803428996236464, + "loss": 0.1443, + "step": 9690 + }, + { + "epoch": 2.24, + "learning_rate": 0.00025789489987145133, + "loss": 0.1477, + "step": 9720 + }, + { + "epoch": 2.24, + "learning_rate": 0.000257755509780538, + "loss": 0.1605, + "step": 9750 + }, + { + "epoch": 2.25, + "learning_rate": 0.0002576161196896247, + "loss": 0.1327, + "step": 9780 + }, + { + "epoch": 2.26, + "learning_rate": 0.0002574767295987114, + "loss": 0.1493, + "step": 9810 + }, + { + "epoch": 2.26, + "learning_rate": 0.0002573373395077981, + "loss": 0.1435, + "step": 9840 + }, + { + "epoch": 2.27, + "learning_rate": 0.00025719794941688476, + "loss": 0.1436, + "step": 9870 + }, + { + "epoch": 2.28, + "learning_rate": 0.00025705855932597145, + "loss": 0.1518, + "step": 9900 + }, + { + "epoch": 2.28, + "learning_rate": 0.00025691916923505813, + "loss": 0.126, + "step": 9930 + }, + { + "epoch": 2.29, + "learning_rate": 0.0002567797791441448, + "loss": 0.1492, + "step": 9960 + }, + { + "epoch": 2.3, + "learning_rate": 0.0002566403890532315, + "loss": 0.1344, + "step": 9990 + }, + { + "epoch": 2.3, + "learning_rate": 0.0002565009989623182, + "loss": 0.1413, + "step": 10020 + }, + { + "epoch": 2.31, + "learning_rate": 0.0002563616088714049, + "loss": 0.1554, + "step": 10050 + }, + { + "epoch": 2.32, + "learning_rate": 0.00025622221878049157, + "loss": 0.13, + "step": 10080 + }, + { + "epoch": 2.32, + "learning_rate": 0.00025608282868957825, + "loss": 0.1501, + "step": 10110 + }, + { + "epoch": 2.33, + "learning_rate": 0.00025594343859866494, + "loss": 0.143, + "step": 10140 + }, + { + "epoch": 2.34, + "learning_rate": 0.00025580404850775163, + "loss": 0.1468, + "step": 10170 + }, + { + "epoch": 2.35, + "learning_rate": 0.0002556646584168383, + "loss": 0.1568, + "step": 10200 + }, + { + "epoch": 2.35, + "learning_rate": 0.000255525268325925, + "loss": 0.1253, + "step": 10230 + }, + { + "epoch": 2.36, + "learning_rate": 0.0002553858782350117, + "loss": 0.1488, + "step": 10260 + }, + { + "epoch": 2.37, + "learning_rate": 0.0002552464881440984, + "loss": 0.1333, + "step": 10290 + }, + { + "epoch": 2.37, + "learning_rate": 0.00025510709805318506, + "loss": 0.135, + "step": 10320 + }, + { + "epoch": 2.38, + "learning_rate": 0.00025496770796227175, + "loss": 0.1518, + "step": 10350 + }, + { + "epoch": 2.39, + "learning_rate": 0.00025482831787135843, + "loss": 0.1169, + "step": 10380 + }, + { + "epoch": 2.39, + "learning_rate": 0.0002546889277804451, + "loss": 0.1492, + "step": 10410 + }, + { + "epoch": 2.4, + "learning_rate": 0.0002545495376895318, + "loss": 0.1319, + "step": 10440 + }, + { + "epoch": 2.41, + "learning_rate": 0.00025441014759861844, + "loss": 0.1432, + "step": 10470 + }, + { + "epoch": 2.41, + "learning_rate": 0.0002542707575077051, + "loss": 0.1455, + "step": 10500 + }, + { + "epoch": 2.42, + "learning_rate": 0.0002541313674167918, + "loss": 0.1298, + "step": 10530 + }, + { + "epoch": 2.43, + "learning_rate": 0.0002539919773258785, + "loss": 0.1493, + "step": 10560 + }, + { + "epoch": 2.44, + "learning_rate": 0.0002538525872349652, + "loss": 0.136, + "step": 10590 + }, + { + "epoch": 2.44, + "learning_rate": 0.00025371319714405187, + "loss": 0.14, + "step": 10620 + }, + { + "epoch": 2.45, + "learning_rate": 0.00025357380705313856, + "loss": 0.1489, + "step": 10650 + }, + { + "epoch": 2.46, + "learning_rate": 0.00025343441696222524, + "loss": 0.1253, + "step": 10680 + }, + { + "epoch": 2.46, + "learning_rate": 0.00025329502687131193, + "loss": 0.1498, + "step": 10710 + }, + { + "epoch": 2.47, + "learning_rate": 0.0002531556367803986, + "loss": 0.141, + "step": 10740 + }, + { + "epoch": 2.48, + "learning_rate": 0.0002530162466894853, + "loss": 0.1389, + "step": 10770 + }, + { + "epoch": 2.48, + "learning_rate": 0.00025287685659857205, + "loss": 0.1601, + "step": 10800 + }, + { + "epoch": 2.49, + "learning_rate": 0.0002527374665076587, + "loss": 0.1304, + "step": 10830 + }, + { + "epoch": 2.5, + "learning_rate": 0.00025259807641674536, + "loss": 0.1467, + "step": 10860 + }, + { + "epoch": 2.5, + "learning_rate": 0.00025245868632583205, + "loss": 0.1435, + "step": 10890 + }, + { + "epoch": 2.51, + "learning_rate": 0.00025231929623491874, + "loss": 0.1401, + "step": 10920 + }, + { + "epoch": 2.52, + "learning_rate": 0.0002521799061440054, + "loss": 0.1479, + "step": 10950 + }, + { + "epoch": 2.53, + "learning_rate": 0.0002520405160530921, + "loss": 0.1267, + "step": 10980 + }, + { + "epoch": 2.53, + "learning_rate": 0.0002519011259621788, + "loss": 0.1487, + "step": 11010 + }, + { + "epoch": 2.54, + "learning_rate": 0.0002517617358712655, + "loss": 0.1344, + "step": 11040 + }, + { + "epoch": 2.55, + "learning_rate": 0.00025162234578035217, + "loss": 0.1386, + "step": 11070 + }, + { + "epoch": 2.55, + "learning_rate": 0.00025148295568943886, + "loss": 0.16, + "step": 11100 + }, + { + "epoch": 2.56, + "learning_rate": 0.00025134356559852554, + "loss": 0.1285, + "step": 11130 + }, + { + "epoch": 2.57, + "learning_rate": 0.00025120417550761223, + "loss": 0.1546, + "step": 11160 + }, + { + "epoch": 2.57, + "learning_rate": 0.0002510647854166989, + "loss": 0.1356, + "step": 11190 + }, + { + "epoch": 2.58, + "learning_rate": 0.0002509253953257856, + "loss": 0.1437, + "step": 11220 + }, + { + "epoch": 2.59, + "learning_rate": 0.0002507860052348723, + "loss": 0.1533, + "step": 11250 + }, + { + "epoch": 2.59, + "learning_rate": 0.000250646615143959, + "loss": 0.1282, + "step": 11280 + }, + { + "epoch": 2.6, + "learning_rate": 0.00025050722505304566, + "loss": 0.1442, + "step": 11310 + }, + { + "epoch": 2.61, + "learning_rate": 0.00025036783496213235, + "loss": 0.1316, + "step": 11340 + }, + { + "epoch": 2.61, + "learning_rate": 0.00025022844487121904, + "loss": 0.1356, + "step": 11370 + }, + { + "epoch": 2.62, + "learning_rate": 0.0002500890547803057, + "loss": 0.1512, + "step": 11400 + }, + { + "epoch": 2.63, + "learning_rate": 0.00024994966468939236, + "loss": 0.1246, + "step": 11430 + }, + { + "epoch": 2.64, + "learning_rate": 0.00024981027459847904, + "loss": 0.1367, + "step": 11460 + }, + { + "epoch": 2.64, + "learning_rate": 0.00024967088450756573, + "loss": 0.1235, + "step": 11490 + }, + { + "epoch": 2.65, + "learning_rate": 0.0002495314944166524, + "loss": 0.1304, + "step": 11520 + }, + { + "epoch": 2.66, + "learning_rate": 0.0002493921043257391, + "loss": 0.144, + "step": 11550 + }, + { + "epoch": 2.66, + "learning_rate": 0.00024925271423482584, + "loss": 0.1213, + "step": 11580 + }, + { + "epoch": 2.67, + "learning_rate": 0.00024911332414391253, + "loss": 0.1453, + "step": 11610 + }, + { + "epoch": 2.68, + "learning_rate": 0.0002489739340529992, + "loss": 0.1363, + "step": 11640 + }, + { + "epoch": 2.68, + "learning_rate": 0.0002488345439620859, + "loss": 0.142, + "step": 11670 + }, + { + "epoch": 2.69, + "learning_rate": 0.0002486951538711726, + "loss": 0.1441, + "step": 11700 + }, + { + "epoch": 2.7, + "learning_rate": 0.0002485557637802593, + "loss": 0.1215, + "step": 11730 + }, + { + "epoch": 2.7, + "learning_rate": 0.00024841637368934596, + "loss": 0.1424, + "step": 11760 + }, + { + "epoch": 2.71, + "learning_rate": 0.00024827698359843265, + "loss": 0.133, + "step": 11790 + }, + { + "epoch": 2.72, + "learning_rate": 0.0002481375935075193, + "loss": 0.1354, + "step": 11820 + }, + { + "epoch": 2.73, + "learning_rate": 0.00024799820341660597, + "loss": 0.1427, + "step": 11850 + }, + { + "epoch": 2.73, + "learning_rate": 0.00024785881332569265, + "loss": 0.1196, + "step": 11880 + }, + { + "epoch": 2.74, + "learning_rate": 0.00024771942323477934, + "loss": 0.1464, + "step": 11910 + }, + { + "epoch": 2.75, + "learning_rate": 0.000247580033143866, + "loss": 0.1277, + "step": 11940 + }, + { + "epoch": 2.75, + "learning_rate": 0.0002474406430529527, + "loss": 0.1343, + "step": 11970 + }, + { + "epoch": 2.76, + "learning_rate": 0.0002473012529620394, + "loss": 0.145, + "step": 12000 + }, + { + "epoch": 2.77, + "learning_rate": 0.0002471618628711261, + "loss": 0.1128, + "step": 12030 + }, + { + "epoch": 2.77, + "learning_rate": 0.0002470224727802128, + "loss": 0.1388, + "step": 12060 + }, + { + "epoch": 2.78, + "learning_rate": 0.00024688308268929946, + "loss": 0.1298, + "step": 12090 + }, + { + "epoch": 2.79, + "learning_rate": 0.00024674369259838615, + "loss": 0.1363, + "step": 12120 + }, + { + "epoch": 2.79, + "learning_rate": 0.00024660430250747283, + "loss": 0.1423, + "step": 12150 + }, + { + "epoch": 2.8, + "learning_rate": 0.0002464649124165595, + "loss": 0.1247, + "step": 12180 + }, + { + "epoch": 2.81, + "learning_rate": 0.0002463255223256462, + "loss": 0.1384, + "step": 12210 + }, + { + "epoch": 2.81, + "learning_rate": 0.0002461861322347329, + "loss": 0.1302, + "step": 12240 + }, + { + "epoch": 2.82, + "learning_rate": 0.0002460467421438196, + "loss": 0.1391, + "step": 12270 + }, + { + "epoch": 2.83, + "learning_rate": 0.00024590735205290627, + "loss": 0.148, + "step": 12300 + }, + { + "epoch": 2.84, + "learning_rate": 0.00024576796196199295, + "loss": 0.1214, + "step": 12330 + }, + { + "epoch": 2.84, + "learning_rate": 0.00024562857187107964, + "loss": 0.1391, + "step": 12360 + }, + { + "epoch": 2.85, + "learning_rate": 0.0002454891817801663, + "loss": 0.136, + "step": 12390 + }, + { + "epoch": 2.86, + "learning_rate": 0.000245349791689253, + "loss": 0.1336, + "step": 12420 + }, + { + "epoch": 2.86, + "learning_rate": 0.0002452104015983397, + "loss": 0.1418, + "step": 12450 + }, + { + "epoch": 2.87, + "learning_rate": 0.0002450710115074264, + "loss": 0.1181, + "step": 12480 + }, + { + "epoch": 2.88, + "learning_rate": 0.00024493162141651307, + "loss": 0.1403, + "step": 12510 + }, + { + "epoch": 2.88, + "learning_rate": 0.00024479223132559976, + "loss": 0.1335, + "step": 12540 + }, + { + "epoch": 2.89, + "learning_rate": 0.00024465284123468644, + "loss": 0.1325, + "step": 12570 + }, + { + "epoch": 2.9, + "learning_rate": 0.00024451345114377313, + "loss": 0.1511, + "step": 12600 + }, + { + "epoch": 2.9, + "learning_rate": 0.0002443740610528598, + "loss": 0.1149, + "step": 12630 + }, + { + "epoch": 2.91, + "learning_rate": 0.0002442346709619465, + "loss": 0.1513, + "step": 12660 + }, + { + "epoch": 2.92, + "learning_rate": 0.00024409528087103316, + "loss": 0.1323, + "step": 12690 + }, + { + "epoch": 2.93, + "learning_rate": 0.00024395589078011985, + "loss": 0.138, + "step": 12720 + }, + { + "epoch": 2.93, + "learning_rate": 0.00024381650068920654, + "loss": 0.1476, + "step": 12750 + }, + { + "epoch": 2.94, + "learning_rate": 0.00024367711059829322, + "loss": 0.1201, + "step": 12780 + }, + { + "epoch": 2.95, + "learning_rate": 0.0002435377205073799, + "loss": 0.1428, + "step": 12810 + }, + { + "epoch": 2.95, + "learning_rate": 0.0002433983304164666, + "loss": 0.1328, + "step": 12840 + }, + { + "epoch": 2.96, + "learning_rate": 0.00024325894032555328, + "loss": 0.1406, + "step": 12870 + }, + { + "epoch": 2.97, + "learning_rate": 0.00024311955023463997, + "loss": 0.1499, + "step": 12900 + }, + { + "epoch": 2.97, + "learning_rate": 0.00024298016014372663, + "loss": 0.1254, + "step": 12930 + }, + { + "epoch": 2.98, + "learning_rate": 0.00024284077005281332, + "loss": 0.1372, + "step": 12960 + }, + { + "epoch": 2.99, + "learning_rate": 0.0002427013799619, + "loss": 0.1315, + "step": 12990 + }, + { + "epoch": 2.99, + "learning_rate": 0.0002425619898709867, + "loss": 0.1364, + "step": 13020 + }, + { + "epoch": 3.0, + "eval_cer": 0.04246546738213996, + "eval_loss": 0.15239985287189484, + "eval_runtime": 415.2353, + "eval_samples_per_second": 38.877, + "eval_steps_per_second": 2.43, + "eval_wer": 0.1563369318758672, + "step": 13045 + }, + { + "epoch": 3.0, + "learning_rate": 0.00024242259978007338, + "loss": 0.1401, + "step": 13050 + }, + { + "epoch": 3.01, + "learning_rate": 0.00024228320968916006, + "loss": 0.1182, + "step": 13080 + }, + { + "epoch": 3.01, + "learning_rate": 0.00024214381959824675, + "loss": 0.1359, + "step": 13110 + }, + { + "epoch": 3.02, + "learning_rate": 0.00024200442950733344, + "loss": 0.1334, + "step": 13140 + }, + { + "epoch": 3.03, + "learning_rate": 0.00024186503941642015, + "loss": 0.1301, + "step": 13170 + }, + { + "epoch": 3.04, + "learning_rate": 0.00024172564932550684, + "loss": 0.141, + "step": 13200 + }, + { + "epoch": 3.04, + "learning_rate": 0.00024158625923459352, + "loss": 0.1143, + "step": 13230 + }, + { + "epoch": 3.05, + "learning_rate": 0.0002414468691436802, + "loss": 0.1405, + "step": 13260 + }, + { + "epoch": 3.06, + "learning_rate": 0.0002413074790527669, + "loss": 0.1268, + "step": 13290 + }, + { + "epoch": 3.06, + "learning_rate": 0.00024116808896185356, + "loss": 0.1315, + "step": 13320 + }, + { + "epoch": 3.07, + "learning_rate": 0.00024102869887094024, + "loss": 0.1412, + "step": 13350 + }, + { + "epoch": 3.08, + "learning_rate": 0.00024088930878002693, + "loss": 0.121, + "step": 13380 + }, + { + "epoch": 3.08, + "learning_rate": 0.00024074991868911361, + "loss": 0.1433, + "step": 13410 + }, + { + "epoch": 3.09, + "learning_rate": 0.0002406105285982003, + "loss": 0.1275, + "step": 13440 + }, + { + "epoch": 3.1, + "learning_rate": 0.000240471138507287, + "loss": 0.1317, + "step": 13470 + }, + { + "epoch": 3.1, + "learning_rate": 0.00024033174841637367, + "loss": 0.1392, + "step": 13500 + }, + { + "epoch": 3.11, + "learning_rate": 0.00024019235832546036, + "loss": 0.1188, + "step": 13530 + }, + { + "epoch": 3.12, + "learning_rate": 0.00024005296823454705, + "loss": 0.14, + "step": 13560 + }, + { + "epoch": 3.13, + "learning_rate": 0.00023991357814363373, + "loss": 0.1277, + "step": 13590 + }, + { + "epoch": 3.13, + "learning_rate": 0.0002397741880527204, + "loss": 0.1286, + "step": 13620 + }, + { + "epoch": 3.14, + "learning_rate": 0.00023963479796180708, + "loss": 0.1408, + "step": 13650 + }, + { + "epoch": 3.15, + "learning_rate": 0.00023949540787089377, + "loss": 0.1223, + "step": 13680 + }, + { + "epoch": 3.15, + "learning_rate": 0.00023935601777998045, + "loss": 0.1416, + "step": 13710 + }, + { + "epoch": 3.16, + "learning_rate": 0.00023921662768906714, + "loss": 0.1316, + "step": 13740 + }, + { + "epoch": 3.17, + "learning_rate": 0.00023907723759815383, + "loss": 0.1291, + "step": 13770 + }, + { + "epoch": 3.17, + "learning_rate": 0.0002389378475072405, + "loss": 0.1517, + "step": 13800 + }, + { + "epoch": 3.18, + "learning_rate": 0.0002387984574163272, + "loss": 0.1158, + "step": 13830 + }, + { + "epoch": 3.19, + "learning_rate": 0.0002386590673254139, + "loss": 0.135, + "step": 13860 + }, + { + "epoch": 3.19, + "learning_rate": 0.00023851967723450057, + "loss": 0.1312, + "step": 13890 + }, + { + "epoch": 3.2, + "learning_rate": 0.00023838028714358723, + "loss": 0.1295, + "step": 13920 + }, + { + "epoch": 3.21, + "learning_rate": 0.00023824089705267392, + "loss": 0.137, + "step": 13950 + }, + { + "epoch": 3.21, + "learning_rate": 0.00023810150696176063, + "loss": 0.1141, + "step": 13980 + }, + { + "epoch": 3.22, + "learning_rate": 0.00023796211687084732, + "loss": 0.1356, + "step": 14010 + }, + { + "epoch": 3.23, + "learning_rate": 0.000237822726779934, + "loss": 0.1314, + "step": 14040 + }, + { + "epoch": 3.24, + "learning_rate": 0.0002376833366890207, + "loss": 0.1332, + "step": 14070 + }, + { + "epoch": 3.24, + "learning_rate": 0.00023754394659810738, + "loss": 0.1464, + "step": 14100 + }, + { + "epoch": 3.25, + "learning_rate": 0.00023740455650719407, + "loss": 0.1175, + "step": 14130 + }, + { + "epoch": 3.26, + "learning_rate": 0.00023726516641628075, + "loss": 0.1396, + "step": 14160 + }, + { + "epoch": 3.26, + "learning_rate": 0.00023712577632536744, + "loss": 0.131, + "step": 14190 + }, + { + "epoch": 3.27, + "learning_rate": 0.00023698638623445413, + "loss": 0.1272, + "step": 14220 + }, + { + "epoch": 3.28, + "learning_rate": 0.0002368516424799046, + "loss": 0.1469, + "step": 14250 + }, + { + "epoch": 3.28, + "learning_rate": 0.00023671225238899128, + "loss": 0.1162, + "step": 14280 + }, + { + "epoch": 3.29, + "learning_rate": 0.00023657286229807796, + "loss": 0.1367, + "step": 14310 + }, + { + "epoch": 3.3, + "learning_rate": 0.00023643347220716465, + "loss": 0.1282, + "step": 14340 + }, + { + "epoch": 3.3, + "learning_rate": 0.00023629408211625134, + "loss": 0.1297, + "step": 14370 + }, + { + "epoch": 3.31, + "learning_rate": 0.00023615469202533802, + "loss": 0.1379, + "step": 14400 + }, + { + "epoch": 3.32, + "learning_rate": 0.00023601530193442468, + "loss": 0.1248, + "step": 14430 + }, + { + "epoch": 3.33, + "learning_rate": 0.00023587591184351137, + "loss": 0.1333, + "step": 14460 + }, + { + "epoch": 3.33, + "learning_rate": 0.00023573652175259806, + "loss": 0.1252, + "step": 14490 + }, + { + "epoch": 3.34, + "learning_rate": 0.00023559713166168474, + "loss": 0.1234, + "step": 14520 + }, + { + "epoch": 3.35, + "learning_rate": 0.00023545774157077143, + "loss": 0.1423, + "step": 14550 + }, + { + "epoch": 3.35, + "learning_rate": 0.00023531835147985812, + "loss": 0.1199, + "step": 14580 + }, + { + "epoch": 3.36, + "learning_rate": 0.0002351789613889448, + "loss": 0.1241, + "step": 14610 + }, + { + "epoch": 3.37, + "learning_rate": 0.0002350395712980315, + "loss": 0.126, + "step": 14640 + }, + { + "epoch": 3.37, + "learning_rate": 0.00023490018120711818, + "loss": 0.1266, + "step": 14670 + }, + { + "epoch": 3.38, + "learning_rate": 0.00023476079111620486, + "loss": 0.1396, + "step": 14700 + }, + { + "epoch": 3.39, + "learning_rate": 0.00023462140102529152, + "loss": 0.1134, + "step": 14730 + }, + { + "epoch": 3.39, + "learning_rate": 0.0002344820109343782, + "loss": 0.1371, + "step": 14760 + }, + { + "epoch": 3.4, + "learning_rate": 0.0002343426208434649, + "loss": 0.1279, + "step": 14790 + }, + { + "epoch": 3.41, + "learning_rate": 0.00023420323075255158, + "loss": 0.124, + "step": 14820 + }, + { + "epoch": 3.41, + "learning_rate": 0.00023406384066163827, + "loss": 0.1378, + "step": 14850 + }, + { + "epoch": 3.42, + "learning_rate": 0.00023392445057072495, + "loss": 0.1153, + "step": 14880 + }, + { + "epoch": 3.43, + "learning_rate": 0.00023378506047981164, + "loss": 0.1244, + "step": 14910 + }, + { + "epoch": 3.44, + "learning_rate": 0.00023364567038889833, + "loss": 0.1187, + "step": 14940 + }, + { + "epoch": 3.44, + "learning_rate": 0.00023350628029798501, + "loss": 0.1292, + "step": 14970 + }, + { + "epoch": 3.45, + "learning_rate": 0.0002333668902070717, + "loss": 0.1472, + "step": 15000 + }, + { + "epoch": 3.46, + "learning_rate": 0.00023322750011615836, + "loss": 0.113, + "step": 15030 + }, + { + "epoch": 3.46, + "learning_rate": 0.0002330881100252451, + "loss": 0.1365, + "step": 15060 + }, + { + "epoch": 3.47, + "learning_rate": 0.00023294871993433176, + "loss": 0.1259, + "step": 15090 + }, + { + "epoch": 3.48, + "learning_rate": 0.00023280932984341845, + "loss": 0.128, + "step": 15120 + }, + { + "epoch": 3.48, + "learning_rate": 0.00023266993975250513, + "loss": 0.1419, + "step": 15150 + }, + { + "epoch": 3.49, + "learning_rate": 0.00023253054966159182, + "loss": 0.1215, + "step": 15180 + }, + { + "epoch": 3.5, + "learning_rate": 0.0002323911595706785, + "loss": 0.1433, + "step": 15210 + }, + { + "epoch": 3.5, + "learning_rate": 0.0002322517694797652, + "loss": 0.1261, + "step": 15240 + }, + { + "epoch": 3.51, + "learning_rate": 0.00023211237938885188, + "loss": 0.1267, + "step": 15270 + }, + { + "epoch": 3.52, + "learning_rate": 0.00023197298929793857, + "loss": 0.1418, + "step": 15300 + }, + { + "epoch": 3.53, + "learning_rate": 0.00023183359920702525, + "loss": 0.116, + "step": 15330 + }, + { + "epoch": 3.53, + "learning_rate": 0.00023169420911611194, + "loss": 0.1403, + "step": 15360 + }, + { + "epoch": 3.54, + "learning_rate": 0.0002315548190251986, + "loss": 0.1251, + "step": 15390 + }, + { + "epoch": 3.55, + "learning_rate": 0.00023141542893428529, + "loss": 0.1289, + "step": 15420 + }, + { + "epoch": 3.55, + "learning_rate": 0.00023127603884337197, + "loss": 0.1389, + "step": 15450 + }, + { + "epoch": 3.56, + "learning_rate": 0.00023113664875245866, + "loss": 0.1165, + "step": 15480 + }, + { + "epoch": 3.57, + "learning_rate": 0.00023099725866154535, + "loss": 0.1322, + "step": 15510 + }, + { + "epoch": 3.57, + "learning_rate": 0.00023085786857063203, + "loss": 0.1234, + "step": 15540 + }, + { + "epoch": 3.58, + "learning_rate": 0.00023071847847971872, + "loss": 0.1283, + "step": 15570 + }, + { + "epoch": 3.59, + "learning_rate": 0.0002305790883888054, + "loss": 0.1435, + "step": 15600 + }, + { + "epoch": 3.59, + "learning_rate": 0.0002304396982978921, + "loss": 0.119, + "step": 15630 + }, + { + "epoch": 3.6, + "learning_rate": 0.00023030030820697878, + "loss": 0.1331, + "step": 15660 + }, + { + "epoch": 3.61, + "learning_rate": 0.00023016091811606544, + "loss": 0.1262, + "step": 15690 + }, + { + "epoch": 3.62, + "learning_rate": 0.00023002152802515212, + "loss": 0.1242, + "step": 15720 + }, + { + "epoch": 3.62, + "learning_rate": 0.0002298821379342388, + "loss": 0.1339, + "step": 15750 + }, + { + "epoch": 3.63, + "learning_rate": 0.0002297427478433255, + "loss": 0.1178, + "step": 15780 + }, + { + "epoch": 3.64, + "learning_rate": 0.00022960335775241218, + "loss": 0.1434, + "step": 15810 + }, + { + "epoch": 3.64, + "learning_rate": 0.0002294639676614989, + "loss": 0.1305, + "step": 15840 + }, + { + "epoch": 3.65, + "learning_rate": 0.00022932457757058558, + "loss": 0.1279, + "step": 15870 + }, + { + "epoch": 3.66, + "learning_rate": 0.00022918518747967227, + "loss": 0.1472, + "step": 15900 + }, + { + "epoch": 3.66, + "learning_rate": 0.00022904579738875896, + "loss": 0.119, + "step": 15930 + }, + { + "epoch": 3.67, + "learning_rate": 0.00022890640729784564, + "loss": 0.1355, + "step": 15960 + }, + { + "epoch": 3.68, + "learning_rate": 0.00022876701720693233, + "loss": 0.1335, + "step": 15990 + }, + { + "epoch": 3.68, + "learning_rate": 0.00022862762711601902, + "loss": 0.1299, + "step": 16020 + }, + { + "epoch": 3.69, + "learning_rate": 0.0002284882370251057, + "loss": 0.1372, + "step": 16050 + }, + { + "epoch": 3.7, + "learning_rate": 0.00022834884693419236, + "loss": 0.1139, + "step": 16080 + }, + { + "epoch": 3.7, + "learning_rate": 0.00022820945684327905, + "loss": 0.127, + "step": 16110 + }, + { + "epoch": 3.71, + "learning_rate": 0.00022807006675236574, + "loss": 0.1217, + "step": 16140 + }, + { + "epoch": 3.72, + "learning_rate": 0.00022793067666145242, + "loss": 0.132, + "step": 16170 + }, + { + "epoch": 3.73, + "learning_rate": 0.0002277912865705391, + "loss": 0.1415, + "step": 16200 + }, + { + "epoch": 3.73, + "learning_rate": 0.0002276518964796258, + "loss": 0.1189, + "step": 16230 + }, + { + "epoch": 3.74, + "learning_rate": 0.00022751250638871248, + "loss": 0.1346, + "step": 16260 + }, + { + "epoch": 3.75, + "learning_rate": 0.00022737311629779917, + "loss": 0.1292, + "step": 16290 + }, + { + "epoch": 3.75, + "learning_rate": 0.00022723372620688586, + "loss": 0.1269, + "step": 16320 + }, + { + "epoch": 3.76, + "learning_rate": 0.00022709433611597254, + "loss": 0.1464, + "step": 16350 + }, + { + "epoch": 3.77, + "learning_rate": 0.0002269549460250592, + "loss": 0.1196, + "step": 16380 + }, + { + "epoch": 3.77, + "learning_rate": 0.0002268155559341459, + "loss": 0.1329, + "step": 16410 + }, + { + "epoch": 3.78, + "learning_rate": 0.00022667616584323258, + "loss": 0.1295, + "step": 16440 + }, + { + "epoch": 3.79, + "learning_rate": 0.00022653677575231926, + "loss": 0.1242, + "step": 16470 + }, + { + "epoch": 3.79, + "learning_rate": 0.00022639738566140595, + "loss": 0.1306, + "step": 16500 + }, + { + "epoch": 3.8, + "learning_rate": 0.00022625799557049264, + "loss": 0.1126, + "step": 16530 + }, + { + "epoch": 3.81, + "learning_rate": 0.0002261232518159431, + "loss": 0.1289, + "step": 16560 + }, + { + "epoch": 3.82, + "learning_rate": 0.0002259838617250298, + "loss": 0.1219, + "step": 16590 + }, + { + "epoch": 3.82, + "learning_rate": 0.00022584447163411647, + "loss": 0.1237, + "step": 16620 + }, + { + "epoch": 3.83, + "learning_rate": 0.00022570508154320316, + "loss": 0.1354, + "step": 16650 + }, + { + "epoch": 3.84, + "learning_rate": 0.00022556569145228985, + "loss": 0.1135, + "step": 16680 + }, + { + "epoch": 3.84, + "learning_rate": 0.00022542630136137653, + "loss": 0.1326, + "step": 16710 + }, + { + "epoch": 3.85, + "learning_rate": 0.00022528691127046322, + "loss": 0.1247, + "step": 16740 + }, + { + "epoch": 3.86, + "learning_rate": 0.0002251475211795499, + "loss": 0.1265, + "step": 16770 + }, + { + "epoch": 3.86, + "learning_rate": 0.00022500813108863657, + "loss": 0.1404, + "step": 16800 + }, + { + "epoch": 3.87, + "learning_rate": 0.00022486874099772325, + "loss": 0.1173, + "step": 16830 + }, + { + "epoch": 3.88, + "learning_rate": 0.00022472935090680994, + "loss": 0.1317, + "step": 16860 + }, + { + "epoch": 3.88, + "learning_rate": 0.00022458996081589663, + "loss": 0.1232, + "step": 16890 + }, + { + "epoch": 3.89, + "learning_rate": 0.00022445057072498334, + "loss": 0.1222, + "step": 16920 + }, + { + "epoch": 3.9, + "learning_rate": 0.00022431118063407003, + "loss": 0.136, + "step": 16950 + }, + { + "epoch": 3.9, + "learning_rate": 0.0002241717905431567, + "loss": 0.1209, + "step": 16980 + }, + { + "epoch": 3.91, + "learning_rate": 0.0002240324004522434, + "loss": 0.1253, + "step": 17010 + }, + { + "epoch": 3.92, + "learning_rate": 0.00022389301036133009, + "loss": 0.1225, + "step": 17040 + }, + { + "epoch": 3.93, + "learning_rate": 0.00022375362027041677, + "loss": 0.1303, + "step": 17070 + }, + { + "epoch": 3.93, + "learning_rate": 0.00022361423017950346, + "loss": 0.1331, + "step": 17100 + }, + { + "epoch": 3.94, + "learning_rate": 0.00022347484008859015, + "loss": 0.1112, + "step": 17130 + }, + { + "epoch": 3.95, + "learning_rate": 0.0002233354499976768, + "loss": 0.1386, + "step": 17160 + }, + { + "epoch": 3.95, + "learning_rate": 0.0002231960599067635, + "loss": 0.1247, + "step": 17190 + }, + { + "epoch": 3.96, + "learning_rate": 0.00022305666981585018, + "loss": 0.1258, + "step": 17220 + }, + { + "epoch": 3.97, + "learning_rate": 0.00022291727972493686, + "loss": 0.1306, + "step": 17250 + }, + { + "epoch": 3.97, + "learning_rate": 0.00022277788963402355, + "loss": 0.1122, + "step": 17280 + }, + { + "epoch": 3.98, + "learning_rate": 0.00022263849954311024, + "loss": 0.1407, + "step": 17310 + }, + { + "epoch": 3.99, + "learning_rate": 0.00022249910945219692, + "loss": 0.1175, + "step": 17340 + }, + { + "epoch": 3.99, + "learning_rate": 0.0002223597193612836, + "loss": 0.1311, + "step": 17370 + }, + { + "epoch": 4.0, + "eval_cer": 0.04056548392942975, + "eval_loss": 0.144550621509552, + "eval_runtime": 417.81, + "eval_samples_per_second": 38.637, + "eval_steps_per_second": 2.415, + "eval_wer": 0.15149074418762057, + "step": 17394 + }, + { + "epoch": 4.0, + "learning_rate": 0.0002222203292703703, + "loss": 0.1378, + "step": 17400 + }, + { + "epoch": 4.01, + "learning_rate": 0.00022208093917945698, + "loss": 0.1161, + "step": 17430 + }, + { + "epoch": 4.02, + "learning_rate": 0.00022194154908854367, + "loss": 0.1229, + "step": 17460 + }, + { + "epoch": 4.02, + "learning_rate": 0.00022180215899763033, + "loss": 0.1221, + "step": 17490 + }, + { + "epoch": 4.03, + "learning_rate": 0.00022166276890671702, + "loss": 0.1179, + "step": 17520 + }, + { + "epoch": 4.04, + "learning_rate": 0.0002215233788158037, + "loss": 0.1366, + "step": 17550 + }, + { + "epoch": 4.04, + "learning_rate": 0.0002213839887248904, + "loss": 0.1104, + "step": 17580 + }, + { + "epoch": 4.05, + "learning_rate": 0.00022124459863397708, + "loss": 0.1265, + "step": 17610 + }, + { + "epoch": 4.06, + "learning_rate": 0.00022110520854306376, + "loss": 0.1179, + "step": 17640 + }, + { + "epoch": 4.06, + "learning_rate": 0.00022096581845215045, + "loss": 0.1217, + "step": 17670 + }, + { + "epoch": 4.07, + "learning_rate": 0.00022082642836123714, + "loss": 0.1307, + "step": 17700 + }, + { + "epoch": 4.08, + "learning_rate": 0.00022068703827032385, + "loss": 0.1138, + "step": 17730 + }, + { + "epoch": 4.08, + "learning_rate": 0.00022054764817941054, + "loss": 0.126, + "step": 17760 + }, + { + "epoch": 4.09, + "learning_rate": 0.00022040825808849722, + "loss": 0.1174, + "step": 17790 + }, + { + "epoch": 4.1, + "learning_rate": 0.0002202688679975839, + "loss": 0.1164, + "step": 17820 + }, + { + "epoch": 4.1, + "learning_rate": 0.00022012947790667057, + "loss": 0.1311, + "step": 17850 + }, + { + "epoch": 4.11, + "learning_rate": 0.00021999008781575726, + "loss": 0.1077, + "step": 17880 + }, + { + "epoch": 4.12, + "learning_rate": 0.00021985069772484394, + "loss": 0.1234, + "step": 17910 + }, + { + "epoch": 4.13, + "learning_rate": 0.00021971130763393063, + "loss": 0.1216, + "step": 17940 + }, + { + "epoch": 4.13, + "learning_rate": 0.00021957191754301732, + "loss": 0.1198, + "step": 17970 + }, + { + "epoch": 4.14, + "learning_rate": 0.000219432527452104, + "loss": 0.1324, + "step": 18000 + }, + { + "epoch": 4.15, + "learning_rate": 0.0002192931373611907, + "loss": 0.1134, + "step": 18030 + }, + { + "epoch": 4.15, + "learning_rate": 0.00021915374727027738, + "loss": 0.1303, + "step": 18060 + }, + { + "epoch": 4.16, + "learning_rate": 0.00021901435717936406, + "loss": 0.1159, + "step": 18090 + }, + { + "epoch": 4.17, + "learning_rate": 0.00021887496708845075, + "loss": 0.1201, + "step": 18120 + }, + { + "epoch": 4.17, + "learning_rate": 0.0002187355769975374, + "loss": 0.1307, + "step": 18150 + }, + { + "epoch": 4.18, + "learning_rate": 0.0002185961869066241, + "loss": 0.1079, + "step": 18180 + }, + { + "epoch": 4.19, + "learning_rate": 0.00021845679681571078, + "loss": 0.1207, + "step": 18210 + }, + { + "epoch": 4.19, + "learning_rate": 0.00021831740672479747, + "loss": 0.1206, + "step": 18240 + }, + { + "epoch": 4.2, + "learning_rate": 0.00021817801663388415, + "loss": 0.1226, + "step": 18270 + }, + { + "epoch": 4.21, + "learning_rate": 0.00021803862654297084, + "loss": 0.1314, + "step": 18300 + }, + { + "epoch": 4.22, + "learning_rate": 0.00021789923645205753, + "loss": 0.1107, + "step": 18330 + }, + { + "epoch": 4.22, + "learning_rate": 0.00021775984636114421, + "loss": 0.135, + "step": 18360 + }, + { + "epoch": 4.23, + "learning_rate": 0.0002176204562702309, + "loss": 0.1237, + "step": 18390 + }, + { + "epoch": 4.24, + "learning_rate": 0.0002174810661793176, + "loss": 0.1199, + "step": 18420 + }, + { + "epoch": 4.24, + "learning_rate": 0.00021734167608840425, + "loss": 0.1296, + "step": 18450 + }, + { + "epoch": 4.25, + "learning_rate": 0.00021720228599749093, + "loss": 0.1058, + "step": 18480 + }, + { + "epoch": 4.26, + "learning_rate": 0.00021706289590657767, + "loss": 0.1248, + "step": 18510 + }, + { + "epoch": 4.26, + "learning_rate": 0.00021692350581566433, + "loss": 0.1192, + "step": 18540 + }, + { + "epoch": 4.27, + "learning_rate": 0.00021678411572475102, + "loss": 0.1193, + "step": 18570 + }, + { + "epoch": 4.28, + "learning_rate": 0.0002166447256338377, + "loss": 0.1393, + "step": 18600 + }, + { + "epoch": 4.28, + "learning_rate": 0.0002165053355429244, + "loss": 0.1102, + "step": 18630 + }, + { + "epoch": 4.29, + "learning_rate": 0.00021636594545201108, + "loss": 0.127, + "step": 18660 + }, + { + "epoch": 4.3, + "learning_rate": 0.00021622655536109777, + "loss": 0.1206, + "step": 18690 + }, + { + "epoch": 4.3, + "learning_rate": 0.00021608716527018445, + "loss": 0.1198, + "step": 18720 + }, + { + "epoch": 4.31, + "learning_rate": 0.00021594777517927114, + "loss": 0.1378, + "step": 18750 + }, + { + "epoch": 4.32, + "learning_rate": 0.00021580838508835783, + "loss": 0.114, + "step": 18780 + }, + { + "epoch": 4.33, + "learning_rate": 0.0002156689949974445, + "loss": 0.1261, + "step": 18810 + }, + { + "epoch": 4.33, + "learning_rate": 0.00021552960490653117, + "loss": 0.123, + "step": 18840 + }, + { + "epoch": 4.34, + "learning_rate": 0.00021539021481561786, + "loss": 0.1231, + "step": 18870 + }, + { + "epoch": 4.35, + "learning_rate": 0.00021525082472470455, + "loss": 0.1389, + "step": 18900 + }, + { + "epoch": 4.35, + "learning_rate": 0.00021511143463379123, + "loss": 0.1046, + "step": 18930 + }, + { + "epoch": 4.36, + "learning_rate": 0.00021497204454287792, + "loss": 0.133, + "step": 18960 + }, + { + "epoch": 4.37, + "learning_rate": 0.0002148326544519646, + "loss": 0.1258, + "step": 18990 + }, + { + "epoch": 4.37, + "learning_rate": 0.0002146932643610513, + "loss": 0.1243, + "step": 19020 + }, + { + "epoch": 4.38, + "learning_rate": 0.00021455387427013798, + "loss": 0.1287, + "step": 19050 + }, + { + "epoch": 4.39, + "learning_rate": 0.00021441448417922466, + "loss": 0.1201, + "step": 19080 + }, + { + "epoch": 4.39, + "learning_rate": 0.00021427509408831135, + "loss": 0.1277, + "step": 19110 + }, + { + "epoch": 4.4, + "learning_rate": 0.000214135703997398, + "loss": 0.1235, + "step": 19140 + }, + { + "epoch": 4.41, + "learning_rate": 0.0002139963139064847, + "loss": 0.1226, + "step": 19170 + }, + { + "epoch": 4.42, + "learning_rate": 0.00021385692381557138, + "loss": 0.1324, + "step": 19200 + }, + { + "epoch": 4.42, + "learning_rate": 0.00021371753372465807, + "loss": 0.1052, + "step": 19230 + }, + { + "epoch": 4.43, + "learning_rate": 0.00021357814363374476, + "loss": 0.1242, + "step": 19260 + }, + { + "epoch": 4.44, + "learning_rate": 0.00021343875354283144, + "loss": 0.1275, + "step": 19290 + }, + { + "epoch": 4.44, + "learning_rate": 0.00021329936345191816, + "loss": 0.1154, + "step": 19320 + }, + { + "epoch": 4.45, + "learning_rate": 0.00021315997336100484, + "loss": 0.1291, + "step": 19350 + }, + { + "epoch": 4.46, + "learning_rate": 0.00021302058327009153, + "loss": 0.1101, + "step": 19380 + }, + { + "epoch": 4.46, + "learning_rate": 0.00021288119317917822, + "loss": 0.1186, + "step": 19410 + }, + { + "epoch": 4.47, + "learning_rate": 0.0002127418030882649, + "loss": 0.1228, + "step": 19440 + }, + { + "epoch": 4.48, + "learning_rate": 0.0002126024129973516, + "loss": 0.1159, + "step": 19470 + }, + { + "epoch": 4.48, + "learning_rate": 0.00021246302290643825, + "loss": 0.1331, + "step": 19500 + }, + { + "epoch": 4.49, + "learning_rate": 0.00021232363281552494, + "loss": 0.1102, + "step": 19530 + }, + { + "epoch": 4.5, + "learning_rate": 0.00021218424272461162, + "loss": 0.1276, + "step": 19560 + }, + { + "epoch": 4.51, + "learning_rate": 0.0002120448526336983, + "loss": 0.1269, + "step": 19590 + }, + { + "epoch": 4.51, + "learning_rate": 0.000211905462542785, + "loss": 0.1195, + "step": 19620 + }, + { + "epoch": 4.52, + "learning_rate": 0.00021176607245187168, + "loss": 0.1333, + "step": 19650 + }, + { + "epoch": 4.53, + "learning_rate": 0.00021163132869732215, + "loss": 0.1119, + "step": 19680 + }, + { + "epoch": 4.53, + "learning_rate": 0.00021149193860640883, + "loss": 0.1229, + "step": 19710 + }, + { + "epoch": 4.54, + "learning_rate": 0.00021135254851549552, + "loss": 0.1171, + "step": 19740 + }, + { + "epoch": 4.55, + "learning_rate": 0.0002112131584245822, + "loss": 0.123, + "step": 19770 + }, + { + "epoch": 4.55, + "learning_rate": 0.0002110737683336689, + "loss": 0.1378, + "step": 19800 + }, + { + "epoch": 4.56, + "learning_rate": 0.00021093437824275558, + "loss": 0.1194, + "step": 19830 + }, + { + "epoch": 4.57, + "learning_rate": 0.00021079498815184227, + "loss": 0.125, + "step": 19860 + }, + { + "epoch": 4.57, + "learning_rate": 0.00021065559806092895, + "loss": 0.1193, + "step": 19890 + }, + { + "epoch": 4.58, + "learning_rate": 0.00021051620797001561, + "loss": 0.116, + "step": 19920 + }, + { + "epoch": 4.59, + "learning_rate": 0.0002103768178791023, + "loss": 0.1403, + "step": 19950 + }, + { + "epoch": 4.59, + "learning_rate": 0.000210237427788189, + "loss": 0.1137, + "step": 19980 + }, + { + "epoch": 4.6, + "learning_rate": 0.00021009803769727567, + "loss": 0.1233, + "step": 20010 + }, + { + "epoch": 4.61, + "learning_rate": 0.00020995864760636236, + "loss": 0.1245, + "step": 20040 + }, + { + "epoch": 4.62, + "learning_rate": 0.00020981925751544905, + "loss": 0.1193, + "step": 20070 + }, + { + "epoch": 4.62, + "learning_rate": 0.00020967986742453573, + "loss": 0.133, + "step": 20100 + }, + { + "epoch": 4.63, + "learning_rate": 0.00020954047733362242, + "loss": 0.1064, + "step": 20130 + }, + { + "epoch": 4.64, + "learning_rate": 0.0002094010872427091, + "loss": 0.1308, + "step": 20160 + }, + { + "epoch": 4.64, + "learning_rate": 0.0002092616971517958, + "loss": 0.1235, + "step": 20190 + }, + { + "epoch": 4.65, + "learning_rate": 0.00020912230706088245, + "loss": 0.1199, + "step": 20220 + }, + { + "epoch": 4.66, + "learning_rate": 0.00020898291696996914, + "loss": 0.1324, + "step": 20250 + }, + { + "epoch": 4.66, + "learning_rate": 0.00020884352687905583, + "loss": 0.1099, + "step": 20280 + }, + { + "epoch": 4.67, + "learning_rate": 0.0002087041367881425, + "loss": 0.1308, + "step": 20310 + }, + { + "epoch": 4.68, + "learning_rate": 0.0002085647466972292, + "loss": 0.1231, + "step": 20340 + }, + { + "epoch": 4.68, + "learning_rate": 0.00020842535660631589, + "loss": 0.1178, + "step": 20370 + }, + { + "epoch": 4.69, + "learning_rate": 0.0002082859665154026, + "loss": 0.1284, + "step": 20400 + }, + { + "epoch": 4.7, + "learning_rate": 0.00020814657642448929, + "loss": 0.113, + "step": 20430 + }, + { + "epoch": 4.71, + "learning_rate": 0.00020800718633357597, + "loss": 0.128, + "step": 20460 + }, + { + "epoch": 4.71, + "learning_rate": 0.00020786779624266266, + "loss": 0.1196, + "step": 20490 + }, + { + "epoch": 4.72, + "learning_rate": 0.00020772840615174935, + "loss": 0.1152, + "step": 20520 + }, + { + "epoch": 4.73, + "learning_rate": 0.00020758901606083603, + "loss": 0.1266, + "step": 20550 + }, + { + "epoch": 4.73, + "learning_rate": 0.00020744962596992272, + "loss": 0.1102, + "step": 20580 + }, + { + "epoch": 4.74, + "learning_rate": 0.00020731023587900938, + "loss": 0.1217, + "step": 20610 + }, + { + "epoch": 4.75, + "learning_rate": 0.00020717084578809606, + "loss": 0.1181, + "step": 20640 + }, + { + "epoch": 4.75, + "learning_rate": 0.00020703145569718275, + "loss": 0.1145, + "step": 20670 + }, + { + "epoch": 4.76, + "learning_rate": 0.00020689206560626944, + "loss": 0.1319, + "step": 20700 + }, + { + "epoch": 4.77, + "learning_rate": 0.00020675267551535612, + "loss": 0.1082, + "step": 20730 + }, + { + "epoch": 4.77, + "learning_rate": 0.0002066132854244428, + "loss": 0.1303, + "step": 20760 + }, + { + "epoch": 4.78, + "learning_rate": 0.0002064738953335295, + "loss": 0.124, + "step": 20790 + }, + { + "epoch": 4.79, + "learning_rate": 0.00020633450524261618, + "loss": 0.1183, + "step": 20820 + }, + { + "epoch": 4.79, + "learning_rate": 0.00020619511515170287, + "loss": 0.1279, + "step": 20850 + }, + { + "epoch": 4.8, + "learning_rate": 0.00020605572506078956, + "loss": 0.1067, + "step": 20880 + }, + { + "epoch": 4.81, + "learning_rate": 0.00020591633496987622, + "loss": 0.1296, + "step": 20910 + }, + { + "epoch": 4.82, + "learning_rate": 0.0002057769448789629, + "loss": 0.1205, + "step": 20940 + }, + { + "epoch": 4.82, + "learning_rate": 0.0002056375547880496, + "loss": 0.1133, + "step": 20970 + }, + { + "epoch": 4.83, + "learning_rate": 0.00020549816469713628, + "loss": 0.1297, + "step": 21000 + }, + { + "epoch": 4.84, + "learning_rate": 0.00020535877460622296, + "loss": 0.1088, + "step": 21030 + }, + { + "epoch": 4.84, + "learning_rate": 0.00020521938451530965, + "loss": 0.1254, + "step": 21060 + }, + { + "epoch": 4.85, + "learning_rate": 0.00020507999442439634, + "loss": 0.1203, + "step": 21090 + }, + { + "epoch": 4.86, + "learning_rate": 0.00020494060433348302, + "loss": 0.1231, + "step": 21120 + }, + { + "epoch": 4.86, + "learning_rate": 0.0002048012142425697, + "loss": 0.1274, + "step": 21150 + }, + { + "epoch": 4.87, + "learning_rate": 0.00020466182415165642, + "loss": 0.1091, + "step": 21180 + }, + { + "epoch": 4.88, + "learning_rate": 0.0002045224340607431, + "loss": 0.1293, + "step": 21210 + }, + { + "epoch": 4.88, + "learning_rate": 0.0002043830439698298, + "loss": 0.1231, + "step": 21240 + }, + { + "epoch": 4.89, + "learning_rate": 0.00020424365387891646, + "loss": 0.1163, + "step": 21270 + }, + { + "epoch": 4.9, + "learning_rate": 0.00020410426378800314, + "loss": 0.1321, + "step": 21300 + }, + { + "epoch": 4.91, + "learning_rate": 0.00020396487369708983, + "loss": 0.1071, + "step": 21330 + }, + { + "epoch": 4.91, + "learning_rate": 0.00020382548360617652, + "loss": 0.1283, + "step": 21360 + }, + { + "epoch": 4.92, + "learning_rate": 0.0002036860935152632, + "loss": 0.1218, + "step": 21390 + }, + { + "epoch": 4.93, + "learning_rate": 0.0002035467034243499, + "loss": 0.1223, + "step": 21420 + }, + { + "epoch": 4.93, + "learning_rate": 0.00020340731333343657, + "loss": 0.1278, + "step": 21450 + }, + { + "epoch": 4.94, + "learning_rate": 0.00020326792324252326, + "loss": 0.1089, + "step": 21480 + }, + { + "epoch": 4.95, + "learning_rate": 0.00020312853315160995, + "loss": 0.1259, + "step": 21510 + }, + { + "epoch": 4.95, + "learning_rate": 0.00020298914306069663, + "loss": 0.1253, + "step": 21540 + }, + { + "epoch": 4.96, + "learning_rate": 0.00020284975296978332, + "loss": 0.1202, + "step": 21570 + }, + { + "epoch": 4.97, + "learning_rate": 0.00020271036287886998, + "loss": 0.1369, + "step": 21600 + }, + { + "epoch": 4.97, + "learning_rate": 0.00020257097278795667, + "loss": 0.1133, + "step": 21630 + }, + { + "epoch": 4.98, + "learning_rate": 0.00020243158269704335, + "loss": 0.1348, + "step": 21660 + }, + { + "epoch": 4.99, + "learning_rate": 0.00020229219260613004, + "loss": 0.1202, + "step": 21690 + }, + { + "epoch": 4.99, + "learning_rate": 0.00020215280251521673, + "loss": 0.1152, + "step": 21720 + }, + { + "epoch": 5.0, + "eval_cer": 0.03967212727229747, + "eval_loss": 0.14306801557540894, + "eval_runtime": 415.6676, + "eval_samples_per_second": 38.836, + "eval_steps_per_second": 2.427, + "eval_wer": 0.1469965142644421, + "step": 21742 + }, + { + "epoch": 5.0, + "learning_rate": 0.00020201341242430341, + "loss": 0.1215, + "step": 21750 + }, + { + "epoch": 5.01, + "learning_rate": 0.0002018740223333901, + "loss": 0.106, + "step": 21780 + }, + { + "epoch": 5.02, + "learning_rate": 0.0002017346322424768, + "loss": 0.1171, + "step": 21810 + }, + { + "epoch": 5.02, + "learning_rate": 0.00020159524215156347, + "loss": 0.1183, + "step": 21840 + }, + { + "epoch": 5.03, + "learning_rate": 0.00020145585206065016, + "loss": 0.1141, + "step": 21870 + }, + { + "epoch": 5.04, + "learning_rate": 0.00020131646196973682, + "loss": 0.1218, + "step": 21900 + }, + { + "epoch": 5.04, + "learning_rate": 0.0002011770718788235, + "loss": 0.1063, + "step": 21930 + }, + { + "epoch": 5.05, + "learning_rate": 0.0002010376817879102, + "loss": 0.1163, + "step": 21960 + }, + { + "epoch": 5.06, + "learning_rate": 0.0002008982916969969, + "loss": 0.1185, + "step": 21990 + }, + { + "epoch": 5.06, + "learning_rate": 0.0002007589016060836, + "loss": 0.1095, + "step": 22020 + }, + { + "epoch": 5.07, + "learning_rate": 0.00020061951151517028, + "loss": 0.1189, + "step": 22050 + }, + { + "epoch": 5.08, + "learning_rate": 0.00020048476776062072, + "loss": 0.1139, + "step": 22080 + }, + { + "epoch": 5.08, + "learning_rate": 0.0002003500240060712, + "loss": 0.1253, + "step": 22110 + }, + { + "epoch": 5.09, + "learning_rate": 0.00020021063391515787, + "loss": 0.1167, + "step": 22140 + }, + { + "epoch": 5.1, + "learning_rate": 0.00020007124382424456, + "loss": 0.113, + "step": 22170 + }, + { + "epoch": 5.11, + "learning_rate": 0.00019993185373333124, + "loss": 0.1288, + "step": 22200 + }, + { + "epoch": 5.11, + "learning_rate": 0.00019979246364241793, + "loss": 0.1054, + "step": 22230 + }, + { + "epoch": 5.12, + "learning_rate": 0.0001996577198878684, + "loss": 0.1226, + "step": 22260 + }, + { + "epoch": 5.13, + "learning_rate": 0.00019952297613331883, + "loss": 0.1236, + "step": 22290 + }, + { + "epoch": 5.13, + "learning_rate": 0.00019938358604240552, + "loss": 0.1246, + "step": 22320 + }, + { + "epoch": 5.14, + "learning_rate": 0.00019924419595149223, + "loss": 0.1315, + "step": 22350 + }, + { + "epoch": 5.15, + "learning_rate": 0.00019910480586057892, + "loss": 0.1182, + "step": 22380 + }, + { + "epoch": 5.15, + "learning_rate": 0.0001989654157696656, + "loss": 0.1283, + "step": 22410 + }, + { + "epoch": 5.16, + "learning_rate": 0.0001988260256787523, + "loss": 0.1193, + "step": 22440 + }, + { + "epoch": 5.17, + "learning_rate": 0.00019868663558783898, + "loss": 0.1194, + "step": 22470 + }, + { + "epoch": 5.17, + "learning_rate": 0.00019854724549692567, + "loss": 0.1309, + "step": 22500 + }, + { + "epoch": 5.18, + "learning_rate": 0.00019840785540601235, + "loss": 0.1083, + "step": 22530 + }, + { + "epoch": 5.19, + "learning_rate": 0.00019826846531509904, + "loss": 0.119, + "step": 22560 + }, + { + "epoch": 5.19, + "learning_rate": 0.00019812907522418573, + "loss": 0.1192, + "step": 22590 + }, + { + "epoch": 5.2, + "learning_rate": 0.0001979896851332724, + "loss": 0.1103, + "step": 22620 + }, + { + "epoch": 5.21, + "learning_rate": 0.0001978502950423591, + "loss": 0.1289, + "step": 22650 + }, + { + "epoch": 5.22, + "learning_rate": 0.00019771090495144576, + "loss": 0.1088, + "step": 22680 + }, + { + "epoch": 5.22, + "learning_rate": 0.00019757151486053245, + "loss": 0.1238, + "step": 22710 + }, + { + "epoch": 5.23, + "learning_rate": 0.00019743212476961913, + "loss": 0.1187, + "step": 22740 + }, + { + "epoch": 5.24, + "learning_rate": 0.00019729273467870582, + "loss": 0.1138, + "step": 22770 + }, + { + "epoch": 5.24, + "learning_rate": 0.0001971533445877925, + "loss": 0.1232, + "step": 22800 + }, + { + "epoch": 5.25, + "learning_rate": 0.0001970139544968792, + "loss": 0.109, + "step": 22830 + }, + { + "epoch": 5.26, + "learning_rate": 0.00019687456440596588, + "loss": 0.1138, + "step": 22860 + }, + { + "epoch": 5.26, + "learning_rate": 0.00019673517431505257, + "loss": 0.1179, + "step": 22890 + }, + { + "epoch": 5.27, + "learning_rate": 0.00019659578422413925, + "loss": 0.1153, + "step": 22920 + }, + { + "epoch": 5.28, + "learning_rate": 0.00019645639413322594, + "loss": 0.125, + "step": 22950 + }, + { + "epoch": 5.28, + "learning_rate": 0.0001963170040423126, + "loss": 0.102, + "step": 22980 + }, + { + "epoch": 5.29, + "learning_rate": 0.00019617761395139928, + "loss": 0.1099, + "step": 23010 + }, + { + "epoch": 5.3, + "learning_rate": 0.00019603822386048597, + "loss": 0.1169, + "step": 23040 + }, + { + "epoch": 5.31, + "learning_rate": 0.00019589883376957266, + "loss": 0.1023, + "step": 23070 + }, + { + "epoch": 5.31, + "learning_rate": 0.00019575944367865934, + "loss": 0.1172, + "step": 23100 + }, + { + "epoch": 5.32, + "learning_rate": 0.00019562005358774606, + "loss": 0.1049, + "step": 23130 + }, + { + "epoch": 5.33, + "learning_rate": 0.00019548066349683274, + "loss": 0.1216, + "step": 23160 + }, + { + "epoch": 5.33, + "learning_rate": 0.00019534127340591943, + "loss": 0.1192, + "step": 23190 + }, + { + "epoch": 5.34, + "learning_rate": 0.00019520188331500612, + "loss": 0.1139, + "step": 23220 + }, + { + "epoch": 5.35, + "learning_rate": 0.0001950624932240928, + "loss": 0.1211, + "step": 23250 + }, + { + "epoch": 5.35, + "learning_rate": 0.0001949231031331795, + "loss": 0.1089, + "step": 23280 + }, + { + "epoch": 5.36, + "learning_rate": 0.00019478371304226618, + "loss": 0.1188, + "step": 23310 + }, + { + "epoch": 5.37, + "learning_rate": 0.00019464432295135284, + "loss": 0.1123, + "step": 23340 + }, + { + "epoch": 5.37, + "learning_rate": 0.00019450493286043952, + "loss": 0.1089, + "step": 23370 + }, + { + "epoch": 5.38, + "learning_rate": 0.0001943655427695262, + "loss": 0.1172, + "step": 23400 + }, + { + "epoch": 5.39, + "learning_rate": 0.0001942261526786129, + "loss": 0.1004, + "step": 23430 + }, + { + "epoch": 5.39, + "learning_rate": 0.00019408676258769958, + "loss": 0.1174, + "step": 23460 + }, + { + "epoch": 5.4, + "learning_rate": 0.00019394737249678627, + "loss": 0.1116, + "step": 23490 + }, + { + "epoch": 5.41, + "learning_rate": 0.00019380798240587296, + "loss": 0.1053, + "step": 23520 + }, + { + "epoch": 5.42, + "learning_rate": 0.00019366859231495964, + "loss": 0.1283, + "step": 23550 + }, + { + "epoch": 5.42, + "learning_rate": 0.00019352920222404633, + "loss": 0.1037, + "step": 23580 + }, + { + "epoch": 5.43, + "learning_rate": 0.00019338981213313302, + "loss": 0.1129, + "step": 23610 + }, + { + "epoch": 5.44, + "learning_rate": 0.00019325042204221968, + "loss": 0.1112, + "step": 23640 + }, + { + "epoch": 5.44, + "learning_rate": 0.00019311103195130636, + "loss": 0.1059, + "step": 23670 + }, + { + "epoch": 5.45, + "learning_rate": 0.00019297164186039305, + "loss": 0.1163, + "step": 23700 + }, + { + "epoch": 5.46, + "learning_rate": 0.00019283225176947974, + "loss": 0.1039, + "step": 23730 + }, + { + "epoch": 5.46, + "learning_rate": 0.00019269286167856642, + "loss": 0.1195, + "step": 23760 + }, + { + "epoch": 5.47, + "learning_rate": 0.0001925534715876531, + "loss": 0.1136, + "step": 23790 + }, + { + "epoch": 5.48, + "learning_rate": 0.0001924140814967398, + "loss": 0.1184, + "step": 23820 + }, + { + "epoch": 5.48, + "learning_rate": 0.00019227469140582648, + "loss": 0.1206, + "step": 23850 + }, + { + "epoch": 5.49, + "learning_rate": 0.00019213530131491317, + "loss": 0.102, + "step": 23880 + }, + { + "epoch": 5.5, + "learning_rate": 0.00019199591122399985, + "loss": 0.1191, + "step": 23910 + }, + { + "epoch": 5.51, + "learning_rate": 0.00019185652113308657, + "loss": 0.1185, + "step": 23940 + }, + { + "epoch": 5.51, + "learning_rate": 0.00019171713104217325, + "loss": 0.1138, + "step": 23970 + }, + { + "epoch": 5.52, + "learning_rate": 0.00019157774095125994, + "loss": 0.1251, + "step": 24000 + }, + { + "epoch": 5.53, + "learning_rate": 0.0001914383508603466, + "loss": 0.1097, + "step": 24030 + }, + { + "epoch": 5.53, + "learning_rate": 0.0001912989607694333, + "loss": 0.1133, + "step": 24060 + }, + { + "epoch": 5.54, + "learning_rate": 0.00019115957067851997, + "loss": 0.1238, + "step": 24090 + }, + { + "epoch": 5.55, + "learning_rate": 0.00019102018058760666, + "loss": 0.1066, + "step": 24120 + }, + { + "epoch": 5.55, + "learning_rate": 0.00019088079049669335, + "loss": 0.1299, + "step": 24150 + }, + { + "epoch": 5.56, + "learning_rate": 0.00019074140040578003, + "loss": 0.1042, + "step": 24180 + }, + { + "epoch": 5.57, + "learning_rate": 0.00019060201031486672, + "loss": 0.1225, + "step": 24210 + }, + { + "epoch": 5.57, + "learning_rate": 0.0001904626202239534, + "loss": 0.1186, + "step": 24240 + }, + { + "epoch": 5.58, + "learning_rate": 0.0001903232301330401, + "loss": 0.1108, + "step": 24270 + }, + { + "epoch": 5.59, + "learning_rate": 0.00019018384004212678, + "loss": 0.1259, + "step": 24300 + }, + { + "epoch": 5.6, + "learning_rate": 0.00019004444995121344, + "loss": 0.1055, + "step": 24330 + }, + { + "epoch": 5.6, + "learning_rate": 0.00018990505986030013, + "loss": 0.1204, + "step": 24360 + }, + { + "epoch": 5.61, + "learning_rate": 0.0001897656697693868, + "loss": 0.1145, + "step": 24390 + }, + { + "epoch": 5.62, + "learning_rate": 0.0001896262796784735, + "loss": 0.1123, + "step": 24420 + }, + { + "epoch": 5.62, + "learning_rate": 0.00018948688958756019, + "loss": 0.1226, + "step": 24450 + }, + { + "epoch": 5.63, + "learning_rate": 0.00018934749949664687, + "loss": 0.1059, + "step": 24480 + }, + { + "epoch": 5.64, + "learning_rate": 0.00018920810940573356, + "loss": 0.1222, + "step": 24510 + }, + { + "epoch": 5.64, + "learning_rate": 0.00018906871931482025, + "loss": 0.1154, + "step": 24540 + }, + { + "epoch": 5.65, + "learning_rate": 0.00018892932922390693, + "loss": 0.1074, + "step": 24570 + }, + { + "epoch": 5.66, + "learning_rate": 0.00018878993913299362, + "loss": 0.1255, + "step": 24600 + }, + { + "epoch": 5.66, + "learning_rate": 0.00018865054904208028, + "loss": 0.1101, + "step": 24630 + }, + { + "epoch": 5.67, + "learning_rate": 0.00018851115895116696, + "loss": 0.1254, + "step": 24660 + }, + { + "epoch": 5.68, + "learning_rate": 0.00018837176886025365, + "loss": 0.1189, + "step": 24690 + }, + { + "epoch": 5.68, + "learning_rate": 0.00018823237876934036, + "loss": 0.1076, + "step": 24720 + }, + { + "epoch": 5.69, + "learning_rate": 0.00018809298867842705, + "loss": 0.1204, + "step": 24750 + }, + { + "epoch": 5.7, + "learning_rate": 0.00018795359858751374, + "loss": 0.1064, + "step": 24780 + }, + { + "epoch": 5.71, + "learning_rate": 0.00018781420849660042, + "loss": 0.1164, + "step": 24810 + }, + { + "epoch": 5.71, + "learning_rate": 0.0001876748184056871, + "loss": 0.1057, + "step": 24840 + }, + { + "epoch": 5.72, + "learning_rate": 0.0001875354283147738, + "loss": 0.1091, + "step": 24870 + }, + { + "epoch": 5.73, + "learning_rate": 0.00018739603822386048, + "loss": 0.1205, + "step": 24900 + }, + { + "epoch": 5.73, + "learning_rate": 0.00018725664813294717, + "loss": 0.1029, + "step": 24930 + }, + { + "epoch": 5.74, + "learning_rate": 0.00018711725804203386, + "loss": 0.1187, + "step": 24960 + }, + { + "epoch": 5.75, + "learning_rate": 0.00018697786795112052, + "loss": 0.1175, + "step": 24990 + }, + { + "epoch": 5.75, + "learning_rate": 0.0001868384778602072, + "loss": 0.1155, + "step": 25020 + }, + { + "epoch": 5.76, + "learning_rate": 0.0001866990877692939, + "loss": 0.1368, + "step": 25050 + }, + { + "epoch": 5.77, + "learning_rate": 0.00018655969767838058, + "loss": 0.1072, + "step": 25080 + }, + { + "epoch": 5.77, + "learning_rate": 0.00018642030758746726, + "loss": 0.1255, + "step": 25110 + }, + { + "epoch": 5.78, + "learning_rate": 0.00018628091749655395, + "loss": 0.1129, + "step": 25140 + }, + { + "epoch": 5.79, + "learning_rate": 0.00018614152740564064, + "loss": 0.1113, + "step": 25170 + }, + { + "epoch": 5.8, + "learning_rate": 0.00018600213731472732, + "loss": 0.1236, + "step": 25200 + }, + { + "epoch": 5.8, + "learning_rate": 0.000185862747223814, + "loss": 0.1061, + "step": 25230 + }, + { + "epoch": 5.81, + "learning_rate": 0.0001857233571329007, + "loss": 0.1178, + "step": 25260 + }, + { + "epoch": 5.82, + "learning_rate": 0.00018558396704198736, + "loss": 0.1099, + "step": 25290 + }, + { + "epoch": 5.82, + "learning_rate": 0.00018544457695107404, + "loss": 0.1125, + "step": 25320 + }, + { + "epoch": 5.83, + "learning_rate": 0.00018530518686016073, + "loss": 0.115, + "step": 25350 + }, + { + "epoch": 5.84, + "learning_rate": 0.00018516579676924742, + "loss": 0.1042, + "step": 25380 + }, + { + "epoch": 5.84, + "learning_rate": 0.0001850264066783341, + "loss": 0.1229, + "step": 25410 + }, + { + "epoch": 5.85, + "learning_rate": 0.0001848870165874208, + "loss": 0.1143, + "step": 25440 + }, + { + "epoch": 5.86, + "learning_rate": 0.00018474762649650748, + "loss": 0.1032, + "step": 25470 + }, + { + "epoch": 5.86, + "learning_rate": 0.00018460823640559416, + "loss": 0.12, + "step": 25500 + }, + { + "epoch": 5.87, + "learning_rate": 0.00018446884631468088, + "loss": 0.1029, + "step": 25530 + }, + { + "epoch": 5.88, + "learning_rate": 0.00018432945622376756, + "loss": 0.1131, + "step": 25560 + }, + { + "epoch": 5.88, + "learning_rate": 0.00018419006613285425, + "loss": 0.1155, + "step": 25590 + }, + { + "epoch": 5.89, + "learning_rate": 0.00018405067604194094, + "loss": 0.105, + "step": 25620 + }, + { + "epoch": 5.9, + "learning_rate": 0.00018391128595102762, + "loss": 0.1186, + "step": 25650 + }, + { + "epoch": 5.91, + "learning_rate": 0.00018377189586011428, + "loss": 0.1041, + "step": 25680 + }, + { + "epoch": 5.91, + "learning_rate": 0.00018363250576920097, + "loss": 0.1131, + "step": 25710 + }, + { + "epoch": 5.92, + "learning_rate": 0.00018349311567828765, + "loss": 0.1092, + "step": 25740 + }, + { + "epoch": 5.93, + "learning_rate": 0.00018335372558737434, + "loss": 0.1008, + "step": 25770 + }, + { + "epoch": 5.93, + "learning_rate": 0.00018321433549646103, + "loss": 0.1176, + "step": 25800 + }, + { + "epoch": 5.94, + "learning_rate": 0.00018307494540554771, + "loss": 0.1009, + "step": 25830 + }, + { + "epoch": 5.95, + "learning_rate": 0.0001829355553146344, + "loss": 0.1117, + "step": 25860 + }, + { + "epoch": 5.95, + "learning_rate": 0.0001827961652237211, + "loss": 0.1167, + "step": 25890 + }, + { + "epoch": 5.96, + "learning_rate": 0.00018265677513280777, + "loss": 0.1082, + "step": 25920 + }, + { + "epoch": 5.97, + "learning_rate": 0.00018251738504189446, + "loss": 0.1219, + "step": 25950 + }, + { + "epoch": 5.97, + "learning_rate": 0.00018237799495098112, + "loss": 0.1021, + "step": 25980 + }, + { + "epoch": 5.98, + "learning_rate": 0.0001822386048600678, + "loss": 0.1167, + "step": 26010 + }, + { + "epoch": 5.99, + "learning_rate": 0.0001820992147691545, + "loss": 0.1164, + "step": 26040 + }, + { + "epoch": 6.0, + "learning_rate": 0.00018195982467824118, + "loss": 0.107, + "step": 26070 + }, + { + "epoch": 6.0, + "eval_cer": 0.03686302783884516, + "eval_loss": 0.13820330798625946, + "eval_runtime": 418.9086, + "eval_samples_per_second": 38.536, + "eval_steps_per_second": 2.409, + "eval_wer": 0.13769670716437105, + "step": 26091 + }, + { + "epoch": 6.0, + "learning_rate": 0.00018182043458732787, + "loss": 0.1163, + "step": 26100 + }, + { + "epoch": 6.01, + "learning_rate": 0.00018168104449641455, + "loss": 0.0979, + "step": 26130 + }, + { + "epoch": 6.02, + "learning_rate": 0.00018154165440550124, + "loss": 0.1163, + "step": 26160 + }, + { + "epoch": 6.02, + "learning_rate": 0.00018140226431458793, + "loss": 0.115, + "step": 26190 + }, + { + "epoch": 6.03, + "learning_rate": 0.0001812628742236746, + "loss": 0.0988, + "step": 26220 + }, + { + "epoch": 6.04, + "learning_rate": 0.0001811234841327613, + "loss": 0.1155, + "step": 26250 + }, + { + "epoch": 6.04, + "learning_rate": 0.00018098409404184796, + "loss": 0.1081, + "step": 26280 + }, + { + "epoch": 6.05, + "learning_rate": 0.0001808447039509347, + "loss": 0.118, + "step": 26310 + }, + { + "epoch": 6.06, + "learning_rate": 0.00018070531386002136, + "loss": 0.1111, + "step": 26340 + }, + { + "epoch": 6.06, + "learning_rate": 0.00018056592376910805, + "loss": 0.1026, + "step": 26370 + }, + { + "epoch": 6.07, + "learning_rate": 0.00018042653367819473, + "loss": 0.1213, + "step": 26400 + }, + { + "epoch": 6.08, + "learning_rate": 0.00018028714358728142, + "loss": 0.1023, + "step": 26430 + }, + { + "epoch": 6.08, + "learning_rate": 0.0001801477534963681, + "loss": 0.1238, + "step": 26460 + }, + { + "epoch": 6.09, + "learning_rate": 0.0001800083634054548, + "loss": 0.1175, + "step": 26490 + }, + { + "epoch": 6.1, + "learning_rate": 0.00017986897331454148, + "loss": 0.1048, + "step": 26520 + }, + { + "epoch": 6.11, + "learning_rate": 0.00017972958322362816, + "loss": 0.1179, + "step": 26550 + }, + { + "epoch": 6.11, + "learning_rate": 0.00017959019313271485, + "loss": 0.1061, + "step": 26580 + }, + { + "epoch": 6.12, + "learning_rate": 0.00017945080304180154, + "loss": 0.1116, + "step": 26610 + }, + { + "epoch": 6.13, + "learning_rate": 0.00017931141295088822, + "loss": 0.1128, + "step": 26640 + }, + { + "epoch": 6.13, + "learning_rate": 0.00017917202285997488, + "loss": 0.1058, + "step": 26670 + }, + { + "epoch": 6.14, + "learning_rate": 0.00017903263276906157, + "loss": 0.1177, + "step": 26700 + }, + { + "epoch": 6.15, + "learning_rate": 0.00017889324267814826, + "loss": 0.1032, + "step": 26730 + }, + { + "epoch": 6.15, + "learning_rate": 0.00017875849892359875, + "loss": 0.1171, + "step": 26760 + }, + { + "epoch": 6.16, + "learning_rate": 0.0001786191088326854, + "loss": 0.1169, + "step": 26790 + }, + { + "epoch": 6.17, + "learning_rate": 0.0001784797187417721, + "loss": 0.1027, + "step": 26820 + }, + { + "epoch": 6.17, + "learning_rate": 0.00017834032865085878, + "loss": 0.1149, + "step": 26850 + }, + { + "epoch": 6.18, + "learning_rate": 0.00017820093855994547, + "loss": 0.1007, + "step": 26880 + }, + { + "epoch": 6.19, + "learning_rate": 0.00017806154846903216, + "loss": 0.1197, + "step": 26910 + }, + { + "epoch": 6.2, + "learning_rate": 0.00017792215837811884, + "loss": 0.1162, + "step": 26940 + }, + { + "epoch": 6.2, + "learning_rate": 0.00017778276828720553, + "loss": 0.1022, + "step": 26970 + }, + { + "epoch": 6.21, + "learning_rate": 0.00017764337819629222, + "loss": 0.1165, + "step": 27000 + }, + { + "epoch": 6.22, + "learning_rate": 0.0001775039881053789, + "loss": 0.104, + "step": 27030 + }, + { + "epoch": 6.22, + "learning_rate": 0.0001773645980144656, + "loss": 0.1142, + "step": 27060 + }, + { + "epoch": 6.23, + "learning_rate": 0.00017722520792355225, + "loss": 0.1213, + "step": 27090 + }, + { + "epoch": 6.24, + "learning_rate": 0.00017708581783263893, + "loss": 0.1095, + "step": 27120 + }, + { + "epoch": 6.24, + "learning_rate": 0.00017694642774172562, + "loss": 0.1238, + "step": 27150 + }, + { + "epoch": 6.25, + "learning_rate": 0.0001768070376508123, + "loss": 0.1054, + "step": 27180 + }, + { + "epoch": 6.26, + "learning_rate": 0.000176667647559899, + "loss": 0.1112, + "step": 27210 + }, + { + "epoch": 6.26, + "learning_rate": 0.00017652825746898568, + "loss": 0.1122, + "step": 27240 + }, + { + "epoch": 6.27, + "learning_rate": 0.00017638886737807237, + "loss": 0.1025, + "step": 27270 + }, + { + "epoch": 6.28, + "learning_rate": 0.00017624947728715905, + "loss": 0.1159, + "step": 27300 + }, + { + "epoch": 6.28, + "learning_rate": 0.00017611008719624574, + "loss": 0.1029, + "step": 27330 + }, + { + "epoch": 6.29, + "learning_rate": 0.00017597069710533243, + "loss": 0.1158, + "step": 27360 + }, + { + "epoch": 6.3, + "learning_rate": 0.00017583130701441914, + "loss": 0.1142, + "step": 27390 + }, + { + "epoch": 6.31, + "learning_rate": 0.00017569191692350583, + "loss": 0.1077, + "step": 27420 + }, + { + "epoch": 6.31, + "learning_rate": 0.0001755525268325925, + "loss": 0.1213, + "step": 27450 + }, + { + "epoch": 6.32, + "learning_rate": 0.00017541313674167917, + "loss": 0.0984, + "step": 27480 + }, + { + "epoch": 6.33, + "learning_rate": 0.00017527374665076586, + "loss": 0.1164, + "step": 27510 + }, + { + "epoch": 6.33, + "learning_rate": 0.00017513435655985255, + "loss": 0.1172, + "step": 27540 + }, + { + "epoch": 6.34, + "learning_rate": 0.00017499496646893923, + "loss": 0.1099, + "step": 27570 + }, + { + "epoch": 6.35, + "learning_rate": 0.00017485557637802592, + "loss": 0.1166, + "step": 27600 + }, + { + "epoch": 6.35, + "learning_rate": 0.0001747161862871126, + "loss": 0.1022, + "step": 27630 + }, + { + "epoch": 6.36, + "learning_rate": 0.0001745767961961993, + "loss": 0.1182, + "step": 27660 + }, + { + "epoch": 6.37, + "learning_rate": 0.00017443740610528598, + "loss": 0.1177, + "step": 27690 + }, + { + "epoch": 6.37, + "learning_rate": 0.00017429801601437267, + "loss": 0.0977, + "step": 27720 + }, + { + "epoch": 6.38, + "learning_rate": 0.00017415862592345933, + "loss": 0.1141, + "step": 27750 + }, + { + "epoch": 6.39, + "learning_rate": 0.000174019235832546, + "loss": 0.1025, + "step": 27780 + }, + { + "epoch": 6.4, + "learning_rate": 0.0001738798457416327, + "loss": 0.1111, + "step": 27810 + }, + { + "epoch": 6.4, + "learning_rate": 0.00017374045565071939, + "loss": 0.1134, + "step": 27840 + }, + { + "epoch": 6.41, + "learning_rate": 0.00017360106555980607, + "loss": 0.1013, + "step": 27870 + }, + { + "epoch": 6.42, + "learning_rate": 0.00017346167546889276, + "loss": 0.1179, + "step": 27900 + }, + { + "epoch": 6.42, + "learning_rate": 0.00017332228537797945, + "loss": 0.1017, + "step": 27930 + }, + { + "epoch": 6.43, + "learning_rate": 0.00017318289528706613, + "loss": 0.1121, + "step": 27960 + }, + { + "epoch": 6.44, + "learning_rate": 0.00017304350519615282, + "loss": 0.1105, + "step": 27990 + }, + { + "epoch": 6.44, + "learning_rate": 0.0001729041151052395, + "loss": 0.106, + "step": 28020 + }, + { + "epoch": 6.45, + "learning_rate": 0.00017276472501432616, + "loss": 0.1303, + "step": 28050 + }, + { + "epoch": 6.46, + "learning_rate": 0.00017262533492341285, + "loss": 0.1033, + "step": 28080 + }, + { + "epoch": 6.46, + "learning_rate": 0.00017248594483249954, + "loss": 0.1137, + "step": 28110 + }, + { + "epoch": 6.47, + "learning_rate": 0.00017234655474158622, + "loss": 0.1183, + "step": 28140 + }, + { + "epoch": 6.48, + "learning_rate": 0.0001722071646506729, + "loss": 0.1071, + "step": 28170 + }, + { + "epoch": 6.48, + "learning_rate": 0.00017206777455975962, + "loss": 0.1228, + "step": 28200 + }, + { + "epoch": 6.49, + "learning_rate": 0.0001719283844688463, + "loss": 0.11, + "step": 28230 + }, + { + "epoch": 6.5, + "learning_rate": 0.000171788994377933, + "loss": 0.1161, + "step": 28260 + }, + { + "epoch": 6.51, + "learning_rate": 0.00017164960428701968, + "loss": 0.1245, + "step": 28290 + }, + { + "epoch": 6.51, + "learning_rate": 0.00017151021419610637, + "loss": 0.1054, + "step": 28320 + }, + { + "epoch": 6.52, + "learning_rate": 0.00017137082410519306, + "loss": 0.1243, + "step": 28350 + }, + { + "epoch": 6.53, + "learning_rate": 0.00017123143401427974, + "loss": 0.113, + "step": 28380 + }, + { + "epoch": 6.53, + "learning_rate": 0.00017109204392336643, + "loss": 0.1238, + "step": 28410 + }, + { + "epoch": 6.54, + "learning_rate": 0.00017095730016881687, + "loss": 0.1194, + "step": 28440 + }, + { + "epoch": 6.55, + "learning_rate": 0.00017081791007790353, + "loss": 0.1077, + "step": 28470 + }, + { + "epoch": 6.55, + "learning_rate": 0.00017067851998699027, + "loss": 0.1179, + "step": 28500 + }, + { + "epoch": 6.56, + "learning_rate": 0.00017053912989607696, + "loss": 0.1052, + "step": 28530 + }, + { + "epoch": 6.57, + "learning_rate": 0.00017039973980516361, + "loss": 0.1158, + "step": 28560 + }, + { + "epoch": 6.57, + "learning_rate": 0.0001702603497142503, + "loss": 0.121, + "step": 28590 + }, + { + "epoch": 6.58, + "learning_rate": 0.000170120959623337, + "loss": 0.1078, + "step": 28620 + }, + { + "epoch": 6.59, + "learning_rate": 0.00016998156953242367, + "loss": 0.1236, + "step": 28650 + }, + { + "epoch": 6.6, + "learning_rate": 0.00016984217944151036, + "loss": 0.1057, + "step": 28680 + }, + { + "epoch": 6.6, + "learning_rate": 0.00016970278935059705, + "loss": 0.1224, + "step": 28710 + }, + { + "epoch": 6.61, + "learning_rate": 0.00016956339925968373, + "loss": 0.1185, + "step": 28740 + }, + { + "epoch": 6.62, + "learning_rate": 0.00016942400916877042, + "loss": 0.1023, + "step": 28770 + }, + { + "epoch": 6.62, + "learning_rate": 0.0001692846190778571, + "loss": 0.1288, + "step": 28800 + }, + { + "epoch": 6.63, + "learning_rate": 0.0001691452289869438, + "loss": 0.1062, + "step": 28830 + }, + { + "epoch": 6.64, + "learning_rate": 0.00016900583889603045, + "loss": 0.1174, + "step": 28860 + }, + { + "epoch": 6.64, + "learning_rate": 0.00016886644880511714, + "loss": 0.1233, + "step": 28890 + }, + { + "epoch": 6.65, + "learning_rate": 0.00016872705871420383, + "loss": 0.1062, + "step": 28920 + }, + { + "epoch": 6.66, + "learning_rate": 0.0001685876686232905, + "loss": 0.1173, + "step": 28950 + }, + { + "epoch": 6.66, + "learning_rate": 0.0001684482785323772, + "loss": 0.1045, + "step": 28980 + }, + { + "epoch": 6.67, + "learning_rate": 0.0001683088884414639, + "loss": 0.1213, + "step": 29010 + }, + { + "epoch": 6.68, + "learning_rate": 0.00016816949835055057, + "loss": 0.1168, + "step": 29040 + }, + { + "epoch": 6.69, + "learning_rate": 0.00016803010825963726, + "loss": 0.1033, + "step": 29070 + }, + { + "epoch": 6.69, + "learning_rate": 0.00016789071816872395, + "loss": 0.1235, + "step": 29100 + }, + { + "epoch": 6.7, + "learning_rate": 0.00016775132807781063, + "loss": 0.1026, + "step": 29130 + }, + { + "epoch": 6.71, + "learning_rate": 0.0001676119379868973, + "loss": 0.1084, + "step": 29160 + }, + { + "epoch": 6.71, + "learning_rate": 0.00016747254789598398, + "loss": 0.1125, + "step": 29190 + }, + { + "epoch": 6.72, + "learning_rate": 0.00016733315780507067, + "loss": 0.107, + "step": 29220 + }, + { + "epoch": 6.73, + "learning_rate": 0.00016719376771415735, + "loss": 0.1208, + "step": 29250 + }, + { + "epoch": 6.73, + "learning_rate": 0.00016705437762324407, + "loss": 0.1032, + "step": 29280 + }, + { + "epoch": 6.74, + "learning_rate": 0.00016691498753233075, + "loss": 0.1143, + "step": 29310 + }, + { + "epoch": 6.75, + "learning_rate": 0.00016677559744141744, + "loss": 0.1193, + "step": 29340 + }, + { + "epoch": 6.75, + "learning_rate": 0.00016663620735050413, + "loss": 0.1032, + "step": 29370 + }, + { + "epoch": 6.76, + "learning_rate": 0.0001664968172595908, + "loss": 0.1146, + "step": 29400 + }, + { + "epoch": 6.77, + "learning_rate": 0.0001663574271686775, + "loss": 0.1019, + "step": 29430 + }, + { + "epoch": 6.77, + "learning_rate": 0.00016621803707776419, + "loss": 0.1154, + "step": 29460 + }, + { + "epoch": 6.78, + "learning_rate": 0.00016607864698685087, + "loss": 0.111, + "step": 29490 + }, + { + "epoch": 6.79, + "learning_rate": 0.00016593925689593753, + "loss": 0.0978, + "step": 29520 + }, + { + "epoch": 6.8, + "learning_rate": 0.00016579986680502422, + "loss": 0.1228, + "step": 29550 + }, + { + "epoch": 6.8, + "learning_rate": 0.0001656604767141109, + "loss": 0.1014, + "step": 29580 + }, + { + "epoch": 6.81, + "learning_rate": 0.0001655210866231976, + "loss": 0.1128, + "step": 29610 + }, + { + "epoch": 6.82, + "learning_rate": 0.00016538169653228428, + "loss": 0.11, + "step": 29640 + }, + { + "epoch": 6.82, + "learning_rate": 0.00016524230644137096, + "loss": 0.0952, + "step": 29670 + }, + { + "epoch": 6.83, + "learning_rate": 0.00016510291635045765, + "loss": 0.1115, + "step": 29700 + }, + { + "epoch": 6.84, + "learning_rate": 0.00016496352625954434, + "loss": 0.0954, + "step": 29730 + }, + { + "epoch": 6.84, + "learning_rate": 0.00016482413616863102, + "loss": 0.0998, + "step": 29760 + }, + { + "epoch": 6.85, + "learning_rate": 0.0001646847460777177, + "loss": 0.1062, + "step": 29790 + }, + { + "epoch": 6.86, + "learning_rate": 0.0001645453559868044, + "loss": 0.0992, + "step": 29820 + }, + { + "epoch": 6.86, + "learning_rate": 0.00016440596589589106, + "loss": 0.1108, + "step": 29850 + }, + { + "epoch": 6.87, + "learning_rate": 0.00016426657580497774, + "loss": 0.098, + "step": 29880 + }, + { + "epoch": 6.88, + "learning_rate": 0.00016412718571406443, + "loss": 0.1033, + "step": 29910 + }, + { + "epoch": 6.89, + "learning_rate": 0.00016398779562315112, + "loss": 0.1092, + "step": 29940 + }, + { + "epoch": 6.89, + "learning_rate": 0.0001638484055322378, + "loss": 0.0938, + "step": 29970 + }, + { + "epoch": 6.9, + "learning_rate": 0.0001637090154413245, + "loss": 0.1158, + "step": 30000 + }, + { + "epoch": 6.91, + "learning_rate": 0.00016356962535041118, + "loss": 0.0972, + "step": 30030 + }, + { + "epoch": 6.91, + "learning_rate": 0.0001634302352594979, + "loss": 0.1072, + "step": 30060 + }, + { + "epoch": 6.92, + "learning_rate": 0.00016329084516858458, + "loss": 0.1147, + "step": 30090 + }, + { + "epoch": 6.93, + "learning_rate": 0.00016315145507767126, + "loss": 0.0986, + "step": 30120 + }, + { + "epoch": 6.93, + "learning_rate": 0.00016301206498675795, + "loss": 0.1107, + "step": 30150 + }, + { + "epoch": 6.94, + "learning_rate": 0.00016287267489584464, + "loss": 0.1041, + "step": 30180 + }, + { + "epoch": 6.95, + "learning_rate": 0.0001627332848049313, + "loss": 0.1082, + "step": 30210 + }, + { + "epoch": 6.95, + "learning_rate": 0.00016259389471401798, + "loss": 0.1117, + "step": 30240 + }, + { + "epoch": 6.96, + "learning_rate": 0.00016245450462310467, + "loss": 0.1029, + "step": 30270 + }, + { + "epoch": 6.97, + "learning_rate": 0.00016231511453219136, + "loss": 0.1105, + "step": 30300 + }, + { + "epoch": 6.97, + "learning_rate": 0.00016217572444127804, + "loss": 0.0949, + "step": 30330 + }, + { + "epoch": 6.98, + "learning_rate": 0.00016203633435036473, + "loss": 0.107, + "step": 30360 + }, + { + "epoch": 6.99, + "learning_rate": 0.00016189694425945141, + "loss": 0.1078, + "step": 30390 + }, + { + "epoch": 7.0, + "learning_rate": 0.0001617575541685381, + "loss": 0.0957, + "step": 30420 + }, + { + "epoch": 7.0, + "eval_cer": 0.03725208614046285, + "eval_loss": 0.1343260109424591, + "eval_runtime": 417.5587, + "eval_samples_per_second": 38.66, + "eval_steps_per_second": 2.416, + "eval_wer": 0.13718230735388676, + "step": 30439 + }, + { + "epoch": 7.0, + "learning_rate": 0.0001616181640776248, + "loss": 0.1111, + "step": 30450 + }, + { + "epoch": 7.01, + "learning_rate": 0.00016147877398671147, + "loss": 0.1017, + "step": 30480 + }, + { + "epoch": 7.02, + "learning_rate": 0.00016133938389579813, + "loss": 0.0991, + "step": 30510 + }, + { + "epoch": 7.02, + "learning_rate": 0.00016119999380488482, + "loss": 0.112, + "step": 30540 + }, + { + "epoch": 7.03, + "learning_rate": 0.0001610606037139715, + "loss": 0.0916, + "step": 30570 + }, + { + "epoch": 7.04, + "learning_rate": 0.0001609212136230582, + "loss": 0.1086, + "step": 30600 + }, + { + "epoch": 7.04, + "learning_rate": 0.00016078182353214488, + "loss": 0.0994, + "step": 30630 + }, + { + "epoch": 7.05, + "learning_rate": 0.00016064243344123157, + "loss": 0.1117, + "step": 30660 + }, + { + "epoch": 7.06, + "learning_rate": 0.00016050304335031825, + "loss": 0.1151, + "step": 30690 + }, + { + "epoch": 7.06, + "learning_rate": 0.00016036365325940494, + "loss": 0.0941, + "step": 30720 + }, + { + "epoch": 7.07, + "learning_rate": 0.00016022426316849163, + "loss": 0.1159, + "step": 30750 + }, + { + "epoch": 7.08, + "learning_rate": 0.0001600848730775783, + "loss": 0.1002, + "step": 30780 + }, + { + "epoch": 7.09, + "learning_rate": 0.00015994548298666497, + "loss": 0.1088, + "step": 30810 + }, + { + "epoch": 7.09, + "learning_rate": 0.00015980609289575166, + "loss": 0.1133, + "step": 30840 + }, + { + "epoch": 7.1, + "learning_rate": 0.0001596667028048384, + "loss": 0.0936, + "step": 30870 + }, + { + "epoch": 7.11, + "learning_rate": 0.00015952731271392506, + "loss": 0.1099, + "step": 30900 + }, + { + "epoch": 7.11, + "learning_rate": 0.00015938792262301175, + "loss": 0.1003, + "step": 30930 + }, + { + "epoch": 7.12, + "learning_rate": 0.00015924853253209843, + "loss": 0.111, + "step": 30960 + }, + { + "epoch": 7.13, + "learning_rate": 0.00015910914244118512, + "loss": 0.1125, + "step": 30990 + }, + { + "epoch": 7.13, + "learning_rate": 0.0001589697523502718, + "loss": 0.0987, + "step": 31020 + }, + { + "epoch": 7.14, + "learning_rate": 0.0001588303622593585, + "loss": 0.1114, + "step": 31050 + }, + { + "epoch": 7.15, + "learning_rate": 0.00015869097216844518, + "loss": 0.0998, + "step": 31080 + }, + { + "epoch": 7.15, + "learning_rate": 0.00015855158207753187, + "loss": 0.1044, + "step": 31110 + }, + { + "epoch": 7.16, + "learning_rate": 0.00015841219198661855, + "loss": 0.1145, + "step": 31140 + }, + { + "epoch": 7.17, + "learning_rate": 0.00015827280189570524, + "loss": 0.0915, + "step": 31170 + }, + { + "epoch": 7.17, + "learning_rate": 0.0001581334118047919, + "loss": 0.1114, + "step": 31200 + }, + { + "epoch": 7.18, + "learning_rate": 0.00015799402171387858, + "loss": 0.0957, + "step": 31230 + }, + { + "epoch": 7.19, + "learning_rate": 0.00015785463162296527, + "loss": 0.1057, + "step": 31260 + }, + { + "epoch": 7.2, + "learning_rate": 0.00015771524153205196, + "loss": 0.1129, + "step": 31290 + }, + { + "epoch": 7.2, + "learning_rate": 0.00015757585144113864, + "loss": 0.0906, + "step": 31320 + }, + { + "epoch": 7.21, + "learning_rate": 0.00015743646135022533, + "loss": 0.1068, + "step": 31350 + }, + { + "epoch": 7.22, + "learning_rate": 0.00015729707125931202, + "loss": 0.0992, + "step": 31380 + }, + { + "epoch": 7.22, + "learning_rate": 0.0001571576811683987, + "loss": 0.1034, + "step": 31410 + }, + { + "epoch": 7.23, + "learning_rate": 0.0001570182910774854, + "loss": 0.1105, + "step": 31440 + }, + { + "epoch": 7.24, + "learning_rate": 0.00015687890098657208, + "loss": 0.0911, + "step": 31470 + }, + { + "epoch": 7.24, + "learning_rate": 0.00015673951089565874, + "loss": 0.1089, + "step": 31500 + }, + { + "epoch": 7.25, + "learning_rate": 0.00015660012080474542, + "loss": 0.0933, + "step": 31530 + }, + { + "epoch": 7.26, + "learning_rate": 0.0001564607307138321, + "loss": 0.108, + "step": 31560 + }, + { + "epoch": 7.26, + "learning_rate": 0.0001563213406229188, + "loss": 0.1101, + "step": 31590 + }, + { + "epoch": 7.27, + "learning_rate": 0.00015618195053200548, + "loss": 0.0945, + "step": 31620 + }, + { + "epoch": 7.28, + "learning_rate": 0.0001560425604410922, + "loss": 0.1037, + "step": 31650 + }, + { + "epoch": 7.29, + "learning_rate": 0.00015590317035017888, + "loss": 0.0973, + "step": 31680 + }, + { + "epoch": 7.29, + "learning_rate": 0.00015576378025926557, + "loss": 0.1068, + "step": 31710 + }, + { + "epoch": 7.3, + "learning_rate": 0.00015562439016835226, + "loss": 0.1131, + "step": 31740 + }, + { + "epoch": 7.31, + "learning_rate": 0.00015548500007743894, + "loss": 0.0841, + "step": 31770 + }, + { + "epoch": 7.31, + "learning_rate": 0.00015534560998652563, + "loss": 0.1081, + "step": 31800 + }, + { + "epoch": 7.32, + "learning_rate": 0.00015520621989561232, + "loss": 0.0989, + "step": 31830 + }, + { + "epoch": 7.33, + "learning_rate": 0.00015506682980469898, + "loss": 0.1006, + "step": 31860 + }, + { + "epoch": 7.33, + "learning_rate": 0.00015492743971378566, + "loss": 0.1049, + "step": 31890 + }, + { + "epoch": 7.34, + "learning_rate": 0.00015478804962287235, + "loss": 0.0871, + "step": 31920 + }, + { + "epoch": 7.35, + "learning_rate": 0.00015464865953195904, + "loss": 0.1031, + "step": 31950 + }, + { + "epoch": 7.35, + "learning_rate": 0.00015450926944104572, + "loss": 0.0962, + "step": 31980 + }, + { + "epoch": 7.36, + "learning_rate": 0.0001543698793501324, + "loss": 0.1047, + "step": 32010 + }, + { + "epoch": 7.37, + "learning_rate": 0.0001542304892592191, + "loss": 0.1098, + "step": 32040 + }, + { + "epoch": 7.37, + "learning_rate": 0.00015409109916830578, + "loss": 0.0904, + "step": 32070 + }, + { + "epoch": 7.38, + "learning_rate": 0.00015395170907739247, + "loss": 0.1052, + "step": 32100 + }, + { + "epoch": 7.39, + "learning_rate": 0.00015381231898647916, + "loss": 0.093, + "step": 32130 + }, + { + "epoch": 7.4, + "learning_rate": 0.00015367292889556581, + "loss": 0.1045, + "step": 32160 + }, + { + "epoch": 7.4, + "learning_rate": 0.0001535335388046525, + "loss": 0.1134, + "step": 32190 + }, + { + "epoch": 7.41, + "learning_rate": 0.0001533941487137392, + "loss": 0.0932, + "step": 32220 + }, + { + "epoch": 7.42, + "learning_rate": 0.00015325475862282587, + "loss": 0.1057, + "step": 32250 + }, + { + "epoch": 7.42, + "learning_rate": 0.00015311536853191256, + "loss": 0.0964, + "step": 32280 + }, + { + "epoch": 7.43, + "learning_rate": 0.00015297597844099925, + "loss": 0.1018, + "step": 32310 + }, + { + "epoch": 7.44, + "learning_rate": 0.00015283658835008593, + "loss": 0.1051, + "step": 32340 + }, + { + "epoch": 7.44, + "learning_rate": 0.00015269719825917262, + "loss": 0.0871, + "step": 32370 + }, + { + "epoch": 7.45, + "learning_rate": 0.0001525578081682593, + "loss": 0.1047, + "step": 32400 + }, + { + "epoch": 7.46, + "learning_rate": 0.000152418418077346, + "loss": 0.0962, + "step": 32430 + }, + { + "epoch": 7.46, + "learning_rate": 0.0001522790279864327, + "loss": 0.1053, + "step": 32460 + }, + { + "epoch": 7.47, + "learning_rate": 0.0001521396378955194, + "loss": 0.1062, + "step": 32490 + }, + { + "epoch": 7.48, + "learning_rate": 0.00015200024780460608, + "loss": 0.0886, + "step": 32520 + }, + { + "epoch": 7.49, + "learning_rate": 0.00015186085771369274, + "loss": 0.1059, + "step": 32550 + }, + { + "epoch": 7.49, + "learning_rate": 0.00015172146762277943, + "loss": 0.0954, + "step": 32580 + }, + { + "epoch": 7.5, + "learning_rate": 0.0001515820775318661, + "loss": 0.1018, + "step": 32610 + }, + { + "epoch": 7.51, + "learning_rate": 0.0001514426874409528, + "loss": 0.1059, + "step": 32640 + }, + { + "epoch": 7.51, + "learning_rate": 0.00015130329735003949, + "loss": 0.0874, + "step": 32670 + }, + { + "epoch": 7.52, + "learning_rate": 0.00015116390725912617, + "loss": 0.1055, + "step": 32700 + }, + { + "epoch": 7.53, + "learning_rate": 0.00015102451716821286, + "loss": 0.0934, + "step": 32730 + }, + { + "epoch": 7.53, + "learning_rate": 0.00015088512707729955, + "loss": 0.1005, + "step": 32760 + }, + { + "epoch": 7.54, + "learning_rate": 0.00015074573698638623, + "loss": 0.1111, + "step": 32790 + }, + { + "epoch": 7.55, + "learning_rate": 0.00015060634689547292, + "loss": 0.0878, + "step": 32820 + }, + { + "epoch": 7.55, + "learning_rate": 0.00015046695680455958, + "loss": 0.1033, + "step": 32850 + }, + { + "epoch": 7.56, + "learning_rate": 0.00015032756671364627, + "loss": 0.0893, + "step": 32880 + }, + { + "epoch": 7.57, + "learning_rate": 0.00015018817662273295, + "loss": 0.1015, + "step": 32910 + }, + { + "epoch": 7.58, + "learning_rate": 0.00015004878653181964, + "loss": 0.1094, + "step": 32940 + }, + { + "epoch": 7.58, + "learning_rate": 0.00014990939644090633, + "loss": 0.0877, + "step": 32970 + }, + { + "epoch": 7.59, + "learning_rate": 0.000149770006349993, + "loss": 0.1065, + "step": 33000 + }, + { + "epoch": 7.6, + "learning_rate": 0.0001496306162590797, + "loss": 0.0917, + "step": 33030 + }, + { + "epoch": 7.6, + "learning_rate": 0.00014949122616816638, + "loss": 0.1007, + "step": 33060 + }, + { + "epoch": 7.61, + "learning_rate": 0.00014935183607725307, + "loss": 0.1127, + "step": 33090 + }, + { + "epoch": 7.62, + "learning_rate": 0.00014921244598633976, + "loss": 0.0895, + "step": 33120 + }, + { + "epoch": 7.62, + "learning_rate": 0.00014907305589542644, + "loss": 0.1098, + "step": 33150 + }, + { + "epoch": 7.63, + "learning_rate": 0.00014893366580451313, + "loss": 0.0989, + "step": 33180 + }, + { + "epoch": 7.64, + "learning_rate": 0.00014879427571359982, + "loss": 0.1048, + "step": 33210 + }, + { + "epoch": 7.64, + "learning_rate": 0.0001486548856226865, + "loss": 0.1102, + "step": 33240 + }, + { + "epoch": 7.65, + "learning_rate": 0.0001485154955317732, + "loss": 0.0865, + "step": 33270 + }, + { + "epoch": 7.66, + "learning_rate": 0.00014837610544085988, + "loss": 0.1074, + "step": 33300 + }, + { + "epoch": 7.66, + "learning_rate": 0.00014823671534994654, + "loss": 0.0912, + "step": 33330 + }, + { + "epoch": 7.67, + "learning_rate": 0.00014809732525903322, + "loss": 0.1061, + "step": 33360 + }, + { + "epoch": 7.68, + "learning_rate": 0.0001479579351681199, + "loss": 0.1029, + "step": 33390 + }, + { + "epoch": 7.69, + "learning_rate": 0.0001478185450772066, + "loss": 0.093, + "step": 33420 + }, + { + "epoch": 7.69, + "learning_rate": 0.0001476791549862933, + "loss": 0.1068, + "step": 33450 + }, + { + "epoch": 7.7, + "learning_rate": 0.00014753976489538, + "loss": 0.096, + "step": 33480 + }, + { + "epoch": 7.71, + "learning_rate": 0.00014740037480446668, + "loss": 0.1056, + "step": 33510 + }, + { + "epoch": 7.71, + "learning_rate": 0.00014726098471355334, + "loss": 0.1061, + "step": 33540 + }, + { + "epoch": 7.72, + "learning_rate": 0.00014712159462264003, + "loss": 0.0887, + "step": 33570 + }, + { + "epoch": 7.73, + "learning_rate": 0.00014698220453172672, + "loss": 0.1091, + "step": 33600 + }, + { + "epoch": 7.73, + "learning_rate": 0.0001468428144408134, + "loss": 0.094, + "step": 33630 + }, + { + "epoch": 7.74, + "learning_rate": 0.0001467034243499001, + "loss": 0.1038, + "step": 33660 + }, + { + "epoch": 7.75, + "learning_rate": 0.00014656403425898678, + "loss": 0.1078, + "step": 33690 + }, + { + "epoch": 7.75, + "learning_rate": 0.00014642464416807346, + "loss": 0.0924, + "step": 33720 + }, + { + "epoch": 7.76, + "learning_rate": 0.00014628525407716015, + "loss": 0.1082, + "step": 33750 + }, + { + "epoch": 7.77, + "learning_rate": 0.00014614586398624684, + "loss": 0.0953, + "step": 33780 + }, + { + "epoch": 7.78, + "learning_rate": 0.00014600647389533352, + "loss": 0.0993, + "step": 33810 + }, + { + "epoch": 7.78, + "learning_rate": 0.0001458670838044202, + "loss": 0.106, + "step": 33840 + }, + { + "epoch": 7.79, + "learning_rate": 0.0001457276937135069, + "loss": 0.0892, + "step": 33870 + }, + { + "epoch": 7.8, + "learning_rate": 0.00014558830362259358, + "loss": 0.1088, + "step": 33900 + }, + { + "epoch": 7.8, + "learning_rate": 0.00014544891353168027, + "loss": 0.0932, + "step": 33930 + }, + { + "epoch": 7.81, + "learning_rate": 0.00014530952344076695, + "loss": 0.1034, + "step": 33960 + }, + { + "epoch": 7.82, + "learning_rate": 0.00014517013334985364, + "loss": 0.1179, + "step": 33990 + }, + { + "epoch": 7.82, + "learning_rate": 0.0001450307432589403, + "loss": 0.0968, + "step": 34020 + }, + { + "epoch": 7.83, + "learning_rate": 0.000144891353168027, + "loss": 0.1089, + "step": 34050 + }, + { + "epoch": 7.84, + "learning_rate": 0.00014475196307711367, + "loss": 0.0918, + "step": 34080 + }, + { + "epoch": 7.84, + "learning_rate": 0.00014461257298620036, + "loss": 0.1034, + "step": 34110 + }, + { + "epoch": 7.85, + "learning_rate": 0.00014447318289528705, + "loss": 0.1141, + "step": 34140 + }, + { + "epoch": 7.86, + "learning_rate": 0.00014433379280437373, + "loss": 0.085, + "step": 34170 + }, + { + "epoch": 7.86, + "learning_rate": 0.00014419440271346042, + "loss": 0.1063, + "step": 34200 + }, + { + "epoch": 7.87, + "learning_rate": 0.0001440550126225471, + "loss": 0.0956, + "step": 34230 + }, + { + "epoch": 7.88, + "learning_rate": 0.0001439156225316338, + "loss": 0.1042, + "step": 34260 + }, + { + "epoch": 7.89, + "learning_rate": 0.00014377623244072048, + "loss": 0.1145, + "step": 34290 + }, + { + "epoch": 7.89, + "learning_rate": 0.00014363684234980717, + "loss": 0.0916, + "step": 34320 + }, + { + "epoch": 7.9, + "learning_rate": 0.00014349745225889385, + "loss": 0.0978, + "step": 34350 + }, + { + "epoch": 7.91, + "learning_rate": 0.00014335806216798054, + "loss": 0.0932, + "step": 34380 + }, + { + "epoch": 7.91, + "learning_rate": 0.00014321867207706723, + "loss": 0.0997, + "step": 34410 + }, + { + "epoch": 7.92, + "learning_rate": 0.0001430792819861539, + "loss": 0.1126, + "step": 34440 + }, + { + "epoch": 7.93, + "learning_rate": 0.0001429398918952406, + "loss": 0.0943, + "step": 34470 + }, + { + "epoch": 7.93, + "learning_rate": 0.00014280050180432726, + "loss": 0.1053, + "step": 34500 + }, + { + "epoch": 7.94, + "learning_rate": 0.00014266111171341395, + "loss": 0.091, + "step": 34530 + }, + { + "epoch": 7.95, + "learning_rate": 0.00014252172162250063, + "loss": 0.0986, + "step": 34560 + }, + { + "epoch": 7.95, + "learning_rate": 0.00014238233153158732, + "loss": 0.1093, + "step": 34590 + }, + { + "epoch": 7.96, + "learning_rate": 0.00014224294144067403, + "loss": 0.0883, + "step": 34620 + }, + { + "epoch": 7.97, + "learning_rate": 0.00014210355134976072, + "loss": 0.1042, + "step": 34650 + }, + { + "epoch": 7.98, + "learning_rate": 0.00014196416125884738, + "loss": 0.0913, + "step": 34680 + }, + { + "epoch": 7.98, + "learning_rate": 0.00014182477116793407, + "loss": 0.1039, + "step": 34710 + }, + { + "epoch": 7.99, + "learning_rate": 0.00014168538107702075, + "loss": 0.1078, + "step": 34740 + }, + { + "epoch": 8.0, + "learning_rate": 0.00014154599098610744, + "loss": 0.0924, + "step": 34770 + }, + { + "epoch": 8.0, + "eval_cer": 0.03551954550110709, + "eval_loss": 0.1335287243127823, + "eval_runtime": 421.8608, + "eval_samples_per_second": 38.266, + "eval_steps_per_second": 2.392, + "eval_wer": 0.13151037260144166, + "step": 34788 + }, + { + "epoch": 8.0, + "learning_rate": 0.00014140660089519412, + "loss": 0.1036, + "step": 34800 + }, + { + "epoch": 8.01, + "learning_rate": 0.0001412672108042808, + "loss": 0.0932, + "step": 34830 + }, + { + "epoch": 8.02, + "learning_rate": 0.0001411278207133675, + "loss": 0.0995, + "step": 34860 + }, + { + "epoch": 8.02, + "learning_rate": 0.00014098843062245418, + "loss": 0.1045, + "step": 34890 + }, + { + "epoch": 8.03, + "learning_rate": 0.00014084904053154087, + "loss": 0.0845, + "step": 34920 + }, + { + "epoch": 8.04, + "learning_rate": 0.00014070965044062756, + "loss": 0.0967, + "step": 34950 + }, + { + "epoch": 8.04, + "learning_rate": 0.00014057026034971424, + "loss": 0.0932, + "step": 34980 + }, + { + "epoch": 8.05, + "learning_rate": 0.0001404308702588009, + "loss": 0.098, + "step": 35010 + }, + { + "epoch": 8.06, + "learning_rate": 0.00014029148016788762, + "loss": 0.106, + "step": 35040 + }, + { + "epoch": 8.06, + "learning_rate": 0.0001401520900769743, + "loss": 0.0891, + "step": 35070 + }, + { + "epoch": 8.07, + "learning_rate": 0.000140012699986061, + "loss": 0.1053, + "step": 35100 + }, + { + "epoch": 8.08, + "learning_rate": 0.00013987330989514768, + "loss": 0.0898, + "step": 35130 + }, + { + "epoch": 8.09, + "learning_rate": 0.00013973391980423436, + "loss": 0.0967, + "step": 35160 + }, + { + "epoch": 8.09, + "learning_rate": 0.00013959452971332102, + "loss": 0.0991, + "step": 35190 + }, + { + "epoch": 8.1, + "learning_rate": 0.0001394551396224077, + "loss": 0.0853, + "step": 35220 + }, + { + "epoch": 8.11, + "learning_rate": 0.0001393157495314944, + "loss": 0.0999, + "step": 35250 + }, + { + "epoch": 8.11, + "learning_rate": 0.00013918100577694486, + "loss": 0.0977, + "step": 35280 + }, + { + "epoch": 8.12, + "learning_rate": 0.00013904161568603155, + "loss": 0.1027, + "step": 35310 + }, + { + "epoch": 8.13, + "learning_rate": 0.00013890222559511824, + "loss": 0.1099, + "step": 35340 + }, + { + "epoch": 8.13, + "learning_rate": 0.00013876283550420492, + "loss": 0.0861, + "step": 35370 + }, + { + "epoch": 8.14, + "learning_rate": 0.0001386234454132916, + "loss": 0.1048, + "step": 35400 + }, + { + "epoch": 8.15, + "learning_rate": 0.0001384840553223783, + "loss": 0.0947, + "step": 35430 + }, + { + "epoch": 8.15, + "learning_rate": 0.00013834466523146498, + "loss": 0.0964, + "step": 35460 + }, + { + "epoch": 8.16, + "learning_rate": 0.00013820527514055167, + "loss": 0.1025, + "step": 35490 + }, + { + "epoch": 8.17, + "learning_rate": 0.00013806588504963835, + "loss": 0.0839, + "step": 35520 + }, + { + "epoch": 8.18, + "learning_rate": 0.00013792649495872504, + "loss": 0.1016, + "step": 35550 + }, + { + "epoch": 8.18, + "learning_rate": 0.00013778710486781173, + "loss": 0.0896, + "step": 35580 + }, + { + "epoch": 8.19, + "learning_rate": 0.0001376477147768984, + "loss": 0.0954, + "step": 35610 + }, + { + "epoch": 8.2, + "learning_rate": 0.00013750832468598507, + "loss": 0.1006, + "step": 35640 + }, + { + "epoch": 8.2, + "learning_rate": 0.00013736893459507176, + "loss": 0.0892, + "step": 35670 + }, + { + "epoch": 8.21, + "learning_rate": 0.00013722954450415845, + "loss": 0.1059, + "step": 35700 + }, + { + "epoch": 8.22, + "learning_rate": 0.00013709015441324516, + "loss": 0.0888, + "step": 35730 + }, + { + "epoch": 8.22, + "learning_rate": 0.00013695076432233185, + "loss": 0.0946, + "step": 35760 + }, + { + "epoch": 8.23, + "learning_rate": 0.0001368113742314185, + "loss": 0.1051, + "step": 35790 + }, + { + "epoch": 8.24, + "learning_rate": 0.0001366719841405052, + "loss": 0.0884, + "step": 35820 + }, + { + "epoch": 8.24, + "learning_rate": 0.00013653259404959188, + "loss": 0.1018, + "step": 35850 + }, + { + "epoch": 8.25, + "learning_rate": 0.00013639320395867857, + "loss": 0.0902, + "step": 35880 + }, + { + "epoch": 8.26, + "learning_rate": 0.00013625381386776525, + "loss": 0.0906, + "step": 35910 + }, + { + "epoch": 8.26, + "learning_rate": 0.00013611442377685194, + "loss": 0.1045, + "step": 35940 + }, + { + "epoch": 8.27, + "learning_rate": 0.00013597503368593863, + "loss": 0.0839, + "step": 35970 + }, + { + "epoch": 8.28, + "learning_rate": 0.0001358356435950253, + "loss": 0.094, + "step": 36000 + }, + { + "epoch": 8.29, + "learning_rate": 0.000135696253504112, + "loss": 0.0937, + "step": 36030 + }, + { + "epoch": 8.29, + "learning_rate": 0.00013555686341319869, + "loss": 0.0973, + "step": 36060 + }, + { + "epoch": 8.3, + "learning_rate": 0.00013541747332228535, + "loss": 0.1019, + "step": 36090 + }, + { + "epoch": 8.31, + "learning_rate": 0.00013527808323137206, + "loss": 0.086, + "step": 36120 + }, + { + "epoch": 8.31, + "learning_rate": 0.00013513869314045875, + "loss": 0.1026, + "step": 36150 + }, + { + "epoch": 8.32, + "learning_rate": 0.00013499930304954543, + "loss": 0.0922, + "step": 36180 + }, + { + "epoch": 8.33, + "learning_rate": 0.00013485991295863212, + "loss": 0.0994, + "step": 36210 + }, + { + "epoch": 8.33, + "learning_rate": 0.0001347205228677188, + "loss": 0.1057, + "step": 36240 + }, + { + "epoch": 8.34, + "learning_rate": 0.00013458113277680546, + "loss": 0.0842, + "step": 36270 + }, + { + "epoch": 8.35, + "learning_rate": 0.00013444174268589215, + "loss": 0.0973, + "step": 36300 + }, + { + "epoch": 8.35, + "learning_rate": 0.00013430235259497884, + "loss": 0.0907, + "step": 36330 + }, + { + "epoch": 8.36, + "learning_rate": 0.00013416296250406552, + "loss": 0.0967, + "step": 36360 + }, + { + "epoch": 8.37, + "learning_rate": 0.0001340235724131522, + "loss": 0.1056, + "step": 36390 + }, + { + "epoch": 8.38, + "learning_rate": 0.0001338841823222389, + "loss": 0.0879, + "step": 36420 + }, + { + "epoch": 8.38, + "learning_rate": 0.00013374479223132558, + "loss": 0.1004, + "step": 36450 + }, + { + "epoch": 8.39, + "learning_rate": 0.00013360540214041227, + "loss": 0.0931, + "step": 36480 + }, + { + "epoch": 8.4, + "learning_rate": 0.00013346601204949896, + "loss": 0.0998, + "step": 36510 + }, + { + "epoch": 8.4, + "learning_rate": 0.00013332662195858564, + "loss": 0.1044, + "step": 36540 + }, + { + "epoch": 8.41, + "learning_rate": 0.00013318723186767233, + "loss": 0.0884, + "step": 36570 + }, + { + "epoch": 8.42, + "learning_rate": 0.00013304784177675902, + "loss": 0.105, + "step": 36600 + }, + { + "epoch": 8.42, + "learning_rate": 0.0001329084516858457, + "loss": 0.0915, + "step": 36630 + }, + { + "epoch": 8.43, + "learning_rate": 0.0001327690615949324, + "loss": 0.0934, + "step": 36660 + }, + { + "epoch": 8.44, + "learning_rate": 0.00013262967150401908, + "loss": 0.1034, + "step": 36690 + }, + { + "epoch": 8.44, + "learning_rate": 0.00013249028141310576, + "loss": 0.0819, + "step": 36720 + }, + { + "epoch": 8.45, + "learning_rate": 0.00013235089132219245, + "loss": 0.0968, + "step": 36750 + }, + { + "epoch": 8.46, + "learning_rate": 0.0001322115012312791, + "loss": 0.091, + "step": 36780 + }, + { + "epoch": 8.46, + "learning_rate": 0.0001320721111403658, + "loss": 0.1009, + "step": 36810 + }, + { + "epoch": 8.47, + "learning_rate": 0.00013193272104945248, + "loss": 0.1069, + "step": 36840 + }, + { + "epoch": 8.48, + "learning_rate": 0.00013179333095853917, + "loss": 0.0871, + "step": 36870 + }, + { + "epoch": 8.49, + "learning_rate": 0.00013165394086762588, + "loss": 0.0968, + "step": 36900 + }, + { + "epoch": 8.49, + "learning_rate": 0.00013151455077671257, + "loss": 0.0917, + "step": 36930 + }, + { + "epoch": 8.5, + "learning_rate": 0.00013137516068579923, + "loss": 0.0961, + "step": 36960 + }, + { + "epoch": 8.51, + "learning_rate": 0.00013123577059488592, + "loss": 0.1048, + "step": 36990 + }, + { + "epoch": 8.51, + "learning_rate": 0.0001310963805039726, + "loss": 0.081, + "step": 37020 + }, + { + "epoch": 8.52, + "learning_rate": 0.0001309569904130593, + "loss": 0.1008, + "step": 37050 + }, + { + "epoch": 8.53, + "learning_rate": 0.00013081760032214598, + "loss": 0.0923, + "step": 37080 + }, + { + "epoch": 8.53, + "learning_rate": 0.00013067821023123266, + "loss": 0.0939, + "step": 37110 + }, + { + "epoch": 8.54, + "learning_rate": 0.00013053882014031935, + "loss": 0.1002, + "step": 37140 + }, + { + "epoch": 8.55, + "learning_rate": 0.00013039943004940604, + "loss": 0.0845, + "step": 37170 + }, + { + "epoch": 8.55, + "learning_rate": 0.00013026003995849272, + "loss": 0.0937, + "step": 37200 + }, + { + "epoch": 8.56, + "learning_rate": 0.0001301206498675794, + "loss": 0.0882, + "step": 37230 + }, + { + "epoch": 8.57, + "learning_rate": 0.00012998125977666607, + "loss": 0.0935, + "step": 37260 + }, + { + "epoch": 8.58, + "learning_rate": 0.00012984186968575278, + "loss": 0.1046, + "step": 37290 + }, + { + "epoch": 8.58, + "learning_rate": 0.00012970247959483947, + "loss": 0.0817, + "step": 37320 + }, + { + "epoch": 8.59, + "learning_rate": 0.00012956308950392615, + "loss": 0.1012, + "step": 37350 + }, + { + "epoch": 8.6, + "learning_rate": 0.00012942369941301284, + "loss": 0.0899, + "step": 37380 + }, + { + "epoch": 8.6, + "learning_rate": 0.00012928430932209953, + "loss": 0.0924, + "step": 37410 + }, + { + "epoch": 8.61, + "learning_rate": 0.0001291449192311862, + "loss": 0.1039, + "step": 37440 + }, + { + "epoch": 8.62, + "learning_rate": 0.00012900552914027287, + "loss": 0.0879, + "step": 37470 + }, + { + "epoch": 8.62, + "learning_rate": 0.00012886613904935956, + "loss": 0.098, + "step": 37500 + }, + { + "epoch": 8.63, + "learning_rate": 0.00012872674895844625, + "loss": 0.0888, + "step": 37530 + }, + { + "epoch": 8.64, + "learning_rate": 0.00012858735886753293, + "loss": 0.0886, + "step": 37560 + }, + { + "epoch": 8.64, + "learning_rate": 0.0001284526151129834, + "loss": 0.1049, + "step": 37590 + }, + { + "epoch": 8.65, + "learning_rate": 0.00012831322502207009, + "loss": 0.0822, + "step": 37620 + }, + { + "epoch": 8.66, + "learning_rate": 0.00012817383493115677, + "loss": 0.1014, + "step": 37650 + }, + { + "epoch": 8.67, + "learning_rate": 0.00012803444484024346, + "loss": 0.0866, + "step": 37680 + }, + { + "epoch": 8.67, + "learning_rate": 0.00012789970108569392, + "loss": 0.0923, + "step": 37710 + }, + { + "epoch": 8.68, + "learning_rate": 0.0001277603109947806, + "loss": 0.1016, + "step": 37740 + }, + { + "epoch": 8.69, + "learning_rate": 0.0001276209209038673, + "loss": 0.0839, + "step": 37770 + }, + { + "epoch": 8.69, + "learning_rate": 0.00012748617714931776, + "loss": 0.1052, + "step": 37800 + }, + { + "epoch": 8.7, + "learning_rate": 0.00012734678705840445, + "loss": 0.0901, + "step": 37830 + }, + { + "epoch": 8.71, + "learning_rate": 0.00012720739696749114, + "loss": 0.0943, + "step": 37860 + }, + { + "epoch": 8.71, + "learning_rate": 0.00012706800687657782, + "loss": 0.1123, + "step": 37890 + }, + { + "epoch": 8.72, + "learning_rate": 0.00012692861678566448, + "loss": 0.0836, + "step": 37920 + }, + { + "epoch": 8.73, + "learning_rate": 0.00012678922669475117, + "loss": 0.0985, + "step": 37950 + }, + { + "epoch": 8.73, + "learning_rate": 0.00012664983660383786, + "loss": 0.0895, + "step": 37980 + }, + { + "epoch": 8.74, + "learning_rate": 0.00012651044651292454, + "loss": 0.0918, + "step": 38010 + }, + { + "epoch": 8.75, + "learning_rate": 0.00012637105642201123, + "loss": 0.0962, + "step": 38040 + }, + { + "epoch": 8.75, + "learning_rate": 0.00012623166633109791, + "loss": 0.0852, + "step": 38070 + }, + { + "epoch": 8.76, + "learning_rate": 0.0001260922762401846, + "loss": 0.1046, + "step": 38100 + }, + { + "epoch": 8.77, + "learning_rate": 0.0001259528861492713, + "loss": 0.0877, + "step": 38130 + }, + { + "epoch": 8.78, + "learning_rate": 0.00012581349605835797, + "loss": 0.095, + "step": 38160 + }, + { + "epoch": 8.78, + "learning_rate": 0.00012567410596744466, + "loss": 0.0976, + "step": 38190 + }, + { + "epoch": 8.79, + "learning_rate": 0.00012553471587653135, + "loss": 0.0835, + "step": 38220 + }, + { + "epoch": 8.8, + "learning_rate": 0.00012539532578561803, + "loss": 0.0975, + "step": 38250 + }, + { + "epoch": 8.8, + "learning_rate": 0.00012525593569470472, + "loss": 0.0857, + "step": 38280 + }, + { + "epoch": 8.81, + "learning_rate": 0.0001251165456037914, + "loss": 0.0941, + "step": 38310 + }, + { + "epoch": 8.82, + "learning_rate": 0.0001249771555128781, + "loss": 0.1039, + "step": 38340 + }, + { + "epoch": 8.82, + "learning_rate": 0.00012483776542196478, + "loss": 0.085, + "step": 38370 + }, + { + "epoch": 8.83, + "learning_rate": 0.00012469837533105144, + "loss": 0.1022, + "step": 38400 + }, + { + "epoch": 8.84, + "learning_rate": 0.00012455898524013813, + "loss": 0.0894, + "step": 38430 + }, + { + "epoch": 8.84, + "learning_rate": 0.0001244195951492248, + "loss": 0.0935, + "step": 38460 + }, + { + "epoch": 8.85, + "learning_rate": 0.0001242802050583115, + "loss": 0.1008, + "step": 38490 + }, + { + "epoch": 8.86, + "learning_rate": 0.0001241408149673982, + "loss": 0.0745, + "step": 38520 + }, + { + "epoch": 8.87, + "learning_rate": 0.00012400142487648487, + "loss": 0.0978, + "step": 38550 + }, + { + "epoch": 8.87, + "learning_rate": 0.0001238620347855716, + "loss": 0.0877, + "step": 38580 + }, + { + "epoch": 8.88, + "learning_rate": 0.00012372264469465825, + "loss": 0.0916, + "step": 38610 + }, + { + "epoch": 8.89, + "learning_rate": 0.00012358325460374493, + "loss": 0.0998, + "step": 38640 + }, + { + "epoch": 8.89, + "learning_rate": 0.00012344386451283162, + "loss": 0.0861, + "step": 38670 + }, + { + "epoch": 8.9, + "learning_rate": 0.0001233044744219183, + "loss": 0.0977, + "step": 38700 + }, + { + "epoch": 8.91, + "learning_rate": 0.000123165084331005, + "loss": 0.094, + "step": 38730 + }, + { + "epoch": 8.91, + "learning_rate": 0.00012302569424009168, + "loss": 0.0949, + "step": 38760 + }, + { + "epoch": 8.92, + "learning_rate": 0.00012288630414917837, + "loss": 0.0994, + "step": 38790 + }, + { + "epoch": 8.93, + "learning_rate": 0.00012274691405826505, + "loss": 0.0842, + "step": 38820 + }, + { + "epoch": 8.93, + "learning_rate": 0.00012260752396735174, + "loss": 0.0933, + "step": 38850 + }, + { + "epoch": 8.94, + "learning_rate": 0.00012246813387643843, + "loss": 0.0891, + "step": 38880 + }, + { + "epoch": 8.95, + "learning_rate": 0.00012232874378552508, + "loss": 0.0931, + "step": 38910 + }, + { + "epoch": 8.95, + "learning_rate": 0.00012218935369461177, + "loss": 0.1044, + "step": 38940 + }, + { + "epoch": 8.96, + "learning_rate": 0.00012204996360369849, + "loss": 0.0814, + "step": 38970 + }, + { + "epoch": 8.97, + "learning_rate": 0.00012191057351278516, + "loss": 0.0934, + "step": 39000 + }, + { + "epoch": 8.98, + "learning_rate": 0.00012177118342187184, + "loss": 0.0832, + "step": 39030 + }, + { + "epoch": 8.98, + "learning_rate": 0.00012163179333095853, + "loss": 0.0923, + "step": 39060 + }, + { + "epoch": 8.99, + "learning_rate": 0.00012149240324004522, + "loss": 0.1046, + "step": 39090 + }, + { + "epoch": 9.0, + "learning_rate": 0.0001213530131491319, + "loss": 0.0835, + "step": 39120 + }, + { + "epoch": 9.0, + "eval_cer": 0.03841335129896225, + "eval_loss": 0.13283832371234894, + "eval_runtime": 421.3766, + "eval_samples_per_second": 38.31, + "eval_steps_per_second": 2.395, + "eval_wer": 0.1379877491624082, + "step": 39136 + }, + { + "epoch": 9.0, + "learning_rate": 0.00012121362305821858, + "loss": 0.1075, + "step": 39150 + }, + { + "epoch": 9.01, + "learning_rate": 0.00012107423296730526, + "loss": 0.0862, + "step": 39180 + }, + { + "epoch": 9.02, + "learning_rate": 0.00012093484287639195, + "loss": 0.0911, + "step": 39210 + }, + { + "epoch": 9.02, + "learning_rate": 0.00012079545278547864, + "loss": 0.0885, + "step": 39240 + }, + { + "epoch": 9.03, + "learning_rate": 0.00012065606269456532, + "loss": 0.0863, + "step": 39270 + }, + { + "epoch": 9.04, + "learning_rate": 0.00012051667260365201, + "loss": 0.0928, + "step": 39300 + }, + { + "epoch": 9.04, + "learning_rate": 0.00012037728251273868, + "loss": 0.091, + "step": 39330 + }, + { + "epoch": 9.05, + "learning_rate": 0.00012023789242182538, + "loss": 0.0878, + "step": 39360 + }, + { + "epoch": 9.06, + "learning_rate": 0.00012009850233091207, + "loss": 0.0918, + "step": 39390 + }, + { + "epoch": 9.07, + "learning_rate": 0.00011995911223999876, + "loss": 0.0784, + "step": 39420 + }, + { + "epoch": 9.07, + "learning_rate": 0.00011981972214908544, + "loss": 0.0982, + "step": 39450 + }, + { + "epoch": 9.08, + "learning_rate": 0.00011968033205817213, + "loss": 0.0849, + "step": 39480 + }, + { + "epoch": 9.09, + "learning_rate": 0.0001195409419672588, + "loss": 0.0878, + "step": 39510 + }, + { + "epoch": 9.09, + "learning_rate": 0.00011940155187634549, + "loss": 0.1017, + "step": 39540 + }, + { + "epoch": 9.1, + "learning_rate": 0.00011926216178543218, + "loss": 0.0822, + "step": 39570 + }, + { + "epoch": 9.11, + "learning_rate": 0.00011912277169451886, + "loss": 0.0951, + "step": 39600 + }, + { + "epoch": 9.11, + "learning_rate": 0.00011898338160360555, + "loss": 0.0921, + "step": 39630 + }, + { + "epoch": 9.12, + "learning_rate": 0.00011884399151269222, + "loss": 0.0913, + "step": 39660 + }, + { + "epoch": 9.13, + "learning_rate": 0.00011870460142177891, + "loss": 0.0959, + "step": 39690 + }, + { + "epoch": 9.13, + "learning_rate": 0.0001185652113308656, + "loss": 0.0786, + "step": 39720 + }, + { + "epoch": 9.14, + "learning_rate": 0.0001184258212399523, + "loss": 0.0947, + "step": 39750 + }, + { + "epoch": 9.15, + "learning_rate": 0.00011828643114903898, + "loss": 0.09, + "step": 39780 + }, + { + "epoch": 9.15, + "learning_rate": 0.00011814704105812567, + "loss": 0.0959, + "step": 39810 + }, + { + "epoch": 9.16, + "learning_rate": 0.00011800765096721234, + "loss": 0.0958, + "step": 39840 + }, + { + "epoch": 9.17, + "learning_rate": 0.00011786826087629903, + "loss": 0.0802, + "step": 39870 + }, + { + "epoch": 9.18, + "learning_rate": 0.00011772887078538571, + "loss": 0.0956, + "step": 39900 + }, + { + "epoch": 9.18, + "learning_rate": 0.0001175894806944724, + "loss": 0.0841, + "step": 39930 + }, + { + "epoch": 9.19, + "learning_rate": 0.00011745009060355909, + "loss": 0.0869, + "step": 39960 + }, + { + "epoch": 9.2, + "learning_rate": 0.00011731070051264576, + "loss": 0.0951, + "step": 39990 + }, + { + "epoch": 9.2, + "learning_rate": 0.00011717131042173245, + "loss": 0.0794, + "step": 40020 + }, + { + "epoch": 9.21, + "learning_rate": 0.00011703192033081913, + "loss": 0.097, + "step": 40050 + }, + { + "epoch": 9.22, + "learning_rate": 0.00011689253023990582, + "loss": 0.0963, + "step": 40080 + }, + { + "epoch": 9.22, + "learning_rate": 0.00011675314014899251, + "loss": 0.0905, + "step": 40110 + }, + { + "epoch": 9.23, + "learning_rate": 0.00011661375005807918, + "loss": 0.0991, + "step": 40140 + }, + { + "epoch": 9.24, + "learning_rate": 0.00011647435996716588, + "loss": 0.0828, + "step": 40170 + }, + { + "epoch": 9.24, + "learning_rate": 0.00011633496987625257, + "loss": 0.0973, + "step": 40200 + }, + { + "epoch": 9.25, + "learning_rate": 0.00011619557978533925, + "loss": 0.0916, + "step": 40230 + }, + { + "epoch": 9.26, + "learning_rate": 0.00011605618969442594, + "loss": 0.0923, + "step": 40260 + }, + { + "epoch": 9.27, + "learning_rate": 0.00011591679960351263, + "loss": 0.0964, + "step": 40290 + }, + { + "epoch": 9.27, + "learning_rate": 0.0001157774095125993, + "loss": 0.0823, + "step": 40320 + }, + { + "epoch": 9.28, + "learning_rate": 0.00011563801942168599, + "loss": 0.0919, + "step": 40350 + }, + { + "epoch": 9.29, + "learning_rate": 0.00011549862933077267, + "loss": 0.0884, + "step": 40380 + }, + { + "epoch": 9.29, + "learning_rate": 0.00011535923923985936, + "loss": 0.0943, + "step": 40410 + }, + { + "epoch": 9.3, + "learning_rate": 0.00011521984914894605, + "loss": 0.1047, + "step": 40440 + }, + { + "epoch": 9.31, + "learning_rate": 0.00011508045905803272, + "loss": 0.088, + "step": 40470 + }, + { + "epoch": 9.31, + "learning_rate": 0.0001149410689671194, + "loss": 0.0904, + "step": 40500 + }, + { + "epoch": 9.32, + "learning_rate": 0.00011480167887620609, + "loss": 0.0844, + "step": 40530 + }, + { + "epoch": 9.33, + "learning_rate": 0.00011466228878529279, + "loss": 0.0859, + "step": 40560 + }, + { + "epoch": 9.33, + "learning_rate": 0.00011452289869437948, + "loss": 0.0973, + "step": 40590 + }, + { + "epoch": 9.34, + "learning_rate": 0.00011438350860346617, + "loss": 0.0857, + "step": 40620 + }, + { + "epoch": 9.35, + "learning_rate": 0.00011424411851255285, + "loss": 0.0939, + "step": 40650 + }, + { + "epoch": 9.35, + "learning_rate": 0.00011410472842163953, + "loss": 0.0877, + "step": 40680 + }, + { + "epoch": 9.36, + "learning_rate": 0.00011396533833072621, + "loss": 0.0898, + "step": 40710 + }, + { + "epoch": 9.37, + "learning_rate": 0.0001138259482398129, + "loss": 0.1002, + "step": 40740 + }, + { + "epoch": 9.38, + "learning_rate": 0.00011368655814889958, + "loss": 0.085, + "step": 40770 + }, + { + "epoch": 9.38, + "learning_rate": 0.00011354716805798627, + "loss": 0.0958, + "step": 40800 + }, + { + "epoch": 9.39, + "learning_rate": 0.00011340777796707294, + "loss": 0.0823, + "step": 40830 + }, + { + "epoch": 9.4, + "learning_rate": 0.00011326838787615963, + "loss": 0.0916, + "step": 40860 + }, + { + "epoch": 9.4, + "learning_rate": 0.00011312899778524632, + "loss": 0.095, + "step": 40890 + }, + { + "epoch": 9.41, + "learning_rate": 0.000112989607694333, + "loss": 0.0798, + "step": 40920 + }, + { + "epoch": 9.42, + "learning_rate": 0.0001128502176034197, + "loss": 0.0978, + "step": 40950 + }, + { + "epoch": 9.42, + "learning_rate": 0.00011271082751250639, + "loss": 0.087, + "step": 40980 + }, + { + "epoch": 9.43, + "learning_rate": 0.00011257143742159306, + "loss": 0.092, + "step": 41010 + }, + { + "epoch": 9.44, + "learning_rate": 0.00011243204733067975, + "loss": 0.0992, + "step": 41040 + }, + { + "epoch": 9.44, + "learning_rate": 0.00011229265723976644, + "loss": 0.0798, + "step": 41070 + }, + { + "epoch": 9.45, + "learning_rate": 0.00011215326714885312, + "loss": 0.0947, + "step": 41100 + }, + { + "epoch": 9.46, + "learning_rate": 0.00011201387705793981, + "loss": 0.0919, + "step": 41130 + }, + { + "epoch": 9.47, + "learning_rate": 0.00011187448696702648, + "loss": 0.0901, + "step": 41160 + }, + { + "epoch": 9.47, + "learning_rate": 0.00011173509687611317, + "loss": 0.0969, + "step": 41190 + }, + { + "epoch": 9.48, + "learning_rate": 0.00011159570678519986, + "loss": 0.0821, + "step": 41220 + }, + { + "epoch": 9.49, + "learning_rate": 0.00011145631669428654, + "loss": 0.0937, + "step": 41250 + }, + { + "epoch": 9.49, + "learning_rate": 0.00011131692660337323, + "loss": 0.0849, + "step": 41280 + }, + { + "epoch": 9.5, + "learning_rate": 0.0001111775365124599, + "loss": 0.0917, + "step": 41310 + }, + { + "epoch": 9.51, + "learning_rate": 0.0001110381464215466, + "loss": 0.098, + "step": 41340 + }, + { + "epoch": 9.51, + "learning_rate": 0.00011089875633063329, + "loss": 0.0836, + "step": 41370 + }, + { + "epoch": 9.52, + "learning_rate": 0.00011075936623971998, + "loss": 0.0929, + "step": 41400 + }, + { + "epoch": 9.53, + "learning_rate": 0.00011061997614880666, + "loss": 0.0887, + "step": 41430 + }, + { + "epoch": 9.53, + "learning_rate": 0.00011048058605789335, + "loss": 0.0902, + "step": 41460 + }, + { + "epoch": 9.54, + "learning_rate": 0.00011034119596698002, + "loss": 0.1007, + "step": 41490 + }, + { + "epoch": 9.55, + "learning_rate": 0.00011020180587606671, + "loss": 0.0825, + "step": 41520 + }, + { + "epoch": 9.56, + "learning_rate": 0.0001100624157851534, + "loss": 0.0951, + "step": 41550 + }, + { + "epoch": 9.56, + "learning_rate": 0.00010992302569424008, + "loss": 0.0837, + "step": 41580 + }, + { + "epoch": 9.57, + "learning_rate": 0.00010978363560332677, + "loss": 0.0878, + "step": 41610 + }, + { + "epoch": 9.58, + "learning_rate": 0.00010964424551241344, + "loss": 0.1012, + "step": 41640 + }, + { + "epoch": 9.58, + "learning_rate": 0.00010950485542150013, + "loss": 0.0766, + "step": 41670 + }, + { + "epoch": 9.59, + "learning_rate": 0.00010936546533058681, + "loss": 0.0928, + "step": 41700 + }, + { + "epoch": 9.6, + "learning_rate": 0.00010922607523967351, + "loss": 0.0833, + "step": 41730 + }, + { + "epoch": 9.6, + "learning_rate": 0.0001090866851487602, + "loss": 0.0872, + "step": 41760 + }, + { + "epoch": 9.61, + "learning_rate": 0.00010894729505784689, + "loss": 0.1, + "step": 41790 + }, + { + "epoch": 9.62, + "learning_rate": 0.00010881255130329734, + "loss": 0.0814, + "step": 41820 + }, + { + "epoch": 9.62, + "learning_rate": 0.00010867316121238403, + "loss": 0.0883, + "step": 41850 + }, + { + "epoch": 9.63, + "learning_rate": 0.00010853377112147071, + "loss": 0.0872, + "step": 41880 + }, + { + "epoch": 9.64, + "learning_rate": 0.00010839438103055739, + "loss": 0.0906, + "step": 41910 + }, + { + "epoch": 9.64, + "learning_rate": 0.00010825499093964407, + "loss": 0.0993, + "step": 41940 + }, + { + "epoch": 9.65, + "learning_rate": 0.00010811560084873076, + "loss": 0.0814, + "step": 41970 + }, + { + "epoch": 9.66, + "learning_rate": 0.00010797621075781745, + "loss": 0.0956, + "step": 42000 + }, + { + "epoch": 9.67, + "learning_rate": 0.00010783682066690415, + "loss": 0.0893, + "step": 42030 + }, + { + "epoch": 9.67, + "learning_rate": 0.00010769743057599083, + "loss": 0.0898, + "step": 42060 + }, + { + "epoch": 9.68, + "learning_rate": 0.00010755804048507752, + "loss": 0.0943, + "step": 42090 + }, + { + "epoch": 9.69, + "learning_rate": 0.00010741865039416419, + "loss": 0.0815, + "step": 42120 + }, + { + "epoch": 9.69, + "learning_rate": 0.00010727926030325088, + "loss": 0.1163, + "step": 42150 + }, + { + "epoch": 9.7, + "learning_rate": 0.00010713987021233757, + "loss": 0.0932, + "step": 42180 + }, + { + "epoch": 9.71, + "learning_rate": 0.00010700048012142425, + "loss": 0.092, + "step": 42210 + }, + { + "epoch": 9.71, + "learning_rate": 0.00010686109003051094, + "loss": 0.1005, + "step": 42240 + }, + { + "epoch": 9.72, + "learning_rate": 0.00010672169993959761, + "loss": 0.0836, + "step": 42270 + }, + { + "epoch": 9.73, + "learning_rate": 0.0001065823098486843, + "loss": 0.098, + "step": 42300 + }, + { + "epoch": 9.73, + "learning_rate": 0.00010644291975777098, + "loss": 0.0877, + "step": 42330 + }, + { + "epoch": 9.74, + "learning_rate": 0.00010630352966685767, + "loss": 0.0917, + "step": 42360 + }, + { + "epoch": 9.75, + "learning_rate": 0.00010616413957594436, + "loss": 0.1019, + "step": 42390 + }, + { + "epoch": 9.76, + "learning_rate": 0.00010602474948503106, + "loss": 0.0855, + "step": 42420 + }, + { + "epoch": 9.76, + "learning_rate": 0.00010588535939411773, + "loss": 0.0911, + "step": 42450 + }, + { + "epoch": 9.77, + "learning_rate": 0.00010574596930320442, + "loss": 0.0856, + "step": 42480 + }, + { + "epoch": 9.78, + "learning_rate": 0.0001056065792122911, + "loss": 0.0878, + "step": 42510 + }, + { + "epoch": 9.78, + "learning_rate": 0.00010546718912137779, + "loss": 0.0996, + "step": 42540 + }, + { + "epoch": 9.79, + "learning_rate": 0.00010532779903046448, + "loss": 0.0845, + "step": 42570 + }, + { + "epoch": 9.8, + "learning_rate": 0.00010518840893955115, + "loss": 0.0914, + "step": 42600 + }, + { + "epoch": 9.8, + "learning_rate": 0.00010504901884863784, + "loss": 0.0888, + "step": 42630 + }, + { + "epoch": 9.81, + "learning_rate": 0.00010490962875772452, + "loss": 0.0901, + "step": 42660 + }, + { + "epoch": 9.82, + "learning_rate": 0.00010477023866681121, + "loss": 0.0987, + "step": 42690 + }, + { + "epoch": 9.82, + "learning_rate": 0.0001046308485758979, + "loss": 0.0761, + "step": 42720 + }, + { + "epoch": 9.83, + "learning_rate": 0.00010449145848498457, + "loss": 0.0926, + "step": 42750 + }, + { + "epoch": 9.84, + "learning_rate": 0.00010435206839407126, + "loss": 0.0904, + "step": 42780 + }, + { + "epoch": 9.84, + "learning_rate": 0.00010421267830315794, + "loss": 0.0877, + "step": 42810 + }, + { + "epoch": 9.85, + "learning_rate": 0.00010407328821224464, + "loss": 0.1015, + "step": 42840 + }, + { + "epoch": 9.86, + "learning_rate": 0.00010393389812133133, + "loss": 0.0811, + "step": 42870 + }, + { + "epoch": 9.87, + "learning_rate": 0.00010379450803041802, + "loss": 0.1015, + "step": 42900 + }, + { + "epoch": 9.87, + "learning_rate": 0.00010365511793950469, + "loss": 0.0822, + "step": 42930 + }, + { + "epoch": 9.88, + "learning_rate": 0.00010351572784859138, + "loss": 0.0925, + "step": 42960 + }, + { + "epoch": 9.89, + "learning_rate": 0.00010337633775767806, + "loss": 0.1004, + "step": 42990 + }, + { + "epoch": 9.89, + "learning_rate": 0.00010323694766676475, + "loss": 0.0792, + "step": 43020 + }, + { + "epoch": 9.9, + "learning_rate": 0.00010309755757585144, + "loss": 0.0937, + "step": 43050 + }, + { + "epoch": 9.91, + "learning_rate": 0.00010295816748493811, + "loss": 0.0852, + "step": 43080 + }, + { + "epoch": 9.91, + "learning_rate": 0.0001028187773940248, + "loss": 0.0859, + "step": 43110 + }, + { + "epoch": 9.92, + "learning_rate": 0.00010267938730311148, + "loss": 0.0942, + "step": 43140 + }, + { + "epoch": 9.93, + "learning_rate": 0.00010253999721219817, + "loss": 0.0817, + "step": 43170 + }, + { + "epoch": 9.93, + "learning_rate": 0.00010240060712128485, + "loss": 0.0911, + "step": 43200 + }, + { + "epoch": 9.94, + "learning_rate": 0.00010226121703037155, + "loss": 0.0852, + "step": 43230 + }, + { + "epoch": 9.95, + "learning_rate": 0.00010212182693945823, + "loss": 0.0871, + "step": 43260 + }, + { + "epoch": 9.96, + "learning_rate": 0.00010198243684854491, + "loss": 0.0982, + "step": 43290 + }, + { + "epoch": 9.96, + "learning_rate": 0.0001018430467576316, + "loss": 0.0759, + "step": 43320 + }, + { + "epoch": 9.97, + "learning_rate": 0.00010170365666671829, + "loss": 0.0915, + "step": 43350 + }, + { + "epoch": 9.98, + "learning_rate": 0.00010156426657580497, + "loss": 0.0824, + "step": 43380 + }, + { + "epoch": 9.98, + "learning_rate": 0.00010142487648489166, + "loss": 0.0844, + "step": 43410 + }, + { + "epoch": 9.99, + "learning_rate": 0.00010128548639397833, + "loss": 0.0942, + "step": 43440 + }, + { + "epoch": 10.0, + "learning_rate": 0.00010114609630306502, + "loss": 0.0775, + "step": 43470 + }, + { + "epoch": 10.0, + "eval_cer": 0.03279810730523446, + "eval_loss": 0.1231892928481102, + "eval_runtime": 422.7073, + "eval_samples_per_second": 38.19, + "eval_steps_per_second": 2.387, + "eval_wer": 0.122921249450066, + "step": 43485 + }, + { + "epoch": 10.0, + "learning_rate": 0.00010100670621215171, + "loss": 0.0946, + "step": 43500 + }, + { + "epoch": 10.01, + "learning_rate": 0.0001008673161212384, + "loss": 0.0801, + "step": 43530 + }, + { + "epoch": 10.02, + "learning_rate": 0.00010072792603032508, + "loss": 0.0845, + "step": 43560 + }, + { + "epoch": 10.02, + "learning_rate": 0.00010058853593941175, + "loss": 0.097, + "step": 43590 + }, + { + "epoch": 10.03, + "learning_rate": 0.00010044914584849845, + "loss": 0.0771, + "step": 43620 + }, + { + "epoch": 10.04, + "learning_rate": 0.00010030975575758514, + "loss": 0.0906, + "step": 43650 + }, + { + "epoch": 10.04, + "learning_rate": 0.00010017036566667183, + "loss": 0.0877, + "step": 43680 + }, + { + "epoch": 10.05, + "learning_rate": 0.00010003097557575851, + "loss": 0.0816, + "step": 43710 + }, + { + "epoch": 10.06, + "learning_rate": 9.98915854848452e-05, + "loss": 0.0962, + "step": 43740 + }, + { + "epoch": 10.07, + "learning_rate": 9.975219539393187e-05, + "loss": 0.0791, + "step": 43770 + }, + { + "epoch": 10.07, + "learning_rate": 9.961280530301856e-05, + "loss": 0.0894, + "step": 43800 + }, + { + "epoch": 10.08, + "learning_rate": 9.947341521210525e-05, + "loss": 0.085, + "step": 43830 + }, + { + "epoch": 10.09, + "learning_rate": 9.933402512119193e-05, + "loss": 0.0863, + "step": 43860 + }, + { + "epoch": 10.09, + "learning_rate": 9.919463503027862e-05, + "loss": 0.0919, + "step": 43890 + }, + { + "epoch": 10.1, + "learning_rate": 9.905524493936529e-05, + "loss": 0.076, + "step": 43920 + }, + { + "epoch": 10.11, + "learning_rate": 9.891585484845198e-05, + "loss": 0.083, + "step": 43950 + }, + { + "epoch": 10.11, + "learning_rate": 9.877646475753866e-05, + "loss": 0.0826, + "step": 43980 + }, + { + "epoch": 10.12, + "learning_rate": 9.863707466662537e-05, + "loss": 0.0808, + "step": 44010 + }, + { + "epoch": 10.13, + "learning_rate": 9.849768457571205e-05, + "loss": 0.0938, + "step": 44040 + }, + { + "epoch": 10.13, + "learning_rate": 9.835829448479874e-05, + "loss": 0.0765, + "step": 44070 + }, + { + "epoch": 10.14, + "learning_rate": 9.821890439388541e-05, + "loss": 0.092, + "step": 44100 + }, + { + "epoch": 10.15, + "learning_rate": 9.80795143029721e-05, + "loss": 0.0835, + "step": 44130 + }, + { + "epoch": 10.16, + "learning_rate": 9.794012421205878e-05, + "loss": 0.085, + "step": 44160 + }, + { + "epoch": 10.16, + "learning_rate": 9.780073412114547e-05, + "loss": 0.0937, + "step": 44190 + }, + { + "epoch": 10.17, + "learning_rate": 9.766134403023216e-05, + "loss": 0.0774, + "step": 44220 + }, + { + "epoch": 10.18, + "learning_rate": 9.752195393931883e-05, + "loss": 0.0912, + "step": 44250 + }, + { + "epoch": 10.18, + "learning_rate": 9.738256384840552e-05, + "loss": 0.0862, + "step": 44280 + }, + { + "epoch": 10.19, + "learning_rate": 9.72431737574922e-05, + "loss": 0.0867, + "step": 44310 + }, + { + "epoch": 10.2, + "learning_rate": 9.710378366657889e-05, + "loss": 0.0882, + "step": 44340 + }, + { + "epoch": 10.2, + "learning_rate": 9.696439357566558e-05, + "loss": 0.0782, + "step": 44370 + }, + { + "epoch": 10.21, + "learning_rate": 9.682500348475228e-05, + "loss": 0.0874, + "step": 44400 + }, + { + "epoch": 10.22, + "learning_rate": 9.668561339383895e-05, + "loss": 0.0817, + "step": 44430 + }, + { + "epoch": 10.22, + "learning_rate": 9.654622330292564e-05, + "loss": 0.0845, + "step": 44460 + }, + { + "epoch": 10.23, + "learning_rate": 9.640683321201232e-05, + "loss": 0.0949, + "step": 44490 + }, + { + "epoch": 10.24, + "learning_rate": 9.626744312109901e-05, + "loss": 0.0776, + "step": 44520 + }, + { + "epoch": 10.24, + "learning_rate": 9.61280530301857e-05, + "loss": 0.0851, + "step": 44550 + }, + { + "epoch": 10.25, + "learning_rate": 9.599330927563615e-05, + "loss": 0.0821, + "step": 44580 + }, + { + "epoch": 10.26, + "learning_rate": 9.585391918472283e-05, + "loss": 0.0812, + "step": 44610 + }, + { + "epoch": 10.27, + "learning_rate": 9.571452909380952e-05, + "loss": 0.0909, + "step": 44640 + }, + { + "epoch": 10.27, + "learning_rate": 9.55751390028962e-05, + "loss": 0.0771, + "step": 44670 + }, + { + "epoch": 10.28, + "learning_rate": 9.54357489119829e-05, + "loss": 0.0865, + "step": 44700 + }, + { + "epoch": 10.29, + "learning_rate": 9.529635882106958e-05, + "loss": 0.0815, + "step": 44730 + }, + { + "epoch": 10.29, + "learning_rate": 9.515696873015627e-05, + "loss": 0.0859, + "step": 44760 + }, + { + "epoch": 10.3, + "learning_rate": 9.501757863924295e-05, + "loss": 0.0913, + "step": 44790 + }, + { + "epoch": 10.31, + "learning_rate": 9.487818854832964e-05, + "loss": 0.0747, + "step": 44820 + }, + { + "epoch": 10.31, + "learning_rate": 9.473879845741631e-05, + "loss": 0.086, + "step": 44850 + }, + { + "epoch": 10.32, + "learning_rate": 9.4599408366503e-05, + "loss": 0.0891, + "step": 44880 + }, + { + "epoch": 10.33, + "learning_rate": 9.446001827558969e-05, + "loss": 0.0846, + "step": 44910 + }, + { + "epoch": 10.33, + "learning_rate": 9.432062818467637e-05, + "loss": 0.0941, + "step": 44940 + }, + { + "epoch": 10.34, + "learning_rate": 9.418123809376306e-05, + "loss": 0.0736, + "step": 44970 + }, + { + "epoch": 10.35, + "learning_rate": 9.404184800284975e-05, + "loss": 0.0868, + "step": 45000 + }, + { + "epoch": 10.36, + "learning_rate": 9.390245791193642e-05, + "loss": 0.0852, + "step": 45030 + }, + { + "epoch": 10.36, + "learning_rate": 9.37630678210231e-05, + "loss": 0.0795, + "step": 45060 + }, + { + "epoch": 10.37, + "learning_rate": 9.36236777301098e-05, + "loss": 0.0967, + "step": 45090 + }, + { + "epoch": 10.38, + "learning_rate": 9.348428763919649e-05, + "loss": 0.0789, + "step": 45120 + }, + { + "epoch": 10.38, + "learning_rate": 9.334489754828318e-05, + "loss": 0.0891, + "step": 45150 + }, + { + "epoch": 10.39, + "learning_rate": 9.320550745736987e-05, + "loss": 0.0804, + "step": 45180 + }, + { + "epoch": 10.4, + "learning_rate": 9.306611736645654e-05, + "loss": 0.0873, + "step": 45210 + }, + { + "epoch": 10.4, + "learning_rate": 9.292672727554323e-05, + "loss": 0.0901, + "step": 45240 + }, + { + "epoch": 10.41, + "learning_rate": 9.278733718462991e-05, + "loss": 0.0757, + "step": 45270 + }, + { + "epoch": 10.42, + "learning_rate": 9.26479470937166e-05, + "loss": 0.0934, + "step": 45300 + }, + { + "epoch": 10.42, + "learning_rate": 9.250855700280329e-05, + "loss": 0.0832, + "step": 45330 + }, + { + "epoch": 10.43, + "learning_rate": 9.236916691188996e-05, + "loss": 0.0863, + "step": 45360 + }, + { + "epoch": 10.44, + "learning_rate": 9.222977682097665e-05, + "loss": 0.0926, + "step": 45390 + }, + { + "epoch": 10.44, + "learning_rate": 9.209038673006333e-05, + "loss": 0.0784, + "step": 45420 + }, + { + "epoch": 10.45, + "learning_rate": 9.195099663915002e-05, + "loss": 0.0869, + "step": 45450 + }, + { + "epoch": 10.46, + "learning_rate": 9.18116065482367e-05, + "loss": 0.0869, + "step": 45480 + }, + { + "epoch": 10.47, + "learning_rate": 9.16722164573234e-05, + "loss": 0.0816, + "step": 45510 + }, + { + "epoch": 10.47, + "learning_rate": 9.153282636641008e-05, + "loss": 0.0915, + "step": 45540 + }, + { + "epoch": 10.48, + "learning_rate": 9.139343627549676e-05, + "loss": 0.0758, + "step": 45570 + }, + { + "epoch": 10.49, + "learning_rate": 9.125404618458345e-05, + "loss": 0.0874, + "step": 45600 + }, + { + "epoch": 10.49, + "learning_rate": 9.111465609367014e-05, + "loss": 0.0836, + "step": 45630 + }, + { + "epoch": 10.5, + "learning_rate": 9.097526600275682e-05, + "loss": 0.0789, + "step": 45660 + }, + { + "epoch": 10.51, + "learning_rate": 9.08358759118435e-05, + "loss": 0.09, + "step": 45690 + }, + { + "epoch": 10.51, + "learning_rate": 9.069648582093018e-05, + "loss": 0.0752, + "step": 45720 + }, + { + "epoch": 10.52, + "learning_rate": 9.055709573001687e-05, + "loss": 0.085, + "step": 45750 + }, + { + "epoch": 10.53, + "learning_rate": 9.041770563910356e-05, + "loss": 0.08, + "step": 45780 + }, + { + "epoch": 10.53, + "learning_rate": 9.027831554819024e-05, + "loss": 0.0804, + "step": 45810 + }, + { + "epoch": 10.54, + "learning_rate": 9.013892545727692e-05, + "loss": 0.095, + "step": 45840 + }, + { + "epoch": 10.55, + "learning_rate": 8.99995353663636e-05, + "loss": 0.0761, + "step": 45870 + }, + { + "epoch": 10.56, + "learning_rate": 8.98601452754503e-05, + "loss": 0.0869, + "step": 45900 + }, + { + "epoch": 10.56, + "learning_rate": 8.972075518453699e-05, + "loss": 0.081, + "step": 45930 + }, + { + "epoch": 10.57, + "learning_rate": 8.958136509362368e-05, + "loss": 0.0831, + "step": 45960 + }, + { + "epoch": 10.58, + "learning_rate": 8.944197500271036e-05, + "loss": 0.0929, + "step": 45990 + }, + { + "epoch": 10.58, + "learning_rate": 8.930258491179704e-05, + "loss": 0.0774, + "step": 46020 + }, + { + "epoch": 10.59, + "learning_rate": 8.916319482088372e-05, + "loss": 0.0874, + "step": 46050 + }, + { + "epoch": 10.6, + "learning_rate": 8.902380472997041e-05, + "loss": 0.0843, + "step": 46080 + }, + { + "epoch": 10.6, + "learning_rate": 8.88844146390571e-05, + "loss": 0.0829, + "step": 46110 + }, + { + "epoch": 10.61, + "learning_rate": 8.874502454814378e-05, + "loss": 0.0923, + "step": 46140 + }, + { + "epoch": 10.62, + "learning_rate": 8.860563445723046e-05, + "loss": 0.0798, + "step": 46170 + }, + { + "epoch": 10.62, + "learning_rate": 8.846624436631714e-05, + "loss": 0.0899, + "step": 46200 + }, + { + "epoch": 10.63, + "learning_rate": 8.832685427540383e-05, + "loss": 0.0872, + "step": 46230 + }, + { + "epoch": 10.64, + "learning_rate": 8.818746418449052e-05, + "loss": 0.0808, + "step": 46260 + }, + { + "epoch": 10.65, + "learning_rate": 8.804807409357722e-05, + "loss": 0.0891, + "step": 46290 + }, + { + "epoch": 10.65, + "learning_rate": 8.79086840026639e-05, + "loss": 0.076, + "step": 46320 + }, + { + "epoch": 10.66, + "learning_rate": 8.776929391175059e-05, + "loss": 0.0887, + "step": 46350 + }, + { + "epoch": 10.67, + "learning_rate": 8.762990382083726e-05, + "loss": 0.0812, + "step": 46380 + }, + { + "epoch": 10.67, + "learning_rate": 8.749051372992395e-05, + "loss": 0.0833, + "step": 46410 + }, + { + "epoch": 10.68, + "learning_rate": 8.735112363901063e-05, + "loss": 0.0908, + "step": 46440 + }, + { + "epoch": 10.69, + "learning_rate": 8.721173354809732e-05, + "loss": 0.0744, + "step": 46470 + }, + { + "epoch": 10.69, + "learning_rate": 8.707234345718401e-05, + "loss": 0.0896, + "step": 46500 + }, + { + "epoch": 10.7, + "learning_rate": 8.693295336627068e-05, + "loss": 0.0833, + "step": 46530 + }, + { + "epoch": 10.71, + "learning_rate": 8.679356327535737e-05, + "loss": 0.0796, + "step": 46560 + }, + { + "epoch": 10.71, + "learning_rate": 8.665417318444405e-05, + "loss": 0.0907, + "step": 46590 + }, + { + "epoch": 10.72, + "learning_rate": 8.651478309353074e-05, + "loss": 0.0735, + "step": 46620 + }, + { + "epoch": 10.73, + "learning_rate": 8.637539300261743e-05, + "loss": 0.0851, + "step": 46650 + }, + { + "epoch": 10.73, + "learning_rate": 8.623600291170413e-05, + "loss": 0.0805, + "step": 46680 + }, + { + "epoch": 10.74, + "learning_rate": 8.60966128207908e-05, + "loss": 0.0818, + "step": 46710 + }, + { + "epoch": 10.75, + "learning_rate": 8.595722272987749e-05, + "loss": 0.0887, + "step": 46740 + }, + { + "epoch": 10.76, + "learning_rate": 8.581783263896417e-05, + "loss": 0.0771, + "step": 46770 + }, + { + "epoch": 10.76, + "learning_rate": 8.567844254805086e-05, + "loss": 0.0893, + "step": 46800 + }, + { + "epoch": 10.77, + "learning_rate": 8.553905245713755e-05, + "loss": 0.0786, + "step": 46830 + }, + { + "epoch": 10.78, + "learning_rate": 8.539966236622422e-05, + "loss": 0.0799, + "step": 46860 + }, + { + "epoch": 10.78, + "learning_rate": 8.52602722753109e-05, + "loss": 0.093, + "step": 46890 + }, + { + "epoch": 10.79, + "learning_rate": 8.512088218439759e-05, + "loss": 0.074, + "step": 46920 + }, + { + "epoch": 10.8, + "learning_rate": 8.498149209348428e-05, + "loss": 0.0812, + "step": 46950 + }, + { + "epoch": 10.8, + "learning_rate": 8.484210200257097e-05, + "loss": 0.0786, + "step": 46980 + }, + { + "epoch": 10.81, + "learning_rate": 8.470271191165764e-05, + "loss": 0.0775, + "step": 47010 + }, + { + "epoch": 10.82, + "learning_rate": 8.456332182074433e-05, + "loss": 0.0903, + "step": 47040 + }, + { + "epoch": 10.82, + "learning_rate": 8.442393172983103e-05, + "loss": 0.0725, + "step": 47070 + }, + { + "epoch": 10.83, + "learning_rate": 8.428454163891771e-05, + "loss": 0.081, + "step": 47100 + }, + { + "epoch": 10.84, + "learning_rate": 8.41451515480044e-05, + "loss": 0.0829, + "step": 47130 + }, + { + "epoch": 10.85, + "learning_rate": 8.400576145709109e-05, + "loss": 0.0781, + "step": 47160 + }, + { + "epoch": 10.85, + "learning_rate": 8.386637136617776e-05, + "loss": 0.0822, + "step": 47190 + }, + { + "epoch": 10.86, + "learning_rate": 8.372698127526445e-05, + "loss": 0.0815, + "step": 47220 + }, + { + "epoch": 10.87, + "learning_rate": 8.358759118435113e-05, + "loss": 0.0867, + "step": 47250 + }, + { + "epoch": 10.87, + "learning_rate": 8.344820109343782e-05, + "loss": 0.0807, + "step": 47280 + }, + { + "epoch": 10.88, + "learning_rate": 8.33088110025245e-05, + "loss": 0.0843, + "step": 47310 + }, + { + "epoch": 10.89, + "learning_rate": 8.316942091161118e-05, + "loss": 0.0879, + "step": 47340 + }, + { + "epoch": 10.89, + "learning_rate": 8.303003082069786e-05, + "loss": 0.0745, + "step": 47370 + }, + { + "epoch": 10.9, + "learning_rate": 8.289064072978455e-05, + "loss": 0.0905, + "step": 47400 + }, + { + "epoch": 10.91, + "learning_rate": 8.275125063887124e-05, + "loss": 0.076, + "step": 47430 + }, + { + "epoch": 10.91, + "learning_rate": 8.261186054795792e-05, + "loss": 0.079, + "step": 47460 + }, + { + "epoch": 10.92, + "learning_rate": 8.247247045704462e-05, + "loss": 0.087, + "step": 47490 + }, + { + "epoch": 10.93, + "learning_rate": 8.233308036613131e-05, + "loss": 0.0745, + "step": 47520 + }, + { + "epoch": 10.93, + "learning_rate": 8.219369027521798e-05, + "loss": 0.0855, + "step": 47550 + }, + { + "epoch": 10.94, + "learning_rate": 8.205430018430467e-05, + "loss": 0.0774, + "step": 47580 + }, + { + "epoch": 10.95, + "learning_rate": 8.191491009339136e-05, + "loss": 0.083, + "step": 47610 + }, + { + "epoch": 10.96, + "learning_rate": 8.177552000247804e-05, + "loss": 0.0888, + "step": 47640 + }, + { + "epoch": 10.96, + "learning_rate": 8.163612991156473e-05, + "loss": 0.0767, + "step": 47670 + }, + { + "epoch": 10.97, + "learning_rate": 8.14967398206514e-05, + "loss": 0.084, + "step": 47700 + }, + { + "epoch": 10.98, + "learning_rate": 8.135734972973809e-05, + "loss": 0.0802, + "step": 47730 + }, + { + "epoch": 10.98, + "learning_rate": 8.121795963882478e-05, + "loss": 0.0825, + "step": 47760 + }, + { + "epoch": 10.99, + "learning_rate": 8.107856954791146e-05, + "loss": 0.096, + "step": 47790 + }, + { + "epoch": 11.0, + "learning_rate": 8.093917945699815e-05, + "loss": 0.0752, + "step": 47820 + }, + { + "epoch": 11.0, + "eval_cer": 0.030907973429780394, + "eval_loss": 0.12198271602392197, + "eval_runtime": 425.2535, + "eval_samples_per_second": 37.961, + "eval_steps_per_second": 2.373, + "eval_wer": 0.11740498832447799, + "step": 47833 + }, + { + "epoch": 11.0, + "learning_rate": 8.079978936608482e-05, + "loss": 0.0844, + "step": 47850 + }, + { + "epoch": 11.01, + "learning_rate": 8.066039927517152e-05, + "loss": 0.082, + "step": 47880 + }, + { + "epoch": 11.02, + "learning_rate": 8.052100918425821e-05, + "loss": 0.0763, + "step": 47910 + }, + { + "epoch": 11.02, + "learning_rate": 8.03816190933449e-05, + "loss": 0.082, + "step": 47940 + }, + { + "epoch": 11.03, + "learning_rate": 8.024222900243158e-05, + "loss": 0.0735, + "step": 47970 + }, + { + "epoch": 11.04, + "learning_rate": 8.010283891151827e-05, + "loss": 0.0882, + "step": 48000 + }, + { + "epoch": 11.05, + "learning_rate": 7.996344882060494e-05, + "loss": 0.0814, + "step": 48030 + }, + { + "epoch": 11.05, + "learning_rate": 7.982405872969163e-05, + "loss": 0.0771, + "step": 48060 + }, + { + "epoch": 11.06, + "learning_rate": 7.968466863877832e-05, + "loss": 0.0844, + "step": 48090 + }, + { + "epoch": 11.07, + "learning_rate": 7.9545278547865e-05, + "loss": 0.0721, + "step": 48120 + }, + { + "epoch": 11.07, + "learning_rate": 7.940588845695169e-05, + "loss": 0.0869, + "step": 48150 + }, + { + "epoch": 11.08, + "learning_rate": 7.926649836603836e-05, + "loss": 0.0809, + "step": 48180 + }, + { + "epoch": 11.09, + "learning_rate": 7.912710827512505e-05, + "loss": 0.0771, + "step": 48210 + }, + { + "epoch": 11.09, + "learning_rate": 7.898771818421173e-05, + "loss": 0.0812, + "step": 48240 + }, + { + "epoch": 11.1, + "learning_rate": 7.884832809329843e-05, + "loss": 0.0702, + "step": 48270 + }, + { + "epoch": 11.11, + "learning_rate": 7.870893800238512e-05, + "loss": 0.0827, + "step": 48300 + }, + { + "epoch": 11.11, + "learning_rate": 7.856954791147181e-05, + "loss": 0.0796, + "step": 48330 + }, + { + "epoch": 11.12, + "learning_rate": 7.843015782055848e-05, + "loss": 0.0746, + "step": 48360 + }, + { + "epoch": 11.13, + "learning_rate": 7.829076772964517e-05, + "loss": 0.0898, + "step": 48390 + }, + { + "epoch": 11.13, + "learning_rate": 7.815137763873185e-05, + "loss": 0.0707, + "step": 48420 + }, + { + "epoch": 11.14, + "learning_rate": 7.801198754781854e-05, + "loss": 0.0847, + "step": 48450 + }, + { + "epoch": 11.15, + "learning_rate": 7.787259745690523e-05, + "loss": 0.0761, + "step": 48480 + }, + { + "epoch": 11.16, + "learning_rate": 7.77332073659919e-05, + "loss": 0.0781, + "step": 48510 + }, + { + "epoch": 11.16, + "learning_rate": 7.759381727507859e-05, + "loss": 0.0865, + "step": 48540 + }, + { + "epoch": 11.17, + "learning_rate": 7.745442718416527e-05, + "loss": 0.0728, + "step": 48570 + }, + { + "epoch": 11.18, + "learning_rate": 7.731503709325196e-05, + "loss": 0.0816, + "step": 48600 + }, + { + "epoch": 11.18, + "learning_rate": 7.717564700233865e-05, + "loss": 0.0755, + "step": 48630 + }, + { + "epoch": 11.19, + "learning_rate": 7.703625691142535e-05, + "loss": 0.082, + "step": 48660 + }, + { + "epoch": 11.2, + "learning_rate": 7.689686682051202e-05, + "loss": 0.0799, + "step": 48690 + }, + { + "epoch": 11.2, + "learning_rate": 7.67574767295987e-05, + "loss": 0.0714, + "step": 48720 + }, + { + "epoch": 11.21, + "learning_rate": 7.661808663868539e-05, + "loss": 0.0811, + "step": 48750 + }, + { + "epoch": 11.22, + "learning_rate": 7.647869654777208e-05, + "loss": 0.0788, + "step": 48780 + }, + { + "epoch": 11.22, + "learning_rate": 7.633930645685877e-05, + "loss": 0.0824, + "step": 48810 + }, + { + "epoch": 11.23, + "learning_rate": 7.619991636594545e-05, + "loss": 0.0888, + "step": 48840 + }, + { + "epoch": 11.24, + "learning_rate": 7.606052627503213e-05, + "loss": 0.073, + "step": 48870 + }, + { + "epoch": 11.25, + "learning_rate": 7.592113618411881e-05, + "loss": 0.0849, + "step": 48900 + }, + { + "epoch": 11.25, + "learning_rate": 7.57817460932055e-05, + "loss": 0.0797, + "step": 48930 + }, + { + "epoch": 11.26, + "learning_rate": 7.564235600229219e-05, + "loss": 0.0801, + "step": 48960 + }, + { + "epoch": 11.27, + "learning_rate": 7.550296591137887e-05, + "loss": 0.0895, + "step": 48990 + }, + { + "epoch": 11.27, + "learning_rate": 7.536357582046554e-05, + "loss": 0.0754, + "step": 49020 + }, + { + "epoch": 11.28, + "learning_rate": 7.522418572955223e-05, + "loss": 0.0823, + "step": 49050 + }, + { + "epoch": 11.29, + "learning_rate": 7.508479563863893e-05, + "loss": 0.0776, + "step": 49080 + }, + { + "epoch": 11.29, + "learning_rate": 7.49454055477256e-05, + "loss": 0.0756, + "step": 49110 + }, + { + "epoch": 11.3, + "learning_rate": 7.480601545681229e-05, + "loss": 0.0833, + "step": 49140 + }, + { + "epoch": 11.31, + "learning_rate": 7.466662536589899e-05, + "loss": 0.0734, + "step": 49170 + }, + { + "epoch": 11.31, + "learning_rate": 7.452723527498566e-05, + "loss": 0.0809, + "step": 49200 + }, + { + "epoch": 11.32, + "learning_rate": 7.438784518407235e-05, + "loss": 0.083, + "step": 49230 + }, + { + "epoch": 11.33, + "learning_rate": 7.424845509315904e-05, + "loss": 0.0784, + "step": 49260 + }, + { + "epoch": 11.33, + "learning_rate": 7.410906500224572e-05, + "loss": 0.0866, + "step": 49290 + }, + { + "epoch": 11.34, + "learning_rate": 7.396967491133241e-05, + "loss": 0.0755, + "step": 49320 + }, + { + "epoch": 11.35, + "learning_rate": 7.38302848204191e-05, + "loss": 0.0809, + "step": 49350 + }, + { + "epoch": 11.36, + "learning_rate": 7.369089472950578e-05, + "loss": 0.0811, + "step": 49380 + }, + { + "epoch": 11.36, + "learning_rate": 7.355150463859247e-05, + "loss": 0.0772, + "step": 49410 + }, + { + "epoch": 11.37, + "learning_rate": 7.341211454767914e-05, + "loss": 0.0856, + "step": 49440 + }, + { + "epoch": 11.38, + "learning_rate": 7.327272445676583e-05, + "loss": 0.0737, + "step": 49470 + }, + { + "epoch": 11.38, + "learning_rate": 7.313333436585252e-05, + "loss": 0.0818, + "step": 49500 + }, + { + "epoch": 11.39, + "learning_rate": 7.29939442749392e-05, + "loss": 0.0772, + "step": 49530 + }, + { + "epoch": 11.4, + "learning_rate": 7.285455418402589e-05, + "loss": 0.0785, + "step": 49560 + }, + { + "epoch": 11.4, + "learning_rate": 7.271516409311258e-05, + "loss": 0.0889, + "step": 49590 + }, + { + "epoch": 11.41, + "learning_rate": 7.257577400219926e-05, + "loss": 0.0716, + "step": 49620 + }, + { + "epoch": 11.42, + "learning_rate": 7.243638391128595e-05, + "loss": 0.0782, + "step": 49650 + }, + { + "epoch": 11.42, + "learning_rate": 7.229699382037262e-05, + "loss": 0.0828, + "step": 49680 + }, + { + "epoch": 11.43, + "learning_rate": 7.215760372945931e-05, + "loss": 0.0759, + "step": 49710 + }, + { + "epoch": 11.44, + "learning_rate": 7.2018213638546e-05, + "loss": 0.0854, + "step": 49740 + }, + { + "epoch": 11.45, + "learning_rate": 7.188346988399646e-05, + "loss": 0.075, + "step": 49770 + }, + { + "epoch": 11.45, + "learning_rate": 7.174407979308315e-05, + "loss": 0.0831, + "step": 49800 + }, + { + "epoch": 11.46, + "learning_rate": 7.160933603853361e-05, + "loss": 0.0769, + "step": 49830 + }, + { + "epoch": 11.47, + "learning_rate": 7.14699459476203e-05, + "loss": 0.0793, + "step": 49860 + }, + { + "epoch": 11.47, + "learning_rate": 7.133055585670697e-05, + "loss": 0.0858, + "step": 49890 + }, + { + "epoch": 11.48, + "learning_rate": 7.119116576579366e-05, + "loss": 0.0724, + "step": 49920 + }, + { + "epoch": 11.49, + "learning_rate": 7.105177567488036e-05, + "loss": 0.0783, + "step": 49950 + }, + { + "epoch": 11.49, + "learning_rate": 7.091238558396703e-05, + "loss": 0.0819, + "step": 49980 + }, + { + "epoch": 11.5, + "learning_rate": 7.077299549305372e-05, + "loss": 0.0776, + "step": 50010 + }, + { + "epoch": 11.51, + "learning_rate": 7.06336054021404e-05, + "loss": 0.0808, + "step": 50040 + }, + { + "epoch": 11.51, + "learning_rate": 7.049421531122709e-05, + "loss": 0.0772, + "step": 50070 + }, + { + "epoch": 11.52, + "learning_rate": 7.035482522031378e-05, + "loss": 0.079, + "step": 50100 + }, + { + "epoch": 11.53, + "learning_rate": 7.021543512940045e-05, + "loss": 0.0717, + "step": 50130 + }, + { + "epoch": 11.54, + "learning_rate": 7.007604503848715e-05, + "loss": 0.0791, + "step": 50160 + }, + { + "epoch": 11.54, + "learning_rate": 6.993665494757384e-05, + "loss": 0.0865, + "step": 50190 + }, + { + "epoch": 11.55, + "learning_rate": 6.979726485666051e-05, + "loss": 0.0747, + "step": 50220 + }, + { + "epoch": 11.56, + "learning_rate": 6.96578747657472e-05, + "loss": 0.0816, + "step": 50250 + }, + { + "epoch": 11.56, + "learning_rate": 6.951848467483388e-05, + "loss": 0.0796, + "step": 50280 + }, + { + "epoch": 11.57, + "learning_rate": 6.937909458392057e-05, + "loss": 0.0727, + "step": 50310 + }, + { + "epoch": 11.58, + "learning_rate": 6.923970449300726e-05, + "loss": 0.0828, + "step": 50340 + }, + { + "epoch": 11.58, + "learning_rate": 6.910031440209394e-05, + "loss": 0.0712, + "step": 50370 + }, + { + "epoch": 11.59, + "learning_rate": 6.896092431118063e-05, + "loss": 0.0813, + "step": 50400 + }, + { + "epoch": 11.6, + "learning_rate": 6.882153422026732e-05, + "loss": 0.0785, + "step": 50430 + }, + { + "epoch": 11.6, + "learning_rate": 6.868214412935399e-05, + "loss": 0.0743, + "step": 50460 + }, + { + "epoch": 11.61, + "learning_rate": 6.854275403844068e-05, + "loss": 0.0834, + "step": 50490 + }, + { + "epoch": 11.62, + "learning_rate": 6.840336394752736e-05, + "loss": 0.0725, + "step": 50520 + }, + { + "epoch": 11.62, + "learning_rate": 6.826397385661405e-05, + "loss": 0.0804, + "step": 50550 + }, + { + "epoch": 11.63, + "learning_rate": 6.812458376570074e-05, + "loss": 0.0752, + "step": 50580 + }, + { + "epoch": 11.64, + "learning_rate": 6.798519367478742e-05, + "loss": 0.0828, + "step": 50610 + }, + { + "epoch": 11.65, + "learning_rate": 6.784580358387411e-05, + "loss": 0.0843, + "step": 50640 + }, + { + "epoch": 11.65, + "learning_rate": 6.77064134929608e-05, + "loss": 0.0766, + "step": 50670 + }, + { + "epoch": 11.66, + "learning_rate": 6.756702340204747e-05, + "loss": 0.0763, + "step": 50700 + }, + { + "epoch": 11.67, + "learning_rate": 6.742763331113417e-05, + "loss": 0.0782, + "step": 50730 + }, + { + "epoch": 11.67, + "learning_rate": 6.728824322022086e-05, + "loss": 0.0776, + "step": 50760 + }, + { + "epoch": 11.68, + "learning_rate": 6.714885312930754e-05, + "loss": 0.0832, + "step": 50790 + }, + { + "epoch": 11.69, + "learning_rate": 6.700946303839422e-05, + "loss": 0.0724, + "step": 50820 + }, + { + "epoch": 11.69, + "learning_rate": 6.68700729474809e-05, + "loss": 0.0825, + "step": 50850 + }, + { + "epoch": 11.7, + "learning_rate": 6.673068285656759e-05, + "loss": 0.078, + "step": 50880 + }, + { + "epoch": 11.71, + "learning_rate": 6.659129276565428e-05, + "loss": 0.075, + "step": 50910 + }, + { + "epoch": 11.71, + "learning_rate": 6.645190267474096e-05, + "loss": 0.0866, + "step": 50940 + }, + { + "epoch": 11.72, + "learning_rate": 6.631251258382765e-05, + "loss": 0.0705, + "step": 50970 + }, + { + "epoch": 11.73, + "learning_rate": 6.617312249291434e-05, + "loss": 0.0778, + "step": 51000 + }, + { + "epoch": 11.74, + "learning_rate": 6.603373240200102e-05, + "loss": 0.0775, + "step": 51030 + }, + { + "epoch": 11.74, + "learning_rate": 6.58943423110877e-05, + "loss": 0.0724, + "step": 51060 + }, + { + "epoch": 11.75, + "learning_rate": 6.575495222017438e-05, + "loss": 0.0886, + "step": 51090 + }, + { + "epoch": 11.76, + "learning_rate": 6.561556212926107e-05, + "loss": 0.0676, + "step": 51120 + }, + { + "epoch": 11.76, + "learning_rate": 6.547617203834775e-05, + "loss": 0.077, + "step": 51150 + }, + { + "epoch": 11.77, + "learning_rate": 6.533678194743444e-05, + "loss": 0.0782, + "step": 51180 + }, + { + "epoch": 11.78, + "learning_rate": 6.519739185652113e-05, + "loss": 0.0745, + "step": 51210 + }, + { + "epoch": 11.78, + "learning_rate": 6.505800176560781e-05, + "loss": 0.0839, + "step": 51240 + }, + { + "epoch": 11.79, + "learning_rate": 6.49186116746945e-05, + "loss": 0.0752, + "step": 51270 + }, + { + "epoch": 11.8, + "learning_rate": 6.477922158378117e-05, + "loss": 0.0874, + "step": 51300 + }, + { + "epoch": 11.8, + "learning_rate": 6.463983149286787e-05, + "loss": 0.0789, + "step": 51330 + }, + { + "epoch": 11.81, + "learning_rate": 6.450044140195456e-05, + "loss": 0.0782, + "step": 51360 + }, + { + "epoch": 11.82, + "learning_rate": 6.436105131104123e-05, + "loss": 0.0807, + "step": 51390 + }, + { + "epoch": 11.82, + "learning_rate": 6.422166122012792e-05, + "loss": 0.0717, + "step": 51420 + }, + { + "epoch": 11.83, + "learning_rate": 6.408227112921461e-05, + "loss": 0.0817, + "step": 51450 + }, + { + "epoch": 11.84, + "learning_rate": 6.39428810383013e-05, + "loss": 0.0814, + "step": 51480 + }, + { + "epoch": 11.85, + "learning_rate": 6.380349094738798e-05, + "loss": 0.0735, + "step": 51510 + }, + { + "epoch": 11.85, + "learning_rate": 6.366410085647467e-05, + "loss": 0.0863, + "step": 51540 + }, + { + "epoch": 11.86, + "learning_rate": 6.352471076556135e-05, + "loss": 0.068, + "step": 51570 + }, + { + "epoch": 11.87, + "learning_rate": 6.338532067464804e-05, + "loss": 0.0823, + "step": 51600 + }, + { + "epoch": 11.87, + "learning_rate": 6.324593058373471e-05, + "loss": 0.0776, + "step": 51630 + }, + { + "epoch": 11.88, + "learning_rate": 6.31065404928214e-05, + "loss": 0.0773, + "step": 51660 + }, + { + "epoch": 11.89, + "learning_rate": 6.296715040190809e-05, + "loss": 0.0827, + "step": 51690 + }, + { + "epoch": 11.89, + "learning_rate": 6.282776031099477e-05, + "loss": 0.0727, + "step": 51720 + }, + { + "epoch": 11.9, + "learning_rate": 6.268837022008146e-05, + "loss": 0.0812, + "step": 51750 + }, + { + "epoch": 11.91, + "learning_rate": 6.254898012916815e-05, + "loss": 0.0827, + "step": 51780 + }, + { + "epoch": 11.91, + "learning_rate": 6.240959003825483e-05, + "loss": 0.0739, + "step": 51810 + }, + { + "epoch": 11.92, + "learning_rate": 6.227019994734152e-05, + "loss": 0.0832, + "step": 51840 + }, + { + "epoch": 11.93, + "learning_rate": 6.213080985642819e-05, + "loss": 0.0719, + "step": 51870 + }, + { + "epoch": 11.94, + "learning_rate": 6.199141976551488e-05, + "loss": 0.0866, + "step": 51900 + }, + { + "epoch": 11.94, + "learning_rate": 6.185202967460158e-05, + "loss": 0.0805, + "step": 51930 + }, + { + "epoch": 11.95, + "learning_rate": 6.171263958368827e-05, + "loss": 0.0808, + "step": 51960 + }, + { + "epoch": 11.96, + "learning_rate": 6.157324949277494e-05, + "loss": 0.0898, + "step": 51990 + }, + { + "epoch": 11.96, + "learning_rate": 6.143385940186162e-05, + "loss": 0.0738, + "step": 52020 + }, + { + "epoch": 11.97, + "learning_rate": 6.129446931094831e-05, + "loss": 0.0808, + "step": 52050 + }, + { + "epoch": 11.98, + "learning_rate": 6.1155079220035e-05, + "loss": 0.0791, + "step": 52080 + }, + { + "epoch": 11.98, + "learning_rate": 6.101568912912168e-05, + "loss": 0.0771, + "step": 52110 + }, + { + "epoch": 11.99, + "learning_rate": 6.087629903820837e-05, + "loss": 0.0831, + "step": 52140 + }, + { + "epoch": 12.0, + "learning_rate": 6.073690894729505e-05, + "loss": 0.0691, + "step": 52170 + }, + { + "epoch": 12.0, + "eval_cer": 0.03268286725133757, + "eval_loss": 0.11820375919342041, + "eval_runtime": 427.5396, + "eval_samples_per_second": 37.758, + "eval_steps_per_second": 2.36, + "eval_wer": 0.11974686114589327, + "step": 52182 + }, + { + "epoch": 12.0, + "learning_rate": 6.059751885638174e-05, + "loss": 0.0879, + "step": 52200 + }, + { + "epoch": 12.01, + "learning_rate": 6.0458128765468424e-05, + "loss": 0.0754, + "step": 52230 + }, + { + "epoch": 12.02, + "learning_rate": 6.0318738674555104e-05, + "loss": 0.0723, + "step": 52260 + }, + { + "epoch": 12.02, + "learning_rate": 6.017934858364179e-05, + "loss": 0.0813, + "step": 52290 + }, + { + "epoch": 12.03, + "learning_rate": 6.0039958492728484e-05, + "loss": 0.0723, + "step": 52320 + }, + { + "epoch": 12.04, + "learning_rate": 5.9900568401815164e-05, + "loss": 0.0789, + "step": 52350 + }, + { + "epoch": 12.05, + "learning_rate": 5.976117831090185e-05, + "loss": 0.0741, + "step": 52380 + }, + { + "epoch": 12.05, + "learning_rate": 5.962178821998854e-05, + "loss": 0.0686, + "step": 52410 + }, + { + "epoch": 12.06, + "learning_rate": 5.9487044465438996e-05, + "loss": 0.0797, + "step": 52440 + }, + { + "epoch": 12.07, + "learning_rate": 5.934765437452568e-05, + "loss": 0.0692, + "step": 52470 + }, + { + "epoch": 12.07, + "learning_rate": 5.920826428361237e-05, + "loss": 0.0777, + "step": 52500 + }, + { + "epoch": 12.08, + "learning_rate": 5.906887419269905e-05, + "loss": 0.0778, + "step": 52530 + }, + { + "epoch": 12.09, + "learning_rate": 5.8929484101785735e-05, + "loss": 0.0725, + "step": 52560 + }, + { + "epoch": 12.09, + "learning_rate": 5.8790094010872415e-05, + "loss": 0.0851, + "step": 52590 + }, + { + "epoch": 12.1, + "learning_rate": 5.865070391995911e-05, + "loss": 0.0744, + "step": 52620 + }, + { + "epoch": 12.11, + "learning_rate": 5.8511313829045795e-05, + "loss": 0.0843, + "step": 52650 + }, + { + "epoch": 12.11, + "learning_rate": 5.837192373813248e-05, + "loss": 0.0784, + "step": 52680 + }, + { + "epoch": 12.12, + "learning_rate": 5.823253364721916e-05, + "loss": 0.0762, + "step": 52710 + }, + { + "epoch": 12.13, + "learning_rate": 5.809314355630585e-05, + "loss": 0.0805, + "step": 52740 + }, + { + "epoch": 12.14, + "learning_rate": 5.795839980175631e-05, + "loss": 0.078, + "step": 52770 + }, + { + "epoch": 12.14, + "learning_rate": 5.781900971084299e-05, + "loss": 0.0759, + "step": 52800 + }, + { + "epoch": 12.15, + "learning_rate": 5.767961961992968e-05, + "loss": 0.0802, + "step": 52830 + }, + { + "epoch": 12.16, + "learning_rate": 5.754022952901636e-05, + "loss": 0.0748, + "step": 52860 + }, + { + "epoch": 12.16, + "learning_rate": 5.7400839438103046e-05, + "loss": 0.0796, + "step": 52890 + }, + { + "epoch": 12.17, + "learning_rate": 5.726144934718974e-05, + "loss": 0.071, + "step": 52920 + }, + { + "epoch": 12.18, + "learning_rate": 5.7122059256276426e-05, + "loss": 0.0781, + "step": 52950 + }, + { + "epoch": 12.18, + "learning_rate": 5.6982669165363106e-05, + "loss": 0.0778, + "step": 52980 + }, + { + "epoch": 12.19, + "learning_rate": 5.684327907444979e-05, + "loss": 0.0702, + "step": 53010 + }, + { + "epoch": 12.2, + "learning_rate": 5.670388898353647e-05, + "loss": 0.0807, + "step": 53040 + }, + { + "epoch": 12.2, + "learning_rate": 5.656914522898694e-05, + "loss": 0.0717, + "step": 53070 + }, + { + "epoch": 12.21, + "learning_rate": 5.6429755138073624e-05, + "loss": 0.0808, + "step": 53100 + }, + { + "epoch": 12.22, + "learning_rate": 5.6290365047160304e-05, + "loss": 0.0738, + "step": 53130 + }, + { + "epoch": 12.22, + "learning_rate": 5.615097495624699e-05, + "loss": 0.0786, + "step": 53160 + }, + { + "epoch": 12.23, + "learning_rate": 5.6011584865333684e-05, + "loss": 0.0804, + "step": 53190 + }, + { + "epoch": 12.24, + "learning_rate": 5.587219477442037e-05, + "loss": 0.0725, + "step": 53220 + }, + { + "epoch": 12.25, + "learning_rate": 5.573280468350705e-05, + "loss": 0.0807, + "step": 53250 + }, + { + "epoch": 12.25, + "learning_rate": 5.559341459259374e-05, + "loss": 0.0832, + "step": 53280 + }, + { + "epoch": 12.26, + "learning_rate": 5.545402450168042e-05, + "loss": 0.0741, + "step": 53310 + }, + { + "epoch": 12.27, + "learning_rate": 5.53146344107671e-05, + "loss": 0.0822, + "step": 53340 + }, + { + "epoch": 12.27, + "learning_rate": 5.517524431985379e-05, + "loss": 0.073, + "step": 53370 + }, + { + "epoch": 12.28, + "learning_rate": 5.5035854228940477e-05, + "loss": 0.0781, + "step": 53400 + }, + { + "epoch": 12.29, + "learning_rate": 5.489646413802716e-05, + "loss": 0.0792, + "step": 53430 + }, + { + "epoch": 12.29, + "learning_rate": 5.475707404711385e-05, + "loss": 0.0782, + "step": 53460 + }, + { + "epoch": 12.3, + "learning_rate": 5.461768395620053e-05, + "loss": 0.0847, + "step": 53490 + }, + { + "epoch": 12.31, + "learning_rate": 5.4478293865287216e-05, + "loss": 0.0723, + "step": 53520 + }, + { + "epoch": 12.31, + "learning_rate": 5.4338903774373896e-05, + "loss": 0.0782, + "step": 53550 + }, + { + "epoch": 12.32, + "learning_rate": 5.419951368346058e-05, + "loss": 0.0757, + "step": 53580 + }, + { + "epoch": 12.33, + "learning_rate": 5.4060123592547276e-05, + "loss": 0.0733, + "step": 53610 + }, + { + "epoch": 12.34, + "learning_rate": 5.3920733501633956e-05, + "loss": 0.0818, + "step": 53640 + }, + { + "epoch": 12.34, + "learning_rate": 5.378134341072064e-05, + "loss": 0.0713, + "step": 53670 + }, + { + "epoch": 12.35, + "learning_rate": 5.364195331980733e-05, + "loss": 0.0758, + "step": 53700 + }, + { + "epoch": 12.36, + "learning_rate": 5.350256322889401e-05, + "loss": 0.0765, + "step": 53730 + }, + { + "epoch": 12.36, + "learning_rate": 5.3363173137980695e-05, + "loss": 0.074, + "step": 53760 + }, + { + "epoch": 12.37, + "learning_rate": 5.322378304706739e-05, + "loss": 0.0856, + "step": 53790 + }, + { + "epoch": 12.38, + "learning_rate": 5.308439295615407e-05, + "loss": 0.0718, + "step": 53820 + }, + { + "epoch": 12.38, + "learning_rate": 5.2945002865240755e-05, + "loss": 0.0807, + "step": 53850 + }, + { + "epoch": 12.39, + "learning_rate": 5.280561277432744e-05, + "loss": 0.0759, + "step": 53880 + }, + { + "epoch": 12.4, + "learning_rate": 5.266622268341412e-05, + "loss": 0.0727, + "step": 53910 + }, + { + "epoch": 12.4, + "learning_rate": 5.252683259250081e-05, + "loss": 0.0809, + "step": 53940 + }, + { + "epoch": 12.41, + "learning_rate": 5.238744250158749e-05, + "loss": 0.0697, + "step": 53970 + }, + { + "epoch": 12.42, + "learning_rate": 5.224805241067418e-05, + "loss": 0.0769, + "step": 54000 + }, + { + "epoch": 12.42, + "learning_rate": 5.210866231976087e-05, + "loss": 0.0765, + "step": 54030 + }, + { + "epoch": 12.43, + "learning_rate": 5.196927222884755e-05, + "loss": 0.0717, + "step": 54060 + }, + { + "epoch": 12.44, + "learning_rate": 5.1829882137934234e-05, + "loss": 0.0848, + "step": 54090 + }, + { + "epoch": 12.45, + "learning_rate": 5.169049204702092e-05, + "loss": 0.0711, + "step": 54120 + }, + { + "epoch": 12.45, + "learning_rate": 5.15511019561076e-05, + "loss": 0.08, + "step": 54150 + }, + { + "epoch": 12.46, + "learning_rate": 5.1411711865194294e-05, + "loss": 0.0801, + "step": 54180 + }, + { + "epoch": 12.47, + "learning_rate": 5.127232177428098e-05, + "loss": 0.0746, + "step": 54210 + }, + { + "epoch": 12.47, + "learning_rate": 5.113293168336766e-05, + "loss": 0.0823, + "step": 54240 + }, + { + "epoch": 12.48, + "learning_rate": 5.099354159245435e-05, + "loss": 0.0699, + "step": 54270 + }, + { + "epoch": 12.49, + "learning_rate": 5.0854151501541026e-05, + "loss": 0.0789, + "step": 54300 + }, + { + "epoch": 12.49, + "learning_rate": 5.071476141062771e-05, + "loss": 0.0789, + "step": 54330 + }, + { + "epoch": 12.5, + "learning_rate": 5.05753713197144e-05, + "loss": 0.0758, + "step": 54360 + }, + { + "epoch": 12.51, + "learning_rate": 5.0435981228801086e-05, + "loss": 0.0838, + "step": 54390 + }, + { + "epoch": 12.51, + "learning_rate": 5.029659113788777e-05, + "loss": 0.0717, + "step": 54420 + }, + { + "epoch": 12.52, + "learning_rate": 5.015720104697446e-05, + "loss": 0.0821, + "step": 54450 + }, + { + "epoch": 12.53, + "learning_rate": 5.001781095606114e-05, + "loss": 0.0819, + "step": 54480 + }, + { + "epoch": 12.54, + "learning_rate": 4.9878420865147826e-05, + "loss": 0.0749, + "step": 54510 + }, + { + "epoch": 12.54, + "learning_rate": 4.973903077423451e-05, + "loss": 0.0823, + "step": 54540 + }, + { + "epoch": 12.55, + "learning_rate": 4.959964068332119e-05, + "loss": 0.0733, + "step": 54570 + }, + { + "epoch": 12.56, + "learning_rate": 4.9460250592407885e-05, + "loss": 0.0791, + "step": 54600 + }, + { + "epoch": 12.56, + "learning_rate": 4.932086050149457e-05, + "loss": 0.0734, + "step": 54630 + }, + { + "epoch": 12.57, + "learning_rate": 4.918147041058125e-05, + "loss": 0.0738, + "step": 54660 + }, + { + "epoch": 12.58, + "learning_rate": 4.904208031966794e-05, + "loss": 0.084, + "step": 54690 + }, + { + "epoch": 12.58, + "learning_rate": 4.890269022875462e-05, + "loss": 0.0712, + "step": 54720 + }, + { + "epoch": 12.59, + "learning_rate": 4.8763300137841305e-05, + "loss": 0.0821, + "step": 54750 + }, + { + "epoch": 12.6, + "learning_rate": 4.8623910046928e-05, + "loss": 0.0775, + "step": 54780 + }, + { + "epoch": 12.6, + "learning_rate": 4.848451995601468e-05, + "loss": 0.0736, + "step": 54810 + }, + { + "epoch": 12.61, + "learning_rate": 4.8345129865101364e-05, + "loss": 0.0844, + "step": 54840 + }, + { + "epoch": 12.62, + "learning_rate": 4.821038611055183e-05, + "loss": 0.0715, + "step": 54870 + }, + { + "epoch": 12.63, + "learning_rate": 4.8070996019638517e-05, + "loss": 0.0759, + "step": 54900 + }, + { + "epoch": 12.63, + "learning_rate": 4.7931605928725196e-05, + "loss": 0.0798, + "step": 54930 + }, + { + "epoch": 12.64, + "learning_rate": 4.779221583781188e-05, + "loss": 0.0732, + "step": 54960 + }, + { + "epoch": 12.65, + "learning_rate": 4.765282574689856e-05, + "loss": 0.087, + "step": 54990 + }, + { + "epoch": 12.65, + "learning_rate": 4.751343565598525e-05, + "loss": 0.0673, + "step": 55020 + }, + { + "epoch": 12.66, + "learning_rate": 4.7374045565071936e-05, + "loss": 0.0821, + "step": 55050 + }, + { + "epoch": 12.67, + "learning_rate": 4.723465547415862e-05, + "loss": 0.0847, + "step": 55080 + }, + { + "epoch": 12.67, + "learning_rate": 4.709526538324531e-05, + "loss": 0.0746, + "step": 55110 + }, + { + "epoch": 12.68, + "learning_rate": 4.6955875292331996e-05, + "loss": 0.0853, + "step": 55140 + }, + { + "epoch": 12.69, + "learning_rate": 4.6816485201418675e-05, + "loss": 0.0699, + "step": 55170 + }, + { + "epoch": 12.69, + "learning_rate": 4.667709511050536e-05, + "loss": 0.08, + "step": 55200 + }, + { + "epoch": 12.7, + "learning_rate": 4.653770501959204e-05, + "loss": 0.0765, + "step": 55230 + }, + { + "epoch": 12.71, + "learning_rate": 4.639831492867873e-05, + "loss": 0.0732, + "step": 55260 + }, + { + "epoch": 12.71, + "learning_rate": 4.625892483776542e-05, + "loss": 0.0833, + "step": 55290 + }, + { + "epoch": 12.72, + "learning_rate": 4.61195347468521e-05, + "loss": 0.0731, + "step": 55320 + }, + { + "epoch": 12.73, + "learning_rate": 4.598014465593879e-05, + "loss": 0.079, + "step": 55350 + }, + { + "epoch": 12.74, + "learning_rate": 4.5840754565025475e-05, + "loss": 0.0831, + "step": 55380 + }, + { + "epoch": 12.74, + "learning_rate": 4.5701364474112155e-05, + "loss": 0.0722, + "step": 55410 + }, + { + "epoch": 12.75, + "learning_rate": 4.556197438319884e-05, + "loss": 0.0886, + "step": 55440 + }, + { + "epoch": 12.76, + "learning_rate": 4.5422584292285534e-05, + "loss": 0.0694, + "step": 55470 + }, + { + "epoch": 12.76, + "learning_rate": 4.5283194201372214e-05, + "loss": 0.0755, + "step": 55500 + }, + { + "epoch": 12.77, + "learning_rate": 4.51438041104589e-05, + "loss": 0.0788, + "step": 55530 + }, + { + "epoch": 12.78, + "learning_rate": 4.500441401954559e-05, + "loss": 0.0767, + "step": 55560 + }, + { + "epoch": 12.78, + "learning_rate": 4.486502392863227e-05, + "loss": 0.0791, + "step": 55590 + }, + { + "epoch": 12.79, + "learning_rate": 4.4725633837718954e-05, + "loss": 0.0651, + "step": 55620 + }, + { + "epoch": 12.8, + "learning_rate": 4.4586243746805634e-05, + "loss": 0.077, + "step": 55650 + }, + { + "epoch": 12.8, + "learning_rate": 4.444685365589233e-05, + "loss": 0.0821, + "step": 55680 + }, + { + "epoch": 12.81, + "learning_rate": 4.4307463564979013e-05, + "loss": 0.0717, + "step": 55710 + }, + { + "epoch": 12.82, + "learning_rate": 4.416807347406569e-05, + "loss": 0.0846, + "step": 55740 + }, + { + "epoch": 12.83, + "learning_rate": 4.402868338315238e-05, + "loss": 0.0701, + "step": 55770 + }, + { + "epoch": 12.83, + "learning_rate": 4.3889293292239066e-05, + "loss": 0.0813, + "step": 55800 + }, + { + "epoch": 12.84, + "learning_rate": 4.3749903201325746e-05, + "loss": 0.0857, + "step": 55830 + }, + { + "epoch": 12.85, + "learning_rate": 4.361051311041244e-05, + "loss": 0.0717, + "step": 55860 + }, + { + "epoch": 12.85, + "learning_rate": 4.3471123019499126e-05, + "loss": 0.0793, + "step": 55890 + }, + { + "epoch": 12.86, + "learning_rate": 4.3331732928585806e-05, + "loss": 0.0686, + "step": 55920 + }, + { + "epoch": 12.87, + "learning_rate": 4.319234283767249e-05, + "loss": 0.0763, + "step": 55950 + }, + { + "epoch": 12.87, + "learning_rate": 4.305295274675917e-05, + "loss": 0.0815, + "step": 55980 + }, + { + "epoch": 12.88, + "learning_rate": 4.291356265584586e-05, + "loss": 0.0728, + "step": 56010 + }, + { + "epoch": 12.89, + "learning_rate": 4.2774172564932546e-05, + "loss": 0.0795, + "step": 56040 + }, + { + "epoch": 12.89, + "learning_rate": 4.263478247401924e-05, + "loss": 0.0737, + "step": 56070 + }, + { + "epoch": 12.9, + "learning_rate": 4.249539238310592e-05, + "loss": 0.0712, + "step": 56100 + }, + { + "epoch": 12.91, + "learning_rate": 4.2356002292192605e-05, + "loss": 0.0709, + "step": 56130 + }, + { + "epoch": 12.91, + "learning_rate": 4.2216612201279285e-05, + "loss": 0.0728, + "step": 56160 + }, + { + "epoch": 12.92, + "learning_rate": 4.207722211036597e-05, + "loss": 0.0825, + "step": 56190 + }, + { + "epoch": 12.93, + "learning_rate": 4.193783201945266e-05, + "loss": 0.0688, + "step": 56220 + }, + { + "epoch": 12.94, + "learning_rate": 4.179844192853934e-05, + "loss": 0.0764, + "step": 56250 + }, + { + "epoch": 12.94, + "learning_rate": 4.165905183762603e-05, + "loss": 0.077, + "step": 56280 + }, + { + "epoch": 12.95, + "learning_rate": 4.151966174671272e-05, + "loss": 0.0718, + "step": 56310 + }, + { + "epoch": 12.96, + "learning_rate": 4.13802716557994e-05, + "loss": 0.0811, + "step": 56340 + }, + { + "epoch": 12.96, + "learning_rate": 4.1240881564886084e-05, + "loss": 0.0691, + "step": 56370 + }, + { + "epoch": 12.97, + "learning_rate": 4.1101491473972764e-05, + "loss": 0.0732, + "step": 56400 + }, + { + "epoch": 12.98, + "learning_rate": 4.096210138305945e-05, + "loss": 0.0753, + "step": 56430 + }, + { + "epoch": 12.98, + "learning_rate": 4.0822711292146144e-05, + "loss": 0.0731, + "step": 56460 + }, + { + "epoch": 12.99, + "learning_rate": 4.0683321201232824e-05, + "loss": 0.0806, + "step": 56490 + }, + { + "epoch": 13.0, + "learning_rate": 4.054393111031951e-05, + "loss": 0.0689, + "step": 56520 + }, + { + "epoch": 13.0, + "eval_cer": 0.030687342899242763, + "eval_loss": 0.11627411097288132, + "eval_runtime": 429.9895, + "eval_samples_per_second": 37.543, + "eval_steps_per_second": 2.347, + "eval_wer": 0.11497512606179566, + "step": 56530 + }, + { + "epoch": 13.0, + "learning_rate": 4.04045410194062e-05, + "loss": 0.0828, + "step": 56550 + }, + { + "epoch": 13.01, + "learning_rate": 4.026515092849288e-05, + "loss": 0.0787, + "step": 56580 + }, + { + "epoch": 13.02, + "learning_rate": 4.012576083757956e-05, + "loss": 0.0725, + "step": 56610 + }, + { + "epoch": 13.03, + "learning_rate": 3.998637074666624e-05, + "loss": 0.0788, + "step": 56640 + }, + { + "epoch": 13.03, + "learning_rate": 3.9846980655752937e-05, + "loss": 0.0696, + "step": 56670 + }, + { + "epoch": 13.04, + "learning_rate": 3.970759056483962e-05, + "loss": 0.0758, + "step": 56700 + }, + { + "epoch": 13.05, + "learning_rate": 3.956820047392631e-05, + "loss": 0.0743, + "step": 56730 + }, + { + "epoch": 13.05, + "learning_rate": 3.942881038301299e-05, + "loss": 0.0651, + "step": 56760 + }, + { + "epoch": 13.06, + "learning_rate": 3.9289420292099676e-05, + "loss": 0.076, + "step": 56790 + }, + { + "epoch": 13.07, + "learning_rate": 3.9150030201186356e-05, + "loss": 0.0695, + "step": 56820 + }, + { + "epoch": 13.07, + "learning_rate": 3.901064011027305e-05, + "loss": 0.0733, + "step": 56850 + }, + { + "epoch": 13.08, + "learning_rate": 3.8871250019359736e-05, + "loss": 0.0751, + "step": 56880 + }, + { + "epoch": 13.09, + "learning_rate": 3.8731859928446416e-05, + "loss": 0.0687, + "step": 56910 + }, + { + "epoch": 13.09, + "learning_rate": 3.85924698375331e-05, + "loss": 0.0745, + "step": 56940 + }, + { + "epoch": 13.1, + "learning_rate": 3.845307974661979e-05, + "loss": 0.0704, + "step": 56970 + }, + { + "epoch": 13.11, + "learning_rate": 3.831368965570647e-05, + "loss": 0.0736, + "step": 57000 + }, + { + "epoch": 13.11, + "learning_rate": 3.8174299564793155e-05, + "loss": 0.0808, + "step": 57030 + }, + { + "epoch": 13.12, + "learning_rate": 3.803490947387985e-05, + "loss": 0.0689, + "step": 57060 + }, + { + "epoch": 13.13, + "learning_rate": 3.789551938296653e-05, + "loss": 0.0802, + "step": 57090 + }, + { + "epoch": 13.14, + "learning_rate": 3.7756129292053215e-05, + "loss": 0.0672, + "step": 57120 + }, + { + "epoch": 13.14, + "learning_rate": 3.7616739201139895e-05, + "loss": 0.0752, + "step": 57150 + }, + { + "epoch": 13.15, + "learning_rate": 3.747734911022658e-05, + "loss": 0.0731, + "step": 57180 + }, + { + "epoch": 13.16, + "learning_rate": 3.733795901931327e-05, + "loss": 0.0653, + "step": 57210 + }, + { + "epoch": 13.16, + "learning_rate": 3.7198568928399954e-05, + "loss": 0.0803, + "step": 57240 + }, + { + "epoch": 13.17, + "learning_rate": 3.7059178837486634e-05, + "loss": 0.0684, + "step": 57270 + }, + { + "epoch": 13.18, + "learning_rate": 3.691978874657333e-05, + "loss": 0.0754, + "step": 57300 + }, + { + "epoch": 13.18, + "learning_rate": 3.678039865566001e-05, + "loss": 0.0786, + "step": 57330 + }, + { + "epoch": 13.19, + "learning_rate": 3.6641008564746694e-05, + "loss": 0.0673, + "step": 57360 + }, + { + "epoch": 13.2, + "learning_rate": 3.650161847383338e-05, + "loss": 0.0744, + "step": 57390 + }, + { + "epoch": 13.2, + "learning_rate": 3.636222838292007e-05, + "loss": 0.0664, + "step": 57420 + }, + { + "epoch": 13.21, + "learning_rate": 3.622283829200675e-05, + "loss": 0.0724, + "step": 57450 + }, + { + "epoch": 13.22, + "learning_rate": 3.6083448201093433e-05, + "loss": 0.0746, + "step": 57480 + }, + { + "epoch": 13.23, + "learning_rate": 3.594405811018012e-05, + "loss": 0.0672, + "step": 57510 + }, + { + "epoch": 13.23, + "learning_rate": 3.580466801926681e-05, + "loss": 0.0789, + "step": 57540 + }, + { + "epoch": 13.24, + "learning_rate": 3.5665277928353486e-05, + "loss": 0.0701, + "step": 57570 + }, + { + "epoch": 13.25, + "learning_rate": 3.552588783744018e-05, + "loss": 0.0735, + "step": 57600 + }, + { + "epoch": 13.25, + "learning_rate": 3.538649774652686e-05, + "loss": 0.0787, + "step": 57630 + }, + { + "epoch": 13.26, + "learning_rate": 3.5247107655613546e-05, + "loss": 0.0669, + "step": 57660 + }, + { + "epoch": 13.27, + "learning_rate": 3.5107717564700226e-05, + "loss": 0.0805, + "step": 57690 + }, + { + "epoch": 13.27, + "learning_rate": 3.496832747378692e-05, + "loss": 0.0679, + "step": 57720 + }, + { + "epoch": 13.28, + "learning_rate": 3.48289373828736e-05, + "loss": 0.0745, + "step": 57750 + }, + { + "epoch": 13.29, + "learning_rate": 3.4689547291960286e-05, + "loss": 0.0742, + "step": 57780 + }, + { + "epoch": 13.29, + "learning_rate": 3.455015720104697e-05, + "loss": 0.0661, + "step": 57810 + }, + { + "epoch": 13.3, + "learning_rate": 3.441076711013366e-05, + "loss": 0.0761, + "step": 57840 + }, + { + "epoch": 13.31, + "learning_rate": 3.427137701922034e-05, + "loss": 0.0646, + "step": 57870 + }, + { + "epoch": 13.31, + "learning_rate": 3.4131986928307025e-05, + "loss": 0.0716, + "step": 57900 + }, + { + "epoch": 13.32, + "learning_rate": 3.399259683739371e-05, + "loss": 0.0729, + "step": 57930 + }, + { + "epoch": 13.33, + "learning_rate": 3.38532067464804e-05, + "loss": 0.0678, + "step": 57960 + }, + { + "epoch": 13.34, + "learning_rate": 3.3713816655567085e-05, + "loss": 0.0763, + "step": 57990 + }, + { + "epoch": 13.34, + "learning_rate": 3.357442656465377e-05, + "loss": 0.0697, + "step": 58020 + }, + { + "epoch": 13.35, + "learning_rate": 3.343503647374045e-05, + "loss": 0.0707, + "step": 58050 + }, + { + "epoch": 13.36, + "learning_rate": 3.329564638282714e-05, + "loss": 0.0781, + "step": 58080 + }, + { + "epoch": 13.36, + "learning_rate": 3.3156256291913824e-05, + "loss": 0.0666, + "step": 58110 + }, + { + "epoch": 13.37, + "learning_rate": 3.301686620100051e-05, + "loss": 0.0768, + "step": 58140 + }, + { + "epoch": 13.38, + "learning_rate": 3.287747611008719e-05, + "loss": 0.0691, + "step": 58170 + }, + { + "epoch": 13.38, + "learning_rate": 3.273808601917388e-05, + "loss": 0.0779, + "step": 58200 + }, + { + "epoch": 13.39, + "learning_rate": 3.2598695928260564e-05, + "loss": 0.0749, + "step": 58230 + }, + { + "epoch": 13.4, + "learning_rate": 3.245930583734725e-05, + "loss": 0.0656, + "step": 58260 + }, + { + "epoch": 13.4, + "learning_rate": 3.231991574643394e-05, + "loss": 0.0748, + "step": 58290 + }, + { + "epoch": 13.41, + "learning_rate": 3.218052565552062e-05, + "loss": 0.0717, + "step": 58320 + }, + { + "epoch": 13.42, + "learning_rate": 3.2041135564607304e-05, + "loss": 0.075, + "step": 58350 + }, + { + "epoch": 13.43, + "learning_rate": 3.190174547369399e-05, + "loss": 0.0765, + "step": 58380 + }, + { + "epoch": 13.43, + "learning_rate": 3.176235538278068e-05, + "loss": 0.065, + "step": 58410 + }, + { + "epoch": 13.44, + "learning_rate": 3.1622965291867357e-05, + "loss": 0.0762, + "step": 58440 + }, + { + "epoch": 13.45, + "learning_rate": 3.148357520095404e-05, + "loss": 0.0647, + "step": 58470 + }, + { + "epoch": 13.45, + "learning_rate": 3.134418511004073e-05, + "loss": 0.0719, + "step": 58500 + }, + { + "epoch": 13.46, + "learning_rate": 3.1204795019127416e-05, + "loss": 0.0737, + "step": 58530 + }, + { + "epoch": 13.47, + "learning_rate": 3.1065404928214096e-05, + "loss": 0.0637, + "step": 58560 + }, + { + "epoch": 13.47, + "learning_rate": 3.092601483730079e-05, + "loss": 0.0752, + "step": 58590 + }, + { + "epoch": 13.48, + "learning_rate": 3.078662474638747e-05, + "loss": 0.0631, + "step": 58620 + }, + { + "epoch": 13.49, + "learning_rate": 3.0647234655474156e-05, + "loss": 0.0749, + "step": 58650 + }, + { + "epoch": 13.49, + "learning_rate": 3.050784456456084e-05, + "loss": 0.0769, + "step": 58680 + }, + { + "epoch": 13.5, + "learning_rate": 3.0368454473647526e-05, + "loss": 0.0655, + "step": 58710 + }, + { + "epoch": 13.51, + "learning_rate": 3.0229064382734212e-05, + "loss": 0.0724, + "step": 58740 + }, + { + "epoch": 13.52, + "learning_rate": 3.0089674291820895e-05, + "loss": 0.0677, + "step": 58770 + }, + { + "epoch": 13.52, + "learning_rate": 2.9950284200907582e-05, + "loss": 0.0759, + "step": 58800 + }, + { + "epoch": 13.53, + "learning_rate": 2.981089410999427e-05, + "loss": 0.0763, + "step": 58830 + }, + { + "epoch": 13.54, + "learning_rate": 2.967150401908095e-05, + "loss": 0.0665, + "step": 58860 + }, + { + "epoch": 13.54, + "learning_rate": 2.9532113928167638e-05, + "loss": 0.0768, + "step": 58890 + }, + { + "epoch": 13.55, + "learning_rate": 2.939272383725432e-05, + "loss": 0.0623, + "step": 58920 + }, + { + "epoch": 13.56, + "learning_rate": 2.9253333746341008e-05, + "loss": 0.0736, + "step": 58950 + }, + { + "epoch": 13.56, + "learning_rate": 2.9113943655427695e-05, + "loss": 0.0782, + "step": 58980 + }, + { + "epoch": 13.57, + "learning_rate": 2.8974553564514378e-05, + "loss": 0.0645, + "step": 59010 + }, + { + "epoch": 13.58, + "learning_rate": 2.883516347360106e-05, + "loss": 0.0771, + "step": 59040 + }, + { + "epoch": 13.58, + "learning_rate": 2.8695773382687748e-05, + "loss": 0.0627, + "step": 59070 + }, + { + "epoch": 13.59, + "learning_rate": 2.8556383291774434e-05, + "loss": 0.0707, + "step": 59100 + }, + { + "epoch": 13.6, + "learning_rate": 2.8416993200861117e-05, + "loss": 0.0727, + "step": 59130 + }, + { + "epoch": 13.6, + "learning_rate": 2.8277603109947804e-05, + "loss": 0.064, + "step": 59160 + }, + { + "epoch": 13.61, + "learning_rate": 2.813821301903449e-05, + "loss": 0.0728, + "step": 59190 + }, + { + "epoch": 13.62, + "learning_rate": 2.7998822928121174e-05, + "loss": 0.0659, + "step": 59220 + }, + { + "epoch": 13.63, + "learning_rate": 2.7859432837207857e-05, + "loss": 0.0747, + "step": 59250 + }, + { + "epoch": 13.63, + "learning_rate": 2.7720042746294547e-05, + "loss": 0.072, + "step": 59280 + }, + { + "epoch": 13.64, + "learning_rate": 2.758065265538123e-05, + "loss": 0.0658, + "step": 59310 + }, + { + "epoch": 13.65, + "learning_rate": 2.7441262564467913e-05, + "loss": 0.0744, + "step": 59340 + }, + { + "epoch": 13.65, + "learning_rate": 2.7301872473554596e-05, + "loss": 0.0679, + "step": 59370 + }, + { + "epoch": 13.66, + "learning_rate": 2.7162482382641286e-05, + "loss": 0.0765, + "step": 59400 + }, + { + "epoch": 13.67, + "learning_rate": 2.702773862809175e-05, + "loss": 0.0725, + "step": 59430 + }, + { + "epoch": 13.67, + "learning_rate": 2.688834853717843e-05, + "loss": 0.0657, + "step": 59460 + }, + { + "epoch": 13.68, + "learning_rate": 2.6748958446265118e-05, + "loss": 0.0731, + "step": 59490 + }, + { + "epoch": 13.69, + "learning_rate": 2.66095683553518e-05, + "loss": 0.0654, + "step": 59520 + }, + { + "epoch": 13.69, + "learning_rate": 2.6470178264438488e-05, + "loss": 0.0727, + "step": 59550 + }, + { + "epoch": 13.7, + "learning_rate": 2.6330788173525175e-05, + "loss": 0.0726, + "step": 59580 + }, + { + "epoch": 13.71, + "learning_rate": 2.6191398082611858e-05, + "loss": 0.0676, + "step": 59610 + }, + { + "epoch": 13.72, + "learning_rate": 2.605200799169854e-05, + "loss": 0.0756, + "step": 59640 + }, + { + "epoch": 13.72, + "learning_rate": 2.591261790078523e-05, + "loss": 0.0641, + "step": 59670 + }, + { + "epoch": 13.73, + "learning_rate": 2.5773227809871914e-05, + "loss": 0.0697, + "step": 59700 + }, + { + "epoch": 13.74, + "learning_rate": 2.5633837718958597e-05, + "loss": 0.0756, + "step": 59730 + }, + { + "epoch": 13.74, + "learning_rate": 2.5494447628045284e-05, + "loss": 0.065, + "step": 59760 + }, + { + "epoch": 13.75, + "learning_rate": 2.535505753713197e-05, + "loss": 0.0747, + "step": 59790 + }, + { + "epoch": 13.76, + "learning_rate": 2.5215667446218654e-05, + "loss": 0.0647, + "step": 59820 + }, + { + "epoch": 13.76, + "learning_rate": 2.5076277355305337e-05, + "loss": 0.0705, + "step": 59850 + }, + { + "epoch": 13.77, + "learning_rate": 2.4936887264392027e-05, + "loss": 0.08, + "step": 59880 + }, + { + "epoch": 13.78, + "learning_rate": 2.479749717347871e-05, + "loss": 0.063, + "step": 59910 + }, + { + "epoch": 13.78, + "learning_rate": 2.4658107082565393e-05, + "loss": 0.0756, + "step": 59940 + }, + { + "epoch": 13.79, + "learning_rate": 2.4518716991652083e-05, + "loss": 0.0671, + "step": 59970 + }, + { + "epoch": 13.8, + "learning_rate": 2.4379326900738766e-05, + "loss": 0.0692, + "step": 60000 + }, + { + "epoch": 13.8, + "learning_rate": 2.423993680982545e-05, + "loss": 0.0747, + "step": 60030 + }, + { + "epoch": 13.81, + "learning_rate": 2.4100546718912133e-05, + "loss": 0.0604, + "step": 60060 + }, + { + "epoch": 13.82, + "learning_rate": 2.3961156627998823e-05, + "loss": 0.0736, + "step": 60090 + }, + { + "epoch": 13.83, + "learning_rate": 2.3821766537085506e-05, + "loss": 0.0637, + "step": 60120 + }, + { + "epoch": 13.83, + "learning_rate": 2.368237644617219e-05, + "loss": 0.0712, + "step": 60150 + }, + { + "epoch": 13.84, + "learning_rate": 2.354298635525888e-05, + "loss": 0.0699, + "step": 60180 + }, + { + "epoch": 13.85, + "learning_rate": 2.3403596264345562e-05, + "loss": 0.0613, + "step": 60210 + }, + { + "epoch": 13.85, + "learning_rate": 2.3264206173432245e-05, + "loss": 0.0777, + "step": 60240 + }, + { + "epoch": 13.86, + "learning_rate": 2.3124816082518932e-05, + "loss": 0.0623, + "step": 60270 + }, + { + "epoch": 13.87, + "learning_rate": 2.298542599160562e-05, + "loss": 0.071, + "step": 60300 + }, + { + "epoch": 13.87, + "learning_rate": 2.2846035900692302e-05, + "loss": 0.0758, + "step": 60330 + }, + { + "epoch": 13.88, + "learning_rate": 2.2706645809778985e-05, + "loss": 0.0623, + "step": 60360 + }, + { + "epoch": 13.89, + "learning_rate": 2.2567255718865675e-05, + "loss": 0.0778, + "step": 60390 + }, + { + "epoch": 13.89, + "learning_rate": 2.2427865627952358e-05, + "loss": 0.0677, + "step": 60420 + }, + { + "epoch": 13.9, + "learning_rate": 2.228847553703904e-05, + "loss": 0.0702, + "step": 60450 + }, + { + "epoch": 13.91, + "learning_rate": 2.2149085446125728e-05, + "loss": 0.0732, + "step": 60480 + }, + { + "epoch": 13.92, + "learning_rate": 2.2009695355212414e-05, + "loss": 0.0612, + "step": 60510 + }, + { + "epoch": 13.92, + "learning_rate": 2.1870305264299098e-05, + "loss": 0.0763, + "step": 60540 + }, + { + "epoch": 13.93, + "learning_rate": 2.1730915173385784e-05, + "loss": 0.0629, + "step": 60570 + }, + { + "epoch": 13.94, + "learning_rate": 2.1591525082472467e-05, + "loss": 0.075, + "step": 60600 + }, + { + "epoch": 13.94, + "learning_rate": 2.1452134991559154e-05, + "loss": 0.074, + "step": 60630 + }, + { + "epoch": 13.95, + "learning_rate": 2.131274490064584e-05, + "loss": 0.0627, + "step": 60660 + }, + { + "epoch": 13.96, + "learning_rate": 2.1173354809732524e-05, + "loss": 0.0721, + "step": 60690 + }, + { + "epoch": 13.96, + "learning_rate": 2.103396471881921e-05, + "loss": 0.0678, + "step": 60720 + }, + { + "epoch": 13.97, + "learning_rate": 2.0894574627905893e-05, + "loss": 0.0692, + "step": 60750 + }, + { + "epoch": 13.98, + "learning_rate": 2.075518453699258e-05, + "loss": 0.0731, + "step": 60780 + }, + { + "epoch": 13.98, + "learning_rate": 2.0615794446079263e-05, + "loss": 0.064, + "step": 60810 + }, + { + "epoch": 13.99, + "learning_rate": 2.047640435516595e-05, + "loss": 0.0776, + "step": 60840 + }, + { + "epoch": 14.0, + "learning_rate": 2.0337014264252636e-05, + "loss": 0.0653, + "step": 60870 + }, + { + "epoch": 14.0, + "eval_cer": 0.030403675074265814, + "eval_loss": 0.11410792917013168, + "eval_runtime": 434.2474, + "eval_samples_per_second": 37.175, + "eval_steps_per_second": 2.324, + "eval_wer": 0.11264002165893938, + "step": 60879 + }, + { + "epoch": 14.01, + "learning_rate": 2.019762417333932e-05, + "loss": 0.0676, + "step": 60900 + }, + { + "epoch": 14.01, + "learning_rate": 2.0058234082426003e-05, + "loss": 0.0733, + "step": 60930 + }, + { + "epoch": 14.02, + "learning_rate": 1.9918843991512693e-05, + "loss": 0.0639, + "step": 60960 + }, + { + "epoch": 14.03, + "learning_rate": 1.9779453900599376e-05, + "loss": 0.0712, + "step": 60990 + }, + { + "epoch": 14.03, + "learning_rate": 1.964006380968606e-05, + "loss": 0.0683, + "step": 61020 + }, + { + "epoch": 14.04, + "learning_rate": 1.9500673718772746e-05, + "loss": 0.0671, + "step": 61050 + }, + { + "epoch": 14.05, + "learning_rate": 1.9361283627859432e-05, + "loss": 0.0722, + "step": 61080 + }, + { + "epoch": 14.05, + "learning_rate": 1.9221893536946115e-05, + "loss": 0.0619, + "step": 61110 + }, + { + "epoch": 14.06, + "learning_rate": 1.90825034460328e-05, + "loss": 0.0665, + "step": 61140 + }, + { + "epoch": 14.07, + "learning_rate": 1.894311335511949e-05, + "loss": 0.0681, + "step": 61170 + }, + { + "epoch": 14.08, + "learning_rate": 1.8803723264206172e-05, + "loss": 0.0669, + "step": 61200 + }, + { + "epoch": 14.08, + "learning_rate": 1.866433317329286e-05, + "loss": 0.0761, + "step": 61230 + }, + { + "epoch": 14.09, + "learning_rate": 1.8529589418743317e-05, + "loss": 0.0644, + "step": 61260 + }, + { + "epoch": 14.1, + "learning_rate": 1.8390199327830004e-05, + "loss": 0.0678, + "step": 61290 + }, + { + "epoch": 14.1, + "learning_rate": 1.825080923691669e-05, + "loss": 0.0714, + "step": 61320 + }, + { + "epoch": 14.11, + "learning_rate": 1.8111419146003373e-05, + "loss": 0.0666, + "step": 61350 + }, + { + "epoch": 14.12, + "learning_rate": 1.797202905509006e-05, + "loss": 0.0744, + "step": 61380 + }, + { + "epoch": 14.12, + "learning_rate": 1.7832638964176743e-05, + "loss": 0.0671, + "step": 61410 + }, + { + "epoch": 14.13, + "learning_rate": 1.769324887326343e-05, + "loss": 0.0723, + "step": 61440 + }, + { + "epoch": 14.14, + "learning_rate": 1.7553858782350113e-05, + "loss": 0.0696, + "step": 61470 + }, + { + "epoch": 14.14, + "learning_rate": 1.74144686914368e-05, + "loss": 0.0668, + "step": 61500 + }, + { + "epoch": 14.15, + "learning_rate": 1.7275078600523486e-05, + "loss": 0.0743, + "step": 61530 + }, + { + "epoch": 14.16, + "learning_rate": 1.713568850961017e-05, + "loss": 0.0636, + "step": 61560 + }, + { + "epoch": 14.17, + "learning_rate": 1.6996298418696856e-05, + "loss": 0.0722, + "step": 61590 + }, + { + "epoch": 14.17, + "learning_rate": 1.6856908327783542e-05, + "loss": 0.065, + "step": 61620 + }, + { + "epoch": 14.18, + "learning_rate": 1.6717518236870226e-05, + "loss": 0.0691, + "step": 61650 + }, + { + "epoch": 14.19, + "learning_rate": 1.6578128145956912e-05, + "loss": 0.0776, + "step": 61680 + }, + { + "epoch": 14.19, + "learning_rate": 1.6438738055043595e-05, + "loss": 0.0639, + "step": 61710 + }, + { + "epoch": 14.2, + "learning_rate": 1.6299347964130282e-05, + "loss": 0.0736, + "step": 61740 + }, + { + "epoch": 14.21, + "learning_rate": 1.615995787321697e-05, + "loss": 0.07, + "step": 61770 + }, + { + "epoch": 14.21, + "learning_rate": 1.6020567782303652e-05, + "loss": 0.0623, + "step": 61800 + }, + { + "epoch": 14.22, + "learning_rate": 1.588117769139034e-05, + "loss": 0.0733, + "step": 61830 + }, + { + "epoch": 14.23, + "learning_rate": 1.574178760047702e-05, + "loss": 0.0614, + "step": 61860 + }, + { + "epoch": 14.23, + "learning_rate": 1.5602397509563708e-05, + "loss": 0.0723, + "step": 61890 + }, + { + "epoch": 14.24, + "learning_rate": 1.5463007418650395e-05, + "loss": 0.0696, + "step": 61920 + }, + { + "epoch": 14.25, + "learning_rate": 1.5323617327737078e-05, + "loss": 0.068, + "step": 61950 + }, + { + "epoch": 14.25, + "learning_rate": 1.5184227236823763e-05, + "loss": 0.0712, + "step": 61980 + }, + { + "epoch": 14.26, + "learning_rate": 1.5044837145910448e-05, + "loss": 0.0633, + "step": 62010 + }, + { + "epoch": 14.27, + "learning_rate": 1.4905447054997134e-05, + "loss": 0.0774, + "step": 62040 + }, + { + "epoch": 14.28, + "learning_rate": 1.4766056964083819e-05, + "loss": 0.07, + "step": 62070 + }, + { + "epoch": 14.28, + "learning_rate": 1.4626666873170504e-05, + "loss": 0.0633, + "step": 62100 + }, + { + "epoch": 14.29, + "learning_rate": 1.4487276782257189e-05, + "loss": 0.0724, + "step": 62130 + }, + { + "epoch": 14.3, + "learning_rate": 1.4347886691343874e-05, + "loss": 0.0622, + "step": 62160 + }, + { + "epoch": 14.3, + "learning_rate": 1.4208496600430559e-05, + "loss": 0.0684, + "step": 62190 + }, + { + "epoch": 14.31, + "learning_rate": 1.4069106509517245e-05, + "loss": 0.0734, + "step": 62220 + }, + { + "epoch": 14.32, + "learning_rate": 1.3929716418603928e-05, + "loss": 0.064, + "step": 62250 + }, + { + "epoch": 14.32, + "learning_rate": 1.3790326327690615e-05, + "loss": 0.0705, + "step": 62280 + }, + { + "epoch": 14.33, + "learning_rate": 1.3650936236777298e-05, + "loss": 0.0649, + "step": 62310 + }, + { + "epoch": 14.34, + "learning_rate": 1.3511546145863985e-05, + "loss": 0.0678, + "step": 62340 + }, + { + "epoch": 14.34, + "learning_rate": 1.3372156054950671e-05, + "loss": 0.0735, + "step": 62370 + }, + { + "epoch": 14.35, + "learning_rate": 1.3232765964037355e-05, + "loss": 0.0613, + "step": 62400 + }, + { + "epoch": 14.36, + "learning_rate": 1.3093375873124041e-05, + "loss": 0.0742, + "step": 62430 + }, + { + "epoch": 14.37, + "learning_rate": 1.2953985782210724e-05, + "loss": 0.0633, + "step": 62460 + }, + { + "epoch": 14.37, + "learning_rate": 1.2814595691297411e-05, + "loss": 0.0695, + "step": 62490 + }, + { + "epoch": 14.38, + "learning_rate": 1.2675205600384097e-05, + "loss": 0.0706, + "step": 62520 + }, + { + "epoch": 14.39, + "learning_rate": 1.253581550947078e-05, + "loss": 0.0652, + "step": 62550 + }, + { + "epoch": 14.39, + "learning_rate": 1.2396425418557467e-05, + "loss": 0.0736, + "step": 62580 + }, + { + "epoch": 14.4, + "learning_rate": 1.225703532764415e-05, + "loss": 0.0666, + "step": 62610 + }, + { + "epoch": 14.41, + "learning_rate": 1.2117645236730837e-05, + "loss": 0.0668, + "step": 62640 + }, + { + "epoch": 14.41, + "learning_rate": 1.1978255145817522e-05, + "loss": 0.0711, + "step": 62670 + }, + { + "epoch": 14.42, + "learning_rate": 1.1838865054904207e-05, + "loss": 0.0642, + "step": 62700 + }, + { + "epoch": 14.43, + "learning_rate": 1.1699474963990892e-05, + "loss": 0.0746, + "step": 62730 + }, + { + "epoch": 14.43, + "learning_rate": 1.1560084873077578e-05, + "loss": 0.0628, + "step": 62760 + }, + { + "epoch": 14.44, + "learning_rate": 1.1420694782164261e-05, + "loss": 0.0699, + "step": 62790 + }, + { + "epoch": 14.45, + "learning_rate": 1.1281304691250948e-05, + "loss": 0.0709, + "step": 62820 + }, + { + "epoch": 14.45, + "learning_rate": 1.1141914600337633e-05, + "loss": 0.0676, + "step": 62850 + }, + { + "epoch": 14.46, + "learning_rate": 1.1002524509424318e-05, + "loss": 0.0756, + "step": 62880 + }, + { + "epoch": 14.47, + "learning_rate": 1.0863134418511004e-05, + "loss": 0.0616, + "step": 62910 + }, + { + "epoch": 14.48, + "learning_rate": 1.0723744327597688e-05, + "loss": 0.0744, + "step": 62940 + }, + { + "epoch": 14.48, + "learning_rate": 1.0584354236684374e-05, + "loss": 0.0701, + "step": 62970 + }, + { + "epoch": 14.49, + "learning_rate": 1.0444964145771057e-05, + "loss": 0.0611, + "step": 63000 + }, + { + "epoch": 14.5, + "learning_rate": 1.0305574054857744e-05, + "loss": 0.0705, + "step": 63030 + }, + { + "epoch": 14.5, + "learning_rate": 1.016618396394443e-05, + "loss": 0.0638, + "step": 63060 + }, + { + "epoch": 14.51, + "learning_rate": 1.0026793873031114e-05, + "loss": 0.0675, + "step": 63090 + }, + { + "epoch": 14.52, + "learning_rate": 9.8874037821178e-06, + "loss": 0.0672, + "step": 63120 + }, + { + "epoch": 14.52, + "learning_rate": 9.748013691204483e-06, + "loss": 0.065, + "step": 63150 + }, + { + "epoch": 14.53, + "learning_rate": 9.60862360029117e-06, + "loss": 0.071, + "step": 63180 + }, + { + "epoch": 14.54, + "learning_rate": 9.469233509377855e-06, + "loss": 0.0613, + "step": 63210 + }, + { + "epoch": 14.54, + "learning_rate": 9.32984341846454e-06, + "loss": 0.0723, + "step": 63240 + }, + { + "epoch": 14.55, + "learning_rate": 9.190453327551225e-06, + "loss": 0.0732, + "step": 63270 + }, + { + "epoch": 14.56, + "learning_rate": 9.051063236637911e-06, + "loss": 0.0671, + "step": 63300 + }, + { + "epoch": 14.57, + "learning_rate": 8.911673145724596e-06, + "loss": 0.073, + "step": 63330 + }, + { + "epoch": 14.57, + "learning_rate": 8.772283054811281e-06, + "loss": 0.0606, + "step": 63360 + }, + { + "epoch": 14.58, + "learning_rate": 8.632892963897966e-06, + "loss": 0.0676, + "step": 63390 + }, + { + "epoch": 14.59, + "learning_rate": 8.49350287298465e-06, + "loss": 0.0721, + "step": 63420 + }, + { + "epoch": 14.59, + "learning_rate": 8.354112782071336e-06, + "loss": 0.0646, + "step": 63450 + }, + { + "epoch": 14.6, + "learning_rate": 8.21472269115802e-06, + "loss": 0.0723, + "step": 63480 + }, + { + "epoch": 14.61, + "learning_rate": 8.075332600244705e-06, + "loss": 0.0653, + "step": 63510 + }, + { + "epoch": 14.61, + "learning_rate": 7.935942509331392e-06, + "loss": 0.0685, + "step": 63540 + }, + { + "epoch": 14.62, + "learning_rate": 7.796552418418077e-06, + "loss": 0.0728, + "step": 63570 + }, + { + "epoch": 14.63, + "learning_rate": 7.657162327504762e-06, + "loss": 0.0639, + "step": 63600 + }, + { + "epoch": 14.63, + "learning_rate": 7.517772236591447e-06, + "loss": 0.0749, + "step": 63630 + }, + { + "epoch": 14.64, + "learning_rate": 7.3830284820419096e-06, + "loss": 0.0629, + "step": 63660 + }, + { + "epoch": 14.65, + "learning_rate": 7.2436383911285944e-06, + "loss": 0.0677, + "step": 63690 + }, + { + "epoch": 14.65, + "learning_rate": 7.104248300215279e-06, + "loss": 0.0699, + "step": 63720 + }, + { + "epoch": 14.66, + "learning_rate": 6.964858209301964e-06, + "loss": 0.0596, + "step": 63750 + }, + { + "epoch": 14.67, + "learning_rate": 6.825468118388649e-06, + "loss": 0.0692, + "step": 63780 + }, + { + "epoch": 14.68, + "learning_rate": 6.686078027475336e-06, + "loss": 0.0593, + "step": 63810 + }, + { + "epoch": 14.68, + "learning_rate": 6.5466879365620206e-06, + "loss": 0.0655, + "step": 63840 + }, + { + "epoch": 14.69, + "learning_rate": 6.4072978456487054e-06, + "loss": 0.0687, + "step": 63870 + }, + { + "epoch": 14.7, + "learning_rate": 6.26790775473539e-06, + "loss": 0.0652, + "step": 63900 + }, + { + "epoch": 14.7, + "learning_rate": 6.133164000185853e-06, + "loss": 0.0699, + "step": 63930 + }, + { + "epoch": 14.71, + "learning_rate": 5.993773909272538e-06, + "loss": 0.0628, + "step": 63960 + }, + { + "epoch": 14.72, + "learning_rate": 5.854383818359223e-06, + "loss": 0.0672, + "step": 63990 + }, + { + "epoch": 14.72, + "learning_rate": 5.714993727445908e-06, + "loss": 0.0673, + "step": 64020 + }, + { + "epoch": 14.73, + "learning_rate": 5.575603636532594e-06, + "loss": 0.0665, + "step": 64050 + }, + { + "epoch": 14.74, + "learning_rate": 5.4362135456192785e-06, + "loss": 0.072, + "step": 64080 + }, + { + "epoch": 14.74, + "learning_rate": 5.296823454705964e-06, + "loss": 0.0616, + "step": 64110 + }, + { + "epoch": 14.75, + "learning_rate": 5.157433363792649e-06, + "loss": 0.0678, + "step": 64140 + }, + { + "epoch": 14.76, + "learning_rate": 5.018043272879334e-06, + "loss": 0.0681, + "step": 64170 + }, + { + "epoch": 14.77, + "learning_rate": 4.87865318196602e-06, + "loss": 0.0621, + "step": 64200 + }, + { + "epoch": 14.77, + "learning_rate": 4.739263091052705e-06, + "loss": 0.0733, + "step": 64230 + }, + { + "epoch": 14.78, + "learning_rate": 4.5998730001393895e-06, + "loss": 0.0604, + "step": 64260 + }, + { + "epoch": 14.79, + "learning_rate": 4.460482909226075e-06, + "loss": 0.0658, + "step": 64290 + }, + { + "epoch": 14.79, + "learning_rate": 4.32109281831276e-06, + "loss": 0.0689, + "step": 64320 + }, + { + "epoch": 14.8, + "learning_rate": 4.181702727399445e-06, + "loss": 0.0632, + "step": 64350 + }, + { + "epoch": 14.81, + "learning_rate": 4.042312636486131e-06, + "loss": 0.0699, + "step": 64380 + }, + { + "epoch": 14.81, + "learning_rate": 3.902922545572816e-06, + "loss": 0.0652, + "step": 64410 + }, + { + "epoch": 14.82, + "learning_rate": 3.763532454659501e-06, + "loss": 0.0711, + "step": 64440 + }, + { + "epoch": 14.83, + "learning_rate": 3.624142363746186e-06, + "loss": 0.0634, + "step": 64470 + }, + { + "epoch": 14.83, + "learning_rate": 3.4847522728328707e-06, + "loss": 0.0588, + "step": 64500 + }, + { + "epoch": 14.84, + "learning_rate": 3.345362181919556e-06, + "loss": 0.0694, + "step": 64530 + }, + { + "epoch": 14.85, + "learning_rate": 3.2059720910062413e-06, + "loss": 0.06, + "step": 64560 + }, + { + "epoch": 14.86, + "learning_rate": 3.0665820000929266e-06, + "loss": 0.0665, + "step": 64590 + }, + { + "epoch": 14.86, + "learning_rate": 2.9271919091796115e-06, + "loss": 0.0668, + "step": 64620 + }, + { + "epoch": 14.87, + "learning_rate": 2.787801818266297e-06, + "loss": 0.0634, + "step": 64650 + }, + { + "epoch": 14.88, + "learning_rate": 2.648411727352982e-06, + "loss": 0.0719, + "step": 64680 + }, + { + "epoch": 14.88, + "learning_rate": 2.509021636439667e-06, + "loss": 0.0619, + "step": 64710 + }, + { + "epoch": 14.89, + "learning_rate": 2.3696315455263523e-06, + "loss": 0.0707, + "step": 64740 + }, + { + "epoch": 14.9, + "learning_rate": 2.2302414546130376e-06, + "loss": 0.0651, + "step": 64770 + }, + { + "epoch": 14.9, + "learning_rate": 2.0908513636997225e-06, + "loss": 0.0644, + "step": 64800 + }, + { + "epoch": 14.91, + "learning_rate": 1.951461272786408e-06, + "loss": 0.0668, + "step": 64830 + }, + { + "epoch": 14.92, + "learning_rate": 1.812071181873093e-06, + "loss": 0.0624, + "step": 64860 + }, + { + "epoch": 14.92, + "learning_rate": 1.672681090959778e-06, + "loss": 0.0698, + "step": 64890 + }, + { + "epoch": 14.93, + "learning_rate": 1.5332910000464633e-06, + "loss": 0.0677, + "step": 64920 + }, + { + "epoch": 14.94, + "learning_rate": 1.3939009091331484e-06, + "loss": 0.0624, + "step": 64950 + }, + { + "epoch": 14.94, + "learning_rate": 1.2545108182198335e-06, + "loss": 0.0685, + "step": 64980 + }, + { + "epoch": 14.95, + "learning_rate": 1.1151207273065188e-06, + "loss": 0.0614, + "step": 65010 + }, + { + "epoch": 14.96, + "learning_rate": 9.75730636393204e-07, + "loss": 0.0689, + "step": 65040 + }, + { + "epoch": 14.97, + "learning_rate": 8.36340545479889e-07, + "loss": 0.0702, + "step": 65070 + }, + { + "epoch": 14.97, + "learning_rate": 6.969504545665742e-07, + "loss": 0.0671, + "step": 65100 + }, + { + "epoch": 14.98, + "learning_rate": 5.575603636532594e-07, + "loss": 0.0703, + "step": 65130 + }, + { + "epoch": 14.99, + "learning_rate": 4.181702727399445e-07, + "loss": 0.0568, + "step": 65160 + }, + { + "epoch": 14.99, + "learning_rate": 2.787801818266297e-07, + "loss": 0.0676, + "step": 65190 + }, + { + "epoch": 15.0, + "learning_rate": 1.3939009091331485e-07, + "loss": 0.0717, + "step": 65220 + }, + { + "epoch": 15.0, + "eval_cer": 0.028607112182745118, + "eval_loss": 0.11205731332302094, + "eval_runtime": 421.0619, + "eval_samples_per_second": 38.339, + "eval_steps_per_second": 2.396, + "eval_wer": 0.10748248671697858, + "step": 65220 + }, + { + "epoch": 15.0, + "step": 65220, + "total_flos": 1.4555161313987618e+21, + "train_loss": 0.0045058862668025425, + "train_runtime": 16814.3798, + "train_samples_per_second": 496.52, + "train_steps_per_second": 3.879 + } + ], + "logging_steps": 30, + "max_steps": 65220, + "num_train_epochs": 15, + "save_steps": 500, + "total_flos": 1.4555161313987618e+21, + "trial_name": null, + "trial_params": null +}