diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,1501 +1,54751 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 35.73957158962796, - "global_step": 39600, + "epoch": 180.0, + "global_step": 222660, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { - "epoch": 0.36, - "learning_rate": 0.0002388, - "loss": 5.1061, + "epoch": 0.01, + "learning_rate": 2.3e-05, + "loss": 12.7521, + "step": 25 + }, + { + "epoch": 0.01, + "learning_rate": 4.7000000000000004e-05, + "loss": 8.8854, + "step": 50 + }, + { + "epoch": 0.02, + "learning_rate": 7.2e-05, + "loss": 4.0895, + "step": 75 + }, + { + "epoch": 0.02, + "learning_rate": 9.7e-05, + "loss": 3.5682, + "step": 100 + }, + { + "epoch": 0.03, + "learning_rate": 0.000122, + "loss": 3.2477, + "step": 125 + }, + { + "epoch": 0.04, + "learning_rate": 0.000147, + "loss": 3.2236, + "step": 150 + }, + { + "epoch": 0.04, + "learning_rate": 0.00017199999999999998, + "loss": 3.1948, + "step": 175 + }, + { + "epoch": 0.05, + "learning_rate": 0.00019700000000000002, + "loss": 3.115, + "step": 200 + }, + { + "epoch": 0.05, + "learning_rate": 0.000222, + "loss": 3.1549, + "step": 225 + }, + { + "epoch": 0.06, + "learning_rate": 0.000247, + "loss": 3.1232, + "step": 250 + }, + { + "epoch": 0.07, + "learning_rate": 0.00027200000000000005, + "loss": 3.1312, + "step": 275 + }, + { + "epoch": 0.07, + "learning_rate": 0.000297, + "loss": 3.0763, + "step": 300 + }, + { + "epoch": 0.08, + "learning_rate": 0.000322, + "loss": 3.1158, + "step": 325 + }, + { + "epoch": 0.09, + "learning_rate": 0.000347, + "loss": 3.0469, + "step": 350 + }, + { + "epoch": 0.09, + "learning_rate": 0.000372, + "loss": 3.0859, + "step": 375 + }, + { + "epoch": 0.1, + "learning_rate": 0.00039700000000000005, + "loss": 3.0238, "step": 400 }, { - "epoch": 0.36, - "eval_loss": 3.2615509033203125, - "eval_runtime": 209.4571, - "eval_samples_per_second": 18.892, - "eval_steps_per_second": 2.363, + "epoch": 0.1, + "learning_rate": 0.000422, + "loss": 3.1055, + "step": 425 + }, + { + "epoch": 0.11, + "learning_rate": 0.000447, + "loss": 3.0302, + "step": 450 + }, + { + "epoch": 0.12, + "learning_rate": 0.000472, + "loss": 3.0974, + "step": 475 + }, + { + "epoch": 0.12, + "learning_rate": 0.000497, + "loss": 3.0162, + "step": 500 + }, + { + "epoch": 0.12, + "eval_cer": 1.0, + "eval_loss": 3.1486001014709473, + "eval_runtime": 147.8787, + "eval_samples_per_second": 28.354, + "eval_steps_per_second": 7.094, "eval_wer": 1.0, - "step": 400 + "step": 500 }, { - "epoch": 0.72, - "learning_rate": 0.0002990989719814553, - "loss": 1.8298, - "step": 800 + "epoch": 0.13, + "learning_rate": 0.0004999731248473003, + "loss": 3.0909, + "step": 525 }, { - "epoch": 0.72, - "eval_loss": 0.5897451639175415, - "eval_runtime": 208.9676, - "eval_samples_per_second": 18.936, - "eval_steps_per_second": 2.369, - "eval_wer": 0.7382658232272045, - "step": 800 + "epoch": 0.13, + "learning_rate": 0.0004999425849010506, + "loss": 2.9905, + "step": 550 }, { - "epoch": 1.08, - "learning_rate": 0.0002978895383995162, - "loss": 0.7312, - "step": 1200 + "epoch": 0.14, + "learning_rate": 0.0004999120449548009, + "loss": 3.0408, + "step": 575 }, { - "epoch": 1.08, - "eval_loss": 0.38931864500045776, - "eval_runtime": 205.7748, - "eval_samples_per_second": 19.23, - "eval_steps_per_second": 2.406, - "eval_wer": 0.5565651976374375, - "step": 1200 + "epoch": 0.15, + "learning_rate": 0.0004998815050085511, + "loss": 2.9567, + "step": 600 }, { - "epoch": 1.44, - "learning_rate": 0.0002966801048175771, - "loss": 0.5859, - "step": 1600 + "epoch": 0.15, + "learning_rate": 0.0004998509650623015, + "loss": 2.9644, + "step": 625 }, { - "epoch": 1.44, - "eval_loss": 0.3028641939163208, - "eval_runtime": 210.4962, - "eval_samples_per_second": 18.798, - "eval_steps_per_second": 2.352, - "eval_wer": 0.43102785447174363, - "step": 1600 + "epoch": 0.16, + "learning_rate": 0.0004998204251160518, + "loss": 2.7935, + "step": 650 }, { - "epoch": 1.8, - "learning_rate": 0.00029547067123563797, - "loss": 0.5272, - "step": 2000 + "epoch": 0.16, + "learning_rate": 0.0004997898851698021, + "loss": 2.6574, + "step": 675 }, { - "epoch": 1.8, - "eval_loss": 0.2646712362766266, - "eval_runtime": 208.1951, - "eval_samples_per_second": 19.006, - "eval_steps_per_second": 2.378, - "eval_wer": 0.3874462656834306, - "step": 2000 + "epoch": 0.17, + "learning_rate": 0.0004997593452235524, + "loss": 2.4471, + "step": 700 }, { - "epoch": 2.17, - "learning_rate": 0.00029426123765369884, - "loss": 0.4691, - "step": 2400 + "epoch": 0.18, + "learning_rate": 0.0004997288052773027, + "loss": 2.2672, + "step": 725 }, { - "epoch": 2.17, - "eval_loss": 0.25143691897392273, - "eval_runtime": 208.3951, - "eval_samples_per_second": 18.988, - "eval_steps_per_second": 2.375, - "eval_wer": 0.3728025722573655, - "step": 2400 + "epoch": 0.18, + "learning_rate": 0.000499698265331053, + "loss": 2.1358, + "step": 750 }, { - "epoch": 2.53, - "learning_rate": 0.0002930518040717597, - "loss": 0.4313, - "step": 2800 + "epoch": 0.19, + "learning_rate": 0.0004996677253848033, + "loss": 2.0581, + "step": 775 }, { - "epoch": 2.53, - "eval_loss": 0.23935846984386444, - "eval_runtime": 208.5439, - "eval_samples_per_second": 18.974, - "eval_steps_per_second": 2.374, - "eval_wer": 0.33872715199384895, - "step": 2800 + "epoch": 0.2, + "learning_rate": 0.0004996371854385537, + "loss": 1.9562, + "step": 800 }, { - "epoch": 2.89, - "learning_rate": 0.0002918423704898206, - "loss": 0.4157, - "step": 3200 + "epoch": 0.2, + "learning_rate": 0.0004996066454923039, + "loss": 1.9131, + "step": 825 }, { - "epoch": 2.89, - "eval_loss": 0.22154289484024048, - "eval_runtime": 207.5705, - "eval_samples_per_second": 19.063, - "eval_steps_per_second": 2.385, - "eval_wer": 0.3165344423863279, - "step": 3200 + "epoch": 0.21, + "learning_rate": 0.0004995761055460543, + "loss": 1.8268, + "step": 850 }, { - "epoch": 3.25, - "learning_rate": 0.00029063293690788144, - "loss": 0.382, - "step": 3600 + "epoch": 0.21, + "learning_rate": 0.0004995455655998046, + "loss": 1.8359, + "step": 875 }, { - "epoch": 3.25, - "eval_loss": 0.22716625034809113, - "eval_runtime": 208.4179, - "eval_samples_per_second": 18.986, - "eval_steps_per_second": 2.375, - "eval_wer": 0.310103798972495, - "step": 3600 + "epoch": 0.22, + "learning_rate": 0.0004995150256535549, + "loss": 1.721, + "step": 900 }, { - "epoch": 3.61, - "learning_rate": 0.0002894235033259423, - "loss": 0.3636, - "step": 4000 + "epoch": 0.23, + "learning_rate": 0.0004994844857073051, + "loss": 1.7865, + "step": 925 }, { - "epoch": 3.61, - "eval_loss": 0.21131443977355957, - "eval_runtime": 206.1846, - "eval_samples_per_second": 19.192, - "eval_steps_per_second": 2.401, - "eval_wer": 0.30538566385908505, - "step": 4000 + "epoch": 0.23, + "learning_rate": 0.0004994539457610555, + "loss": 1.6867, + "step": 950 }, { - "epoch": 3.97, - "learning_rate": 0.00028821406974400323, - "loss": 0.3665, - "step": 4400 + "epoch": 0.24, + "learning_rate": 0.0004994234058148057, + "loss": 1.6645, + "step": 975 }, { - "epoch": 3.97, - "eval_loss": 0.21285590529441833, - "eval_runtime": 205.9986, - "eval_samples_per_second": 19.209, - "eval_steps_per_second": 2.403, - "eval_wer": 0.2907769195820082, - "step": 4400 + "epoch": 0.24, + "learning_rate": 0.0004993928658685561, + "loss": 1.6532, + "step": 1000 }, { - "epoch": 4.33, - "learning_rate": 0.00028700463616206405, - "loss": 0.333, - "step": 4800 + "epoch": 0.24, + "eval_cer": 0.4583123723088611, + "eval_loss": 1.3737213611602783, + "eval_runtime": 148.5107, + "eval_samples_per_second": 28.234, + "eval_steps_per_second": 7.063, + "eval_wer": 0.9951386623164763, + "step": 1000 }, { - "epoch": 4.33, - "eval_loss": 0.2077477127313614, - "eval_runtime": 208.1768, - "eval_samples_per_second": 19.008, - "eval_steps_per_second": 2.378, - "eval_wer": 0.2788243106280362, - "step": 4800 + "epoch": 0.25, + "learning_rate": 0.0004993623259223064, + "loss": 1.6458, + "step": 1025 }, { - "epoch": 4.69, - "learning_rate": 0.00028579520258012497, - "loss": 0.3313, - "step": 5200 + "epoch": 0.26, + "learning_rate": 0.0004993317859760567, + "loss": 1.6264, + "step": 1050 }, { - "epoch": 4.69, - "eval_loss": 0.18993255496025085, - "eval_runtime": 205.0681, - "eval_samples_per_second": 19.296, - "eval_steps_per_second": 2.414, - "eval_wer": 0.2659979729493587, - "step": 5200 + "epoch": 0.26, + "learning_rate": 0.0004993012460298069, + "loss": 1.6296, + "step": 1075 }, { - "epoch": 5.05, - "learning_rate": 0.00028458576899818584, - "loss": 0.3222, - "step": 5600 + "epoch": 0.27, + "learning_rate": 0.0004992707060835573, + "loss": 1.5512, + "step": 1100 }, { - "epoch": 5.05, - "eval_loss": 0.19064170122146606, - "eval_runtime": 205.7167, - "eval_samples_per_second": 19.235, - "eval_steps_per_second": 2.406, - "eval_wer": 0.2542201097403278, - "step": 5600 + "epoch": 0.27, + "learning_rate": 0.0004992401661373077, + "loss": 1.5247, + "step": 1125 }, { - "epoch": 5.41, - "learning_rate": 0.0002833763354162467, - "loss": 0.3003, - "step": 6000 + "epoch": 0.28, + "learning_rate": 0.0004992096261910579, + "loss": 1.5277, + "step": 1150 }, { - "epoch": 5.41, - "eval_loss": 0.1921728551387787, - "eval_runtime": 204.1327, - "eval_samples_per_second": 19.384, - "eval_steps_per_second": 2.425, - "eval_wer": 0.2612099395379722, - "step": 6000 + "epoch": 0.29, + "learning_rate": 0.0004991790862448083, + "loss": 1.5062, + "step": 1175 }, { - "epoch": 5.78, - "learning_rate": 0.00028216690183430757, - "loss": 0.3057, - "step": 6400 + "epoch": 0.29, + "learning_rate": 0.0004991485462985585, + "loss": 1.4983, + "step": 1200 }, { - "epoch": 5.78, - "eval_loss": 0.19207137823104858, - "eval_runtime": 205.293, - "eval_samples_per_second": 19.275, - "eval_steps_per_second": 2.411, - "eval_wer": 0.2560724146367036, - "step": 6400 + "epoch": 0.3, + "learning_rate": 0.0004991180063523088, + "loss": 1.5167, + "step": 1225 }, { - "epoch": 6.14, - "learning_rate": 0.0002809604918363233, - "loss": 0.297, - "step": 6800 + "epoch": 0.31, + "learning_rate": 0.0004990874664060591, + "loss": 1.4639, + "step": 1250 }, { - "epoch": 6.14, - "eval_loss": 0.1768147200345993, - "eval_runtime": 204.3464, - "eval_samples_per_second": 19.364, - "eval_steps_per_second": 2.422, - "eval_wer": 0.24146367035962674, - "step": 6800 + "epoch": 0.31, + "learning_rate": 0.0004990569264598095, + "loss": 1.4723, + "step": 1275 }, { - "epoch": 6.5, - "learning_rate": 0.0002797510582543842, - "loss": 0.2834, - "step": 7200 + "epoch": 0.32, + "learning_rate": 0.0004990263865135597, + "loss": 1.4641, + "step": 1300 }, { - "epoch": 6.5, - "eval_loss": 0.18651635944843292, - "eval_runtime": 205.3683, - "eval_samples_per_second": 19.268, - "eval_steps_per_second": 2.41, - "eval_wer": 0.24894278824310628, - "step": 7200 + "epoch": 0.32, + "learning_rate": 0.0004989958465673101, + "loss": 1.4708, + "step": 1325 }, { - "epoch": 6.86, - "learning_rate": 0.00027854162467244505, - "loss": 0.2787, - "step": 7600 + "epoch": 0.33, + "learning_rate": 0.0004989653066210603, + "loss": 1.4587, + "step": 1350 }, { - "epoch": 6.86, - "eval_loss": 0.18522889912128448, - "eval_runtime": 204.2237, - "eval_samples_per_second": 19.376, - "eval_steps_per_second": 2.424, - "eval_wer": 0.24726522909167162, - "step": 7600 + "epoch": 0.34, + "learning_rate": 0.0004989347666748106, + "loss": 1.3988, + "step": 1375 }, { - "epoch": 7.22, - "learning_rate": 0.0002773321910905059, - "loss": 0.2678, - "step": 8000 + "epoch": 0.34, + "learning_rate": 0.0004989042267285609, + "loss": 1.4353, + "step": 1400 }, { - "epoch": 7.22, - "eval_loss": 0.1824478805065155, - "eval_runtime": 203.4819, - "eval_samples_per_second": 19.446, - "eval_steps_per_second": 2.433, - "eval_wer": 0.23087407821619543, - "step": 8000 + "epoch": 0.35, + "learning_rate": 0.0004988736867823113, + "loss": 1.4303, + "step": 1425 }, { - "epoch": 7.58, - "learning_rate": 0.0002761227575085668, - "loss": 0.2665, - "step": 8400 + "epoch": 0.35, + "learning_rate": 0.0004988431468360615, + "loss": 1.4705, + "step": 1450 }, { - "epoch": 7.58, - "eval_loss": 0.17768050730228424, - "eval_runtime": 203.7918, - "eval_samples_per_second": 19.417, - "eval_steps_per_second": 2.429, - "eval_wer": 0.2309789256631601, - "step": 8400 + "epoch": 0.36, + "learning_rate": 0.0004988126068898119, + "loss": 1.3941, + "step": 1475 }, { - "epoch": 7.94, - "learning_rate": 0.00027491332392662766, - "loss": 0.2722, - "step": 8800 + "epoch": 0.37, + "learning_rate": 0.0004987820669435622, + "loss": 1.3941, + "step": 1500 }, { - "epoch": 7.94, - "eval_loss": 0.17655304074287415, - "eval_runtime": 203.4054, - "eval_samples_per_second": 19.454, - "eval_steps_per_second": 2.434, - "eval_wer": 0.23216719672875966, - "step": 8800 + "epoch": 0.37, + "eval_cer": 0.37091260022791905, + "eval_loss": 1.1033180952072144, + "eval_runtime": 148.9205, + "eval_samples_per_second": 28.156, + "eval_steps_per_second": 7.044, + "eval_wer": 0.9866231647634583, + "step": 1500 }, { - "epoch": 8.3, - "learning_rate": 0.0002737038903446885, - "loss": 0.2549, - "step": 9200 + "epoch": 0.37, + "learning_rate": 0.0004987515269973125, + "loss": 1.401, + "step": 1525 }, { - "epoch": 8.3, - "eval_loss": 0.18208913505077362, - "eval_runtime": 203.5406, - "eval_samples_per_second": 19.441, - "eval_steps_per_second": 2.432, - "eval_wer": 0.23590675567049943, - "step": 9200 + "epoch": 0.38, + "learning_rate": 0.0004987209870510628, + "loss": 1.3726, + "step": 1550 }, { - "epoch": 8.66, - "learning_rate": 0.00027249748034670427, - "loss": 0.2535, - "step": 9600 + "epoch": 0.38, + "learning_rate": 0.0004986904471048131, + "loss": 1.3804, + "step": 1575 }, { - "epoch": 8.66, - "eval_loss": 0.17272169888019562, - "eval_runtime": 204.5912, - "eval_samples_per_second": 19.341, - "eval_steps_per_second": 2.419, - "eval_wer": 0.22619089225177366, - "step": 9600 + "epoch": 0.39, + "learning_rate": 0.0004986599071585634, + "loss": 1.4081, + "step": 1600 }, { - "epoch": 9.03, - "learning_rate": 0.00027128804676476514, - "loss": 0.2508, - "step": 10000 + "epoch": 0.4, + "learning_rate": 0.0004986293672123137, + "loss": 1.392, + "step": 1625 }, { - "epoch": 9.03, - "eval_loss": 0.17887552082538605, - "eval_runtime": 202.6986, - "eval_samples_per_second": 19.522, - "eval_steps_per_second": 2.442, - "eval_wer": 0.22301051969384544, - "step": 10000 + "epoch": 0.4, + "learning_rate": 0.0004985988272660641, + "loss": 1.3433, + "step": 1650 }, { - "epoch": 9.39, - "learning_rate": 0.000270078613182826, - "loss": 0.2354, - "step": 10400 + "epoch": 0.41, + "learning_rate": 0.0004985682873198143, + "loss": 1.3965, + "step": 1675 }, { - "epoch": 9.39, - "eval_loss": 0.17052198946475983, - "eval_runtime": 202.2989, - "eval_samples_per_second": 19.56, - "eval_steps_per_second": 2.447, - "eval_wer": 0.2227658756509279, - "step": 10400 + "epoch": 0.41, + "learning_rate": 0.0004985377473735646, + "loss": 1.3149, + "step": 1700 }, { - "epoch": 9.75, - "learning_rate": 0.0002688691796008869, - "loss": 0.2449, - "step": 10800 + "epoch": 0.42, + "learning_rate": 0.0004985072074273149, + "loss": 1.3295, + "step": 1725 }, { - "epoch": 9.75, - "eval_loss": 0.17250895500183105, - "eval_runtime": 202.4538, - "eval_samples_per_second": 19.545, - "eval_steps_per_second": 2.445, - "eval_wer": 0.2203893335197288, - "step": 10800 + "epoch": 0.43, + "learning_rate": 0.0004984766674810652, + "loss": 1.3181, + "step": 1750 }, { - "epoch": 10.11, - "learning_rate": 0.0002676597460189478, - "loss": 0.2461, - "step": 11200 + "epoch": 0.43, + "learning_rate": 0.0004984461275348155, + "loss": 1.3353, + "step": 1775 }, { - "epoch": 10.11, - "eval_loss": 0.18136142194271088, - "eval_runtime": 202.9746, - "eval_samples_per_second": 19.495, - "eval_steps_per_second": 2.439, - "eval_wer": 0.23083912906720722, - "step": 11200 + "epoch": 0.44, + "learning_rate": 0.0004984155875885659, + "loss": 1.3267, + "step": 1800 }, { - "epoch": 10.47, - "learning_rate": 0.0002664533360209635, - "loss": 0.2354, - "step": 11600 + "epoch": 0.45, + "learning_rate": 0.0004983850476423162, + "loss": 1.3335, + "step": 1825 }, { - "epoch": 10.47, - "eval_loss": 0.17660640180110931, - "eval_runtime": 202.5754, - "eval_samples_per_second": 19.533, - "eval_steps_per_second": 2.444, - "eval_wer": 0.21902631670918812, - "step": 11600 + "epoch": 0.45, + "learning_rate": 0.0004983545076960664, + "loss": 1.3258, + "step": 1850 }, { - "epoch": 10.83, - "learning_rate": 0.00026524390243902435, - "loss": 0.2271, - "step": 12000 + "epoch": 0.46, + "learning_rate": 0.0004983239677498168, + "loss": 1.3543, + "step": 1875 }, { - "epoch": 10.83, - "eval_loss": 0.16712866723537445, - "eval_runtime": 204.6252, - "eval_samples_per_second": 19.338, - "eval_steps_per_second": 2.419, - "eval_wer": 0.22643553629469124, - "step": 12000 + "epoch": 0.46, + "learning_rate": 0.0004982934278035671, + "loss": 1.3208, + "step": 1900 }, { - "epoch": 11.19, - "learning_rate": 0.0002640344688570853, - "loss": 0.2262, - "step": 12400 + "epoch": 0.47, + "learning_rate": 0.0004982628878573174, + "loss": 1.3046, + "step": 1925 }, { - "epoch": 11.19, - "eval_loss": 0.16640537977218628, - "eval_runtime": 205.9457, - "eval_samples_per_second": 19.214, - "eval_steps_per_second": 2.404, - "eval_wer": 0.2237444518225981, - "step": 12400 + "epoch": 0.48, + "learning_rate": 0.0004982323479110677, + "loss": 1.3268, + "step": 1950 }, { - "epoch": 11.55, - "learning_rate": 0.0002628250352751461, - "loss": 0.222, - "step": 12800 + "epoch": 0.48, + "learning_rate": 0.000498201807964818, + "loss": 1.3152, + "step": 1975 }, { - "epoch": 11.55, - "eval_loss": 0.16319511830806732, - "eval_runtime": 203.9378, - "eval_samples_per_second": 19.403, - "eval_steps_per_second": 2.427, - "eval_wer": 0.20773774158599237, - "step": 12800 + "epoch": 0.49, + "learning_rate": 0.0004981712680185683, + "loss": 1.3275, + "step": 2000 }, { - "epoch": 11.91, - "learning_rate": 0.000261615601693207, - "loss": 0.2254, - "step": 13200 + "epoch": 0.49, + "eval_cer": 0.348711025327762, + "eval_loss": 1.093718409538269, + "eval_runtime": 154.6705, + "eval_samples_per_second": 27.109, + "eval_steps_per_second": 6.782, + "eval_wer": 0.9539641109298532, + "step": 2000 }, { - "epoch": 11.91, - "eval_loss": 0.16412602365016937, - "eval_runtime": 203.9337, - "eval_samples_per_second": 19.403, - "eval_steps_per_second": 2.427, - "eval_wer": 0.21906126585817634, - "step": 13200 + "epoch": 0.49, + "learning_rate": 0.0004981407280723186, + "loss": 1.3006, + "step": 2025 }, { - "epoch": 12.27, - "learning_rate": 0.0002604061681112679, - "loss": 0.2198, - "step": 13600 + "epoch": 0.5, + "learning_rate": 0.0004981101881260689, + "loss": 1.2848, + "step": 2050 }, { - "epoch": 12.27, - "eval_loss": 0.16197219491004944, - "eval_runtime": 202.2546, - "eval_samples_per_second": 19.564, - "eval_steps_per_second": 2.447, - "eval_wer": 0.2122112326564848, - "step": 13600 + "epoch": 0.51, + "learning_rate": 0.0004980796481798192, + "loss": 1.2935, + "step": 2075 }, { - "epoch": 12.63, - "learning_rate": 0.00025919673452932875, - "loss": 0.2167, - "step": 14000 + "epoch": 0.51, + "learning_rate": 0.0004980491082335695, + "loss": 1.3263, + "step": 2100 }, { - "epoch": 12.63, - "eval_loss": 0.15757694840431213, - "eval_runtime": 202.2278, - "eval_samples_per_second": 19.567, - "eval_steps_per_second": 2.448, - "eval_wer": 0.2082270296718275, - "step": 14000 + "epoch": 0.52, + "learning_rate": 0.0004980185682873198, + "loss": 1.3252, + "step": 2125 }, { - "epoch": 13.0, - "learning_rate": 0.0002579903245313445, - "loss": 0.2138, - "step": 14400 + "epoch": 0.52, + "learning_rate": 0.0004979880283410701, + "loss": 1.3055, + "step": 2150 }, { - "epoch": 13.0, - "eval_loss": 0.16401419043540955, - "eval_runtime": 202.7059, - "eval_samples_per_second": 19.521, - "eval_steps_per_second": 2.442, - "eval_wer": 0.2156711984063188, - "step": 14400 + "epoch": 0.53, + "learning_rate": 0.0004979574883948204, + "loss": 1.2801, + "step": 2175 }, { - "epoch": 13.36, - "learning_rate": 0.0002567808909494053, - "loss": 0.2112, - "step": 14800 + "epoch": 0.54, + "learning_rate": 0.0004979269484485708, + "loss": 1.2867, + "step": 2200 }, { - "epoch": 13.36, - "eval_loss": 0.17054887115955353, - "eval_runtime": 203.4699, - "eval_samples_per_second": 19.448, - "eval_steps_per_second": 2.433, - "eval_wer": 0.21696431691888302, - "step": 14800 + "epoch": 0.54, + "learning_rate": 0.000497896408502321, + "loss": 1.3295, + "step": 2225 }, { - "epoch": 13.72, - "learning_rate": 0.00025557145736746623, - "loss": 0.2038, - "step": 15200 + "epoch": 0.55, + "learning_rate": 0.0004978658685560714, + "loss": 1.3141, + "step": 2250 }, { - "epoch": 13.72, - "eval_loss": 0.1620979905128479, - "eval_runtime": 203.3439, - "eval_samples_per_second": 19.46, - "eval_steps_per_second": 2.434, - "eval_wer": 0.2075979449900395, - "step": 15200 + "epoch": 0.56, + "learning_rate": 0.0004978353286098217, + "loss": 1.2956, + "step": 2275 }, { - "epoch": 14.08, - "learning_rate": 0.0002543620237855271, - "loss": 0.2101, - "step": 15600 + "epoch": 0.56, + "learning_rate": 0.000497804788663572, + "loss": 1.2728, + "step": 2300 }, { - "epoch": 14.08, - "eval_loss": 0.16726231575012207, - "eval_runtime": 203.5727, - "eval_samples_per_second": 19.438, - "eval_steps_per_second": 2.432, - "eval_wer": 0.19962953902072483, - "step": 15600 + "epoch": 0.57, + "learning_rate": 0.0004977742487173222, + "loss": 1.2823, + "step": 2325 }, { - "epoch": 14.44, - "learning_rate": 0.00025315259020358797, - "loss": 0.2013, - "step": 16000 + "epoch": 0.57, + "learning_rate": 0.0004977437087710726, + "loss": 1.3055, + "step": 2350 }, { - "epoch": 14.44, - "eval_loss": 0.16415779292583466, - "eval_runtime": 202.8281, - "eval_samples_per_second": 19.509, - "eval_steps_per_second": 2.44, - "eval_wer": 0.20885611435361548, - "step": 16000 + "epoch": 0.58, + "learning_rate": 0.0004977131688248228, + "loss": 1.2819, + "step": 2375 }, { - "epoch": 14.8, - "learning_rate": 0.00025194315662164883, - "loss": 0.21, - "step": 16400 + "epoch": 0.59, + "learning_rate": 0.0004976826288785732, + "loss": 1.2821, + "step": 2400 }, { - "epoch": 14.8, - "eval_loss": 0.1616578996181488, - "eval_runtime": 203.1464, - "eval_samples_per_second": 19.479, - "eval_steps_per_second": 2.437, - "eval_wer": 0.2186768252193059, - "step": 16400 + "epoch": 0.59, + "learning_rate": 0.0004976520889323235, + "loss": 1.2981, + "step": 2425 }, { - "epoch": 15.16, - "learning_rate": 0.0002507337230397097, - "loss": 0.2002, - "step": 16800 + "epoch": 0.6, + "learning_rate": 0.0004976215489860738, + "loss": 1.2734, + "step": 2450 }, { - "epoch": 15.16, - "eval_loss": 0.1627209484577179, - "eval_runtime": 202.7336, - "eval_samples_per_second": 19.518, - "eval_steps_per_second": 2.442, - "eval_wer": 0.21839723202740013, - "step": 16800 + "epoch": 0.6, + "learning_rate": 0.0004975910090398241, + "loss": 1.2244, + "step": 2475 + }, + { + "epoch": 0.61, + "learning_rate": 0.0004975604690935744, + "loss": 1.2648, + "step": 2500 + }, + { + "epoch": 0.61, + "eval_cer": 0.3137429031960001, + "eval_loss": 0.9402545690536499, + "eval_runtime": 149.7438, + "eval_samples_per_second": 28.001, + "eval_steps_per_second": 7.005, + "eval_wer": 0.9449918433931485, + "step": 2500 + }, + { + "epoch": 0.62, + "learning_rate": 0.0004975299291473248, + "loss": 1.2673, + "step": 2525 + }, + { + "epoch": 0.62, + "learning_rate": 0.000497499389201075, + "loss": 1.2347, + "step": 2550 + }, + { + "epoch": 0.63, + "learning_rate": 0.0004974688492548254, + "loss": 1.2291, + "step": 2575 + }, + { + "epoch": 0.63, + "learning_rate": 0.0004974383093085756, + "loss": 1.2904, + "step": 2600 + }, + { + "epoch": 0.64, + "learning_rate": 0.000497407769362326, + "loss": 1.1844, + "step": 2625 + }, + { + "epoch": 0.65, + "learning_rate": 0.0004973772294160762, + "loss": 1.2243, + "step": 2650 + }, + { + "epoch": 0.65, + "learning_rate": 0.0004973466894698266, + "loss": 1.265, + "step": 2675 + }, + { + "epoch": 0.66, + "learning_rate": 0.0004973161495235768, + "loss": 1.2719, + "step": 2700 + }, + { + "epoch": 0.66, + "learning_rate": 0.0004972856095773272, + "loss": 1.2109, + "step": 2725 + }, + { + "epoch": 0.67, + "learning_rate": 0.0004972550696310774, + "loss": 1.2428, + "step": 2750 + }, + { + "epoch": 0.68, + "learning_rate": 0.0004972245296848278, + "loss": 1.2307, + "step": 2775 + }, + { + "epoch": 0.68, + "learning_rate": 0.000497193989738578, + "loss": 1.2242, + "step": 2800 + }, + { + "epoch": 0.69, + "learning_rate": 0.0004971634497923284, + "loss": 1.2375, + "step": 2825 + }, + { + "epoch": 0.7, + "learning_rate": 0.0004971329098460786, + "loss": 1.2087, + "step": 2850 + }, + { + "epoch": 0.7, + "learning_rate": 0.000497102369899829, + "loss": 1.2111, + "step": 2875 + }, + { + "epoch": 0.71, + "learning_rate": 0.0004970718299535792, + "loss": 1.2721, + "step": 2900 + }, + { + "epoch": 0.71, + "learning_rate": 0.0004970412900073296, + "loss": 1.2132, + "step": 2925 + }, + { + "epoch": 0.72, + "learning_rate": 0.00049701075006108, + "loss": 1.1936, + "step": 2950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0004969802101148302, + "loss": 1.2966, + "step": 2975 + }, + { + "epoch": 0.73, + "learning_rate": 0.0004969496701685805, + "loss": 1.3085, + "step": 3000 + }, + { + "epoch": 0.73, + "eval_cer": 0.30896378961633625, + "eval_loss": 0.9274962544441223, + "eval_runtime": 149.1917, + "eval_samples_per_second": 28.105, + "eval_steps_per_second": 7.031, + "eval_wer": 0.9287765089722675, + "step": 3000 + }, + { + "epoch": 0.74, + "learning_rate": 0.0004969191302223308, + "loss": 1.2099, + "step": 3025 + }, + { + "epoch": 0.74, + "learning_rate": 0.0004968885902760812, + "loss": 1.2075, + "step": 3050 + }, + { + "epoch": 0.75, + "learning_rate": 0.0004968580503298314, + "loss": 1.2174, + "step": 3075 + }, + { + "epoch": 0.76, + "learning_rate": 0.0004968275103835818, + "loss": 1.2464, + "step": 3100 + }, + { + "epoch": 0.76, + "learning_rate": 0.000496796970437332, + "loss": 1.262, + "step": 3125 + }, + { + "epoch": 0.77, + "learning_rate": 0.0004967664304910823, + "loss": 1.2058, + "step": 3150 + }, + { + "epoch": 0.77, + "learning_rate": 0.0004967358905448326, + "loss": 1.2482, + "step": 3175 + }, + { + "epoch": 0.78, + "learning_rate": 0.000496705350598583, + "loss": 1.2172, + "step": 3200 + }, + { + "epoch": 0.79, + "learning_rate": 0.0004966748106523332, + "loss": 1.2177, + "step": 3225 + }, + { + "epoch": 0.79, + "learning_rate": 0.0004966442707060836, + "loss": 1.2189, + "step": 3250 + }, + { + "epoch": 0.8, + "learning_rate": 0.0004966137307598339, + "loss": 1.196, + "step": 3275 + }, + { + "epoch": 0.81, + "learning_rate": 0.0004965831908135842, + "loss": 1.1916, + "step": 3300 + }, + { + "epoch": 0.81, + "learning_rate": 0.0004965526508673345, + "loss": 1.1967, + "step": 3325 + }, + { + "epoch": 0.82, + "learning_rate": 0.0004965221109210848, + "loss": 1.2152, + "step": 3350 + }, + { + "epoch": 0.82, + "learning_rate": 0.0004964915709748351, + "loss": 1.2419, + "step": 3375 + }, + { + "epoch": 0.83, + "learning_rate": 0.0004964610310285854, + "loss": 1.1729, + "step": 3400 + }, + { + "epoch": 0.84, + "learning_rate": 0.0004964304910823357, + "loss": 1.1925, + "step": 3425 + }, + { + "epoch": 0.84, + "learning_rate": 0.000496399951136086, + "loss": 1.2207, + "step": 3450 + }, + { + "epoch": 0.85, + "learning_rate": 0.0004963694111898363, + "loss": 1.1863, + "step": 3475 + }, + { + "epoch": 0.85, + "learning_rate": 0.0004963388712435866, + "loss": 1.1934, + "step": 3500 + }, + { + "epoch": 0.85, + "eval_cer": 0.2815519029188013, + "eval_loss": 0.8737192153930664, + "eval_runtime": 147.4134, + "eval_samples_per_second": 28.444, + "eval_steps_per_second": 7.116, + "eval_wer": 0.8882218597063621, + "step": 3500 + }, + { + "epoch": 0.86, + "learning_rate": 0.0004963083312973369, + "loss": 1.1506, + "step": 3525 + }, + { + "epoch": 0.87, + "learning_rate": 0.0004962777913510872, + "loss": 1.1723, + "step": 3550 + }, + { + "epoch": 0.87, + "learning_rate": 0.0004962472514048376, + "loss": 1.1829, + "step": 3575 + }, + { + "epoch": 0.88, + "learning_rate": 0.0004962167114585879, + "loss": 1.2188, + "step": 3600 + }, + { + "epoch": 0.88, + "learning_rate": 0.0004961861715123381, + "loss": 1.179, + "step": 3625 + }, + { + "epoch": 0.89, + "learning_rate": 0.0004961556315660885, + "loss": 1.1642, + "step": 3650 + }, + { + "epoch": 0.9, + "learning_rate": 0.0004961250916198388, + "loss": 1.1982, + "step": 3675 + }, + { + "epoch": 0.9, + "learning_rate": 0.0004960945516735891, + "loss": 1.2169, + "step": 3700 + }, + { + "epoch": 0.91, + "learning_rate": 0.0004960640117273394, + "loss": 1.1939, + "step": 3725 + }, + { + "epoch": 0.92, + "learning_rate": 0.0004960334717810897, + "loss": 1.2329, + "step": 3750 + }, + { + "epoch": 0.92, + "learning_rate": 0.0004960029318348399, + "loss": 1.2036, + "step": 3775 + }, + { + "epoch": 0.93, + "learning_rate": 0.0004959723918885903, + "loss": 1.1609, + "step": 3800 + }, + { + "epoch": 0.93, + "learning_rate": 0.0004959418519423406, + "loss": 1.1622, + "step": 3825 + }, + { + "epoch": 0.94, + "learning_rate": 0.0004959113119960909, + "loss": 1.1903, + "step": 3850 + }, + { + "epoch": 0.95, + "learning_rate": 0.0004958807720498412, + "loss": 1.1552, + "step": 3875 + }, + { + "epoch": 0.95, + "learning_rate": 0.0004958502321035915, + "loss": 1.1445, + "step": 3900 + }, + { + "epoch": 0.96, + "learning_rate": 0.0004958196921573418, + "loss": 1.1968, + "step": 3925 + }, + { + "epoch": 0.96, + "learning_rate": 0.0004957891522110921, + "loss": 1.1482, + "step": 3950 + }, + { + "epoch": 0.97, + "learning_rate": 0.0004957586122648425, + "loss": 1.1879, + "step": 3975 + }, + { + "epoch": 0.98, + "learning_rate": 0.0004957280723185927, + "loss": 1.1909, + "step": 4000 + }, + { + "epoch": 0.98, + "eval_cer": 0.27801505087112305, + "eval_loss": 0.8657284379005432, + "eval_runtime": 148.1841, + "eval_samples_per_second": 28.296, + "eval_steps_per_second": 7.079, + "eval_wer": 0.8697879282218597, + "step": 4000 + }, + { + "epoch": 0.98, + "learning_rate": 0.0004956975323723431, + "loss": 1.1837, + "step": 4025 + }, + { + "epoch": 0.99, + "learning_rate": 0.0004956669924260934, + "loss": 1.1907, + "step": 4050 + }, + { + "epoch": 0.99, + "learning_rate": 0.0004956364524798437, + "loss": 1.181, + "step": 4075 + }, + { + "epoch": 1.0, + "learning_rate": 0.0004956059125335939, + "loss": 1.1887, + "step": 4100 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004955753725873443, + "loss": 1.1424, + "step": 4125 + }, + { + "epoch": 1.01, + "learning_rate": 0.0004955448326410945, + "loss": 1.2208, + "step": 4150 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004955142926948449, + "loss": 1.0992, + "step": 4175 + }, + { + "epoch": 1.02, + "learning_rate": 0.0004954837527485952, + "loss": 1.1928, + "step": 4200 + }, + { + "epoch": 1.03, + "learning_rate": 0.0004954532128023455, + "loss": 1.1475, + "step": 4225 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004954226728560957, + "loss": 1.1454, + "step": 4250 + }, + { + "epoch": 1.04, + "learning_rate": 0.0004953921329098461, + "loss": 1.1318, + "step": 4275 + }, + { + "epoch": 1.05, + "learning_rate": 0.0004953615929635963, + "loss": 1.0943, + "step": 4300 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004953310530173467, + "loss": 1.1443, + "step": 4325 + }, + { + "epoch": 1.06, + "learning_rate": 0.0004953005130710971, + "loss": 1.14, + "step": 4350 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004952699731248473, + "loss": 1.1257, + "step": 4375 + }, + { + "epoch": 1.07, + "learning_rate": 0.0004952394331785976, + "loss": 1.1535, + "step": 4400 + }, + { + "epoch": 1.08, + "learning_rate": 0.0004952088932323479, + "loss": 1.1164, + "step": 4425 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004951783532860983, + "loss": 1.1142, + "step": 4450 + }, + { + "epoch": 1.09, + "learning_rate": 0.0004951478133398485, + "loss": 1.1491, + "step": 4475 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004951172733935989, + "loss": 1.0647, + "step": 4500 + }, + { + "epoch": 1.1, + "eval_cer": 0.2660236337689804, + "eval_loss": 0.8246370553970337, + "eval_runtime": 149.8516, + "eval_samples_per_second": 27.981, + "eval_steps_per_second": 7.0, + "eval_wer": 0.8816639477977162, + "step": 4500 + }, + { + "epoch": 1.1, + "learning_rate": 0.0004950867334473491, + "loss": 1.1131, + "step": 4525 + }, + { + "epoch": 1.11, + "learning_rate": 0.0004950561935010994, + "loss": 1.1171, + "step": 4550 + }, + { + "epoch": 1.12, + "learning_rate": 0.0004950256535548497, + "loss": 1.14, + "step": 4575 + }, + { + "epoch": 1.12, + "learning_rate": 0.0004949951136086001, + "loss": 1.1237, + "step": 4600 + }, + { + "epoch": 1.13, + "learning_rate": 0.0004949645736623503, + "loss": 1.1444, + "step": 4625 + }, + { + "epoch": 1.13, + "learning_rate": 0.0004949340337161007, + "loss": 1.1466, + "step": 4650 + }, + { + "epoch": 1.14, + "learning_rate": 0.000494903493769851, + "loss": 1.0618, + "step": 4675 + }, + { + "epoch": 1.15, + "learning_rate": 0.0004948729538236013, + "loss": 1.128, + "step": 4700 + }, + { + "epoch": 1.15, + "learning_rate": 0.0004948424138773516, + "loss": 1.1266, + "step": 4725 + }, + { + "epoch": 1.16, + "learning_rate": 0.0004948130955289519, + "loss": 1.1306, + "step": 4750 + }, + { + "epoch": 1.17, + "learning_rate": 0.0004947825555827022, + "loss": 1.0861, + "step": 4775 + }, + { + "epoch": 1.17, + "learning_rate": 0.0004947520156364525, + "loss": 1.1126, + "step": 4800 + }, + { + "epoch": 1.18, + "learning_rate": 0.0004947214756902028, + "loss": 1.1643, + "step": 4825 + }, + { + "epoch": 1.18, + "learning_rate": 0.000494690935743953, + "loss": 1.1249, + "step": 4850 + }, + { + "epoch": 1.19, + "learning_rate": 0.0004946603957977034, + "loss": 1.0927, + "step": 4875 + }, + { + "epoch": 1.2, + "learning_rate": 0.0004946298558514537, + "loss": 1.0774, + "step": 4900 + }, + { + "epoch": 1.2, + "learning_rate": 0.000494599315905204, + "loss": 1.0776, + "step": 4925 + }, + { + "epoch": 1.21, + "learning_rate": 0.0004945687759589543, + "loss": 1.0937, + "step": 4950 + }, + { + "epoch": 1.21, + "learning_rate": 0.0004945382360127046, + "loss": 1.1052, + "step": 4975 + }, + { + "epoch": 1.22, + "learning_rate": 0.000494507696066455, + "loss": 1.1362, + "step": 5000 + }, + { + "epoch": 1.22, + "eval_cer": 0.27113127932404546, + "eval_loss": 0.8031673431396484, + "eval_runtime": 150.0559, + "eval_samples_per_second": 27.943, + "eval_steps_per_second": 6.991, + "eval_wer": 0.9086460032626428, + "step": 5000 + }, + { + "epoch": 1.23, + "learning_rate": 0.0004944771561202052, + "loss": 1.0782, + "step": 5025 + }, + { + "epoch": 1.23, + "learning_rate": 0.0004944466161739556, + "loss": 1.0927, + "step": 5050 + }, + { + "epoch": 1.24, + "learning_rate": 0.0004944160762277058, + "loss": 1.1011, + "step": 5075 + }, + { + "epoch": 1.24, + "learning_rate": 0.0004943855362814562, + "loss": 1.0837, + "step": 5100 + }, + { + "epoch": 1.25, + "learning_rate": 0.0004943549963352065, + "loss": 1.0993, + "step": 5125 + }, + { + "epoch": 1.26, + "learning_rate": 0.0004943244563889568, + "loss": 1.1002, + "step": 5150 + }, + { + "epoch": 1.26, + "learning_rate": 0.000494293916442707, + "loss": 1.0856, + "step": 5175 + }, + { + "epoch": 1.27, + "learning_rate": 0.0004942633764964574, + "loss": 1.1047, + "step": 5200 + }, + { + "epoch": 1.28, + "learning_rate": 0.0004942328365502076, + "loss": 1.1072, + "step": 5225 + }, + { + "epoch": 1.28, + "learning_rate": 0.000494202296603958, + "loss": 1.0748, + "step": 5250 + }, + { + "epoch": 1.29, + "learning_rate": 0.0004941717566577083, + "loss": 1.0535, + "step": 5275 + }, + { + "epoch": 1.29, + "learning_rate": 0.0004941412167114586, + "loss": 1.1443, + "step": 5300 + }, + { + "epoch": 1.3, + "learning_rate": 0.0004941106767652088, + "loss": 1.0943, + "step": 5325 + }, + { + "epoch": 1.31, + "learning_rate": 0.0004940801368189592, + "loss": 1.0904, + "step": 5350 + }, + { + "epoch": 1.31, + "learning_rate": 0.0004940495968727096, + "loss": 1.097, + "step": 5375 + }, + { + "epoch": 1.32, + "learning_rate": 0.0004940190569264598, + "loss": 1.1234, + "step": 5400 + }, + { + "epoch": 1.32, + "learning_rate": 0.0004939885169802102, + "loss": 1.1049, + "step": 5425 + }, + { + "epoch": 1.33, + "learning_rate": 0.0004939579770339604, + "loss": 1.0737, + "step": 5450 + }, + { + "epoch": 1.34, + "learning_rate": 0.0004939274370877108, + "loss": 1.0872, + "step": 5475 + }, + { + "epoch": 1.34, + "learning_rate": 0.000493896897141461, + "loss": 1.0994, + "step": 5500 + }, + { + "epoch": 1.34, + "eval_cer": 0.24623471556317567, + "eval_loss": 0.7718956470489502, + "eval_runtime": 150.4418, + "eval_samples_per_second": 27.871, + "eval_steps_per_second": 6.973, + "eval_wer": 0.8305709624796085, + "step": 5500 + }, + { + "epoch": 1.35, + "learning_rate": 0.0004938663571952114, + "loss": 1.0869, + "step": 5525 + }, + { + "epoch": 1.35, + "learning_rate": 0.0004938358172489616, + "loss": 1.0742, + "step": 5550 + }, + { + "epoch": 1.36, + "learning_rate": 0.000493805277302712, + "loss": 1.0867, + "step": 5575 + }, + { + "epoch": 1.37, + "learning_rate": 0.0004937747373564622, + "loss": 1.0516, + "step": 5600 + }, + { + "epoch": 1.37, + "learning_rate": 0.0004937441974102126, + "loss": 1.0562, + "step": 5625 + }, + { + "epoch": 1.38, + "learning_rate": 0.0004937136574639628, + "loss": 1.072, + "step": 5650 + }, + { + "epoch": 1.38, + "learning_rate": 0.0004936831175177132, + "loss": 1.0712, + "step": 5675 + }, + { + "epoch": 1.39, + "learning_rate": 0.0004936525775714634, + "loss": 1.0735, + "step": 5700 + }, + { + "epoch": 1.4, + "learning_rate": 0.0004936220376252138, + "loss": 1.0757, + "step": 5725 + }, + { + "epoch": 1.4, + "learning_rate": 0.0004935914976789642, + "loss": 1.0374, + "step": 5750 + }, + { + "epoch": 1.41, + "learning_rate": 0.0004935609577327144, + "loss": 1.0556, + "step": 5775 + }, + { + "epoch": 1.42, + "learning_rate": 0.0004935304177864647, + "loss": 1.0696, + "step": 5800 + }, + { + "epoch": 1.42, + "learning_rate": 0.000493499877840215, + "loss": 1.0751, + "step": 5825 + }, + { + "epoch": 1.43, + "learning_rate": 0.0004934693378939653, + "loss": 1.0841, + "step": 5850 + }, + { + "epoch": 1.43, + "learning_rate": 0.0004934387979477156, + "loss": 1.0686, + "step": 5875 + }, + { + "epoch": 1.44, + "learning_rate": 0.000493408258001466, + "loss": 1.062, + "step": 5900 + }, + { + "epoch": 1.45, + "learning_rate": 0.0004933777180552162, + "loss": 1.0416, + "step": 5925 + }, + { + "epoch": 1.45, + "learning_rate": 0.0004933471781089666, + "loss": 1.0138, + "step": 5950 + }, + { + "epoch": 1.46, + "learning_rate": 0.0004933166381627168, + "loss": 1.0089, + "step": 5975 + }, + { + "epoch": 1.46, + "learning_rate": 0.0004932860982164672, + "loss": 1.1, + "step": 6000 + }, + { + "epoch": 1.46, + "eval_cer": 0.25613174132213584, + "eval_loss": 0.7853134870529175, + "eval_runtime": 146.4034, + "eval_samples_per_second": 28.64, + "eval_steps_per_second": 7.165, + "eval_wer": 0.8400652528548124, + "step": 6000 + }, + { + "epoch": 1.47, + "learning_rate": 0.0004932555582702174, + "loss": 1.0436, + "step": 6025 + }, + { + "epoch": 1.48, + "learning_rate": 0.0004932250183239678, + "loss": 1.1361, + "step": 6050 + }, + { + "epoch": 1.48, + "learning_rate": 0.000493194478377718, + "loss": 1.0567, + "step": 6075 + }, + { + "epoch": 1.49, + "learning_rate": 0.0004931639384314684, + "loss": 1.1106, + "step": 6100 + }, + { + "epoch": 1.49, + "learning_rate": 0.0004931333984852187, + "loss": 1.0431, + "step": 6125 + }, + { + "epoch": 1.5, + "learning_rate": 0.000493102858538969, + "loss": 1.095, + "step": 6150 + }, + { + "epoch": 1.51, + "learning_rate": 0.0004930723185927193, + "loss": 1.0448, + "step": 6175 + }, + { + "epoch": 1.51, + "learning_rate": 0.0004930417786464696, + "loss": 1.0329, + "step": 6200 + }, + { + "epoch": 1.52, + "learning_rate": 0.0004930112387002199, + "loss": 1.0757, + "step": 6225 + }, + { + "epoch": 1.53, + "learning_rate": 0.0004929806987539702, + "loss": 1.0936, + "step": 6250 + }, + { + "epoch": 1.53, + "learning_rate": 0.0004929501588077205, + "loss": 1.0361, + "step": 6275 + }, + { + "epoch": 1.54, + "learning_rate": 0.0004929196188614708, + "loss": 1.0478, + "step": 6300 + }, + { + "epoch": 1.54, + "learning_rate": 0.0004928890789152211, + "loss": 1.0408, + "step": 6325 + }, + { + "epoch": 1.55, + "learning_rate": 0.0004928585389689714, + "loss": 1.0468, + "step": 6350 + }, + { + "epoch": 1.56, + "learning_rate": 0.0004928279990227217, + "loss": 1.0571, + "step": 6375 + }, + { + "epoch": 1.56, + "learning_rate": 0.000492797459076472, + "loss": 1.0958, + "step": 6400 + }, + { + "epoch": 1.57, + "learning_rate": 0.0004927669191302224, + "loss": 1.0402, + "step": 6425 + }, + { + "epoch": 1.57, + "learning_rate": 0.0004927363791839727, + "loss": 1.0423, + "step": 6450 + }, + { + "epoch": 1.58, + "learning_rate": 0.0004927058392377229, + "loss": 1.0132, + "step": 6475 + }, + { + "epoch": 1.59, + "learning_rate": 0.0004926752992914733, + "loss": 1.0629, + "step": 6500 + }, + { + "epoch": 1.59, + "eval_cer": 0.24587538371508064, + "eval_loss": 0.7808747887611389, + "eval_runtime": 150.3232, + "eval_samples_per_second": 27.893, + "eval_steps_per_second": 6.978, + "eval_wer": 0.8244698205546492, + "step": 6500 + }, + { + "epoch": 1.59, + "learning_rate": 0.0004926447593452236, + "loss": 1.0696, + "step": 6525 + }, + { + "epoch": 1.6, + "learning_rate": 0.0004926142193989739, + "loss": 1.0916, + "step": 6550 + }, + { + "epoch": 1.6, + "learning_rate": 0.0004925836794527242, + "loss": 1.0583, + "step": 6575 + }, + { + "epoch": 1.61, + "learning_rate": 0.0004925531395064745, + "loss": 1.0745, + "step": 6600 + }, + { + "epoch": 1.62, + "learning_rate": 0.0004925225995602247, + "loss": 1.0613, + "step": 6625 + }, + { + "epoch": 1.62, + "learning_rate": 0.0004924920596139751, + "loss": 1.0993, + "step": 6650 + }, + { + "epoch": 1.63, + "learning_rate": 0.0004924615196677254, + "loss": 1.0287, + "step": 6675 + }, + { + "epoch": 1.63, + "learning_rate": 0.0004924309797214757, + "loss": 1.0697, + "step": 6700 + }, + { + "epoch": 1.64, + "learning_rate": 0.000492400439775226, + "loss": 1.0078, + "step": 6725 + }, + { + "epoch": 1.65, + "learning_rate": 0.0004923698998289763, + "loss": 1.0758, + "step": 6750 + }, + { + "epoch": 1.65, + "learning_rate": 0.0004923393598827267, + "loss": 1.049, + "step": 6775 + }, + { + "epoch": 1.66, + "learning_rate": 0.0004923088199364769, + "loss": 1.0401, + "step": 6800 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004922782799902273, + "loss": 1.0468, + "step": 6825 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004922477400439775, + "loss": 1.0586, + "step": 6850 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004922172000977279, + "loss": 1.0428, + "step": 6875 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004921866601514781, + "loss": 1.0465, + "step": 6900 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004921561202052285, + "loss": 1.015, + "step": 6925 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004921255802589787, + "loss": 1.0893, + "step": 6950 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004920950403127291, + "loss": 1.071, + "step": 6975 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004920645003664793, + "loss": 1.1032, + "step": 7000 + }, + { + "epoch": 1.71, + "eval_cer": 0.24269786351549746, + "eval_loss": 0.7637730836868286, + "eval_runtime": 150.2038, + "eval_samples_per_second": 27.915, + "eval_steps_per_second": 6.984, + "eval_wer": 0.8227406199021207, + "step": 7000 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004920339604202297, + "loss": 1.0387, + "step": 7025 + }, + { + "epoch": 1.72, + "learning_rate": 0.00049200342047398, + "loss": 1.0642, + "step": 7050 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004919728805277303, + "loss": 1.0831, + "step": 7075 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004919423405814805, + "loss": 1.0667, + "step": 7100 + }, + { + "epoch": 1.74, + "learning_rate": 0.0004919118006352309, + "loss": 1.042, + "step": 7125 + }, + { + "epoch": 1.74, + "learning_rate": 0.0004918812606889813, + "loss": 1.0001, + "step": 7150 + }, + { + "epoch": 1.75, + "learning_rate": 0.0004918507207427315, + "loss": 1.0786, + "step": 7175 + }, + { + "epoch": 1.76, + "learning_rate": 0.0004918201807964819, + "loss": 1.0567, + "step": 7200 + }, + { + "epoch": 1.76, + "learning_rate": 0.0004917896408502321, + "loss": 1.0255, + "step": 7225 + }, + { + "epoch": 1.77, + "learning_rate": 0.0004917591009039824, + "loss": 1.0694, + "step": 7250 + }, + { + "epoch": 1.78, + "learning_rate": 0.0004917285609577327, + "loss": 1.0622, + "step": 7275 + }, + { + "epoch": 1.78, + "learning_rate": 0.0004916980210114831, + "loss": 1.0316, + "step": 7300 + }, + { + "epoch": 1.79, + "learning_rate": 0.0004916674810652333, + "loss": 1.0995, + "step": 7325 + }, + { + "epoch": 1.79, + "learning_rate": 0.0004916369411189837, + "loss": 1.0378, + "step": 7350 + }, + { + "epoch": 1.8, + "learning_rate": 0.0004916064011727339, + "loss": 1.0338, + "step": 7375 + }, + { + "epoch": 1.81, + "learning_rate": 0.0004915758612264842, + "loss": 1.0584, + "step": 7400 + }, + { + "epoch": 1.81, + "learning_rate": 0.0004915453212802345, + "loss": 1.0315, + "step": 7425 + }, + { + "epoch": 1.82, + "learning_rate": 0.0004915147813339849, + "loss": 1.0323, + "step": 7450 + }, + { + "epoch": 1.82, + "learning_rate": 0.0004914842413877351, + "loss": 0.9843, + "step": 7475 + }, + { + "epoch": 1.83, + "learning_rate": 0.0004914537014414855, + "loss": 1.0171, + "step": 7500 + }, + { + "epoch": 1.83, + "eval_cer": 0.23322690266213567, + "eval_loss": 0.74111008644104, + "eval_runtime": 150.5438, + "eval_samples_per_second": 27.852, + "eval_steps_per_second": 6.968, + "eval_wer": 0.8087112561174551, + "step": 7500 + }, + { + "epoch": 1.84, + "learning_rate": 0.0004914231614952358, + "loss": 1.0284, + "step": 7525 + }, + { + "epoch": 1.84, + "learning_rate": 0.0004913926215489861, + "loss": 1.0462, + "step": 7550 + }, + { + "epoch": 1.85, + "learning_rate": 0.0004913620816027364, + "loss": 1.0062, + "step": 7575 + }, + { + "epoch": 1.85, + "learning_rate": 0.0004913315416564867, + "loss": 1.0715, + "step": 7600 + }, + { + "epoch": 1.86, + "learning_rate": 0.000491301001710237, + "loss": 1.0672, + "step": 7625 + }, + { + "epoch": 1.87, + "learning_rate": 0.0004912704617639873, + "loss": 1.0077, + "step": 7650 + }, + { + "epoch": 1.87, + "learning_rate": 0.0004912399218177377, + "loss": 1.0668, + "step": 7675 + }, + { + "epoch": 1.88, + "learning_rate": 0.0004912093818714879, + "loss": 1.0582, + "step": 7700 + }, + { + "epoch": 1.89, + "learning_rate": 0.0004911788419252382, + "loss": 1.0758, + "step": 7725 + }, + { + "epoch": 1.89, + "learning_rate": 0.0004911483019789885, + "loss": 1.0678, + "step": 7750 + }, + { + "epoch": 1.9, + "learning_rate": 0.0004911177620327388, + "loss": 1.041, + "step": 7775 + }, + { + "epoch": 1.9, + "learning_rate": 0.0004910872220864891, + "loss": 1.0245, + "step": 7800 + }, + { + "epoch": 1.91, + "learning_rate": 0.0004910566821402395, + "loss": 1.0517, + "step": 7825 + }, + { + "epoch": 1.92, + "learning_rate": 0.0004910261421939897, + "loss": 1.0589, + "step": 7850 + }, + { + "epoch": 1.92, + "learning_rate": 0.00049099560224774, + "loss": 1.0315, + "step": 7875 + }, + { + "epoch": 1.93, + "learning_rate": 0.0004909650623014904, + "loss": 1.0659, + "step": 7900 + }, + { + "epoch": 1.93, + "learning_rate": 0.0004909345223552407, + "loss": 1.0559, + "step": 7925 + }, + { + "epoch": 1.94, + "learning_rate": 0.000490903982408991, + "loss": 1.0801, + "step": 7950 + }, + { + "epoch": 1.95, + "learning_rate": 0.0004908734424627413, + "loss": 1.0445, + "step": 7975 + }, + { + "epoch": 1.95, + "learning_rate": 0.0004908429025164916, + "loss": 1.0591, + "step": 8000 + }, + { + "epoch": 1.95, + "eval_cer": 0.23618882375286182, + "eval_loss": 0.7331734895706177, + "eval_runtime": 150.163, + "eval_samples_per_second": 27.923, + "eval_steps_per_second": 6.986, + "eval_wer": 0.8274061990212072, + "step": 8000 + }, + { + "epoch": 1.96, + "learning_rate": 0.0004908123625702418, + "loss": 1.0552, + "step": 8025 + }, + { + "epoch": 1.96, + "learning_rate": 0.0004907818226239922, + "loss": 1.0331, + "step": 8050 + }, + { + "epoch": 1.97, + "learning_rate": 0.0004907512826777425, + "loss": 1.0102, + "step": 8075 + }, + { + "epoch": 1.98, + "learning_rate": 0.0004907219643293428, + "loss": 0.9944, + "step": 8100 + }, + { + "epoch": 1.98, + "learning_rate": 0.0004906914243830931, + "loss": 0.9907, + "step": 8125 + }, + { + "epoch": 1.99, + "learning_rate": 0.0004906608844368434, + "loss": 1.0408, + "step": 8150 + }, + { + "epoch": 1.99, + "learning_rate": 0.0004906303444905936, + "loss": 1.0145, + "step": 8175 + }, + { + "epoch": 2.0, + "learning_rate": 0.000490599804544344, + "loss": 1.033, + "step": 8200 + }, + { + "epoch": 2.01, + "learning_rate": 0.0004905692645980944, + "loss": 0.9967, + "step": 8225 + }, + { + "epoch": 2.01, + "learning_rate": 0.0004905387246518446, + "loss": 1.0126, + "step": 8250 + }, + { + "epoch": 2.02, + "learning_rate": 0.000490508184705595, + "loss": 0.9957, + "step": 8275 + }, + { + "epoch": 2.03, + "learning_rate": 0.0004904776447593452, + "loss": 1.0066, + "step": 8300 + }, + { + "epoch": 2.03, + "learning_rate": 0.0004904471048130955, + "loss": 0.9957, + "step": 8325 + }, + { + "epoch": 2.04, + "learning_rate": 0.0004904165648668458, + "loss": 1.0412, + "step": 8350 + }, + { + "epoch": 2.04, + "learning_rate": 0.0004903860249205962, + "loss": 1.0109, + "step": 8375 + }, + { + "epoch": 2.05, + "learning_rate": 0.0004903554849743464, + "loss": 0.9944, + "step": 8400 + }, + { + "epoch": 2.06, + "learning_rate": 0.0004903249450280968, + "loss": 0.9917, + "step": 8425 + }, + { + "epoch": 2.06, + "learning_rate": 0.000490294405081847, + "loss": 1.0134, + "step": 8450 + }, + { + "epoch": 2.07, + "learning_rate": 0.0004902638651355974, + "loss": 0.9979, + "step": 8475 + }, + { + "epoch": 2.07, + "learning_rate": 0.0004902333251893476, + "loss": 0.9725, + "step": 8500 + }, + { + "epoch": 2.07, + "eval_cer": 0.22165641715347575, + "eval_loss": 0.7190037369728088, + "eval_runtime": 154.2309, + "eval_samples_per_second": 27.187, + "eval_steps_per_second": 6.801, + "eval_wer": 0.7847308319738988, + "step": 8500 + }, + { + "epoch": 2.08, + "learning_rate": 0.000490202785243098, + "loss": 0.9934, + "step": 8525 + }, + { + "epoch": 2.09, + "learning_rate": 0.0004901722452968482, + "loss": 0.9609, + "step": 8550 + }, + { + "epoch": 2.09, + "learning_rate": 0.0004901417053505986, + "loss": 0.9797, + "step": 8575 + }, + { + "epoch": 2.1, + "learning_rate": 0.000490111165404349, + "loss": 0.9612, + "step": 8600 + }, + { + "epoch": 2.1, + "learning_rate": 0.0004900806254580992, + "loss": 0.9582, + "step": 8625 + }, + { + "epoch": 2.11, + "learning_rate": 0.0004900500855118495, + "loss": 1.0047, + "step": 8650 + }, + { + "epoch": 2.12, + "learning_rate": 0.0004900195455655998, + "loss": 0.9842, + "step": 8675 + }, + { + "epoch": 2.12, + "learning_rate": 0.0004899890056193501, + "loss": 0.9559, + "step": 8700 + }, + { + "epoch": 2.13, + "learning_rate": 0.0004899584656731004, + "loss": 0.9806, + "step": 8725 + }, + { + "epoch": 2.14, + "learning_rate": 0.0004899279257268508, + "loss": 0.988, + "step": 8750 + }, + { + "epoch": 2.14, + "learning_rate": 0.000489897385780601, + "loss": 0.9616, + "step": 8775 + }, + { + "epoch": 2.15, + "learning_rate": 0.0004898668458343513, + "loss": 0.9586, + "step": 8800 + }, + { + "epoch": 2.15, + "learning_rate": 0.0004898363058881016, + "loss": 0.9778, + "step": 8825 + }, + { + "epoch": 2.16, + "learning_rate": 0.000489805765941852, + "loss": 1.0124, + "step": 8850 + }, + { + "epoch": 2.17, + "learning_rate": 0.0004897752259956022, + "loss": 1.0, + "step": 8875 + }, + { + "epoch": 2.17, + "learning_rate": 0.0004897446860493526, + "loss": 0.9949, + "step": 8900 + }, + { + "epoch": 2.18, + "learning_rate": 0.0004897141461031028, + "loss": 0.9904, + "step": 8925 + }, + { + "epoch": 2.18, + "learning_rate": 0.0004896836061568532, + "loss": 1.0132, + "step": 8950 + }, + { + "epoch": 2.19, + "learning_rate": 0.0004896530662106035, + "loss": 0.971, + "step": 8975 + }, + { + "epoch": 2.2, + "learning_rate": 0.0004896225262643538, + "loss": 1.03, + "step": 9000 + }, + { + "epoch": 2.2, + "eval_cer": 0.23557795961110028, + "eval_loss": 0.7176295518875122, + "eval_runtime": 149.5931, + "eval_samples_per_second": 28.029, + "eval_steps_per_second": 7.012, + "eval_wer": 0.8255138662316477, + "step": 9000 + }, + { + "epoch": 2.2, + "learning_rate": 0.0004895919863181041, + "loss": 0.9694, + "step": 9025 + }, + { + "epoch": 2.21, + "learning_rate": 0.0004895614463718544, + "loss": 0.9855, + "step": 9050 + }, + { + "epoch": 2.21, + "learning_rate": 0.0004895309064256047, + "loss": 0.986, + "step": 9075 + }, + { + "epoch": 2.22, + "learning_rate": 0.000489500366479355, + "loss": 1.0111, + "step": 9100 + }, + { + "epoch": 2.23, + "learning_rate": 0.0004894698265331053, + "loss": 0.9636, + "step": 9125 + }, + { + "epoch": 2.23, + "learning_rate": 0.0004894392865868556, + "loss": 0.9908, + "step": 9150 + }, + { + "epoch": 2.24, + "learning_rate": 0.0004894087466406059, + "loss": 0.9693, + "step": 9175 + }, + { + "epoch": 2.24, + "learning_rate": 0.0004893782066943562, + "loss": 1.0015, + "step": 9200 + }, + { + "epoch": 2.25, + "learning_rate": 0.0004893476667481066, + "loss": 0.9758, + "step": 9225 + }, + { + "epoch": 2.26, + "learning_rate": 0.0004893171268018568, + "loss": 1.0329, + "step": 9250 + }, + { + "epoch": 2.26, + "learning_rate": 0.0004892865868556071, + "loss": 0.9654, + "step": 9275 + }, + { + "epoch": 2.27, + "learning_rate": 0.0004892560469093575, + "loss": 0.9999, + "step": 9300 + }, + { + "epoch": 2.28, + "learning_rate": 0.0004892255069631077, + "loss": 0.9878, + "step": 9325 + }, + { + "epoch": 2.28, + "learning_rate": 0.0004891949670168581, + "loss": 0.9785, + "step": 9350 + }, + { + "epoch": 2.29, + "learning_rate": 0.0004891644270706084, + "loss": 0.9796, + "step": 9375 + }, + { + "epoch": 2.29, + "learning_rate": 0.0004891338871243587, + "loss": 1.0357, + "step": 9400 + }, + { + "epoch": 2.3, + "learning_rate": 0.000489103347178109, + "loss": 0.9666, + "step": 9425 + }, + { + "epoch": 2.31, + "learning_rate": 0.0004890728072318593, + "loss": 1.0062, + "step": 9450 + }, + { + "epoch": 2.31, + "learning_rate": 0.0004890422672856095, + "loss": 0.9699, + "step": 9475 + }, + { + "epoch": 2.32, + "learning_rate": 0.0004890117273393599, + "loss": 0.9939, + "step": 9500 + }, + { + "epoch": 2.32, + "eval_cer": 0.2471176452470663, + "eval_loss": 0.7189167141914368, + "eval_runtime": 153.4415, + "eval_samples_per_second": 27.326, + "eval_steps_per_second": 6.836, + "eval_wer": 0.8653181076672104, + "step": 9500 + }, + { + "epoch": 2.32, + "learning_rate": 0.0004889811873931102, + "loss": 0.9811, + "step": 9525 + }, + { + "epoch": 2.33, + "learning_rate": 0.0004889506474468605, + "loss": 1.0085, + "step": 9550 + }, + { + "epoch": 2.34, + "learning_rate": 0.0004889201075006108, + "loss": 0.9753, + "step": 9575 + }, + { + "epoch": 2.34, + "learning_rate": 0.0004888895675543611, + "loss": 0.9409, + "step": 9600 + }, + { + "epoch": 2.35, + "learning_rate": 0.0004888590276081115, + "loss": 0.9792, + "step": 9625 + }, + { + "epoch": 2.35, + "learning_rate": 0.0004888284876618617, + "loss": 1.0009, + "step": 9650 + }, + { + "epoch": 2.36, + "learning_rate": 0.0004887979477156121, + "loss": 0.9875, + "step": 9675 + }, + { + "epoch": 2.37, + "learning_rate": 0.0004887674077693623, + "loss": 1.0286, + "step": 9700 + }, + { + "epoch": 2.37, + "learning_rate": 0.0004887368678231127, + "loss": 0.96, + "step": 9725 + }, + { + "epoch": 2.38, + "learning_rate": 0.0004887063278768629, + "loss": 0.9712, + "step": 9750 + }, + { + "epoch": 2.39, + "learning_rate": 0.0004886757879306133, + "loss": 0.9919, + "step": 9775 + }, + { + "epoch": 2.39, + "learning_rate": 0.0004886452479843635, + "loss": 1.0148, + "step": 9800 + }, + { + "epoch": 2.4, + "learning_rate": 0.0004886147080381139, + "loss": 0.9762, + "step": 9825 + }, + { + "epoch": 2.4, + "learning_rate": 0.0004885841680918641, + "loss": 0.9539, + "step": 9850 + }, + { + "epoch": 2.41, + "learning_rate": 0.0004885536281456145, + "loss": 0.9814, + "step": 9875 + }, + { + "epoch": 2.42, + "learning_rate": 0.0004885230881993648, + "loss": 0.9418, + "step": 9900 + }, + { + "epoch": 2.42, + "learning_rate": 0.0004884925482531151, + "loss": 0.9613, + "step": 9925 + }, + { + "epoch": 2.43, + "learning_rate": 0.0004884620083068653, + "loss": 1.0212, + "step": 9950 + }, + { + "epoch": 2.43, + "learning_rate": 0.0004884314683606157, + "loss": 0.9608, + "step": 9975 + }, + { + "epoch": 2.44, + "learning_rate": 0.0004884009284143661, + "loss": 0.9564, + "step": 10000 + }, + { + "epoch": 2.44, + "eval_cer": 0.22702586162643862, + "eval_loss": 0.7050137519836426, + "eval_runtime": 153.9631, + "eval_samples_per_second": 27.234, + "eval_steps_per_second": 6.813, + "eval_wer": 0.7984339314845025, + "step": 10000 + }, + { + "epoch": 2.45, + "learning_rate": 0.0004883703884681163, + "loss": 0.977, + "step": 10025 + }, + { + "epoch": 2.45, + "learning_rate": 0.0004883398485218667, + "loss": 1.0024, + "step": 10050 + }, + { + "epoch": 2.46, + "learning_rate": 0.0004883093085756169, + "loss": 0.9681, + "step": 10075 + }, + { + "epoch": 2.46, + "learning_rate": 0.0004882787686293672, + "loss": 0.9711, + "step": 10100 + }, + { + "epoch": 2.47, + "learning_rate": 0.0004882482286831175, + "loss": 0.9421, + "step": 10125 + }, + { + "epoch": 2.48, + "learning_rate": 0.0004882176887368678, + "loss": 0.9543, + "step": 10150 + }, + { + "epoch": 2.48, + "learning_rate": 0.0004881871487906181, + "loss": 0.9585, + "step": 10175 + }, + { + "epoch": 2.49, + "learning_rate": 0.0004881566088443685, + "loss": 1.012, + "step": 10200 + }, + { + "epoch": 2.5, + "learning_rate": 0.00048812606889811873, + "loss": 0.9411, + "step": 10225 + }, + { + "epoch": 2.5, + "learning_rate": 0.00048809552895186904, + "loss": 0.9809, + "step": 10250 + }, + { + "epoch": 2.51, + "learning_rate": 0.00048806498900561934, + "loss": 0.9897, + "step": 10275 + }, + { + "epoch": 2.51, + "learning_rate": 0.00048803444905936964, + "loss": 0.9325, + "step": 10300 + }, + { + "epoch": 2.52, + "learning_rate": 0.00048800390911312, + "loss": 0.9752, + "step": 10325 + }, + { + "epoch": 2.53, + "learning_rate": 0.0004879733691668703, + "loss": 0.9296, + "step": 10350 + }, + { + "epoch": 2.53, + "learning_rate": 0.00048794282922062055, + "loss": 1.0148, + "step": 10375 + }, + { + "epoch": 2.54, + "learning_rate": 0.00048791228927437086, + "loss": 1.0025, + "step": 10400 + }, + { + "epoch": 2.54, + "learning_rate": 0.00048788174932812116, + "loss": 0.9625, + "step": 10425 + }, + { + "epoch": 2.55, + "learning_rate": 0.0004878512093818715, + "loss": 0.9829, + "step": 10450 + }, + { + "epoch": 2.56, + "learning_rate": 0.0004878206694356218, + "loss": 0.9655, + "step": 10475 + }, + { + "epoch": 2.56, + "learning_rate": 0.0004877901294893721, + "loss": 0.966, + "step": 10500 + }, + { + "epoch": 2.56, + "eval_cer": 0.22002915721281685, + "eval_loss": 0.698431134223938, + "eval_runtime": 151.9452, + "eval_samples_per_second": 27.595, + "eval_steps_per_second": 6.904, + "eval_wer": 0.7738009787928222, + "step": 10500 + }, + { + "epoch": 2.57, + "learning_rate": 0.0004877595895431224, + "loss": 0.946, + "step": 10525 + }, + { + "epoch": 2.57, + "learning_rate": 0.0004877290495968727, + "loss": 0.9189, + "step": 10550 + }, + { + "epoch": 2.58, + "learning_rate": 0.00048769850965062303, + "loss": 0.9545, + "step": 10575 + }, + { + "epoch": 2.59, + "learning_rate": 0.00048766796970437334, + "loss": 0.9564, + "step": 10600 + }, + { + "epoch": 2.59, + "learning_rate": 0.00048763742975812364, + "loss": 0.994, + "step": 10625 + }, + { + "epoch": 2.6, + "learning_rate": 0.00048760688981187394, + "loss": 1.0165, + "step": 10650 + }, + { + "epoch": 2.6, + "learning_rate": 0.00048757634986562425, + "loss": 0.9581, + "step": 10675 + }, + { + "epoch": 2.61, + "learning_rate": 0.00048754580991937455, + "loss": 0.9181, + "step": 10700 + }, + { + "epoch": 2.62, + "learning_rate": 0.00048751526997312485, + "loss": 0.9664, + "step": 10725 + }, + { + "epoch": 2.62, + "learning_rate": 0.00048748473002687516, + "loss": 0.995, + "step": 10750 + }, + { + "epoch": 2.63, + "learning_rate": 0.00048745419008062546, + "loss": 0.9565, + "step": 10775 + }, + { + "epoch": 2.64, + "learning_rate": 0.00048742365013437576, + "loss": 0.9906, + "step": 10800 + }, + { + "epoch": 2.64, + "learning_rate": 0.0004873931101881261, + "loss": 0.9804, + "step": 10825 + }, + { + "epoch": 2.65, + "learning_rate": 0.00048736257024187637, + "loss": 0.9643, + "step": 10850 + }, + { + "epoch": 2.65, + "learning_rate": 0.0004873320302956267, + "loss": 0.9544, + "step": 10875 + }, + { + "epoch": 2.66, + "learning_rate": 0.000487301490349377, + "loss": 1.0451, + "step": 10900 + }, + { + "epoch": 2.67, + "learning_rate": 0.0004872709504031273, + "loss": 0.9919, + "step": 10925 + }, + { + "epoch": 2.67, + "learning_rate": 0.00048724041045687764, + "loss": 1.007, + "step": 10950 + }, + { + "epoch": 2.68, + "learning_rate": 0.00048720987051062794, + "loss": 0.9678, + "step": 10975 + }, + { + "epoch": 2.68, + "learning_rate": 0.00048717933056437824, + "loss": 0.9858, + "step": 11000 + }, + { + "epoch": 2.68, + "eval_cer": 0.22549613461597692, + "eval_loss": 0.6884613633155823, + "eval_runtime": 147.9789, + "eval_samples_per_second": 28.335, + "eval_steps_per_second": 7.089, + "eval_wer": 0.8049592169657422, + "step": 11000 + }, + { + "epoch": 2.69, + "learning_rate": 0.0004871487906181285, + "loss": 0.9764, + "step": 11025 + }, + { + "epoch": 2.7, + "learning_rate": 0.0004871182506718788, + "loss": 0.9899, + "step": 11050 + }, + { + "epoch": 2.7, + "learning_rate": 0.00048708771072562915, + "loss": 0.9894, + "step": 11075 + }, + { + "epoch": 2.71, + "learning_rate": 0.00048705717077937946, + "loss": 0.9927, + "step": 11100 + }, + { + "epoch": 2.71, + "learning_rate": 0.00048702663083312976, + "loss": 0.9676, + "step": 11125 + }, + { + "epoch": 2.72, + "learning_rate": 0.00048699609088688006, + "loss": 1.0058, + "step": 11150 + }, + { + "epoch": 2.73, + "learning_rate": 0.0004869655509406303, + "loss": 0.9584, + "step": 11175 + }, + { + "epoch": 2.73, + "learning_rate": 0.00048693501099438067, + "loss": 0.9052, + "step": 11200 + }, + { + "epoch": 2.74, + "learning_rate": 0.000486904471048131, + "loss": 0.9558, + "step": 11225 + }, + { + "epoch": 2.75, + "learning_rate": 0.0004868739311018813, + "loss": 0.9989, + "step": 11250 + }, + { + "epoch": 2.75, + "learning_rate": 0.0004868433911556316, + "loss": 0.9705, + "step": 11275 + }, + { + "epoch": 2.76, + "learning_rate": 0.0004868128512093819, + "loss": 0.96, + "step": 11300 + }, + { + "epoch": 2.76, + "learning_rate": 0.00048678231126313213, + "loss": 0.9782, + "step": 11325 + }, + { + "epoch": 2.77, + "learning_rate": 0.0004867517713168825, + "loss": 0.9906, + "step": 11350 + }, + { + "epoch": 2.78, + "learning_rate": 0.0004867212313706328, + "loss": 0.9869, + "step": 11375 + }, + { + "epoch": 2.78, + "learning_rate": 0.0004866906914243831, + "loss": 0.9431, + "step": 11400 + }, + { + "epoch": 2.79, + "learning_rate": 0.0004866601514781334, + "loss": 0.9565, + "step": 11425 + }, + { + "epoch": 2.79, + "learning_rate": 0.0004866296115318837, + "loss": 0.9876, + "step": 11450 + }, + { + "epoch": 2.8, + "learning_rate": 0.00048659907158563406, + "loss": 0.9448, + "step": 11475 + }, + { + "epoch": 2.81, + "learning_rate": 0.0004865685316393843, + "loss": 0.9484, + "step": 11500 + }, + { + "epoch": 2.81, + "eval_cer": 0.21829923102984508, + "eval_loss": 0.6878862977027893, + "eval_runtime": 149.5721, + "eval_samples_per_second": 28.033, + "eval_steps_per_second": 7.013, + "eval_wer": 0.7645676998368679, + "step": 11500 + }, + { + "epoch": 2.81, + "learning_rate": 0.0004865379916931346, + "loss": 0.9508, + "step": 11525 + }, + { + "epoch": 2.82, + "learning_rate": 0.0004865074517468849, + "loss": 0.996, + "step": 11550 + }, + { + "epoch": 2.82, + "learning_rate": 0.0004864769118006352, + "loss": 0.9525, + "step": 11575 + }, + { + "epoch": 2.83, + "learning_rate": 0.0004864463718543856, + "loss": 1.0059, + "step": 11600 + }, + { + "epoch": 2.84, + "learning_rate": 0.0004864158319081359, + "loss": 0.9635, + "step": 11625 + }, + { + "epoch": 2.84, + "learning_rate": 0.00048638529196188613, + "loss": 0.96, + "step": 11650 + }, + { + "epoch": 2.85, + "learning_rate": 0.00048635475201563643, + "loss": 0.968, + "step": 11675 + }, + { + "epoch": 2.86, + "learning_rate": 0.00048632421206938674, + "loss": 0.9205, + "step": 11700 + }, + { + "epoch": 2.86, + "learning_rate": 0.0004862936721231371, + "loss": 0.9185, + "step": 11725 + }, + { + "epoch": 2.87, + "learning_rate": 0.0004862631321768874, + "loss": 0.9517, + "step": 11750 + }, + { + "epoch": 2.87, + "learning_rate": 0.0004862325922306377, + "loss": 1.0051, + "step": 11775 + }, + { + "epoch": 2.88, + "learning_rate": 0.00048620205228438795, + "loss": 0.9333, + "step": 11800 + }, + { + "epoch": 2.89, + "learning_rate": 0.00048617151233813825, + "loss": 0.9508, + "step": 11825 + }, + { + "epoch": 2.89, + "learning_rate": 0.0004861409723918886, + "loss": 0.9726, + "step": 11850 + }, + { + "epoch": 2.9, + "learning_rate": 0.0004861104324456389, + "loss": 0.9376, + "step": 11875 + }, + { + "epoch": 2.9, + "learning_rate": 0.0004860798924993892, + "loss": 0.9773, + "step": 11900 + }, + { + "epoch": 2.91, + "learning_rate": 0.0004860493525531395, + "loss": 0.9483, + "step": 11925 + }, + { + "epoch": 2.92, + "learning_rate": 0.0004860188126068898, + "loss": 0.9744, + "step": 11950 + }, + { + "epoch": 2.92, + "learning_rate": 0.00048598827266064013, + "loss": 0.9449, + "step": 11975 + }, + { + "epoch": 2.93, + "learning_rate": 0.00048595773271439043, + "loss": 0.9244, + "step": 12000 + }, + { + "epoch": 2.93, + "eval_cer": 0.21655390491052637, + "eval_loss": 0.6589547991752625, + "eval_runtime": 149.4696, + "eval_samples_per_second": 28.053, + "eval_steps_per_second": 7.018, + "eval_wer": 0.7743882544861338, + "step": 12000 + }, + { + "epoch": 2.93, + "learning_rate": 0.00048592719276814074, + "loss": 0.9488, + "step": 12025 + }, + { + "epoch": 2.94, + "learning_rate": 0.00048589665282189104, + "loss": 0.9111, + "step": 12050 + }, + { + "epoch": 2.95, + "learning_rate": 0.00048586611287564134, + "loss": 0.9263, + "step": 12075 + }, + { + "epoch": 2.95, + "learning_rate": 0.0004858355729293917, + "loss": 0.8932, + "step": 12100 + }, + { + "epoch": 2.96, + "learning_rate": 0.00048580503298314195, + "loss": 0.9376, + "step": 12125 + }, + { + "epoch": 2.96, + "learning_rate": 0.00048577449303689225, + "loss": 0.9569, + "step": 12150 + }, + { + "epoch": 2.97, + "learning_rate": 0.00048574395309064256, + "loss": 0.9335, + "step": 12175 + }, + { + "epoch": 2.98, + "learning_rate": 0.00048571341314439286, + "loss": 0.9099, + "step": 12200 + }, + { + "epoch": 2.98, + "learning_rate": 0.0004856828731981432, + "loss": 0.9444, + "step": 12225 + }, + { + "epoch": 2.99, + "learning_rate": 0.0004856523332518935, + "loss": 0.9528, + "step": 12250 + }, + { + "epoch": 3.0, + "learning_rate": 0.00048562179330564377, + "loss": 0.9481, + "step": 12275 + }, + { + "epoch": 3.0, + "learning_rate": 0.00048559125335939407, + "loss": 0.9301, + "step": 12300 + }, + { + "epoch": 3.01, + "learning_rate": 0.0004855607134131444, + "loss": 0.8993, + "step": 12325 + }, + { + "epoch": 3.01, + "learning_rate": 0.00048553017346689473, + "loss": 0.905, + "step": 12350 + }, + { + "epoch": 3.02, + "learning_rate": 0.00048549963352064504, + "loss": 0.9204, + "step": 12375 + }, + { + "epoch": 3.03, + "learning_rate": 0.00048546909357439534, + "loss": 0.9196, + "step": 12400 + }, + { + "epoch": 3.03, + "learning_rate": 0.00048543855362814564, + "loss": 0.9102, + "step": 12425 + }, + { + "epoch": 3.04, + "learning_rate": 0.0004854080136818959, + "loss": 0.9034, + "step": 12450 + }, + { + "epoch": 3.04, + "learning_rate": 0.00048537747373564625, + "loss": 0.8883, + "step": 12475 + }, + { + "epoch": 3.05, + "learning_rate": 0.00048534693378939655, + "loss": 0.9224, + "step": 12500 + }, + { + "epoch": 3.05, + "eval_cer": 0.2035255587610238, + "eval_loss": 0.6522818207740784, + "eval_runtime": 150.425, + "eval_samples_per_second": 27.874, + "eval_steps_per_second": 6.974, + "eval_wer": 0.7476672104404568, + "step": 12500 + }, + { + "epoch": 3.06, + "learning_rate": 0.00048531639384314686, + "loss": 0.9002, + "step": 12525 + }, + { + "epoch": 3.06, + "learning_rate": 0.00048528585389689716, + "loss": 0.9254, + "step": 12550 + }, + { + "epoch": 3.07, + "learning_rate": 0.00048525531395064746, + "loss": 0.9498, + "step": 12575 + }, + { + "epoch": 3.07, + "learning_rate": 0.00048522477400439777, + "loss": 0.9027, + "step": 12600 + }, + { + "epoch": 3.08, + "learning_rate": 0.00048519423405814807, + "loss": 0.9143, + "step": 12625 + }, + { + "epoch": 3.09, + "learning_rate": 0.0004851636941118984, + "loss": 0.9581, + "step": 12650 + }, + { + "epoch": 3.09, + "learning_rate": 0.0004851331541656487, + "loss": 0.9042, + "step": 12675 + }, + { + "epoch": 3.1, + "learning_rate": 0.000485102614219399, + "loss": 0.927, + "step": 12700 + }, + { + "epoch": 3.11, + "learning_rate": 0.00048507207427314934, + "loss": 0.9333, + "step": 12725 + }, + { + "epoch": 3.11, + "learning_rate": 0.0004850415343268996, + "loss": 0.8864, + "step": 12750 + }, + { + "epoch": 3.12, + "learning_rate": 0.0004850109943806499, + "loss": 0.9396, + "step": 12775 + }, + { + "epoch": 3.12, + "learning_rate": 0.0004849804544344002, + "loss": 0.9603, + "step": 12800 + }, + { + "epoch": 3.13, + "learning_rate": 0.0004849499144881505, + "loss": 0.9117, + "step": 12825 + }, + { + "epoch": 3.14, + "learning_rate": 0.0004849193745419008, + "loss": 0.9961, + "step": 12850 + }, + { + "epoch": 3.14, + "learning_rate": 0.00048488883459565116, + "loss": 0.9035, + "step": 12875 + }, + { + "epoch": 3.15, + "learning_rate": 0.00048485829464940146, + "loss": 0.8586, + "step": 12900 + }, + { + "epoch": 3.15, + "learning_rate": 0.0004848277547031517, + "loss": 0.9017, + "step": 12925 + }, + { + "epoch": 3.16, + "learning_rate": 0.000484797214756902, + "loss": 0.8265, + "step": 12950 + }, + { + "epoch": 3.17, + "learning_rate": 0.0004847666748106523, + "loss": 0.926, + "step": 12975 + }, + { + "epoch": 3.17, + "learning_rate": 0.0004847361348644027, + "loss": 0.9148, + "step": 13000 + }, + { + "epoch": 3.17, + "eval_cer": 0.20544028418015872, + "eval_loss": 0.6521516442298889, + "eval_runtime": 148.4584, + "eval_samples_per_second": 28.244, + "eval_steps_per_second": 7.066, + "eval_wer": 0.7506688417618271, + "step": 13000 + }, + { + "epoch": 3.18, + "learning_rate": 0.000484705594918153, + "loss": 0.885, + "step": 13025 + }, + { + "epoch": 3.18, + "learning_rate": 0.0004846750549719033, + "loss": 0.9175, + "step": 13050 + }, + { + "epoch": 3.19, + "learning_rate": 0.00048464451502565353, + "loss": 0.8873, + "step": 13075 + }, + { + "epoch": 3.2, + "learning_rate": 0.00048461397507940383, + "loss": 0.9484, + "step": 13100 + }, + { + "epoch": 3.2, + "learning_rate": 0.0004845834351331542, + "loss": 0.8753, + "step": 13125 + }, + { + "epoch": 3.21, + "learning_rate": 0.0004845528951869045, + "loss": 0.9427, + "step": 13150 + }, + { + "epoch": 3.21, + "learning_rate": 0.0004845223552406548, + "loss": 0.9135, + "step": 13175 + }, + { + "epoch": 3.22, + "learning_rate": 0.0004844918152944051, + "loss": 0.9313, + "step": 13200 + }, + { + "epoch": 3.23, + "learning_rate": 0.00048446127534815535, + "loss": 0.9239, + "step": 13225 + }, + { + "epoch": 3.23, + "learning_rate": 0.0004844307354019057, + "loss": 0.9113, + "step": 13250 + }, + { + "epoch": 3.24, + "learning_rate": 0.000484400195455656, + "loss": 0.8907, + "step": 13275 + }, + { + "epoch": 3.25, + "learning_rate": 0.0004843696555094063, + "loss": 0.9199, + "step": 13300 + }, + { + "epoch": 3.25, + "learning_rate": 0.0004843391155631566, + "loss": 0.9231, + "step": 13325 + }, + { + "epoch": 3.26, + "learning_rate": 0.0004843085756169069, + "loss": 0.9079, + "step": 13350 + }, + { + "epoch": 3.26, + "learning_rate": 0.0004842780356706572, + "loss": 0.8949, + "step": 13375 + }, + { + "epoch": 3.27, + "learning_rate": 0.00048424749572440753, + "loss": 0.9139, + "step": 13400 + }, + { + "epoch": 3.28, + "learning_rate": 0.00048421695577815783, + "loss": 0.9003, + "step": 13425 + }, + { + "epoch": 3.28, + "learning_rate": 0.00048418641583190813, + "loss": 0.9042, + "step": 13450 + }, + { + "epoch": 3.29, + "learning_rate": 0.00048415587588565844, + "loss": 0.9246, + "step": 13475 + }, + { + "epoch": 3.29, + "learning_rate": 0.0004841253359394088, + "loss": 0.9227, + "step": 13500 + }, + { + "epoch": 3.29, + "eval_cer": 0.20374629118199644, + "eval_loss": 0.6420453190803528, + "eval_runtime": 148.4286, + "eval_samples_per_second": 28.249, + "eval_steps_per_second": 7.067, + "eval_wer": 0.754094616639478, + "step": 13500 + }, + { + "epoch": 3.3, + "learning_rate": 0.0004840947959931591, + "loss": 0.9074, + "step": 13525 + }, + { + "epoch": 3.31, + "learning_rate": 0.00048406425604690935, + "loss": 0.8885, + "step": 13550 + }, + { + "epoch": 3.31, + "learning_rate": 0.00048403371610065965, + "loss": 0.9374, + "step": 13575 + }, + { + "epoch": 3.32, + "learning_rate": 0.00048400317615440995, + "loss": 0.9339, + "step": 13600 + }, + { + "epoch": 3.32, + "learning_rate": 0.0004839726362081603, + "loss": 0.8923, + "step": 13625 + }, + { + "epoch": 3.33, + "learning_rate": 0.0004839420962619106, + "loss": 0.9201, + "step": 13650 + }, + { + "epoch": 3.34, + "learning_rate": 0.0004839115563156609, + "loss": 0.9358, + "step": 13675 + }, + { + "epoch": 3.34, + "learning_rate": 0.00048388101636941117, + "loss": 0.9606, + "step": 13700 + }, + { + "epoch": 3.35, + "learning_rate": 0.0004838516980210115, + "loss": 0.894, + "step": 13725 + }, + { + "epoch": 3.36, + "learning_rate": 0.0004838211580747618, + "loss": 0.9257, + "step": 13750 + }, + { + "epoch": 3.36, + "learning_rate": 0.0004837906181285121, + "loss": 0.8742, + "step": 13775 + }, + { + "epoch": 3.37, + "learning_rate": 0.00048376007818226244, + "loss": 0.8619, + "step": 13800 + }, + { + "epoch": 3.37, + "learning_rate": 0.00048372953823601274, + "loss": 0.8761, + "step": 13825 + }, + { + "epoch": 3.38, + "learning_rate": 0.000483698998289763, + "loss": 0.9257, + "step": 13850 + }, + { + "epoch": 3.39, + "learning_rate": 0.0004836684583435133, + "loss": 0.9392, + "step": 13875 + }, + { + "epoch": 3.39, + "learning_rate": 0.0004836379183972636, + "loss": 0.9186, + "step": 13900 + }, + { + "epoch": 3.4, + "learning_rate": 0.00048360737845101396, + "loss": 0.9031, + "step": 13925 + }, + { + "epoch": 3.4, + "learning_rate": 0.00048357683850476426, + "loss": 0.8896, + "step": 13950 + }, + { + "epoch": 3.41, + "learning_rate": 0.00048354629855851456, + "loss": 0.9033, + "step": 13975 + }, + { + "epoch": 3.42, + "learning_rate": 0.00048351575861226487, + "loss": 0.8935, + "step": 14000 + }, + { + "epoch": 3.42, + "eval_cer": 0.2014260341057257, + "eval_loss": 0.6442487835884094, + "eval_runtime": 150.0535, + "eval_samples_per_second": 27.943, + "eval_steps_per_second": 6.991, + "eval_wer": 0.7415986949429038, + "step": 14000 + }, + { + "epoch": 3.42, + "learning_rate": 0.0004834852186660151, + "loss": 0.8764, + "step": 14025 + }, + { + "epoch": 3.43, + "learning_rate": 0.00048345467871976547, + "loss": 0.9076, + "step": 14050 + }, + { + "epoch": 3.43, + "learning_rate": 0.0004834241387735158, + "loss": 0.9242, + "step": 14075 + }, + { + "epoch": 3.44, + "learning_rate": 0.0004833935988272661, + "loss": 0.855, + "step": 14100 + }, + { + "epoch": 3.45, + "learning_rate": 0.0004833630588810164, + "loss": 0.9283, + "step": 14125 + }, + { + "epoch": 3.45, + "learning_rate": 0.0004833325189347667, + "loss": 0.9128, + "step": 14150 + }, + { + "epoch": 3.46, + "learning_rate": 0.000483301978988517, + "loss": 0.9126, + "step": 14175 + }, + { + "epoch": 3.47, + "learning_rate": 0.0004832714390422673, + "loss": 0.8883, + "step": 14200 + }, + { + "epoch": 3.47, + "learning_rate": 0.0004832408990960176, + "loss": 0.8974, + "step": 14225 + }, + { + "epoch": 3.48, + "learning_rate": 0.0004832103591497679, + "loss": 0.9776, + "step": 14250 + }, + { + "epoch": 3.48, + "learning_rate": 0.0004831798192035182, + "loss": 0.9265, + "step": 14275 + }, + { + "epoch": 3.49, + "learning_rate": 0.00048314927925726856, + "loss": 0.9559, + "step": 14300 + }, + { + "epoch": 3.5, + "learning_rate": 0.0004831187393110188, + "loss": 0.9448, + "step": 14325 + }, + { + "epoch": 3.5, + "learning_rate": 0.0004830881993647691, + "loss": 0.9357, + "step": 14350 + }, + { + "epoch": 3.51, + "learning_rate": 0.0004830576594185194, + "loss": 0.9283, + "step": 14375 + }, + { + "epoch": 3.51, + "learning_rate": 0.0004830271194722697, + "loss": 0.9365, + "step": 14400 + }, + { + "epoch": 3.52, + "learning_rate": 0.0004829965795260201, + "loss": 0.9369, + "step": 14425 + }, + { + "epoch": 3.53, + "learning_rate": 0.0004829660395797704, + "loss": 0.9185, + "step": 14450 + }, + { + "epoch": 3.53, + "learning_rate": 0.0004829354996335207, + "loss": 0.923, + "step": 14475 + }, + { + "epoch": 3.54, + "learning_rate": 0.00048290495968727093, + "loss": 0.9257, + "step": 14500 + }, + { + "epoch": 3.54, + "eval_cer": 0.1986027124421219, + "eval_loss": 0.6285128593444824, + "eval_runtime": 148.5155, + "eval_samples_per_second": 28.233, + "eval_steps_per_second": 7.063, + "eval_wer": 0.7263295269168026, + "step": 14500 + }, + { + "epoch": 3.54, + "learning_rate": 0.00048287441974102124, + "loss": 0.9144, + "step": 14525 + }, + { + "epoch": 3.55, + "learning_rate": 0.0004828438797947716, + "loss": 0.9176, + "step": 14550 + }, + { + "epoch": 3.56, + "learning_rate": 0.0004828133398485219, + "loss": 0.8861, + "step": 14575 + }, + { + "epoch": 3.56, + "learning_rate": 0.0004827827999022722, + "loss": 0.9533, + "step": 14600 + }, + { + "epoch": 3.57, + "learning_rate": 0.0004827522599560225, + "loss": 0.8651, + "step": 14625 + }, + { + "epoch": 3.57, + "learning_rate": 0.00048272172000977275, + "loss": 0.9017, + "step": 14650 + }, + { + "epoch": 3.58, + "learning_rate": 0.0004826911800635231, + "loss": 0.8858, + "step": 14675 + }, + { + "epoch": 3.59, + "learning_rate": 0.0004826606401172734, + "loss": 0.9246, + "step": 14700 + }, + { + "epoch": 3.59, + "learning_rate": 0.0004826301001710237, + "loss": 0.844, + "step": 14725 + }, + { + "epoch": 3.6, + "learning_rate": 0.000482599560224774, + "loss": 0.8826, + "step": 14750 + }, + { + "epoch": 3.61, + "learning_rate": 0.0004825690202785243, + "loss": 0.8788, + "step": 14775 + }, + { + "epoch": 3.61, + "learning_rate": 0.00048253848033227457, + "loss": 0.907, + "step": 14800 + }, + { + "epoch": 3.62, + "learning_rate": 0.00048250794038602493, + "loss": 0.9251, + "step": 14825 + }, + { + "epoch": 3.62, + "learning_rate": 0.00048247740043977523, + "loss": 0.8712, + "step": 14850 + }, + { + "epoch": 3.63, + "learning_rate": 0.00048244686049352554, + "loss": 0.9175, + "step": 14875 + }, + { + "epoch": 3.64, + "learning_rate": 0.00048241632054727584, + "loss": 0.9437, + "step": 14900 + }, + { + "epoch": 3.64, + "learning_rate": 0.00048238578060102614, + "loss": 0.9023, + "step": 14925 + }, + { + "epoch": 3.65, + "learning_rate": 0.0004823552406547765, + "loss": 0.9112, + "step": 14950 + }, + { + "epoch": 3.65, + "learning_rate": 0.00048232470070852675, + "loss": 0.8988, + "step": 14975 + }, + { + "epoch": 3.66, + "learning_rate": 0.00048229538236012706, + "loss": 0.9194, + "step": 15000 + }, + { + "epoch": 3.66, + "eval_cer": 0.19383386548668932, + "eval_loss": 0.6116518378257751, + "eval_runtime": 157.9954, + "eval_samples_per_second": 26.539, + "eval_steps_per_second": 6.639, + "eval_wer": 0.72, + "step": 15000 + }, + { + "epoch": 3.67, + "learning_rate": 0.00048226484241387736, + "loss": 0.8694, + "step": 15025 + }, + { + "epoch": 3.67, + "learning_rate": 0.00048223430246762766, + "loss": 0.9755, + "step": 15050 + }, + { + "epoch": 3.68, + "learning_rate": 0.00048220376252137797, + "loss": 0.9342, + "step": 15075 + }, + { + "epoch": 3.68, + "learning_rate": 0.0004821732225751283, + "loss": 0.9129, + "step": 15100 + }, + { + "epoch": 3.69, + "learning_rate": 0.0004821426826288786, + "loss": 0.9193, + "step": 15125 + }, + { + "epoch": 3.7, + "learning_rate": 0.0004821121426826289, + "loss": 0.9264, + "step": 15150 + }, + { + "epoch": 3.7, + "learning_rate": 0.0004820816027363792, + "loss": 0.916, + "step": 15175 + }, + { + "epoch": 3.71, + "learning_rate": 0.0004820510627901295, + "loss": 0.968, + "step": 15200 + }, + { + "epoch": 3.72, + "learning_rate": 0.00048202052284387984, + "loss": 0.919, + "step": 15225 + }, + { + "epoch": 3.72, + "learning_rate": 0.00048198998289763014, + "loss": 0.8958, + "step": 15250 + }, + { + "epoch": 3.73, + "learning_rate": 0.0004819594429513804, + "loss": 0.881, + "step": 15275 + }, + { + "epoch": 3.73, + "learning_rate": 0.0004819289030051307, + "loss": 0.8499, + "step": 15300 + }, + { + "epoch": 3.74, + "learning_rate": 0.000481898363058881, + "loss": 0.8722, + "step": 15325 + }, + { + "epoch": 3.75, + "learning_rate": 0.00048186782311263136, + "loss": 0.9201, + "step": 15350 + }, + { + "epoch": 3.75, + "learning_rate": 0.00048183728316638166, + "loss": 0.9017, + "step": 15375 + }, + { + "epoch": 3.76, + "learning_rate": 0.00048180674322013196, + "loss": 0.8766, + "step": 15400 + }, + { + "epoch": 3.76, + "learning_rate": 0.00048177620327388227, + "loss": 0.8692, + "step": 15425 + }, + { + "epoch": 3.77, + "learning_rate": 0.0004817456633276325, + "loss": 0.8803, + "step": 15450 + }, + { + "epoch": 3.78, + "learning_rate": 0.0004817151233813828, + "loss": 0.8915, + "step": 15475 + }, + { + "epoch": 3.78, + "learning_rate": 0.0004816845834351332, + "loss": 0.9158, + "step": 15500 + }, + { + "epoch": 3.78, + "eval_cer": 0.19416753077420612, + "eval_loss": 0.6197028160095215, + "eval_runtime": 156.8998, + "eval_samples_per_second": 26.724, + "eval_steps_per_second": 6.686, + "eval_wer": 0.7233605220228385, + "step": 15500 + }, + { + "epoch": 3.79, + "learning_rate": 0.0004816540434888835, + "loss": 0.8998, + "step": 15525 + }, + { + "epoch": 3.79, + "learning_rate": 0.0004816235035426338, + "loss": 0.8904, + "step": 15550 + }, + { + "epoch": 3.8, + "learning_rate": 0.0004815929635963841, + "loss": 0.8888, + "step": 15575 + }, + { + "epoch": 3.81, + "learning_rate": 0.00048156242365013434, + "loss": 0.9235, + "step": 15600 + }, + { + "epoch": 3.81, + "learning_rate": 0.0004815318837038847, + "loss": 0.9225, + "step": 15625 + }, + { + "epoch": 3.82, + "learning_rate": 0.000481501343757635, + "loss": 0.955, + "step": 15650 + }, + { + "epoch": 3.83, + "learning_rate": 0.0004814708038113853, + "loss": 0.9162, + "step": 15675 + }, + { + "epoch": 3.83, + "learning_rate": 0.0004814402638651356, + "loss": 0.9626, + "step": 15700 + }, + { + "epoch": 3.84, + "learning_rate": 0.0004814097239188859, + "loss": 0.9149, + "step": 15725 + }, + { + "epoch": 3.84, + "learning_rate": 0.0004813791839726362, + "loss": 0.9075, + "step": 15750 + }, + { + "epoch": 3.85, + "learning_rate": 0.0004813486440263865, + "loss": 0.9157, + "step": 15775 + }, + { + "epoch": 3.86, + "learning_rate": 0.0004813181040801368, + "loss": 0.9607, + "step": 15800 + }, + { + "epoch": 3.86, + "learning_rate": 0.0004812875641338871, + "loss": 0.9188, + "step": 15825 + }, + { + "epoch": 3.87, + "learning_rate": 0.0004812570241876374, + "loss": 0.9023, + "step": 15850 + }, + { + "epoch": 3.87, + "learning_rate": 0.0004812264842413878, + "loss": 0.8976, + "step": 15875 + }, + { + "epoch": 3.88, + "learning_rate": 0.0004811959442951381, + "loss": 0.9066, + "step": 15900 + }, + { + "epoch": 3.89, + "learning_rate": 0.00048116540434888833, + "loss": 0.869, + "step": 15925 + }, + { + "epoch": 3.89, + "learning_rate": 0.00048113486440263864, + "loss": 0.8878, + "step": 15950 + }, + { + "epoch": 3.9, + "learning_rate": 0.00048110432445638894, + "loss": 0.887, + "step": 15975 + }, + { + "epoch": 3.9, + "learning_rate": 0.0004810737845101393, + "loss": 0.9079, + "step": 16000 + }, + { + "epoch": 3.9, + "eval_cer": 0.19389546523207704, + "eval_loss": 0.6110395789146423, + "eval_runtime": 159.6702, + "eval_samples_per_second": 26.26, + "eval_steps_per_second": 6.57, + "eval_wer": 0.7186623164763458, + "step": 16000 + }, + { + "epoch": 3.91, + "learning_rate": 0.0004810432445638896, + "loss": 0.8978, + "step": 16025 + }, + { + "epoch": 3.92, + "learning_rate": 0.0004810127046176399, + "loss": 0.9334, + "step": 16050 + }, + { + "epoch": 3.92, + "learning_rate": 0.00048098216467139015, + "loss": 0.9075, + "step": 16075 + }, + { + "epoch": 3.93, + "learning_rate": 0.00048095162472514046, + "loss": 0.9095, + "step": 16100 + }, + { + "epoch": 3.93, + "learning_rate": 0.0004809210847788908, + "loss": 0.8562, + "step": 16125 + }, + { + "epoch": 3.94, + "learning_rate": 0.0004808905448326411, + "loss": 0.8754, + "step": 16150 + }, + { + "epoch": 3.95, + "learning_rate": 0.0004808600048863914, + "loss": 0.8995, + "step": 16175 + }, + { + "epoch": 3.95, + "learning_rate": 0.0004808294649401417, + "loss": 0.888, + "step": 16200 + }, + { + "epoch": 3.96, + "learning_rate": 0.000480798924993892, + "loss": 0.9029, + "step": 16225 + }, + { + "epoch": 3.97, + "learning_rate": 0.00048076838504764233, + "loss": 0.8989, + "step": 16250 + }, + { + "epoch": 3.97, + "learning_rate": 0.00048073784510139264, + "loss": 0.8953, + "step": 16275 + }, + { + "epoch": 3.98, + "learning_rate": 0.00048070730515514294, + "loss": 0.8848, + "step": 16300 + }, + { + "epoch": 3.98, + "learning_rate": 0.00048067676520889324, + "loss": 0.8959, + "step": 16325 + }, + { + "epoch": 3.99, + "learning_rate": 0.00048064622526264355, + "loss": 0.9037, + "step": 16350 + }, + { + "epoch": 4.0, + "learning_rate": 0.0004806156853163939, + "loss": 0.8861, + "step": 16375 + }, + { + "epoch": 4.0, + "learning_rate": 0.00048058514537014415, + "loss": 0.8714, + "step": 16400 + }, + { + "epoch": 4.01, + "learning_rate": 0.00048055460542389446, + "loss": 0.8466, + "step": 16425 + }, + { + "epoch": 4.01, + "learning_rate": 0.00048052406547764476, + "loss": 0.8683, + "step": 16450 + }, + { + "epoch": 4.02, + "learning_rate": 0.00048049352553139506, + "loss": 0.8804, + "step": 16475 + }, + { + "epoch": 4.03, + "learning_rate": 0.0004804629855851454, + "loss": 0.8748, + "step": 16500 + }, + { + "epoch": 4.03, + "eval_cer": 0.19239140478219358, + "eval_loss": 0.6182339191436768, + "eval_runtime": 155.8113, + "eval_samples_per_second": 26.911, + "eval_steps_per_second": 6.733, + "eval_wer": 0.7095595432300164, + "step": 16500 + }, + { + "epoch": 4.03, + "learning_rate": 0.0004804324456388957, + "loss": 0.8761, + "step": 16525 + }, + { + "epoch": 4.04, + "learning_rate": 0.00048040190569264597, + "loss": 0.8836, + "step": 16550 + }, + { + "epoch": 4.04, + "learning_rate": 0.0004803713657463963, + "loss": 0.8432, + "step": 16575 + }, + { + "epoch": 4.05, + "learning_rate": 0.0004803408258001466, + "loss": 0.8815, + "step": 16600 + }, + { + "epoch": 4.06, + "learning_rate": 0.00048031028585389694, + "loss": 0.8588, + "step": 16625 + }, + { + "epoch": 4.06, + "learning_rate": 0.00048027974590764724, + "loss": 0.8693, + "step": 16650 + }, + { + "epoch": 4.07, + "learning_rate": 0.00048024920596139754, + "loss": 0.8591, + "step": 16675 + }, + { + "epoch": 4.08, + "learning_rate": 0.0004802186660151478, + "loss": 0.826, + "step": 16700 + }, + { + "epoch": 4.08, + "learning_rate": 0.0004801881260688981, + "loss": 0.8454, + "step": 16725 + }, + { + "epoch": 4.09, + "learning_rate": 0.00048015758612264845, + "loss": 0.8355, + "step": 16750 + }, + { + "epoch": 4.09, + "learning_rate": 0.00048012704617639876, + "loss": 0.8605, + "step": 16775 + }, + { + "epoch": 4.1, + "learning_rate": 0.00048009650623014906, + "loss": 0.8632, + "step": 16800 + }, + { + "epoch": 4.11, + "learning_rate": 0.00048006596628389936, + "loss": 0.8736, + "step": 16825 + }, + { + "epoch": 4.11, + "learning_rate": 0.00048003542633764967, + "loss": 0.8854, + "step": 16850 + }, + { + "epoch": 4.12, + "learning_rate": 0.0004800048863913999, + "loss": 0.8112, + "step": 16875 + }, + { + "epoch": 4.12, + "learning_rate": 0.0004799743464451503, + "loss": 0.9039, + "step": 16900 + }, + { + "epoch": 4.13, + "learning_rate": 0.0004799438064989006, + "loss": 0.8413, + "step": 16925 + }, + { + "epoch": 4.14, + "learning_rate": 0.0004799132665526509, + "loss": 0.893, + "step": 16950 + }, + { + "epoch": 4.14, + "learning_rate": 0.0004798827266064012, + "loss": 0.8393, + "step": 16975 + }, + { + "epoch": 4.15, + "learning_rate": 0.0004798521866601515, + "loss": 0.8646, + "step": 17000 + }, + { + "epoch": 4.15, + "eval_cer": 0.1894038171308892, + "eval_loss": 0.610537588596344, + "eval_runtime": 151.6007, + "eval_samples_per_second": 27.658, + "eval_steps_per_second": 6.919, + "eval_wer": 0.7057096247960848, + "step": 17000 + }, + { + "epoch": 4.15, + "learning_rate": 0.0004798216467139018, + "loss": 0.8306, + "step": 17025 + }, + { + "epoch": 4.16, + "learning_rate": 0.0004797911067676521, + "loss": 0.8423, + "step": 17050 + }, + { + "epoch": 4.17, + "learning_rate": 0.0004797605668214024, + "loss": 0.8677, + "step": 17075 + }, + { + "epoch": 4.17, + "learning_rate": 0.0004797300268751527, + "loss": 0.881, + "step": 17100 + }, + { + "epoch": 4.18, + "learning_rate": 0.000479699486928903, + "loss": 0.8678, + "step": 17125 + }, + { + "epoch": 4.18, + "learning_rate": 0.00047966894698265336, + "loss": 0.8482, + "step": 17150 + }, + { + "epoch": 4.19, + "learning_rate": 0.0004796384070364036, + "loss": 0.8506, + "step": 17175 + }, + { + "epoch": 4.2, + "learning_rate": 0.0004796078670901539, + "loss": 0.865, + "step": 17200 + }, + { + "epoch": 4.2, + "learning_rate": 0.0004795773271439042, + "loss": 0.8473, + "step": 17225 + }, + { + "epoch": 4.21, + "learning_rate": 0.0004795467871976545, + "loss": 0.8935, + "step": 17250 + }, + { + "epoch": 4.22, + "learning_rate": 0.0004795162472514049, + "loss": 0.8363, + "step": 17275 + }, + { + "epoch": 4.22, + "learning_rate": 0.0004794857073051552, + "loss": 0.8998, + "step": 17300 + }, + { + "epoch": 4.23, + "learning_rate": 0.00047945516735890543, + "loss": 0.8064, + "step": 17325 + }, + { + "epoch": 4.23, + "learning_rate": 0.00047942462741265573, + "loss": 0.8821, + "step": 17350 + }, + { + "epoch": 4.24, + "learning_rate": 0.00047939408746640604, + "loss": 0.8698, + "step": 17375 + }, + { + "epoch": 4.25, + "learning_rate": 0.0004793635475201564, + "loss": 0.8981, + "step": 17400 + }, + { + "epoch": 4.25, + "learning_rate": 0.0004793330075739067, + "loss": 0.89, + "step": 17425 + }, + { + "epoch": 4.26, + "learning_rate": 0.000479302467627657, + "loss": 0.9013, + "step": 17450 + }, + { + "epoch": 4.26, + "learning_rate": 0.0004792719276814073, + "loss": 0.8582, + "step": 17475 + }, + { + "epoch": 4.27, + "learning_rate": 0.00047924138773515755, + "loss": 0.8455, + "step": 17500 + }, + { + "epoch": 4.27, + "eval_cer": 0.19123640955617383, + "eval_loss": 0.6235982775688171, + "eval_runtime": 151.4202, + "eval_samples_per_second": 27.691, + "eval_steps_per_second": 6.928, + "eval_wer": 0.7036215334420881, + "step": 17500 + }, + { + "epoch": 4.28, + "learning_rate": 0.0004792108477889079, + "loss": 0.8973, + "step": 17525 + }, + { + "epoch": 4.28, + "learning_rate": 0.0004791803078426582, + "loss": 0.9159, + "step": 17550 + }, + { + "epoch": 4.29, + "learning_rate": 0.0004791497678964085, + "loss": 0.891, + "step": 17575 + }, + { + "epoch": 4.29, + "learning_rate": 0.0004791192279501588, + "loss": 0.8436, + "step": 17600 + }, + { + "epoch": 4.3, + "learning_rate": 0.0004790886880039091, + "loss": 0.8194, + "step": 17625 + }, + { + "epoch": 4.31, + "learning_rate": 0.00047905814805765943, + "loss": 0.9107, + "step": 17650 + }, + { + "epoch": 4.31, + "learning_rate": 0.00047902760811140973, + "loss": 0.8197, + "step": 17675 + }, + { + "epoch": 4.32, + "learning_rate": 0.00047899706816516003, + "loss": 0.8804, + "step": 17700 + }, + { + "epoch": 4.33, + "learning_rate": 0.00047896652821891034, + "loss": 0.8347, + "step": 17725 + }, + { + "epoch": 4.33, + "learning_rate": 0.00047893598827266064, + "loss": 0.8829, + "step": 17750 + }, + { + "epoch": 4.34, + "learning_rate": 0.000478905448326411, + "loss": 0.8283, + "step": 17775 + }, + { + "epoch": 4.34, + "learning_rate": 0.00047887490838016125, + "loss": 0.9252, + "step": 17800 + }, + { + "epoch": 4.35, + "learning_rate": 0.00047884436843391155, + "loss": 0.8479, + "step": 17825 + }, + { + "epoch": 4.36, + "learning_rate": 0.00047881382848766185, + "loss": 0.8377, + "step": 17850 + }, + { + "epoch": 4.36, + "learning_rate": 0.00047878328854141216, + "loss": 0.839, + "step": 17875 + }, + { + "epoch": 4.37, + "learning_rate": 0.0004787527485951625, + "loss": 0.8441, + "step": 17900 + }, + { + "epoch": 4.37, + "learning_rate": 0.0004787222086489128, + "loss": 0.8075, + "step": 17925 + }, + { + "epoch": 4.38, + "learning_rate": 0.0004786916687026631, + "loss": 0.8223, + "step": 17950 + }, + { + "epoch": 4.39, + "learning_rate": 0.00047866112875641337, + "loss": 0.8505, + "step": 17975 + }, + { + "epoch": 4.39, + "learning_rate": 0.0004786305888101637, + "loss": 0.8922, + "step": 18000 + }, + { + "epoch": 4.39, + "eval_cer": 0.1920988059916019, + "eval_loss": 0.5946230888366699, + "eval_runtime": 153.06, + "eval_samples_per_second": 27.394, + "eval_steps_per_second": 6.854, + "eval_wer": 0.7341272430668841, + "step": 18000 + }, + { + "epoch": 4.4, + "learning_rate": 0.00047860004886391403, + "loss": 0.8649, + "step": 18025 + }, + { + "epoch": 4.4, + "learning_rate": 0.00047856950891766434, + "loss": 0.8993, + "step": 18050 + }, + { + "epoch": 4.41, + "learning_rate": 0.00047853896897141464, + "loss": 0.8717, + "step": 18075 + }, + { + "epoch": 4.42, + "learning_rate": 0.00047850842902516494, + "loss": 0.8664, + "step": 18100 + }, + { + "epoch": 4.42, + "learning_rate": 0.0004784778890789152, + "loss": 0.8581, + "step": 18125 + }, + { + "epoch": 4.43, + "learning_rate": 0.0004784473491326655, + "loss": 0.88, + "step": 18150 + }, + { + "epoch": 4.44, + "learning_rate": 0.00047841680918641585, + "loss": 0.882, + "step": 18175 + }, + { + "epoch": 4.44, + "learning_rate": 0.00047838626924016616, + "loss": 0.8509, + "step": 18200 + }, + { + "epoch": 4.45, + "learning_rate": 0.00047835572929391646, + "loss": 0.8531, + "step": 18225 + }, + { + "epoch": 4.45, + "learning_rate": 0.00047832518934766676, + "loss": 0.8309, + "step": 18250 + }, + { + "epoch": 4.46, + "learning_rate": 0.000478294649401417, + "loss": 0.8175, + "step": 18275 + }, + { + "epoch": 4.47, + "learning_rate": 0.00047826410945516737, + "loss": 0.8153, + "step": 18300 + }, + { + "epoch": 4.47, + "learning_rate": 0.00047823356950891767, + "loss": 0.8628, + "step": 18325 + }, + { + "epoch": 4.48, + "learning_rate": 0.000478203029562668, + "loss": 0.8184, + "step": 18350 + }, + { + "epoch": 4.48, + "learning_rate": 0.0004781724896164183, + "loss": 0.8636, + "step": 18375 + }, + { + "epoch": 4.49, + "learning_rate": 0.0004781419496701686, + "loss": 0.9017, + "step": 18400 + }, + { + "epoch": 4.5, + "learning_rate": 0.00047811140972391894, + "loss": 0.8521, + "step": 18425 + }, + { + "epoch": 4.5, + "learning_rate": 0.0004780808697776692, + "loss": 0.8823, + "step": 18450 + }, + { + "epoch": 4.51, + "learning_rate": 0.0004780503298314195, + "loss": 0.8743, + "step": 18475 + }, + { + "epoch": 4.51, + "learning_rate": 0.0004780197898851698, + "loss": 0.892, + "step": 18500 + }, + { + "epoch": 4.51, + "eval_cer": 0.1869244273790335, + "eval_loss": 0.5911566615104675, + "eval_runtime": 154.1004, + "eval_samples_per_second": 27.21, + "eval_steps_per_second": 6.807, + "eval_wer": 0.7141924959216965, + "step": 18500 + }, + { + "epoch": 4.52, + "learning_rate": 0.0004779892499389201, + "loss": 0.819, + "step": 18525 + }, + { + "epoch": 4.53, + "learning_rate": 0.00047795870999267046, + "loss": 0.8848, + "step": 18550 + }, + { + "epoch": 4.53, + "learning_rate": 0.00047792817004642076, + "loss": 0.866, + "step": 18575 + }, + { + "epoch": 4.54, + "learning_rate": 0.000477897630100171, + "loss": 0.8542, + "step": 18600 + }, + { + "epoch": 4.54, + "learning_rate": 0.0004778670901539213, + "loss": 0.8467, + "step": 18625 + }, + { + "epoch": 4.55, + "learning_rate": 0.0004778365502076716, + "loss": 0.8299, + "step": 18650 + }, + { + "epoch": 4.56, + "learning_rate": 0.000477806010261422, + "loss": 0.8438, + "step": 18675 + }, + { + "epoch": 4.56, + "learning_rate": 0.0004777754703151723, + "loss": 0.9114, + "step": 18700 + }, + { + "epoch": 4.57, + "learning_rate": 0.0004777449303689226, + "loss": 0.8342, + "step": 18725 + }, + { + "epoch": 4.58, + "learning_rate": 0.00047771561202052283, + "loss": 0.8113, + "step": 18750 + }, + { + "epoch": 4.58, + "learning_rate": 0.00047768507207427314, + "loss": 0.8987, + "step": 18775 + }, + { + "epoch": 4.59, + "learning_rate": 0.00047765453212802344, + "loss": 0.9497, + "step": 18800 + }, + { + "epoch": 4.59, + "learning_rate": 0.0004776239921817738, + "loss": 0.8582, + "step": 18825 + }, + { + "epoch": 4.6, + "learning_rate": 0.0004775934522355241, + "loss": 0.8603, + "step": 18850 + }, + { + "epoch": 4.61, + "learning_rate": 0.0004775629122892744, + "loss": 0.8849, + "step": 18875 + }, + { + "epoch": 4.61, + "learning_rate": 0.0004775323723430247, + "loss": 0.7985, + "step": 18900 + }, + { + "epoch": 4.62, + "learning_rate": 0.00047750183239677496, + "loss": 0.8452, + "step": 18925 + }, + { + "epoch": 4.62, + "learning_rate": 0.00047747129245052526, + "loss": 0.8839, + "step": 18950 + }, + { + "epoch": 4.63, + "learning_rate": 0.0004774407525042756, + "loss": 0.875, + "step": 18975 + }, + { + "epoch": 4.64, + "learning_rate": 0.0004774102125580259, + "loss": 0.8652, + "step": 19000 + }, + { + "epoch": 4.64, + "eval_cer": 0.18706816011827151, + "eval_loss": 0.6004529595375061, + "eval_runtime": 153.7951, + "eval_samples_per_second": 27.264, + "eval_steps_per_second": 6.821, + "eval_wer": 0.6966068515497553, + "step": 19000 + }, + { + "epoch": 4.64, + "learning_rate": 0.0004773796726117762, + "loss": 0.8351, + "step": 19025 + }, + { + "epoch": 4.65, + "learning_rate": 0.0004773491326655265, + "loss": 0.8282, + "step": 19050 + }, + { + "epoch": 4.65, + "learning_rate": 0.0004773185927192768, + "loss": 0.8422, + "step": 19075 + }, + { + "epoch": 4.66, + "learning_rate": 0.00047728805277302713, + "loss": 0.8612, + "step": 19100 + }, + { + "epoch": 4.67, + "learning_rate": 0.00047725751282677744, + "loss": 0.843, + "step": 19125 + }, + { + "epoch": 4.67, + "learning_rate": 0.00047722697288052774, + "loss": 0.8185, + "step": 19150 + }, + { + "epoch": 4.68, + "learning_rate": 0.00047719643293427804, + "loss": 0.8069, + "step": 19175 + }, + { + "epoch": 4.69, + "learning_rate": 0.00047716589298802835, + "loss": 0.8473, + "step": 19200 + }, + { + "epoch": 4.69, + "learning_rate": 0.00047713535304177865, + "loss": 0.8486, + "step": 19225 + }, + { + "epoch": 4.7, + "learning_rate": 0.00047710481309552895, + "loss": 0.8625, + "step": 19250 + }, + { + "epoch": 4.7, + "learning_rate": 0.00047707427314927926, + "loss": 0.8526, + "step": 19275 + }, + { + "epoch": 4.71, + "learning_rate": 0.00047704373320302956, + "loss": 0.8784, + "step": 19300 + }, + { + "epoch": 4.72, + "learning_rate": 0.00047701319325677986, + "loss": 0.8541, + "step": 19325 + }, + { + "epoch": 4.72, + "learning_rate": 0.0004769826533105302, + "loss": 0.8885, + "step": 19350 + }, + { + "epoch": 4.73, + "learning_rate": 0.0004769521133642805, + "loss": 0.8381, + "step": 19375 + }, + { + "epoch": 4.73, + "learning_rate": 0.0004769215734180308, + "loss": 0.8414, + "step": 19400 + }, + { + "epoch": 4.74, + "learning_rate": 0.0004768910334717811, + "loss": 0.8571, + "step": 19425 + }, + { + "epoch": 4.75, + "learning_rate": 0.0004768604935255314, + "loss": 0.8505, + "step": 19450 + }, + { + "epoch": 4.75, + "learning_rate": 0.00047682995357928174, + "loss": 0.8485, + "step": 19475 + }, + { + "epoch": 4.76, + "learning_rate": 0.00047679941363303204, + "loss": 0.899, + "step": 19500 + }, + { + "epoch": 4.76, + "eval_cer": 0.18276131125324682, + "eval_loss": 0.5773286819458008, + "eval_runtime": 154.5433, + "eval_samples_per_second": 27.132, + "eval_steps_per_second": 6.788, + "eval_wer": 0.6981402936378467, + "step": 19500 + }, + { + "epoch": 4.76, + "learning_rate": 0.00047676887368678234, + "loss": 0.8769, + "step": 19525 + }, + { + "epoch": 4.77, + "learning_rate": 0.0004767383337405326, + "loss": 0.9001, + "step": 19550 + }, + { + "epoch": 4.78, + "learning_rate": 0.0004767077937942829, + "loss": 0.8733, + "step": 19575 + }, + { + "epoch": 4.78, + "learning_rate": 0.00047667725384803325, + "loss": 0.8425, + "step": 19600 + }, + { + "epoch": 4.79, + "learning_rate": 0.00047664671390178356, + "loss": 0.8404, + "step": 19625 + }, + { + "epoch": 4.8, + "learning_rate": 0.00047661617395553386, + "loss": 0.8385, + "step": 19650 + }, + { + "epoch": 4.8, + "learning_rate": 0.00047658563400928416, + "loss": 0.8495, + "step": 19675 + }, + { + "epoch": 4.81, + "learning_rate": 0.0004765550940630344, + "loss": 0.8986, + "step": 19700 + }, + { + "epoch": 4.81, + "learning_rate": 0.00047652455411678477, + "loss": 0.847, + "step": 19725 + }, + { + "epoch": 4.82, + "learning_rate": 0.0004764940141705351, + "loss": 0.8786, + "step": 19750 + }, + { + "epoch": 4.83, + "learning_rate": 0.0004764634742242854, + "loss": 0.857, + "step": 19775 + }, + { + "epoch": 4.83, + "learning_rate": 0.0004764329342780357, + "loss": 0.8316, + "step": 19800 + }, + { + "epoch": 4.84, + "learning_rate": 0.000476402394331786, + "loss": 0.8361, + "step": 19825 + }, + { + "epoch": 4.84, + "learning_rate": 0.00047637185438553634, + "loss": 0.8672, + "step": 19850 + }, + { + "epoch": 4.85, + "learning_rate": 0.0004763413144392866, + "loss": 0.82, + "step": 19875 + }, + { + "epoch": 4.86, + "learning_rate": 0.0004763107744930369, + "loss": 0.9363, + "step": 19900 + }, + { + "epoch": 4.86, + "learning_rate": 0.0004762802345467872, + "loss": 0.8214, + "step": 19925 + }, + { + "epoch": 4.87, + "learning_rate": 0.0004762496946005375, + "loss": 0.8463, + "step": 19950 + }, + { + "epoch": 4.87, + "learning_rate": 0.00047621915465428786, + "loss": 0.8159, + "step": 19975 + }, + { + "epoch": 4.88, + "learning_rate": 0.00047618861470803816, + "loss": 0.8552, + "step": 20000 + }, + { + "epoch": 4.88, + "eval_cer": 0.18054372041928893, + "eval_loss": 0.5839799642562866, + "eval_runtime": 155.5746, + "eval_samples_per_second": 26.952, + "eval_steps_per_second": 6.743, + "eval_wer": 0.687536704730832, + "step": 20000 + }, + { + "epoch": 4.89, + "learning_rate": 0.0004761580747617884, + "loss": 0.8316, + "step": 20025 + }, + { + "epoch": 4.89, + "learning_rate": 0.0004761275348155387, + "loss": 0.8426, + "step": 20050 + }, + { + "epoch": 4.9, + "learning_rate": 0.000476096994869289, + "loss": 0.8167, + "step": 20075 + }, + { + "epoch": 4.9, + "learning_rate": 0.0004760664549230394, + "loss": 0.8331, + "step": 20100 + }, + { + "epoch": 4.91, + "learning_rate": 0.0004760359149767897, + "loss": 0.8494, + "step": 20125 + }, + { + "epoch": 4.92, + "learning_rate": 0.00047600537503054, + "loss": 0.8332, + "step": 20150 + }, + { + "epoch": 4.92, + "learning_rate": 0.00047597483508429023, + "loss": 0.8497, + "step": 20175 + }, + { + "epoch": 4.93, + "learning_rate": 0.00047594429513804054, + "loss": 0.8528, + "step": 20200 + }, + { + "epoch": 4.94, + "learning_rate": 0.00047591375519179084, + "loss": 0.8209, + "step": 20225 + }, + { + "epoch": 4.94, + "learning_rate": 0.0004758832152455412, + "loss": 0.8663, + "step": 20250 + }, + { + "epoch": 4.95, + "learning_rate": 0.0004758526752992915, + "loss": 0.8484, + "step": 20275 + }, + { + "epoch": 4.95, + "learning_rate": 0.0004758221353530418, + "loss": 0.9051, + "step": 20300 + }, + { + "epoch": 4.96, + "learning_rate": 0.0004757915954067921, + "loss": 0.8601, + "step": 20325 + }, + { + "epoch": 4.97, + "learning_rate": 0.00047576105546054236, + "loss": 0.8726, + "step": 20350 + }, + { + "epoch": 4.97, + "learning_rate": 0.0004757305155142927, + "loss": 0.8709, + "step": 20375 + }, + { + "epoch": 4.98, + "learning_rate": 0.000475699975568043, + "loss": 0.8691, + "step": 20400 + }, + { + "epoch": 4.98, + "learning_rate": 0.0004756694356217933, + "loss": 0.8425, + "step": 20425 + }, + { + "epoch": 4.99, + "learning_rate": 0.0004756388956755436, + "loss": 0.9021, + "step": 20450 + }, + { + "epoch": 5.0, + "learning_rate": 0.0004756083557292939, + "loss": 0.8877, + "step": 20475 + }, + { + "epoch": 5.0, + "learning_rate": 0.00047557781578304423, + "loss": 0.8581, + "step": 20500 + }, + { + "epoch": 5.0, + "eval_cer": 0.18998901471207252, + "eval_loss": 0.5940809845924377, + "eval_runtime": 154.3505, + "eval_samples_per_second": 27.165, + "eval_steps_per_second": 6.796, + "eval_wer": 0.7326916802610114, + "step": 20500 + }, + { + "epoch": 5.01, + "learning_rate": 0.00047554727583679453, + "loss": 0.8584, + "step": 20525 + }, + { + "epoch": 5.01, + "learning_rate": 0.00047551673589054484, + "loss": 0.8564, + "step": 20550 + }, + { + "epoch": 5.02, + "learning_rate": 0.00047548619594429514, + "loss": 0.7907, + "step": 20575 + }, + { + "epoch": 5.03, + "learning_rate": 0.00047545565599804544, + "loss": 0.7891, + "step": 20600 + }, + { + "epoch": 5.03, + "learning_rate": 0.0004754251160517958, + "loss": 0.7914, + "step": 20625 + }, + { + "epoch": 5.04, + "learning_rate": 0.00047539457610554605, + "loss": 0.8744, + "step": 20650 + }, + { + "epoch": 5.05, + "learning_rate": 0.00047536403615929635, + "loss": 0.813, + "step": 20675 + }, + { + "epoch": 5.05, + "learning_rate": 0.00047533349621304666, + "loss": 0.8361, + "step": 20700 + }, + { + "epoch": 5.06, + "learning_rate": 0.00047530295626679696, + "loss": 0.7998, + "step": 20725 + }, + { + "epoch": 5.06, + "learning_rate": 0.0004752724163205473, + "loss": 0.7892, + "step": 20750 + }, + { + "epoch": 5.07, + "learning_rate": 0.0004752418763742976, + "loss": 0.7928, + "step": 20775 + }, + { + "epoch": 5.08, + "learning_rate": 0.00047521133642804787, + "loss": 0.826, + "step": 20800 + }, + { + "epoch": 5.08, + "learning_rate": 0.00047518079648179817, + "loss": 0.8311, + "step": 20825 + }, + { + "epoch": 5.09, + "learning_rate": 0.0004751502565355485, + "loss": 0.8117, + "step": 20850 + }, + { + "epoch": 5.09, + "learning_rate": 0.00047511971658929883, + "loss": 0.8047, + "step": 20875 + }, + { + "epoch": 5.1, + "learning_rate": 0.00047508917664304914, + "loss": 0.7799, + "step": 20900 + }, + { + "epoch": 5.11, + "learning_rate": 0.00047505863669679944, + "loss": 0.8633, + "step": 20925 + }, + { + "epoch": 5.11, + "learning_rate": 0.00047502809675054974, + "loss": 0.817, + "step": 20950 + }, + { + "epoch": 5.12, + "learning_rate": 0.0004749975568043, + "loss": 0.782, + "step": 20975 + }, + { + "epoch": 5.12, + "learning_rate": 0.00047496701685805035, + "loss": 0.8571, + "step": 21000 + }, + { + "epoch": 5.12, + "eval_cer": 0.18460417030276274, + "eval_loss": 0.591896116733551, + "eval_runtime": 154.5066, + "eval_samples_per_second": 27.138, + "eval_steps_per_second": 6.789, + "eval_wer": 0.7048939641109299, + "step": 21000 + }, + { + "epoch": 5.13, + "learning_rate": 0.00047493647691180065, + "loss": 0.842, + "step": 21025 + }, + { + "epoch": 5.14, + "learning_rate": 0.00047490593696555096, + "loss": 0.8247, + "step": 21050 + }, + { + "epoch": 5.14, + "learning_rate": 0.00047487539701930126, + "loss": 0.7865, + "step": 21075 + }, + { + "epoch": 5.15, + "learning_rate": 0.00047484485707305156, + "loss": 0.8372, + "step": 21100 + }, + { + "epoch": 5.15, + "learning_rate": 0.00047481431712680187, + "loss": 0.8344, + "step": 21125 + }, + { + "epoch": 5.16, + "learning_rate": 0.00047478377718055217, + "loss": 0.8012, + "step": 21150 + }, + { + "epoch": 5.17, + "learning_rate": 0.0004747532372343025, + "loss": 0.8137, + "step": 21175 + }, + { + "epoch": 5.17, + "learning_rate": 0.0004747226972880528, + "loss": 0.8604, + "step": 21200 + }, + { + "epoch": 5.18, + "learning_rate": 0.0004746921573418031, + "loss": 0.8123, + "step": 21225 + }, + { + "epoch": 5.19, + "learning_rate": 0.00047466161739555344, + "loss": 0.7806, + "step": 21250 + }, + { + "epoch": 5.19, + "learning_rate": 0.0004746310774493037, + "loss": 0.8092, + "step": 21275 + }, + { + "epoch": 5.2, + "learning_rate": 0.000474600537503054, + "loss": 0.8068, + "step": 21300 + }, + { + "epoch": 5.2, + "learning_rate": 0.0004745699975568043, + "loss": 0.792, + "step": 21325 + }, + { + "epoch": 5.21, + "learning_rate": 0.0004745394576105546, + "loss": 0.7547, + "step": 21350 + }, + { + "epoch": 5.22, + "learning_rate": 0.00047450891766430495, + "loss": 0.8371, + "step": 21375 + }, + { + "epoch": 5.22, + "learning_rate": 0.00047447837771805526, + "loss": 0.819, + "step": 21400 + }, + { + "epoch": 5.23, + "learning_rate": 0.00047444783777180556, + "loss": 0.7873, + "step": 21425 + }, + { + "epoch": 5.23, + "learning_rate": 0.0004744172978255558, + "loss": 0.8598, + "step": 21450 + }, + { + "epoch": 5.24, + "learning_rate": 0.0004743867578793061, + "loss": 0.8331, + "step": 21475 + }, + { + "epoch": 5.25, + "learning_rate": 0.0004743562179330564, + "loss": 0.7979, + "step": 21500 + }, + { + "epoch": 5.25, + "eval_cer": 0.1748200774103467, + "eval_loss": 0.5703975558280945, + "eval_runtime": 154.9079, + "eval_samples_per_second": 27.068, + "eval_steps_per_second": 6.772, + "eval_wer": 0.6698205546492659, + "step": 21500 + }, + { + "epoch": 5.25, + "learning_rate": 0.0004743256779868068, + "loss": 0.83, + "step": 21525 + }, + { + "epoch": 5.26, + "learning_rate": 0.0004742951380405571, + "loss": 0.85, + "step": 21550 + }, + { + "epoch": 5.26, + "learning_rate": 0.0004742645980943074, + "loss": 0.8218, + "step": 21575 + }, + { + "epoch": 5.27, + "learning_rate": 0.00047423405814805763, + "loss": 0.8249, + "step": 21600 + }, + { + "epoch": 5.28, + "learning_rate": 0.00047420351820180793, + "loss": 0.8485, + "step": 21625 + }, + { + "epoch": 5.28, + "learning_rate": 0.0004741729782555583, + "loss": 0.8386, + "step": 21650 + }, + { + "epoch": 5.29, + "learning_rate": 0.0004741424383093086, + "loss": 0.797, + "step": 21675 + }, + { + "epoch": 5.3, + "learning_rate": 0.0004741118983630589, + "loss": 0.854, + "step": 21700 + }, + { + "epoch": 5.3, + "learning_rate": 0.0004740813584168092, + "loss": 0.7792, + "step": 21725 + }, + { + "epoch": 5.31, + "learning_rate": 0.00047405081847055945, + "loss": 0.804, + "step": 21750 + }, + { + "epoch": 5.31, + "learning_rate": 0.0004740202785243098, + "loss": 0.7898, + "step": 21775 + }, + { + "epoch": 5.32, + "learning_rate": 0.0004739897385780601, + "loss": 0.7937, + "step": 21800 + }, + { + "epoch": 5.33, + "learning_rate": 0.0004739591986318104, + "loss": 0.8173, + "step": 21825 + }, + { + "epoch": 5.33, + "learning_rate": 0.0004739286586855607, + "loss": 0.8347, + "step": 21850 + }, + { + "epoch": 5.34, + "learning_rate": 0.000473898118739311, + "loss": 0.8076, + "step": 21875 + }, + { + "epoch": 5.34, + "learning_rate": 0.0004738675787930614, + "loss": 0.8352, + "step": 21900 + }, + { + "epoch": 5.35, + "learning_rate": 0.00047383703884681163, + "loss": 0.8279, + "step": 21925 + }, + { + "epoch": 5.36, + "learning_rate": 0.00047380649890056193, + "loss": 0.784, + "step": 21950 + }, + { + "epoch": 5.36, + "learning_rate": 0.00047377595895431224, + "loss": 0.8001, + "step": 21975 + }, + { + "epoch": 5.37, + "learning_rate": 0.00047374541900806254, + "loss": 0.8348, + "step": 22000 + }, + { + "epoch": 5.37, + "eval_cer": 0.1788907939180518, + "eval_loss": 0.5868992805480957, + "eval_runtime": 154.2562, + "eval_samples_per_second": 27.182, + "eval_steps_per_second": 6.8, + "eval_wer": 0.6766068515497553, + "step": 22000 + }, + { + "epoch": 5.37, + "learning_rate": 0.0004737148790618129, + "loss": 0.8137, + "step": 22025 + }, + { + "epoch": 5.38, + "learning_rate": 0.0004736843391155632, + "loss": 0.8458, + "step": 22050 + }, + { + "epoch": 5.39, + "learning_rate": 0.00047365379916931345, + "loss": 0.8318, + "step": 22075 + }, + { + "epoch": 5.39, + "learning_rate": 0.00047362325922306375, + "loss": 0.8083, + "step": 22100 + }, + { + "epoch": 5.4, + "learning_rate": 0.00047359271927681406, + "loss": 0.7662, + "step": 22125 + }, + { + "epoch": 5.41, + "learning_rate": 0.0004735621793305644, + "loss": 0.8556, + "step": 22150 + }, + { + "epoch": 5.41, + "learning_rate": 0.0004735316393843147, + "loss": 0.8289, + "step": 22175 + }, + { + "epoch": 5.42, + "learning_rate": 0.000473501099438065, + "loss": 0.7828, + "step": 22200 + }, + { + "epoch": 5.42, + "learning_rate": 0.00047347055949181527, + "loss": 0.7481, + "step": 22225 + }, + { + "epoch": 5.43, + "learning_rate": 0.00047344001954556557, + "loss": 0.8216, + "step": 22250 + }, + { + "epoch": 5.44, + "learning_rate": 0.00047340947959931593, + "loss": 0.8051, + "step": 22275 + }, + { + "epoch": 5.44, + "learning_rate": 0.00047337893965306623, + "loss": 0.7921, + "step": 22300 + }, + { + "epoch": 5.45, + "learning_rate": 0.00047334839970681654, + "loss": 0.8073, + "step": 22325 + }, + { + "epoch": 5.45, + "learning_rate": 0.00047331785976056684, + "loss": 0.8664, + "step": 22350 + }, + { + "epoch": 5.46, + "learning_rate": 0.00047328731981431714, + "loss": 0.8147, + "step": 22375 + }, + { + "epoch": 5.47, + "learning_rate": 0.00047325677986806745, + "loss": 0.8146, + "step": 22400 + }, + { + "epoch": 5.47, + "learning_rate": 0.00047322623992181775, + "loss": 0.7966, + "step": 22425 + }, + { + "epoch": 5.48, + "learning_rate": 0.00047319569997556805, + "loss": 0.8359, + "step": 22450 + }, + { + "epoch": 5.48, + "learning_rate": 0.00047316516002931836, + "loss": 0.8292, + "step": 22475 + }, + { + "epoch": 5.49, + "learning_rate": 0.00047313462008306866, + "loss": 0.7843, + "step": 22500 + }, + { + "epoch": 5.49, + "eval_cer": 0.1750356765192037, + "eval_loss": 0.5732399821281433, + "eval_runtime": 154.5633, + "eval_samples_per_second": 27.128, + "eval_steps_per_second": 6.787, + "eval_wer": 0.6731810766721044, + "step": 22500 + }, + { + "epoch": 5.5, + "learning_rate": 0.000473104080136819, + "loss": 0.7897, + "step": 22525 + }, + { + "epoch": 5.5, + "learning_rate": 0.00047307354019056927, + "loss": 0.7618, + "step": 22550 + }, + { + "epoch": 5.51, + "learning_rate": 0.00047304300024431957, + "loss": 0.8309, + "step": 22575 + }, + { + "epoch": 5.51, + "learning_rate": 0.0004730124602980699, + "loss": 0.7635, + "step": 22600 + }, + { + "epoch": 5.52, + "learning_rate": 0.0004729819203518202, + "loss": 0.818, + "step": 22625 + }, + { + "epoch": 5.53, + "learning_rate": 0.00047295138040557053, + "loss": 0.8215, + "step": 22650 + }, + { + "epoch": 5.53, + "learning_rate": 0.00047292084045932084, + "loss": 0.8412, + "step": 22675 + }, + { + "epoch": 5.54, + "learning_rate": 0.0004728903005130711, + "loss": 0.7867, + "step": 22700 + }, + { + "epoch": 5.55, + "learning_rate": 0.0004728597605668214, + "loss": 0.7692, + "step": 22725 + }, + { + "epoch": 5.55, + "learning_rate": 0.0004728292206205717, + "loss": 0.8446, + "step": 22750 + }, + { + "epoch": 5.56, + "learning_rate": 0.00047279868067432205, + "loss": 0.8351, + "step": 22775 + }, + { + "epoch": 5.56, + "learning_rate": 0.00047276814072807235, + "loss": 0.7931, + "step": 22800 + }, + { + "epoch": 5.57, + "learning_rate": 0.00047273760078182266, + "loss": 0.862, + "step": 22825 + }, + { + "epoch": 5.58, + "learning_rate": 0.00047270706083557296, + "loss": 0.88, + "step": 22850 + }, + { + "epoch": 5.58, + "learning_rate": 0.0004726765208893232, + "loss": 0.785, + "step": 22875 + }, + { + "epoch": 5.59, + "learning_rate": 0.0004726459809430735, + "loss": 0.8098, + "step": 22900 + }, + { + "epoch": 5.59, + "learning_rate": 0.00047261544099682387, + "loss": 0.7932, + "step": 22925 + }, + { + "epoch": 5.6, + "learning_rate": 0.0004725849010505742, + "loss": 0.8176, + "step": 22950 + }, + { + "epoch": 5.61, + "learning_rate": 0.0004725543611043245, + "loss": 0.8033, + "step": 22975 + }, + { + "epoch": 5.61, + "learning_rate": 0.0004725250427559248, + "loss": 0.855, + "step": 23000 + }, + { + "epoch": 5.61, + "eval_cer": 0.1686601028715748, + "eval_loss": 0.5447995662689209, + "eval_runtime": 154.9215, + "eval_samples_per_second": 27.065, + "eval_steps_per_second": 6.771, + "eval_wer": 0.6520065252854812, + "step": 23000 + }, + { + "epoch": 5.62, + "learning_rate": 0.00047249450280967503, + "loss": 0.7908, + "step": 23025 + }, + { + "epoch": 5.62, + "learning_rate": 0.00047246396286342534, + "loss": 0.8381, + "step": 23050 + }, + { + "epoch": 5.63, + "learning_rate": 0.0004724334229171757, + "loss": 0.8155, + "step": 23075 + }, + { + "epoch": 5.64, + "learning_rate": 0.000472402882970926, + "loss": 0.8471, + "step": 23100 + }, + { + "epoch": 5.64, + "learning_rate": 0.0004723723430246763, + "loss": 0.8259, + "step": 23125 + }, + { + "epoch": 5.65, + "learning_rate": 0.0004723418030784266, + "loss": 0.8709, + "step": 23150 + }, + { + "epoch": 5.66, + "learning_rate": 0.00047231126313217685, + "loss": 0.7902, + "step": 23175 + }, + { + "epoch": 5.66, + "learning_rate": 0.0004722807231859272, + "loss": 0.8795, + "step": 23200 + }, + { + "epoch": 5.67, + "learning_rate": 0.0004722501832396775, + "loss": 0.8107, + "step": 23225 + }, + { + "epoch": 5.67, + "learning_rate": 0.0004722196432934278, + "loss": 0.7959, + "step": 23250 + }, + { + "epoch": 5.68, + "learning_rate": 0.0004721891033471781, + "loss": 0.7615, + "step": 23275 + }, + { + "epoch": 5.69, + "learning_rate": 0.0004721585634009284, + "loss": 0.8344, + "step": 23300 + }, + { + "epoch": 5.69, + "learning_rate": 0.0004721280234546788, + "loss": 0.8545, + "step": 23325 + }, + { + "epoch": 5.7, + "learning_rate": 0.00047209748350842903, + "loss": 0.8713, + "step": 23350 + }, + { + "epoch": 5.7, + "learning_rate": 0.00047206694356217933, + "loss": 0.7914, + "step": 23375 + }, + { + "epoch": 5.71, + "learning_rate": 0.00047203640361592964, + "loss": 0.8725, + "step": 23400 + }, + { + "epoch": 5.72, + "learning_rate": 0.00047200586366967994, + "loss": 0.834, + "step": 23425 + }, + { + "epoch": 5.72, + "learning_rate": 0.0004719753237234303, + "loss": 0.8515, + "step": 23450 + }, + { + "epoch": 5.73, + "learning_rate": 0.0004719447837771806, + "loss": 0.7854, + "step": 23475 + }, + { + "epoch": 5.73, + "learning_rate": 0.00047191424383093085, + "loss": 0.7774, + "step": 23500 + }, + { + "epoch": 5.73, + "eval_cer": 0.17590320626674744, + "eval_loss": 0.5685146450996399, + "eval_runtime": 150.6401, + "eval_samples_per_second": 27.835, + "eval_steps_per_second": 6.964, + "eval_wer": 0.6818270799347471, + "step": 23500 + }, + { + "epoch": 5.74, + "learning_rate": 0.00047188370388468115, + "loss": 0.8371, + "step": 23525 + }, + { + "epoch": 5.75, + "learning_rate": 0.00047185316393843146, + "loss": 0.7747, + "step": 23550 + }, + { + "epoch": 5.75, + "learning_rate": 0.00047182262399218176, + "loss": 0.801, + "step": 23575 + }, + { + "epoch": 5.76, + "learning_rate": 0.0004717920840459321, + "loss": 0.7689, + "step": 23600 + }, + { + "epoch": 5.77, + "learning_rate": 0.0004717615440996824, + "loss": 0.8017, + "step": 23625 + }, + { + "epoch": 5.77, + "learning_rate": 0.00047173100415343267, + "loss": 0.849, + "step": 23650 + }, + { + "epoch": 5.78, + "learning_rate": 0.000471700464207183, + "loss": 0.7922, + "step": 23675 + }, + { + "epoch": 5.78, + "learning_rate": 0.0004716699242609333, + "loss": 0.849, + "step": 23700 + }, + { + "epoch": 5.79, + "learning_rate": 0.00047163938431468364, + "loss": 0.8138, + "step": 23725 + }, + { + "epoch": 5.8, + "learning_rate": 0.00047160884436843394, + "loss": 0.8949, + "step": 23750 + }, + { + "epoch": 5.8, + "learning_rate": 0.00047157830442218424, + "loss": 0.8182, + "step": 23775 + }, + { + "epoch": 5.81, + "learning_rate": 0.00047154776447593455, + "loss": 0.8002, + "step": 23800 + }, + { + "epoch": 5.81, + "learning_rate": 0.0004715172245296848, + "loss": 0.825, + "step": 23825 + }, + { + "epoch": 5.82, + "learning_rate": 0.00047148668458343515, + "loss": 0.8962, + "step": 23850 + }, + { + "epoch": 5.83, + "learning_rate": 0.00047145614463718546, + "loss": 0.816, + "step": 23875 + }, + { + "epoch": 5.83, + "learning_rate": 0.00047142560469093576, + "loss": 0.7518, + "step": 23900 + }, + { + "epoch": 5.84, + "learning_rate": 0.00047139506474468606, + "loss": 0.812, + "step": 23925 + }, + { + "epoch": 5.84, + "learning_rate": 0.00047136452479843637, + "loss": 0.8034, + "step": 23950 + }, + { + "epoch": 5.85, + "learning_rate": 0.00047133398485218667, + "loss": 0.8022, + "step": 23975 + }, + { + "epoch": 5.86, + "learning_rate": 0.00047130344490593697, + "loss": 0.8622, + "step": 24000 + }, + { + "epoch": 5.86, + "eval_cer": 0.17418868002012258, + "eval_loss": 0.5598137378692627, + "eval_runtime": 151.7552, + "eval_samples_per_second": 27.63, + "eval_steps_per_second": 6.912, + "eval_wer": 0.6687438825448614, + "step": 24000 + }, + { + "epoch": 5.86, + "learning_rate": 0.0004712729049596873, + "loss": 0.8301, + "step": 24025 + }, + { + "epoch": 5.87, + "learning_rate": 0.0004712423650134376, + "loss": 0.7974, + "step": 24050 + }, + { + "epoch": 5.87, + "learning_rate": 0.0004712118250671879, + "loss": 0.788, + "step": 24075 + }, + { + "epoch": 5.88, + "learning_rate": 0.00047118128512093824, + "loss": 0.8011, + "step": 24100 + }, + { + "epoch": 5.89, + "learning_rate": 0.0004711507451746885, + "loss": 0.8189, + "step": 24125 + }, + { + "epoch": 5.89, + "learning_rate": 0.0004711202052284388, + "loss": 0.8521, + "step": 24150 + }, + { + "epoch": 5.9, + "learning_rate": 0.0004710896652821891, + "loss": 0.832, + "step": 24175 + }, + { + "epoch": 5.91, + "learning_rate": 0.0004710591253359394, + "loss": 0.8306, + "step": 24200 + }, + { + "epoch": 5.91, + "learning_rate": 0.00047102858538968976, + "loss": 0.8189, + "step": 24225 + }, + { + "epoch": 5.92, + "learning_rate": 0.00047099804544344006, + "loss": 0.8372, + "step": 24250 + }, + { + "epoch": 5.92, + "learning_rate": 0.0004709675054971903, + "loss": 0.8268, + "step": 24275 + }, + { + "epoch": 5.93, + "learning_rate": 0.0004709369655509406, + "loss": 0.8726, + "step": 24300 + }, + { + "epoch": 5.94, + "learning_rate": 0.0004709064256046909, + "loss": 0.816, + "step": 24325 + }, + { + "epoch": 5.94, + "learning_rate": 0.0004708758856584413, + "loss": 0.8516, + "step": 24350 + }, + { + "epoch": 5.95, + "learning_rate": 0.0004708453457121916, + "loss": 0.7799, + "step": 24375 + }, + { + "epoch": 5.95, + "learning_rate": 0.0004708148057659419, + "loss": 0.825, + "step": 24400 + }, + { + "epoch": 5.96, + "learning_rate": 0.0004707842658196922, + "loss": 0.767, + "step": 24425 + }, + { + "epoch": 5.97, + "learning_rate": 0.00047075372587344243, + "loss": 0.8352, + "step": 24450 + }, + { + "epoch": 5.97, + "learning_rate": 0.0004707231859271928, + "loss": 0.8106, + "step": 24475 + }, + { + "epoch": 5.98, + "learning_rate": 0.0004706926459809431, + "loss": 0.7968, + "step": 24500 + }, + { + "epoch": 5.98, + "eval_cer": 0.16986643121875097, + "eval_loss": 0.5589384436607361, + "eval_runtime": 150.8942, + "eval_samples_per_second": 27.788, + "eval_steps_per_second": 6.952, + "eval_wer": 0.657716150081566, + "step": 24500 + }, + { + "epoch": 5.98, + "learning_rate": 0.0004706621060346934, + "loss": 0.8186, + "step": 24525 + }, + { + "epoch": 5.99, + "learning_rate": 0.0004706315660884437, + "loss": 0.8581, + "step": 24550 + }, + { + "epoch": 6.0, + "learning_rate": 0.000470601026142194, + "loss": 0.7809, + "step": 24575 + }, + { + "epoch": 6.0, + "learning_rate": 0.0004705704861959443, + "loss": 0.8235, + "step": 24600 + }, + { + "epoch": 6.01, + "learning_rate": 0.0004705399462496946, + "loss": 0.8245, + "step": 24625 + }, + { + "epoch": 6.02, + "learning_rate": 0.0004705094063034449, + "loss": 0.8341, + "step": 24650 + }, + { + "epoch": 6.02, + "learning_rate": 0.0004704788663571952, + "loss": 0.7669, + "step": 24675 + }, + { + "epoch": 6.03, + "learning_rate": 0.0004704483264109455, + "loss": 0.775, + "step": 24700 + }, + { + "epoch": 6.03, + "learning_rate": 0.0004704177864646959, + "loss": 0.7697, + "step": 24725 + }, + { + "epoch": 6.04, + "learning_rate": 0.0004703872465184461, + "loss": 0.775, + "step": 24750 + }, + { + "epoch": 6.05, + "learning_rate": 0.00047035670657219643, + "loss": 0.7845, + "step": 24775 + }, + { + "epoch": 6.05, + "learning_rate": 0.00047032616662594673, + "loss": 0.8577, + "step": 24800 + }, + { + "epoch": 6.06, + "learning_rate": 0.00047029562667969704, + "loss": 0.7583, + "step": 24825 + }, + { + "epoch": 6.06, + "learning_rate": 0.0004702650867334474, + "loss": 0.777, + "step": 24850 + }, + { + "epoch": 6.07, + "learning_rate": 0.0004702345467871977, + "loss": 0.7411, + "step": 24875 + }, + { + "epoch": 6.08, + "learning_rate": 0.000470204006840948, + "loss": 0.7703, + "step": 24900 + }, + { + "epoch": 6.08, + "learning_rate": 0.00047017346689469825, + "loss": 0.7881, + "step": 24925 + }, + { + "epoch": 6.09, + "learning_rate": 0.00047014292694844855, + "loss": 0.7471, + "step": 24950 + }, + { + "epoch": 6.09, + "learning_rate": 0.00047011238700219886, + "loss": 0.8077, + "step": 24975 + }, + { + "epoch": 6.1, + "learning_rate": 0.0004700818470559492, + "loss": 0.8253, + "step": 25000 + }, + { + "epoch": 6.1, + "eval_cer": 0.16891676847735695, + "eval_loss": 0.5600982308387756, + "eval_runtime": 152.7105, + "eval_samples_per_second": 27.457, + "eval_steps_per_second": 6.869, + "eval_wer": 0.6617292006525285, + "step": 25000 + }, + { + "epoch": 6.11, + "learning_rate": 0.0004700513071096995, + "loss": 0.774, + "step": 25025 + }, + { + "epoch": 6.11, + "learning_rate": 0.0004700207671634498, + "loss": 0.7965, + "step": 25050 + }, + { + "epoch": 6.12, + "learning_rate": 0.00046999022721720007, + "loss": 0.7859, + "step": 25075 + }, + { + "epoch": 6.12, + "learning_rate": 0.0004699596872709504, + "loss": 0.7834, + "step": 25100 + }, + { + "epoch": 6.13, + "learning_rate": 0.00046992914732470073, + "loss": 0.7398, + "step": 25125 + }, + { + "epoch": 6.14, + "learning_rate": 0.00046989860737845103, + "loss": 0.8568, + "step": 25150 + }, + { + "epoch": 6.14, + "learning_rate": 0.00046986806743220134, + "loss": 0.783, + "step": 25175 + }, + { + "epoch": 6.15, + "learning_rate": 0.00046983752748595164, + "loss": 0.8308, + "step": 25200 + }, + { + "epoch": 6.16, + "learning_rate": 0.0004698069875397019, + "loss": 0.7543, + "step": 25225 + }, + { + "epoch": 6.16, + "learning_rate": 0.00046977644759345225, + "loss": 0.8413, + "step": 25250 + }, + { + "epoch": 6.17, + "learning_rate": 0.00046974590764720255, + "loss": 0.7851, + "step": 25275 + }, + { + "epoch": 6.17, + "learning_rate": 0.00046971536770095285, + "loss": 0.7815, + "step": 25300 + }, + { + "epoch": 6.18, + "learning_rate": 0.00046968482775470316, + "loss": 0.7607, + "step": 25325 + }, + { + "epoch": 6.19, + "learning_rate": 0.00046965428780845346, + "loss": 0.7827, + "step": 25350 + }, + { + "epoch": 6.19, + "learning_rate": 0.0004696237478622038, + "loss": 0.7891, + "step": 25375 + }, + { + "epoch": 6.2, + "learning_rate": 0.00046959320791595407, + "loss": 0.7708, + "step": 25400 + }, + { + "epoch": 6.2, + "learning_rate": 0.00046956266796970437, + "loss": 0.7806, + "step": 25425 + }, + { + "epoch": 6.21, + "learning_rate": 0.0004695321280234547, + "loss": 0.8272, + "step": 25450 + }, + { + "epoch": 6.22, + "learning_rate": 0.000469501588077205, + "loss": 0.7922, + "step": 25475 + }, + { + "epoch": 6.22, + "learning_rate": 0.00046947104813095534, + "loss": 0.7947, + "step": 25500 + }, + { + "epoch": 6.22, + "eval_cer": 0.16775663993922157, + "eval_loss": 0.5526652932167053, + "eval_runtime": 153.2005, + "eval_samples_per_second": 27.369, + "eval_steps_per_second": 6.847, + "eval_wer": 0.6471778140293638, + "step": 25500 + }, + { + "epoch": 6.23, + "learning_rate": 0.00046944050818470564, + "loss": 0.7896, + "step": 25525 + }, + { + "epoch": 6.23, + "learning_rate": 0.0004694099682384559, + "loss": 0.7802, + "step": 25550 + }, + { + "epoch": 6.24, + "learning_rate": 0.0004693806498900562, + "loss": 0.7681, + "step": 25575 + }, + { + "epoch": 6.25, + "learning_rate": 0.0004693501099438065, + "loss": 0.7726, + "step": 25600 + }, + { + "epoch": 6.25, + "learning_rate": 0.0004693207915954068, + "loss": 0.7731, + "step": 25625 + }, + { + "epoch": 6.26, + "learning_rate": 0.0004692902516491571, + "loss": 0.7475, + "step": 25650 + }, + { + "epoch": 6.27, + "learning_rate": 0.0004692597117029074, + "loss": 0.7772, + "step": 25675 + }, + { + "epoch": 6.27, + "learning_rate": 0.0004692291717566577, + "loss": 0.7563, + "step": 25700 + }, + { + "epoch": 6.28, + "learning_rate": 0.000469198631810408, + "loss": 0.7887, + "step": 25725 + }, + { + "epoch": 6.28, + "learning_rate": 0.0004691680918641583, + "loss": 0.8447, + "step": 25750 + }, + { + "epoch": 6.29, + "learning_rate": 0.0004691375519179086, + "loss": 0.7684, + "step": 25775 + }, + { + "epoch": 6.3, + "learning_rate": 0.00046910701197165893, + "loss": 0.8256, + "step": 25800 + }, + { + "epoch": 6.3, + "learning_rate": 0.0004690764720254093, + "loss": 0.7834, + "step": 25825 + }, + { + "epoch": 6.31, + "learning_rate": 0.0004690459320791596, + "loss": 0.7856, + "step": 25850 + }, + { + "epoch": 6.31, + "learning_rate": 0.00046901539213290984, + "loss": 0.7571, + "step": 25875 + }, + { + "epoch": 6.32, + "learning_rate": 0.00046898485218666014, + "loss": 0.8078, + "step": 25900 + }, + { + "epoch": 6.33, + "learning_rate": 0.00046895431224041044, + "loss": 0.7851, + "step": 25925 + }, + { + "epoch": 6.33, + "learning_rate": 0.0004689237722941608, + "loss": 0.8066, + "step": 25950 + }, + { + "epoch": 6.34, + "learning_rate": 0.0004688932323479111, + "loss": 0.7699, + "step": 25975 + }, + { + "epoch": 6.34, + "learning_rate": 0.0004688626924016614, + "loss": 0.8273, + "step": 26000 + }, + { + "epoch": 6.34, + "eval_cer": 0.17227908791310328, + "eval_loss": 0.5425549745559692, + "eval_runtime": 153.5111, + "eval_samples_per_second": 27.314, + "eval_steps_per_second": 6.833, + "eval_wer": 0.6673083197389886, + "step": 26000 + }, + { + "epoch": 6.35, + "learning_rate": 0.00046883215245541166, + "loss": 0.8126, + "step": 26025 + }, + { + "epoch": 6.36, + "learning_rate": 0.00046880161250916196, + "loss": 0.8578, + "step": 26050 + }, + { + "epoch": 6.36, + "learning_rate": 0.0004687710725629123, + "loss": 0.7734, + "step": 26075 + }, + { + "epoch": 6.37, + "learning_rate": 0.0004687405326166626, + "loss": 0.7617, + "step": 26100 + }, + { + "epoch": 6.38, + "learning_rate": 0.0004687099926704129, + "loss": 0.7766, + "step": 26125 + }, + { + "epoch": 6.38, + "learning_rate": 0.00046867945272416323, + "loss": 0.8196, + "step": 26150 + }, + { + "epoch": 6.39, + "learning_rate": 0.0004686489127779135, + "loss": 0.7303, + "step": 26175 + }, + { + "epoch": 6.39, + "learning_rate": 0.00046861837283166384, + "loss": 0.7622, + "step": 26200 + }, + { + "epoch": 6.4, + "learning_rate": 0.00046858783288541414, + "loss": 0.7714, + "step": 26225 + }, + { + "epoch": 6.41, + "learning_rate": 0.00046855729293916444, + "loss": 0.7608, + "step": 26250 + }, + { + "epoch": 6.41, + "learning_rate": 0.00046852675299291475, + "loss": 0.8122, + "step": 26275 + }, + { + "epoch": 6.42, + "learning_rate": 0.00046849621304666505, + "loss": 0.7717, + "step": 26300 + }, + { + "epoch": 6.42, + "learning_rate": 0.0004684656731004154, + "loss": 0.741, + "step": 26325 + }, + { + "epoch": 6.43, + "learning_rate": 0.00046843513315416566, + "loss": 0.7665, + "step": 26350 + }, + { + "epoch": 6.44, + "learning_rate": 0.00046840459320791596, + "loss": 0.81, + "step": 26375 + }, + { + "epoch": 6.44, + "learning_rate": 0.00046837405326166626, + "loss": 0.8025, + "step": 26400 + }, + { + "epoch": 6.45, + "learning_rate": 0.00046834351331541657, + "loss": 0.7949, + "step": 26425 + }, + { + "epoch": 6.45, + "learning_rate": 0.00046831297336916687, + "loss": 0.8085, + "step": 26450 + }, + { + "epoch": 6.46, + "learning_rate": 0.0004682824334229172, + "loss": 0.8072, + "step": 26475 + }, + { + "epoch": 6.47, + "learning_rate": 0.0004682518934766675, + "loss": 0.8085, + "step": 26500 + }, + { + "epoch": 6.47, + "eval_cer": 0.1681621715963574, + "eval_loss": 0.5464115142822266, + "eval_runtime": 151.2701, + "eval_samples_per_second": 27.719, + "eval_steps_per_second": 6.935, + "eval_wer": 0.6475693311582382, + "step": 26500 + }, + { + "epoch": 6.47, + "learning_rate": 0.0004682213535304178, + "loss": 0.7243, + "step": 26525 + }, + { + "epoch": 6.48, + "learning_rate": 0.0004681908135841681, + "loss": 0.8214, + "step": 26550 + }, + { + "epoch": 6.48, + "learning_rate": 0.0004681602736379184, + "loss": 0.7823, + "step": 26575 + }, + { + "epoch": 6.49, + "learning_rate": 0.00046812973369166874, + "loss": 0.7737, + "step": 26600 + }, + { + "epoch": 6.5, + "learning_rate": 0.00046809919374541905, + "loss": 0.7714, + "step": 26625 + }, + { + "epoch": 6.5, + "learning_rate": 0.0004680686537991693, + "loss": 0.7848, + "step": 26650 + }, + { + "epoch": 6.51, + "learning_rate": 0.0004680381138529196, + "loss": 0.8329, + "step": 26675 + }, + { + "epoch": 6.52, + "learning_rate": 0.0004680075739066699, + "loss": 0.802, + "step": 26700 + }, + { + "epoch": 6.52, + "learning_rate": 0.00046797703396042026, + "loss": 0.8132, + "step": 26725 + }, + { + "epoch": 6.53, + "learning_rate": 0.00046794649401417056, + "loss": 0.8287, + "step": 26750 + }, + { + "epoch": 6.53, + "learning_rate": 0.00046791595406792087, + "loss": 0.7784, + "step": 26775 + }, + { + "epoch": 6.54, + "learning_rate": 0.00046788541412167117, + "loss": 0.803, + "step": 26800 + }, + { + "epoch": 6.55, + "learning_rate": 0.0004678548741754214, + "loss": 0.7928, + "step": 26825 + }, + { + "epoch": 6.55, + "learning_rate": 0.0004678243342291718, + "loss": 0.8156, + "step": 26850 + }, + { + "epoch": 6.56, + "learning_rate": 0.0004677937942829221, + "loss": 0.7577, + "step": 26875 + }, + { + "epoch": 6.56, + "learning_rate": 0.0004677632543366724, + "loss": 0.7651, + "step": 26900 + }, + { + "epoch": 6.57, + "learning_rate": 0.0004677327143904227, + "loss": 0.7585, + "step": 26925 + }, + { + "epoch": 6.58, + "learning_rate": 0.000467702174444173, + "loss": 0.8167, + "step": 26950 + }, + { + "epoch": 6.58, + "learning_rate": 0.0004676716344979233, + "loss": 0.7781, + "step": 26975 + }, + { + "epoch": 6.59, + "learning_rate": 0.0004676410945516736, + "loss": 0.8164, + "step": 27000 + }, + { + "epoch": 6.59, + "eval_cer": 0.1653131833721754, + "eval_loss": 0.5459656715393066, + "eval_runtime": 153.5643, + "eval_samples_per_second": 27.305, + "eval_steps_per_second": 6.831, + "eval_wer": 0.6328548123980424, + "step": 27000 + }, + { + "epoch": 6.59, + "learning_rate": 0.0004676105546054239, + "loss": 0.7949, + "step": 27025 + }, + { + "epoch": 6.6, + "learning_rate": 0.0004675800146591742, + "loss": 0.7673, + "step": 27050 + }, + { + "epoch": 6.61, + "learning_rate": 0.0004675494747129245, + "loss": 0.7335, + "step": 27075 + }, + { + "epoch": 6.61, + "learning_rate": 0.00046751893476667486, + "loss": 0.8251, + "step": 27100 + }, + { + "epoch": 6.62, + "learning_rate": 0.0004674883948204251, + "loss": 0.7464, + "step": 27125 + }, + { + "epoch": 6.63, + "learning_rate": 0.0004674578548741754, + "loss": 0.8075, + "step": 27150 + }, + { + "epoch": 6.63, + "learning_rate": 0.0004674273149279257, + "loss": 0.7601, + "step": 27175 + }, + { + "epoch": 6.64, + "learning_rate": 0.000467396774981676, + "loss": 0.8107, + "step": 27200 + }, + { + "epoch": 6.64, + "learning_rate": 0.0004673662350354264, + "loss": 0.7774, + "step": 27225 + }, + { + "epoch": 6.65, + "learning_rate": 0.0004673356950891767, + "loss": 0.8015, + "step": 27250 + }, + { + "epoch": 6.66, + "learning_rate": 0.000467305155142927, + "loss": 0.7453, + "step": 27275 + }, + { + "epoch": 6.66, + "learning_rate": 0.00046727461519667724, + "loss": 0.8042, + "step": 27300 + }, + { + "epoch": 6.67, + "learning_rate": 0.00046724407525042754, + "loss": 0.7639, + "step": 27325 + }, + { + "epoch": 6.67, + "learning_rate": 0.0004672135353041779, + "loss": 0.7875, + "step": 27350 + }, + { + "epoch": 6.68, + "learning_rate": 0.0004671829953579282, + "loss": 0.7677, + "step": 27375 + }, + { + "epoch": 6.69, + "learning_rate": 0.0004671524554116785, + "loss": 0.8096, + "step": 27400 + }, + { + "epoch": 6.69, + "learning_rate": 0.0004671219154654288, + "loss": 0.7775, + "step": 27425 + }, + { + "epoch": 6.7, + "learning_rate": 0.00046709137551917906, + "loss": 0.8353, + "step": 27450 + }, + { + "epoch": 6.7, + "learning_rate": 0.0004670608355729294, + "loss": 0.8382, + "step": 27475 + }, + { + "epoch": 6.71, + "learning_rate": 0.0004670302956266797, + "loss": 0.755, + "step": 27500 + }, + { + "epoch": 6.71, + "eval_cer": 0.16939929981622742, + "eval_loss": 0.5419759154319763, + "eval_runtime": 152.9956, + "eval_samples_per_second": 27.406, + "eval_steps_per_second": 6.856, + "eval_wer": 0.6614355628058728, + "step": 27500 + }, + { + "epoch": 6.72, + "learning_rate": 0.00046699975568043, + "loss": 0.7685, + "step": 27525 + }, + { + "epoch": 6.72, + "learning_rate": 0.0004669692157341803, + "loss": 0.7839, + "step": 27550 + }, + { + "epoch": 6.73, + "learning_rate": 0.00046693867578793063, + "loss": 0.7775, + "step": 27575 + }, + { + "epoch": 6.73, + "learning_rate": 0.0004669081358416809, + "loss": 0.8121, + "step": 27600 + }, + { + "epoch": 6.74, + "learning_rate": 0.00046687759589543123, + "loss": 0.765, + "step": 27625 + }, + { + "epoch": 6.75, + "learning_rate": 0.00046684705594918154, + "loss": 0.8056, + "step": 27650 + }, + { + "epoch": 6.75, + "learning_rate": 0.00046681651600293184, + "loss": 0.733, + "step": 27675 + }, + { + "epoch": 6.76, + "learning_rate": 0.00046678597605668214, + "loss": 0.8103, + "step": 27700 + }, + { + "epoch": 6.77, + "learning_rate": 0.00046675543611043245, + "loss": 0.7478, + "step": 27725 + }, + { + "epoch": 6.77, + "learning_rate": 0.0004667248961641828, + "loss": 0.7973, + "step": 27750 + }, + { + "epoch": 6.78, + "learning_rate": 0.00046669435621793305, + "loss": 0.7877, + "step": 27775 + }, + { + "epoch": 6.78, + "learning_rate": 0.00046666381627168336, + "loss": 0.8024, + "step": 27800 + }, + { + "epoch": 6.79, + "learning_rate": 0.00046663327632543366, + "loss": 0.7701, + "step": 27825 + }, + { + "epoch": 6.8, + "learning_rate": 0.00046660273637918396, + "loss": 0.8046, + "step": 27850 + }, + { + "epoch": 6.8, + "learning_rate": 0.0004665721964329343, + "loss": 0.7917, + "step": 27875 + }, + { + "epoch": 6.81, + "learning_rate": 0.0004665416564866846, + "loss": 0.8223, + "step": 27900 + }, + { + "epoch": 6.81, + "learning_rate": 0.0004665111165404349, + "loss": 0.7697, + "step": 27925 + }, + { + "epoch": 6.82, + "learning_rate": 0.0004664805765941852, + "loss": 0.8104, + "step": 27950 + }, + { + "epoch": 6.83, + "learning_rate": 0.0004664500366479355, + "loss": 0.7723, + "step": 27975 + }, + { + "epoch": 6.83, + "learning_rate": 0.00046641949670168584, + "loss": 0.822, + "step": 28000 + }, + { + "epoch": 6.83, + "eval_cer": 0.1698561645945197, + "eval_loss": 0.5540247559547424, + "eval_runtime": 153.0638, + "eval_samples_per_second": 27.394, + "eval_steps_per_second": 6.853, + "eval_wer": 0.6492985318107667, + "step": 28000 + }, + { + "epoch": 6.84, + "learning_rate": 0.00046638895675543614, + "loss": 0.7624, + "step": 28025 + }, + { + "epoch": 6.84, + "learning_rate": 0.00046635841680918645, + "loss": 0.8005, + "step": 28050 + }, + { + "epoch": 6.85, + "learning_rate": 0.0004663278768629367, + "loss": 0.7542, + "step": 28075 + }, + { + "epoch": 6.86, + "learning_rate": 0.000466297336916687, + "loss": 0.8048, + "step": 28100 + }, + { + "epoch": 6.86, + "learning_rate": 0.00046626679697043736, + "loss": 0.7846, + "step": 28125 + }, + { + "epoch": 6.87, + "learning_rate": 0.00046623625702418766, + "loss": 0.7999, + "step": 28150 + }, + { + "epoch": 6.88, + "learning_rate": 0.00046620571707793796, + "loss": 0.7547, + "step": 28175 + }, + { + "epoch": 6.88, + "learning_rate": 0.00046617517713168827, + "loss": 0.7975, + "step": 28200 + }, + { + "epoch": 6.89, + "learning_rate": 0.0004661446371854385, + "loss": 0.7271, + "step": 28225 + }, + { + "epoch": 6.89, + "learning_rate": 0.00046611409723918887, + "loss": 0.8168, + "step": 28250 + }, + { + "epoch": 6.9, + "learning_rate": 0.0004660835572929392, + "loss": 0.7559, + "step": 28275 + }, + { + "epoch": 6.91, + "learning_rate": 0.0004660530173466895, + "loss": 0.7618, + "step": 28300 + }, + { + "epoch": 6.91, + "learning_rate": 0.0004660224774004398, + "loss": 0.811, + "step": 28325 + }, + { + "epoch": 6.92, + "learning_rate": 0.0004659919374541901, + "loss": 0.7985, + "step": 28350 + }, + { + "epoch": 6.92, + "learning_rate": 0.00046596139750794044, + "loss": 0.779, + "step": 28375 + }, + { + "epoch": 6.93, + "learning_rate": 0.0004659308575616907, + "loss": 0.8269, + "step": 28400 + }, + { + "epoch": 6.94, + "learning_rate": 0.000465900317615441, + "loss": 0.7372, + "step": 28425 + }, + { + "epoch": 6.94, + "learning_rate": 0.0004658697776691913, + "loss": 0.8145, + "step": 28450 + }, + { + "epoch": 6.95, + "learning_rate": 0.0004658392377229416, + "loss": 0.7761, + "step": 28475 + }, + { + "epoch": 6.95, + "learning_rate": 0.00046580869777669196, + "loss": 0.7957, + "step": 28500 + }, + { + "epoch": 6.95, + "eval_cer": 0.16304425941706108, + "eval_loss": 0.5358180403709412, + "eval_runtime": 151.3883, + "eval_samples_per_second": 27.697, + "eval_steps_per_second": 6.929, + "eval_wer": 0.6373246329526917, + "step": 28500 + }, + { + "epoch": 6.96, + "learning_rate": 0.00046577815783044226, + "loss": 0.7879, + "step": 28525 + }, + { + "epoch": 6.97, + "learning_rate": 0.0004657476178841925, + "loss": 0.8106, + "step": 28550 + }, + { + "epoch": 6.97, + "learning_rate": 0.0004657170779379428, + "loss": 0.7716, + "step": 28575 + }, + { + "epoch": 6.98, + "learning_rate": 0.0004656877595895431, + "loss": 0.7921, + "step": 28600 + }, + { + "epoch": 6.99, + "learning_rate": 0.0004656572196432934, + "loss": 0.7744, + "step": 28625 + }, + { + "epoch": 6.99, + "learning_rate": 0.00046562667969704373, + "loss": 0.7707, + "step": 28650 + }, + { + "epoch": 7.0, + "learning_rate": 0.0004655961397507941, + "loss": 0.7645, + "step": 28675 + }, + { + "epoch": 7.0, + "learning_rate": 0.00046556559980454434, + "loss": 0.8178, + "step": 28700 + }, + { + "epoch": 7.01, + "learning_rate": 0.00046553505985829464, + "loss": 0.7335, + "step": 28725 + }, + { + "epoch": 7.02, + "learning_rate": 0.00046550451991204494, + "loss": 0.7847, + "step": 28750 + }, + { + "epoch": 7.02, + "learning_rate": 0.00046547397996579525, + "loss": 0.7395, + "step": 28775 + }, + { + "epoch": 7.03, + "learning_rate": 0.0004654434400195456, + "loss": 0.7532, + "step": 28800 + }, + { + "epoch": 7.03, + "learning_rate": 0.0004654129000732959, + "loss": 0.7882, + "step": 28825 + }, + { + "epoch": 7.04, + "learning_rate": 0.0004653823601270462, + "loss": 0.7519, + "step": 28850 + }, + { + "epoch": 7.05, + "learning_rate": 0.00046535182018079646, + "loss": 0.6923, + "step": 28875 + }, + { + "epoch": 7.05, + "learning_rate": 0.00046532128023454676, + "loss": 0.7965, + "step": 28900 + }, + { + "epoch": 7.06, + "learning_rate": 0.0004652907402882971, + "loss": 0.703, + "step": 28925 + }, + { + "epoch": 7.06, + "learning_rate": 0.0004652602003420474, + "loss": 0.752, + "step": 28950 + }, + { + "epoch": 7.07, + "learning_rate": 0.0004652296603957977, + "loss": 0.6877, + "step": 28975 + }, + { + "epoch": 7.08, + "learning_rate": 0.00046519912044954803, + "loss": 0.7739, + "step": 29000 + }, + { + "epoch": 7.08, + "eval_cer": 0.17274621931562684, + "eval_loss": 0.5662298202514648, + "eval_runtime": 153.6801, + "eval_samples_per_second": 27.284, + "eval_steps_per_second": 6.826, + "eval_wer": 0.6695595432300163, + "step": 29000 + }, + { + "epoch": 7.08, + "learning_rate": 0.0004651685805032983, + "loss": 0.7574, + "step": 29025 + }, + { + "epoch": 7.09, + "learning_rate": 0.00046513804055704864, + "loss": 0.8008, + "step": 29050 + }, + { + "epoch": 7.09, + "learning_rate": 0.00046510750061079894, + "loss": 0.7341, + "step": 29075 + }, + { + "epoch": 7.1, + "learning_rate": 0.00046507696066454924, + "loss": 0.7556, + "step": 29100 + }, + { + "epoch": 7.11, + "learning_rate": 0.00046504642071829955, + "loss": 0.7353, + "step": 29125 + }, + { + "epoch": 7.11, + "learning_rate": 0.00046501588077204985, + "loss": 0.7788, + "step": 29150 + }, + { + "epoch": 7.12, + "learning_rate": 0.00046498534082580015, + "loss": 0.75, + "step": 29175 + }, + { + "epoch": 7.13, + "learning_rate": 0.00046495480087955046, + "loss": 0.7361, + "step": 29200 + }, + { + "epoch": 7.13, + "learning_rate": 0.00046492426093330076, + "loss": 0.7574, + "step": 29225 + }, + { + "epoch": 7.14, + "learning_rate": 0.00046489372098705106, + "loss": 0.7727, + "step": 29250 + }, + { + "epoch": 7.14, + "learning_rate": 0.00046486318104080137, + "loss": 0.74, + "step": 29275 + }, + { + "epoch": 7.15, + "learning_rate": 0.0004648326410945517, + "loss": 0.7178, + "step": 29300 + }, + { + "epoch": 7.16, + "learning_rate": 0.00046480210114830203, + "loss": 0.7438, + "step": 29325 + }, + { + "epoch": 7.16, + "learning_rate": 0.0004647715612020523, + "loss": 0.7835, + "step": 29350 + }, + { + "epoch": 7.17, + "learning_rate": 0.0004647410212558026, + "loss": 0.7028, + "step": 29375 + }, + { + "epoch": 7.17, + "learning_rate": 0.0004647104813095529, + "loss": 0.784, + "step": 29400 + }, + { + "epoch": 7.18, + "learning_rate": 0.00046467994136330324, + "loss": 0.7249, + "step": 29425 + }, + { + "epoch": 7.19, + "learning_rate": 0.00046464940141705354, + "loss": 0.7371, + "step": 29450 + }, + { + "epoch": 7.19, + "learning_rate": 0.00046461886147080385, + "loss": 0.7614, + "step": 29475 + }, + { + "epoch": 7.2, + "learning_rate": 0.0004645883215245541, + "loss": 0.7833, + "step": 29500 + }, + { + "epoch": 7.2, + "eval_cer": 0.15938420787860744, + "eval_loss": 0.5323081016540527, + "eval_runtime": 153.6339, + "eval_samples_per_second": 27.292, + "eval_steps_per_second": 6.828, + "eval_wer": 0.6227079934747145, + "step": 29500 + }, + { + "epoch": 7.2, + "learning_rate": 0.0004645577815783044, + "loss": 0.7305, + "step": 29525 + }, + { + "epoch": 7.21, + "learning_rate": 0.00046452724163205476, + "loss": 0.7645, + "step": 29550 + }, + { + "epoch": 7.22, + "learning_rate": 0.00046449670168580506, + "loss": 0.7863, + "step": 29575 + }, + { + "epoch": 7.22, + "learning_rate": 0.00046446616173955536, + "loss": 0.7635, + "step": 29600 + }, + { + "epoch": 7.23, + "learning_rate": 0.00046443562179330567, + "loss": 0.7263, + "step": 29625 + }, + { + "epoch": 7.24, + "learning_rate": 0.0004644050818470559, + "loss": 0.7765, + "step": 29650 + }, + { + "epoch": 7.24, + "learning_rate": 0.0004643745419008062, + "loss": 0.7977, + "step": 29675 + }, + { + "epoch": 7.25, + "learning_rate": 0.0004643440019545566, + "loss": 0.7765, + "step": 29700 + }, + { + "epoch": 7.25, + "learning_rate": 0.0004643134620083069, + "loss": 0.7449, + "step": 29725 + }, + { + "epoch": 7.26, + "learning_rate": 0.0004642829220620572, + "loss": 0.7772, + "step": 29750 + }, + { + "epoch": 7.27, + "learning_rate": 0.0004642523821158075, + "loss": 0.7407, + "step": 29775 + }, + { + "epoch": 7.27, + "learning_rate": 0.0004642218421695578, + "loss": 0.7405, + "step": 29800 + }, + { + "epoch": 7.28, + "learning_rate": 0.0004641913022233081, + "loss": 0.7628, + "step": 29825 + }, + { + "epoch": 7.28, + "learning_rate": 0.0004641607622770584, + "loss": 0.7384, + "step": 29850 + }, + { + "epoch": 7.29, + "learning_rate": 0.0004641302223308087, + "loss": 0.7202, + "step": 29875 + }, + { + "epoch": 7.3, + "learning_rate": 0.000464099682384559, + "loss": 0.8118, + "step": 29900 + }, + { + "epoch": 7.3, + "learning_rate": 0.0004640691424383093, + "loss": 0.7478, + "step": 29925 + }, + { + "epoch": 7.31, + "learning_rate": 0.00046403860249205967, + "loss": 0.7712, + "step": 29950 + }, + { + "epoch": 7.31, + "learning_rate": 0.0004640080625458099, + "loss": 0.729, + "step": 29975 + }, + { + "epoch": 7.32, + "learning_rate": 0.0004639775225995602, + "loss": 0.7737, + "step": 30000 + }, + { + "epoch": 7.32, + "eval_cer": 0.1612784000492798, + "eval_loss": 0.5348503589630127, + "eval_runtime": 151.5191, + "eval_samples_per_second": 27.673, + "eval_steps_per_second": 6.923, + "eval_wer": 0.6303425774877651, + "step": 30000 + }, + { + "epoch": 7.33, + "learning_rate": 0.0004639469826533105, + "loss": 0.7539, + "step": 30025 + }, + { + "epoch": 7.33, + "learning_rate": 0.0004639164427070608, + "loss": 0.7372, + "step": 30050 + }, + { + "epoch": 7.34, + "learning_rate": 0.0004638859027608112, + "loss": 0.7137, + "step": 30075 + }, + { + "epoch": 7.35, + "learning_rate": 0.0004638553628145615, + "loss": 0.7689, + "step": 30100 + }, + { + "epoch": 7.35, + "learning_rate": 0.00046382482286831173, + "loss": 0.7584, + "step": 30125 + }, + { + "epoch": 7.36, + "learning_rate": 0.00046379428292206204, + "loss": 0.7275, + "step": 30150 + }, + { + "epoch": 7.36, + "learning_rate": 0.00046376374297581234, + "loss": 0.7524, + "step": 30175 + }, + { + "epoch": 7.37, + "learning_rate": 0.0004637332030295627, + "loss": 0.7609, + "step": 30200 + }, + { + "epoch": 7.38, + "learning_rate": 0.000463702663083313, + "loss": 0.6847, + "step": 30225 + }, + { + "epoch": 7.38, + "learning_rate": 0.0004636721231370633, + "loss": 0.7438, + "step": 30250 + }, + { + "epoch": 7.39, + "learning_rate": 0.0004636415831908136, + "loss": 0.7237, + "step": 30275 + }, + { + "epoch": 7.39, + "learning_rate": 0.00046361104324456386, + "loss": 0.8116, + "step": 30300 + }, + { + "epoch": 7.4, + "learning_rate": 0.0004635805032983142, + "loss": 0.7247, + "step": 30325 + }, + { + "epoch": 7.41, + "learning_rate": 0.0004635499633520645, + "loss": 0.8259, + "step": 30350 + }, + { + "epoch": 7.41, + "learning_rate": 0.0004635194234058148, + "loss": 0.7375, + "step": 30375 + }, + { + "epoch": 7.42, + "learning_rate": 0.0004634888834595651, + "loss": 0.7721, + "step": 30400 + }, + { + "epoch": 7.42, + "learning_rate": 0.00046345834351331543, + "loss": 0.7388, + "step": 30425 + }, + { + "epoch": 7.43, + "learning_rate": 0.00046342780356706573, + "loss": 0.7617, + "step": 30450 + }, + { + "epoch": 7.44, + "learning_rate": 0.00046339726362081604, + "loss": 0.7408, + "step": 30475 + }, + { + "epoch": 7.44, + "learning_rate": 0.00046336672367456634, + "loss": 0.7697, + "step": 30500 + }, + { + "epoch": 7.44, + "eval_cer": 0.1623358623451023, + "eval_loss": 0.531502366065979, + "eval_runtime": 153.2868, + "eval_samples_per_second": 27.354, + "eval_steps_per_second": 6.843, + "eval_wer": 0.6386296900489397, + "step": 30500 + }, + { + "epoch": 7.45, + "learning_rate": 0.00046333618372831664, + "loss": 0.7369, + "step": 30525 + }, + { + "epoch": 7.45, + "learning_rate": 0.00046330564378206695, + "loss": 0.7767, + "step": 30550 + }, + { + "epoch": 7.46, + "learning_rate": 0.0004632751038358173, + "loss": 0.7329, + "step": 30575 + }, + { + "epoch": 7.47, + "learning_rate": 0.00046324456388956755, + "loss": 0.7998, + "step": 30600 + }, + { + "epoch": 7.47, + "learning_rate": 0.00046321402394331786, + "loss": 0.7511, + "step": 30625 + }, + { + "epoch": 7.48, + "learning_rate": 0.00046318348399706816, + "loss": 0.775, + "step": 30650 + }, + { + "epoch": 7.49, + "learning_rate": 0.00046315294405081846, + "loss": 0.7321, + "step": 30675 + }, + { + "epoch": 7.49, + "learning_rate": 0.0004631224041045688, + "loss": 0.7492, + "step": 30700 + }, + { + "epoch": 7.5, + "learning_rate": 0.0004630918641583191, + "loss": 0.7255, + "step": 30725 + }, + { + "epoch": 7.5, + "learning_rate": 0.0004630613242120694, + "loss": 0.8, + "step": 30750 + }, + { + "epoch": 7.51, + "learning_rate": 0.0004630307842658197, + "loss": 0.7936, + "step": 30775 + }, + { + "epoch": 7.52, + "learning_rate": 0.00046300024431957, + "loss": 0.8171, + "step": 30800 + }, + { + "epoch": 7.52, + "learning_rate": 0.00046296970437332034, + "loss": 0.7838, + "step": 30825 + }, + { + "epoch": 7.53, + "learning_rate": 0.00046293916442707064, + "loss": 0.7683, + "step": 30850 + }, + { + "epoch": 7.53, + "learning_rate": 0.00046290862448082094, + "loss": 0.754, + "step": 30875 + }, + { + "epoch": 7.54, + "learning_rate": 0.00046287808453457125, + "loss": 0.723, + "step": 30900 + }, + { + "epoch": 7.55, + "learning_rate": 0.0004628475445883215, + "loss": 0.7296, + "step": 30925 + }, + { + "epoch": 7.55, + "learning_rate": 0.0004628170046420718, + "loss": 0.7375, + "step": 30950 + }, + { + "epoch": 7.56, + "learning_rate": 0.00046278646469582216, + "loss": 0.7338, + "step": 30975 + }, + { + "epoch": 7.56, + "learning_rate": 0.00046275592474957246, + "loss": 0.7647, + "step": 31000 + }, + { + "epoch": 7.56, + "eval_cer": 0.16078560208617804, + "eval_loss": 0.5345603823661804, + "eval_runtime": 152.8664, + "eval_samples_per_second": 27.429, + "eval_steps_per_second": 6.862, + "eval_wer": 0.6219249592169658, + "step": 31000 + }, + { + "epoch": 7.57, + "learning_rate": 0.00046272538480332276, + "loss": 0.7339, + "step": 31025 + }, + { + "epoch": 7.58, + "learning_rate": 0.00046269484485707307, + "loss": 0.8613, + "step": 31050 + }, + { + "epoch": 7.58, + "learning_rate": 0.0004626643049108233, + "loss": 0.7179, + "step": 31075 + }, + { + "epoch": 7.59, + "learning_rate": 0.0004626337649645737, + "loss": 0.8002, + "step": 31100 + }, + { + "epoch": 7.6, + "learning_rate": 0.000462603225018324, + "loss": 0.7486, + "step": 31125 + }, + { + "epoch": 7.6, + "learning_rate": 0.0004625726850720743, + "loss": 0.7804, + "step": 31150 + }, + { + "epoch": 7.61, + "learning_rate": 0.0004625421451258246, + "loss": 0.7206, + "step": 31175 + }, + { + "epoch": 7.61, + "learning_rate": 0.0004625116051795749, + "loss": 0.7351, + "step": 31200 + }, + { + "epoch": 7.62, + "learning_rate": 0.00046248106523332524, + "loss": 0.7299, + "step": 31225 + }, + { + "epoch": 7.63, + "learning_rate": 0.0004624505252870755, + "loss": 0.776, + "step": 31250 + }, + { + "epoch": 7.63, + "learning_rate": 0.0004624199853408258, + "loss": 0.753, + "step": 31275 + }, + { + "epoch": 7.64, + "learning_rate": 0.0004623894453945761, + "loss": 0.7613, + "step": 31300 + }, + { + "epoch": 7.64, + "learning_rate": 0.0004623589054483264, + "loss": 0.7381, + "step": 31325 + }, + { + "epoch": 7.65, + "learning_rate": 0.00046232836550207676, + "loss": 0.7744, + "step": 31350 + }, + { + "epoch": 7.66, + "learning_rate": 0.00046229782555582706, + "loss": 0.7205, + "step": 31375 + }, + { + "epoch": 7.66, + "learning_rate": 0.0004622672856095773, + "loss": 0.7958, + "step": 31400 + }, + { + "epoch": 7.67, + "learning_rate": 0.0004622367456633276, + "loss": 0.8055, + "step": 31425 + }, + { + "epoch": 7.67, + "learning_rate": 0.0004622062057170779, + "loss": 0.8087, + "step": 31450 + }, + { + "epoch": 7.68, + "learning_rate": 0.0004621756657708283, + "loss": 0.7123, + "step": 31475 + }, + { + "epoch": 7.69, + "learning_rate": 0.0004621451258245786, + "loss": 0.7123, + "step": 31500 + }, + { + "epoch": 7.69, + "eval_cer": 0.15610915474882703, + "eval_loss": 0.5194910764694214, + "eval_runtime": 154.4911, + "eval_samples_per_second": 27.141, + "eval_steps_per_second": 6.79, + "eval_wer": 0.6110277324632952, + "step": 31500 + }, + { + "epoch": 7.69, + "learning_rate": 0.0004621145858783289, + "loss": 0.7202, + "step": 31525 + }, + { + "epoch": 7.7, + "learning_rate": 0.00046208404593207913, + "loss": 0.7416, + "step": 31550 + }, + { + "epoch": 7.7, + "learning_rate": 0.00046205350598582944, + "loss": 0.7489, + "step": 31575 + }, + { + "epoch": 7.71, + "learning_rate": 0.0004620229660395798, + "loss": 0.7806, + "step": 31600 + }, + { + "epoch": 7.72, + "learning_rate": 0.0004619924260933301, + "loss": 0.7351, + "step": 31625 + }, + { + "epoch": 7.72, + "learning_rate": 0.0004619618861470804, + "loss": 0.7592, + "step": 31650 + }, + { + "epoch": 7.73, + "learning_rate": 0.0004619313462008307, + "loss": 0.7057, + "step": 31675 + }, + { + "epoch": 7.74, + "learning_rate": 0.00046190080625458095, + "loss": 0.7845, + "step": 31700 + }, + { + "epoch": 7.74, + "learning_rate": 0.0004618702663083313, + "loss": 0.7061, + "step": 31725 + }, + { + "epoch": 7.75, + "learning_rate": 0.0004618397263620816, + "loss": 0.7245, + "step": 31750 + }, + { + "epoch": 7.75, + "learning_rate": 0.0004618091864158319, + "loss": 0.7343, + "step": 31775 + }, + { + "epoch": 7.76, + "learning_rate": 0.0004617786464695822, + "loss": 0.7688, + "step": 31800 + }, + { + "epoch": 7.77, + "learning_rate": 0.0004617481065233325, + "loss": 0.7333, + "step": 31825 + }, + { + "epoch": 7.77, + "learning_rate": 0.0004617175665770829, + "loss": 0.7634, + "step": 31850 + }, + { + "epoch": 7.78, + "learning_rate": 0.00046168702663083313, + "loss": 0.781, + "step": 31875 + }, + { + "epoch": 7.78, + "learning_rate": 0.00046165648668458343, + "loss": 0.8163, + "step": 31900 + }, + { + "epoch": 7.79, + "learning_rate": 0.00046162594673833374, + "loss": 0.7101, + "step": 31925 + }, + { + "epoch": 7.8, + "learning_rate": 0.00046159540679208404, + "loss": 0.7749, + "step": 31950 + }, + { + "epoch": 7.8, + "learning_rate": 0.0004615648668458344, + "loss": 0.7374, + "step": 31975 + }, + { + "epoch": 7.81, + "learning_rate": 0.0004615343268995847, + "loss": 0.7412, + "step": 32000 + }, + { + "epoch": 7.81, + "eval_cer": 0.1613245998583206, + "eval_loss": 0.5384941697120667, + "eval_runtime": 151.6218, + "eval_samples_per_second": 27.654, + "eval_steps_per_second": 6.919, + "eval_wer": 0.6256117455138662, + "step": 32000 + }, + { + "epoch": 7.81, + "learning_rate": 0.00046150378695333495, + "loss": 0.7464, + "step": 32025 + }, + { + "epoch": 7.82, + "learning_rate": 0.00046147324700708525, + "loss": 0.789, + "step": 32050 + }, + { + "epoch": 7.83, + "learning_rate": 0.00046144270706083556, + "loss": 0.7565, + "step": 32075 + }, + { + "epoch": 7.83, + "learning_rate": 0.0004614121671145859, + "loss": 0.7613, + "step": 32100 + }, + { + "epoch": 7.84, + "learning_rate": 0.0004613816271683362, + "loss": 0.732, + "step": 32125 + }, + { + "epoch": 7.85, + "learning_rate": 0.0004613510872220865, + "loss": 0.7272, + "step": 32150 + }, + { + "epoch": 7.85, + "learning_rate": 0.00046132054727583677, + "loss": 0.7103, + "step": 32175 + }, + { + "epoch": 7.86, + "learning_rate": 0.0004612900073295871, + "loss": 0.7953, + "step": 32200 + }, + { + "epoch": 7.86, + "learning_rate": 0.00046125946738333743, + "loss": 0.7259, + "step": 32225 + }, + { + "epoch": 7.87, + "learning_rate": 0.00046122892743708774, + "loss": 0.7467, + "step": 32250 + }, + { + "epoch": 7.88, + "learning_rate": 0.00046119838749083804, + "loss": 0.7153, + "step": 32275 + }, + { + "epoch": 7.88, + "learning_rate": 0.00046116784754458834, + "loss": 0.6801, + "step": 32300 + }, + { + "epoch": 7.89, + "learning_rate": 0.00046113730759833865, + "loss": 0.6988, + "step": 32325 + }, + { + "epoch": 7.89, + "learning_rate": 0.0004611067676520889, + "loss": 0.8216, + "step": 32350 + }, + { + "epoch": 7.9, + "learning_rate": 0.00046107622770583925, + "loss": 0.7436, + "step": 32375 + }, + { + "epoch": 7.91, + "learning_rate": 0.00046104568775958956, + "loss": 0.802, + "step": 32400 + }, + { + "epoch": 7.91, + "learning_rate": 0.00046101514781333986, + "loss": 0.7254, + "step": 32425 + }, + { + "epoch": 7.92, + "learning_rate": 0.00046098460786709016, + "loss": 0.7719, + "step": 32450 + }, + { + "epoch": 7.92, + "learning_rate": 0.00046095406792084047, + "loss": 0.7155, + "step": 32475 + }, + { + "epoch": 7.93, + "learning_rate": 0.00046092352797459077, + "loss": 0.7702, + "step": 32500 + }, + { + "epoch": 7.93, + "eval_cer": 0.16136053304313008, + "eval_loss": 0.5290741920471191, + "eval_runtime": 152.6414, + "eval_samples_per_second": 27.47, + "eval_steps_per_second": 6.872, + "eval_wer": 0.6342903752039152, + "step": 32500 + }, + { + "epoch": 7.94, + "learning_rate": 0.00045748786240159785, + "loss": 0.7358, + "step": 32525 + }, + { + "epoch": 7.94, + "learning_rate": 0.0004574546632812417, + "loss": 0.8072, + "step": 32550 + }, + { + "epoch": 7.95, + "learning_rate": 0.0004574214641608856, + "loss": 0.7435, + "step": 32575 + }, + { + "epoch": 7.96, + "learning_rate": 0.0004573882650405295, + "loss": 0.7616, + "step": 32600 + }, + { + "epoch": 7.96, + "learning_rate": 0.0004573550659201734, + "loss": 0.75, + "step": 32625 + }, + { + "epoch": 7.97, + "learning_rate": 0.0004573218667998173, + "loss": 0.7756, + "step": 32650 + }, + { + "epoch": 7.97, + "learning_rate": 0.0004572886676794612, + "loss": 0.7521, + "step": 32675 + }, + { + "epoch": 7.98, + "learning_rate": 0.0004572567965239193, + "loss": 0.7256, + "step": 32700 + }, + { + "epoch": 7.99, + "learning_rate": 0.00045722359740356323, + "loss": 0.7392, + "step": 32725 + }, + { + "epoch": 7.99, + "learning_rate": 0.0004571903982832071, + "loss": 0.7464, + "step": 32750 + }, + { + "epoch": 8.0, + "learning_rate": 0.00045715719916285095, + "loss": 0.71, + "step": 32775 + }, + { + "epoch": 8.0, + "learning_rate": 0.00045712400004249487, + "loss": 0.7379, + "step": 32800 + }, + { + "epoch": 8.01, + "learning_rate": 0.0004570908009221388, + "loss": 0.69, + "step": 32825 + }, + { + "epoch": 8.02, + "learning_rate": 0.0004570576018017827, + "loss": 0.7467, + "step": 32850 + }, + { + "epoch": 8.02, + "learning_rate": 0.0004570244026814266, + "loss": 0.6749, + "step": 32875 + }, + { + "epoch": 8.03, + "learning_rate": 0.0004569912035610704, + "loss": 0.7433, + "step": 32900 + }, + { + "epoch": 8.03, + "learning_rate": 0.00045695800444071433, + "loss": 0.6778, + "step": 32925 + }, + { + "epoch": 8.04, + "learning_rate": 0.00045692480532035824, + "loss": 0.7142, + "step": 32950 + }, + { + "epoch": 8.05, + "learning_rate": 0.00045689160620000216, + "loss": 0.683, + "step": 32975 + }, + { + "epoch": 8.05, + "learning_rate": 0.00045685840707964607, + "loss": 0.7561, + "step": 33000 + }, + { + "epoch": 8.05, + "eval_cer": 0.1552724248739772, + "eval_loss": 0.5043615102767944, + "eval_runtime": 142.7702, + "eval_samples_per_second": 29.369, + "eval_steps_per_second": 7.347, + "eval_wer": 0.6138336052202283, + "step": 33000 + }, + { + "epoch": 8.06, + "learning_rate": 0.00045682520795928993, + "loss": 0.6955, + "step": 33025 + }, + { + "epoch": 8.06, + "learning_rate": 0.0004567920088389338, + "loss": 0.7009, + "step": 33050 + }, + { + "epoch": 8.07, + "learning_rate": 0.0004567588097185777, + "loss": 0.6887, + "step": 33075 + }, + { + "epoch": 8.08, + "learning_rate": 0.0004567256105982216, + "loss": 0.7224, + "step": 33100 + }, + { + "epoch": 8.08, + "learning_rate": 0.0004566924114778655, + "loss": 0.7305, + "step": 33125 + }, + { + "epoch": 8.09, + "learning_rate": 0.0004566592123575094, + "loss": 0.7314, + "step": 33150 + }, + { + "epoch": 8.1, + "learning_rate": 0.0004566260132371533, + "loss": 0.7016, + "step": 33175 + }, + { + "epoch": 8.1, + "learning_rate": 0.00045659281411679716, + "loss": 0.7451, + "step": 33200 + }, + { + "epoch": 8.11, + "learning_rate": 0.0004565596149964411, + "loss": 0.7097, + "step": 33225 + }, + { + "epoch": 8.11, + "learning_rate": 0.00045652641587608494, + "loss": 0.6997, + "step": 33250 + }, + { + "epoch": 8.12, + "learning_rate": 0.00045649321675572885, + "loss": 0.6959, + "step": 33275 + }, + { + "epoch": 8.13, + "learning_rate": 0.00045646001763537277, + "loss": 0.7657, + "step": 33300 + }, + { + "epoch": 8.13, + "learning_rate": 0.0004564268185150167, + "loss": 0.7058, + "step": 33325 + }, + { + "epoch": 8.14, + "learning_rate": 0.0004563936193946605, + "loss": 0.7508, + "step": 33350 + }, + { + "epoch": 8.14, + "learning_rate": 0.0004563604202743044, + "loss": 0.6738, + "step": 33375 + }, + { + "epoch": 8.15, + "learning_rate": 0.0004563272211539483, + "loss": 0.7368, + "step": 33400 + }, + { + "epoch": 8.16, + "learning_rate": 0.00045629402203359223, + "loss": 0.7343, + "step": 33425 + }, + { + "epoch": 8.16, + "learning_rate": 0.00045626082291323614, + "loss": 0.709, + "step": 33450 + }, + { + "epoch": 8.17, + "learning_rate": 0.00045622762379288, + "loss": 0.7208, + "step": 33475 + }, + { + "epoch": 8.17, + "learning_rate": 0.00045619442467252386, + "loss": 0.7045, + "step": 33500 + }, + { + "epoch": 8.18, + "learning_rate": 0.0004561612255521678, + "loss": 0.7289, + "step": 33525 + }, + { + "epoch": 8.19, + "learning_rate": 0.0004561280264318117, + "loss": 0.7799, + "step": 33550 + }, + { + "epoch": 8.19, + "learning_rate": 0.00045609482731145555, + "loss": 0.7295, + "step": 33575 + }, + { + "epoch": 8.2, + "learning_rate": 0.00045606162819109946, + "loss": 0.7468, + "step": 33600 + }, + { + "epoch": 8.21, + "learning_rate": 0.0004560284290707434, + "loss": 0.711, + "step": 33625 + }, + { + "epoch": 8.21, + "learning_rate": 0.00045599522995038724, + "loss": 0.7462, + "step": 33650 + }, + { + "epoch": 8.22, + "learning_rate": 0.00045596203083003115, + "loss": 0.6793, + "step": 33675 + }, + { + "epoch": 8.22, + "learning_rate": 0.000455928831709675, + "loss": 0.7026, + "step": 33700 + }, + { + "epoch": 8.23, + "learning_rate": 0.0004558956325893189, + "loss": 0.707, + "step": 33725 + }, + { + "epoch": 8.24, + "learning_rate": 0.00045586243346896284, + "loss": 0.7465, + "step": 33750 + }, + { + "epoch": 8.24, + "learning_rate": 0.00045582923434860675, + "loss": 0.7105, + "step": 33775 + }, + { + "epoch": 8.25, + "learning_rate": 0.00045579603522825056, + "loss": 0.7257, + "step": 33800 + }, + { + "epoch": 8.25, + "learning_rate": 0.00045576283610789447, + "loss": 0.6767, + "step": 33825 + }, + { + "epoch": 8.26, + "learning_rate": 0.0004557296369875384, + "loss": 0.7343, + "step": 33850 + }, + { + "epoch": 8.27, + "learning_rate": 0.0004556964378671823, + "loss": 0.6389, + "step": 33875 + }, + { + "epoch": 8.27, + "learning_rate": 0.0004556632387468262, + "loss": 0.7362, + "step": 33900 + }, + { + "epoch": 8.28, + "learning_rate": 0.0004556300396264701, + "loss": 0.66, + "step": 33925 + }, + { + "epoch": 8.28, + "learning_rate": 0.00045559684050611393, + "loss": 0.7329, + "step": 33950 + }, + { + "epoch": 8.29, + "learning_rate": 0.00045556364138575785, + "loss": 0.6778, + "step": 33975 + }, + { + "epoch": 8.3, + "learning_rate": 0.00045553044226540176, + "loss": 0.7017, + "step": 34000 + }, + { + "epoch": 8.3, + "learning_rate": 0.0004554972431450456, + "loss": 0.6709, + "step": 34025 + }, + { + "epoch": 8.31, + "learning_rate": 0.00045546404402468954, + "loss": 0.7861, + "step": 34050 + }, + { + "epoch": 8.32, + "learning_rate": 0.0004554308449043334, + "loss": 0.7241, + "step": 34075 + }, + { + "epoch": 8.32, + "learning_rate": 0.0004553976457839773, + "loss": 0.6993, + "step": 34100 + }, + { + "epoch": 8.33, + "learning_rate": 0.0004553644466636212, + "loss": 0.6818, + "step": 34125 + }, + { + "epoch": 8.33, + "learning_rate": 0.0004553312475432651, + "loss": 0.7136, + "step": 34150 + }, + { + "epoch": 8.34, + "learning_rate": 0.000455298048422909, + "loss": 0.725, + "step": 34175 + }, + { + "epoch": 8.35, + "learning_rate": 0.0004552648493025529, + "loss": 0.7254, + "step": 34200 + }, + { + "epoch": 8.35, + "learning_rate": 0.00045523165018219677, + "loss": 0.7135, + "step": 34225 + }, + { + "epoch": 8.36, + "learning_rate": 0.00045519845106184063, + "loss": 0.7367, + "step": 34250 + }, + { + "epoch": 8.36, + "learning_rate": 0.00045516525194148454, + "loss": 0.7019, + "step": 34275 + }, + { + "epoch": 8.37, + "learning_rate": 0.00045513205282112846, + "loss": 0.7287, + "step": 34300 + }, + { + "epoch": 8.38, + "learning_rate": 0.00045509885370077237, + "loss": 0.7241, + "step": 34325 + }, + { + "epoch": 8.38, + "learning_rate": 0.0004550656545804163, + "loss": 0.749, + "step": 34350 + }, + { + "epoch": 8.39, + "learning_rate": 0.0004550324554600601, + "loss": 0.7361, + "step": 34375 + }, + { + "epoch": 8.39, + "learning_rate": 0.000454999256339704, + "loss": 0.7496, + "step": 34400 + }, + { + "epoch": 8.4, + "learning_rate": 0.0004549660572193479, + "loss": 0.6714, + "step": 34425 + }, + { + "epoch": 8.41, + "learning_rate": 0.00045493285809899183, + "loss": 0.7154, + "step": 34450 + }, + { + "epoch": 8.41, + "learning_rate": 0.00045489965897863575, + "loss": 0.7159, + "step": 34475 + }, + { + "epoch": 8.42, + "learning_rate": 0.0004548664598582796, + "loss": 0.6873, + "step": 34500 + }, + { + "epoch": 8.42, + "learning_rate": 0.00045483326073792347, + "loss": 0.7398, + "step": 34525 + }, + { + "epoch": 8.43, + "learning_rate": 0.0004548000616175674, + "loss": 0.7187, + "step": 34550 + }, + { + "epoch": 8.44, + "learning_rate": 0.0004547668624972113, + "loss": 0.7376, + "step": 34575 + }, + { + "epoch": 8.44, + "learning_rate": 0.00045473366337685515, + "loss": 0.7299, + "step": 34600 + }, + { + "epoch": 8.45, + "learning_rate": 0.00045470046425649907, + "loss": 0.7037, + "step": 34625 + }, + { + "epoch": 8.46, + "learning_rate": 0.000454667265136143, + "loss": 0.7256, + "step": 34650 + }, + { + "epoch": 8.46, + "learning_rate": 0.00045463406601578684, + "loss": 0.6814, + "step": 34675 + }, + { + "epoch": 8.47, + "learning_rate": 0.00045460086689543076, + "loss": 0.7661, + "step": 34700 + }, + { + "epoch": 8.47, + "learning_rate": 0.0004545676677750746, + "loss": 0.7051, + "step": 34725 + }, + { + "epoch": 8.48, + "learning_rate": 0.00045453446865471853, + "loss": 0.7034, + "step": 34750 + }, + { + "epoch": 8.49, + "learning_rate": 0.00045450126953436244, + "loss": 0.6999, + "step": 34775 + }, + { + "epoch": 8.49, + "learning_rate": 0.00045446807041400636, + "loss": 0.7787, + "step": 34800 + }, + { + "epoch": 8.5, + "learning_rate": 0.00045443487129365016, + "loss": 0.6958, + "step": 34825 + }, + { + "epoch": 8.5, + "learning_rate": 0.0004544016721732941, + "loss": 0.7198, + "step": 34850 + }, + { + "epoch": 8.51, + "learning_rate": 0.000454368473052938, + "loss": 0.7049, + "step": 34875 + }, + { + "epoch": 8.52, + "learning_rate": 0.0004543352739325819, + "loss": 0.7153, + "step": 34900 + }, + { + "epoch": 8.52, + "learning_rate": 0.0004543020748122258, + "loss": 0.6683, + "step": 34925 + }, + { + "epoch": 8.53, + "learning_rate": 0.0004542688756918697, + "loss": 0.7465, + "step": 34950 + }, + { + "epoch": 8.53, + "learning_rate": 0.0004542370045363278, + "loss": 0.7218, + "step": 34975 + }, + { + "epoch": 8.54, + "learning_rate": 0.00045420380541597174, + "loss": 0.7668, + "step": 35000 + }, + { + "epoch": 8.55, + "learning_rate": 0.0004541706062956156, + "loss": 0.7447, + "step": 35025 + }, + { + "epoch": 8.55, + "learning_rate": 0.00045413740717525946, + "loss": 0.7514, + "step": 35050 + }, + { + "epoch": 8.56, + "learning_rate": 0.00045410420805490337, + "loss": 0.6962, + "step": 35075 + }, + { + "epoch": 8.57, + "learning_rate": 0.0004540710089345473, + "loss": 0.7447, + "step": 35100 + }, + { + "epoch": 8.57, + "learning_rate": 0.0004540378098141912, + "loss": 0.6955, + "step": 35125 + }, + { + "epoch": 8.58, + "learning_rate": 0.00045400461069383506, + "loss": 0.7442, + "step": 35150 + }, + { + "epoch": 8.58, + "learning_rate": 0.0004539714115734789, + "loss": 0.7125, + "step": 35175 + }, + { + "epoch": 8.59, + "learning_rate": 0.00045393821245312283, + "loss": 0.6657, + "step": 35200 + }, + { + "epoch": 8.6, + "learning_rate": 0.00045390501333276675, + "loss": 0.7187, + "step": 35225 + }, + { + "epoch": 8.6, + "learning_rate": 0.00045387181421241066, + "loss": 0.7508, + "step": 35250 + }, + { + "epoch": 8.61, + "learning_rate": 0.0004538386150920545, + "loss": 0.6859, + "step": 35275 + }, + { + "epoch": 8.61, + "learning_rate": 0.00045380541597169843, + "loss": 0.735, + "step": 35300 + }, + { + "epoch": 8.62, + "learning_rate": 0.0004537722168513423, + "loss": 0.7471, + "step": 35325 + }, + { + "epoch": 8.63, + "learning_rate": 0.0004537390177309862, + "loss": 0.7225, + "step": 35350 + }, + { + "epoch": 8.63, + "learning_rate": 0.00045370581861063007, + "loss": 0.6906, + "step": 35375 + }, + { + "epoch": 8.64, + "learning_rate": 0.000453672619490274, + "loss": 0.7514, + "step": 35400 + }, + { + "epoch": 8.64, + "learning_rate": 0.0004536394203699179, + "loss": 0.6694, + "step": 35425 + }, + { + "epoch": 8.65, + "learning_rate": 0.0004536062212495618, + "loss": 0.7746, + "step": 35450 + }, + { + "epoch": 8.66, + "learning_rate": 0.00045357302212920567, + "loss": 0.701, + "step": 35475 + }, + { + "epoch": 8.66, + "learning_rate": 0.00045353982300884953, + "loss": 0.7392, + "step": 35500 + }, + { + "epoch": 8.67, + "learning_rate": 0.00045350662388849344, + "loss": 0.6876, + "step": 35525 + }, + { + "epoch": 8.67, + "learning_rate": 0.00045347342476813736, + "loss": 0.7694, + "step": 35550 + }, + { + "epoch": 8.68, + "learning_rate": 0.00045344022564778127, + "loss": 0.7055, + "step": 35575 + }, + { + "epoch": 8.69, + "learning_rate": 0.0004534070265274252, + "loss": 0.7324, + "step": 35600 + }, + { + "epoch": 8.69, + "learning_rate": 0.000453373827407069, + "loss": 0.6626, + "step": 35625 + }, + { + "epoch": 8.7, + "learning_rate": 0.0004533406282867129, + "loss": 0.7154, + "step": 35650 + }, + { + "epoch": 8.71, + "learning_rate": 0.0004533074291663568, + "loss": 0.6535, + "step": 35675 + }, + { + "epoch": 8.71, + "learning_rate": 0.00045327423004600073, + "loss": 0.7425, + "step": 35700 + }, + { + "epoch": 8.72, + "learning_rate": 0.0004532410309256446, + "loss": 0.6725, + "step": 35725 + }, + { + "epoch": 8.72, + "learning_rate": 0.0004532078318052885, + "loss": 0.7673, + "step": 35750 + }, + { + "epoch": 8.73, + "learning_rate": 0.00045317463268493237, + "loss": 0.7024, + "step": 35775 + }, + { + "epoch": 8.74, + "learning_rate": 0.0004531414335645763, + "loss": 0.7646, + "step": 35800 + }, + { + "epoch": 8.74, + "learning_rate": 0.0004531082344442202, + "loss": 0.6934, + "step": 35825 + }, + { + "epoch": 8.75, + "learning_rate": 0.00045307503532386405, + "loss": 0.7679, + "step": 35850 + }, + { + "epoch": 8.75, + "learning_rate": 0.00045304183620350797, + "loss": 0.7127, + "step": 35875 + }, + { + "epoch": 8.76, + "learning_rate": 0.0004530086370831519, + "loss": 0.7156, + "step": 35900 + }, + { + "epoch": 8.77, + "learning_rate": 0.00045297543796279574, + "loss": 0.7257, + "step": 35925 + }, + { + "epoch": 8.77, + "learning_rate": 0.0004529422388424396, + "loss": 0.7511, + "step": 35950 + }, + { + "epoch": 8.78, + "learning_rate": 0.0004529090397220835, + "loss": 0.716, + "step": 35975 + }, + { + "epoch": 8.78, + "learning_rate": 0.00045287584060172743, + "loss": 0.6707, + "step": 36000 + }, + { + "epoch": 8.78, + "eval_cer": 0.1483578534542057, + "eval_loss": 0.4949270784854889, + "eval_runtime": 144.1661, + "eval_samples_per_second": 29.085, + "eval_steps_per_second": 7.276, + "eval_wer": 0.5880587275693312, + "step": 36000 + }, + { + "epoch": 8.79, + "learning_rate": 0.00045284264148137134, + "loss": 0.7008, + "step": 36025 + }, + { + "epoch": 8.8, + "learning_rate": 0.00045280944236101526, + "loss": 0.7192, + "step": 36050 + }, + { + "epoch": 8.8, + "learning_rate": 0.00045277624324065906, + "loss": 0.6832, + "step": 36075 + }, + { + "epoch": 8.81, + "learning_rate": 0.000452743044120303, + "loss": 0.6916, + "step": 36100 + }, + { + "epoch": 8.82, + "learning_rate": 0.0004527098449999469, + "loss": 0.7466, + "step": 36125 + }, + { + "epoch": 8.82, + "learning_rate": 0.0004526766458795908, + "loss": 0.7268, + "step": 36150 + }, + { + "epoch": 8.83, + "learning_rate": 0.0004526447747240489, + "loss": 0.7509, + "step": 36175 + }, + { + "epoch": 8.83, + "learning_rate": 0.0004526115756036928, + "loss": 0.7412, + "step": 36200 + }, + { + "epoch": 8.84, + "learning_rate": 0.0004525783764833367, + "loss": 0.7099, + "step": 36225 + }, + { + "epoch": 8.85, + "learning_rate": 0.00045254517736298064, + "loss": 0.7817, + "step": 36250 + }, + { + "epoch": 8.85, + "learning_rate": 0.00045251197824262444, + "loss": 0.7181, + "step": 36275 + }, + { + "epoch": 8.86, + "learning_rate": 0.00045247877912226836, + "loss": 0.7417, + "step": 36300 + }, + { + "epoch": 8.86, + "learning_rate": 0.00045244558000191227, + "loss": 0.7523, + "step": 36325 + }, + { + "epoch": 8.87, + "learning_rate": 0.0004524123808815562, + "loss": 0.7523, + "step": 36350 + }, + { + "epoch": 8.88, + "learning_rate": 0.0004523791817612001, + "loss": 0.6954, + "step": 36375 + }, + { + "epoch": 8.88, + "learning_rate": 0.00045234598264084396, + "loss": 0.7373, + "step": 36400 + }, + { + "epoch": 8.89, + "learning_rate": 0.0004523127835204878, + "loss": 0.6966, + "step": 36425 + }, + { + "epoch": 8.89, + "learning_rate": 0.00045227958440013173, + "loss": 0.7854, + "step": 36450 + }, + { + "epoch": 8.9, + "learning_rate": 0.00045224638527977565, + "loss": 0.7014, + "step": 36475 + }, + { + "epoch": 8.91, + "learning_rate": 0.0004522131861594195, + "loss": 0.6959, + "step": 36500 + }, + { + "epoch": 8.91, + "learning_rate": 0.0004521799870390634, + "loss": 0.6655, + "step": 36525 + }, + { + "epoch": 8.92, + "learning_rate": 0.00045214678791870733, + "loss": 0.7365, + "step": 36550 + }, + { + "epoch": 8.93, + "learning_rate": 0.0004521135887983512, + "loss": 0.7066, + "step": 36575 + }, + { + "epoch": 8.93, + "learning_rate": 0.0004520803896779951, + "loss": 0.7764, + "step": 36600 + }, + { + "epoch": 8.94, + "learning_rate": 0.00045204719055763897, + "loss": 0.7355, + "step": 36625 + }, + { + "epoch": 8.94, + "learning_rate": 0.0004520139914372829, + "loss": 0.737, + "step": 36650 + }, + { + "epoch": 8.95, + "learning_rate": 0.0004519807923169268, + "loss": 0.6743, + "step": 36675 + }, + { + "epoch": 8.96, + "learning_rate": 0.0004519475931965707, + "loss": 0.7412, + "step": 36700 + }, + { + "epoch": 8.96, + "learning_rate": 0.0004519143940762145, + "loss": 0.6972, + "step": 36725 + }, + { + "epoch": 8.97, + "learning_rate": 0.00045188119495585843, + "loss": 0.6959, + "step": 36750 + }, + { + "epoch": 8.97, + "learning_rate": 0.00045184799583550234, + "loss": 0.7406, + "step": 36775 + }, + { + "epoch": 8.98, + "learning_rate": 0.00045181479671514626, + "loss": 0.7489, + "step": 36800 + }, + { + "epoch": 8.99, + "learning_rate": 0.00045178159759479017, + "loss": 0.7189, + "step": 36825 + }, + { + "epoch": 8.99, + "learning_rate": 0.00045174839847443403, + "loss": 0.7095, + "step": 36850 + }, + { + "epoch": 9.0, + "learning_rate": 0.0004517151993540779, + "loss": 0.6805, + "step": 36875 + }, + { + "epoch": 9.0, + "learning_rate": 0.0004516820002337218, + "loss": 0.7752, + "step": 36900 + }, + { + "epoch": 9.01, + "learning_rate": 0.0004516488011133657, + "loss": 0.6744, + "step": 36925 + }, + { + "epoch": 9.02, + "learning_rate": 0.00045161560199300963, + "loss": 0.7001, + "step": 36950 + }, + { + "epoch": 9.02, + "learning_rate": 0.0004515824028726535, + "loss": 0.6452, + "step": 36975 + }, + { + "epoch": 9.03, + "learning_rate": 0.0004515492037522974, + "loss": 0.7344, + "step": 37000 + }, + { + "epoch": 9.03, + "learning_rate": 0.00045151600463194127, + "loss": 0.6445, + "step": 37025 + }, + { + "epoch": 9.04, + "learning_rate": 0.0004514828055115852, + "loss": 0.7017, + "step": 37050 + }, + { + "epoch": 9.05, + "learning_rate": 0.00045144960639122904, + "loss": 0.6833, + "step": 37075 + }, + { + "epoch": 9.05, + "learning_rate": 0.00045141640727087295, + "loss": 0.724, + "step": 37100 + }, + { + "epoch": 9.06, + "learning_rate": 0.00045138320815051687, + "loss": 0.7056, + "step": 37125 + }, + { + "epoch": 9.07, + "learning_rate": 0.0004513500090301608, + "loss": 0.7139, + "step": 37150 + }, + { + "epoch": 9.07, + "learning_rate": 0.00045131680990980464, + "loss": 0.6972, + "step": 37175 + }, + { + "epoch": 9.08, + "learning_rate": 0.0004512836107894485, + "loss": 0.6807, + "step": 37200 + }, + { + "epoch": 9.08, + "learning_rate": 0.0004512504116690924, + "loss": 0.7068, + "step": 37225 + }, + { + "epoch": 9.09, + "learning_rate": 0.00045121721254873633, + "loss": 0.763, + "step": 37250 + }, + { + "epoch": 9.1, + "learning_rate": 0.00045118401342838024, + "loss": 0.6558, + "step": 37275 + }, + { + "epoch": 9.1, + "learning_rate": 0.0004511508143080241, + "loss": 0.7469, + "step": 37300 + }, + { + "epoch": 9.11, + "learning_rate": 0.00045111761518766796, + "loss": 0.6294, + "step": 37325 + }, + { + "epoch": 9.11, + "learning_rate": 0.0004510844160673119, + "loss": 0.7112, + "step": 37350 + }, + { + "epoch": 9.12, + "learning_rate": 0.0004510512169469558, + "loss": 0.6873, + "step": 37375 + }, + { + "epoch": 9.13, + "learning_rate": 0.0004510180178265997, + "loss": 0.7776, + "step": 37400 + }, + { + "epoch": 9.13, + "learning_rate": 0.00045098481870624356, + "loss": 0.6728, + "step": 37425 + }, + { + "epoch": 9.14, + "learning_rate": 0.0004509516195858875, + "loss": 0.747, + "step": 37450 + }, + { + "epoch": 9.14, + "learning_rate": 0.00045091842046553134, + "loss": 0.6623, + "step": 37475 + }, + { + "epoch": 9.15, + "learning_rate": 0.00045088522134517525, + "loss": 0.7196, + "step": 37500 + }, + { + "epoch": 9.16, + "learning_rate": 0.0004508520222248191, + "loss": 0.7017, + "step": 37525 + }, + { + "epoch": 9.16, + "learning_rate": 0.000450818823104463, + "loss": 0.723, + "step": 37550 + }, + { + "epoch": 9.17, + "learning_rate": 0.00045078562398410694, + "loss": 0.66, + "step": 37575 + }, + { + "epoch": 9.18, + "learning_rate": 0.00045075242486375085, + "loss": 0.7111, + "step": 37600 + }, + { + "epoch": 9.18, + "learning_rate": 0.0004507192257433947, + "loss": 0.7159, + "step": 37625 + }, + { + "epoch": 9.19, + "learning_rate": 0.0004506860266230386, + "loss": 0.7171, + "step": 37650 + }, + { + "epoch": 9.19, + "learning_rate": 0.0004506528275026825, + "loss": 0.6743, + "step": 37675 + }, + { + "epoch": 9.2, + "learning_rate": 0.0004506196283823264, + "loss": 0.7218, + "step": 37700 + }, + { + "epoch": 9.21, + "learning_rate": 0.0004505864292619703, + "loss": 0.6664, + "step": 37725 + }, + { + "epoch": 9.21, + "learning_rate": 0.0004505532301416142, + "loss": 0.7363, + "step": 37750 + }, + { + "epoch": 9.22, + "learning_rate": 0.00045052003102125803, + "loss": 0.6426, + "step": 37775 + }, + { + "epoch": 9.22, + "learning_rate": 0.00045048683190090195, + "loss": 0.664, + "step": 37800 + }, + { + "epoch": 9.23, + "learning_rate": 0.00045045363278054586, + "loss": 0.7016, + "step": 37825 + }, + { + "epoch": 9.24, + "learning_rate": 0.0004504204336601898, + "loss": 0.6749, + "step": 37850 + }, + { + "epoch": 9.24, + "learning_rate": 0.00045038723453983364, + "loss": 0.6577, + "step": 37875 + }, + { + "epoch": 9.25, + "learning_rate": 0.00045035403541947755, + "loss": 0.744, + "step": 37900 + }, + { + "epoch": 9.25, + "learning_rate": 0.0004503208362991214, + "loss": 0.6835, + "step": 37925 + }, + { + "epoch": 9.26, + "learning_rate": 0.0004502876371787653, + "loss": 0.7322, + "step": 37950 + }, + { + "epoch": 9.27, + "learning_rate": 0.0004502544380584092, + "loss": 0.708, + "step": 37975 + }, + { + "epoch": 9.27, + "learning_rate": 0.0004502212389380531, + "loss": 0.7195, + "step": 38000 + }, + { + "epoch": 9.28, + "learning_rate": 0.000450188039817697, + "loss": 0.6804, + "step": 38025 + }, + { + "epoch": 9.29, + "learning_rate": 0.0004501548406973409, + "loss": 0.7341, + "step": 38050 + }, + { + "epoch": 9.29, + "learning_rate": 0.0004501216415769848, + "loss": 0.7179, + "step": 38075 + }, + { + "epoch": 9.3, + "learning_rate": 0.00045008844245662865, + "loss": 0.7163, + "step": 38100 + }, + { + "epoch": 9.3, + "learning_rate": 0.00045005524333627256, + "loss": 0.6866, + "step": 38125 + }, + { + "epoch": 9.31, + "learning_rate": 0.0004500220442159165, + "loss": 0.7201, + "step": 38150 + }, + { + "epoch": 9.32, + "learning_rate": 0.0004499888450955604, + "loss": 0.6692, + "step": 38175 + }, + { + "epoch": 9.32, + "learning_rate": 0.0004499556459752043, + "loss": 0.6772, + "step": 38200 + }, + { + "epoch": 9.33, + "learning_rate": 0.0004499224468548481, + "loss": 0.6355, + "step": 38225 + }, + { + "epoch": 9.33, + "learning_rate": 0.000449889247734492, + "loss": 0.7786, + "step": 38250 + }, + { + "epoch": 9.34, + "learning_rate": 0.00044985604861413593, + "loss": 0.691, + "step": 38275 + }, + { + "epoch": 9.35, + "learning_rate": 0.00044982284949377985, + "loss": 0.6757, + "step": 38300 + }, + { + "epoch": 9.35, + "learning_rate": 0.0004497896503734237, + "loss": 0.6706, + "step": 38325 + }, + { + "epoch": 9.36, + "learning_rate": 0.0004497564512530676, + "loss": 0.709, + "step": 38350 + }, + { + "epoch": 9.36, + "learning_rate": 0.0004497232521327115, + "loss": 0.6798, + "step": 38375 + }, + { + "epoch": 9.37, + "learning_rate": 0.0004496900530123554, + "loss": 0.7252, + "step": 38400 + }, + { + "epoch": 9.38, + "learning_rate": 0.0004496568538919993, + "loss": 0.6908, + "step": 38425 + }, + { + "epoch": 9.38, + "learning_rate": 0.00044962365477164317, + "loss": 0.7345, + "step": 38450 + }, + { + "epoch": 9.39, + "learning_rate": 0.0004495904556512871, + "loss": 0.7017, + "step": 38475 + }, + { + "epoch": 9.39, + "learning_rate": 0.000449557256530931, + "loss": 0.7145, + "step": 38500 + }, + { + "epoch": 9.4, + "learning_rate": 0.00044952405741057486, + "loss": 0.6815, + "step": 38525 + }, + { + "epoch": 9.41, + "learning_rate": 0.0004494908582902187, + "loss": 0.7273, + "step": 38550 + }, + { + "epoch": 9.41, + "learning_rate": 0.00044945765916986263, + "loss": 0.6296, + "step": 38575 + }, + { + "epoch": 9.42, + "learning_rate": 0.00044942446004950655, + "loss": 0.7299, + "step": 38600 + }, + { + "epoch": 9.43, + "learning_rate": 0.00044939126092915046, + "loss": 0.6673, + "step": 38625 + }, + { + "epoch": 9.43, + "learning_rate": 0.0004493580618087944, + "loss": 0.6781, + "step": 38650 + }, + { + "epoch": 9.44, + "learning_rate": 0.0004493248626884382, + "loss": 0.6999, + "step": 38675 + }, + { + "epoch": 9.44, + "learning_rate": 0.0004492916635680821, + "loss": 0.6705, + "step": 38700 + }, + { + "epoch": 9.45, + "learning_rate": 0.000449258464447726, + "loss": 0.6873, + "step": 38725 + }, + { + "epoch": 9.46, + "learning_rate": 0.0004492252653273699, + "loss": 0.7198, + "step": 38750 + }, + { + "epoch": 9.46, + "learning_rate": 0.0004491920662070138, + "loss": 0.6728, + "step": 38775 + }, + { + "epoch": 9.47, + "learning_rate": 0.0004491588670866577, + "loss": 0.7017, + "step": 38800 + }, + { + "epoch": 9.47, + "learning_rate": 0.00044912566796630155, + "loss": 0.7148, + "step": 38825 + }, + { + "epoch": 9.48, + "learning_rate": 0.00044909246884594547, + "loss": 0.7188, + "step": 38850 + }, + { + "epoch": 9.49, + "learning_rate": 0.0004490592697255894, + "loss": 0.6564, + "step": 38875 + }, + { + "epoch": 9.49, + "learning_rate": 0.00044902607060523324, + "loss": 0.6816, + "step": 38900 + }, + { + "epoch": 9.5, + "learning_rate": 0.00044899287148487716, + "loss": 0.6847, + "step": 38925 + }, + { + "epoch": 9.5, + "learning_rate": 0.00044895967236452107, + "loss": 0.6948, + "step": 38950 + }, + { + "epoch": 9.51, + "learning_rate": 0.00044892647324416493, + "loss": 0.7111, + "step": 38975 + }, + { + "epoch": 9.52, + "learning_rate": 0.0004488932741238088, + "loss": 0.719, + "step": 39000 + }, + { + "epoch": 9.52, + "eval_cer": 0.15075511021221114, + "eval_loss": 0.5013872385025024, + "eval_runtime": 145.9791, + "eval_samples_per_second": 28.723, + "eval_steps_per_second": 7.186, + "eval_wer": 0.5959216965742251, + "step": 39000 + }, + { + "epoch": 9.52, + "learning_rate": 0.0004488600750034527, + "loss": 0.6854, + "step": 39025 + }, + { + "epoch": 9.53, + "learning_rate": 0.0004488268758830966, + "loss": 0.678, + "step": 39050 + }, + { + "epoch": 9.54, + "learning_rate": 0.00044879367676274053, + "loss": 0.6631, + "step": 39075 + }, + { + "epoch": 9.54, + "learning_rate": 0.00044876047764238445, + "loss": 0.7081, + "step": 39100 + }, + { + "epoch": 9.55, + "learning_rate": 0.00044872727852202825, + "loss": 0.6705, + "step": 39125 + }, + { + "epoch": 9.55, + "learning_rate": 0.00044869407940167216, + "loss": 0.729, + "step": 39150 + }, + { + "epoch": 9.56, + "learning_rate": 0.0004486608802813161, + "loss": 0.7027, + "step": 39175 + }, + { + "epoch": 9.57, + "learning_rate": 0.00044862768116096, + "loss": 0.7308, + "step": 39200 + }, + { + "epoch": 9.57, + "learning_rate": 0.0004485944820406039, + "loss": 0.7288, + "step": 39225 + }, + { + "epoch": 9.58, + "learning_rate": 0.00044856128292024777, + "loss": 0.7452, + "step": 39250 + }, + { + "epoch": 9.58, + "learning_rate": 0.0004485280837998916, + "loss": 0.6672, + "step": 39275 + }, + { + "epoch": 9.59, + "learning_rate": 0.00044849488467953554, + "loss": 0.7339, + "step": 39300 + }, + { + "epoch": 9.6, + "learning_rate": 0.00044846168555917945, + "loss": 0.6634, + "step": 39325 + }, + { + "epoch": 9.6, + "learning_rate": 0.0004484284864388233, + "loss": 0.753, + "step": 39350 + }, + { + "epoch": 9.61, + "learning_rate": 0.00044839528731846723, + "loss": 0.7163, + "step": 39375 + }, + { + "epoch": 9.61, + "learning_rate": 0.00044836208819811114, + "loss": 0.688, + "step": 39400 + }, + { + "epoch": 9.62, + "learning_rate": 0.000448328889077755, + "loss": 0.6879, + "step": 39425 + }, + { + "epoch": 9.63, + "learning_rate": 0.00044829701792221315, + "loss": 0.6762, + "step": 39450 + }, + { + "epoch": 9.63, + "learning_rate": 0.000448263818801857, + "loss": 0.6697, + "step": 39475 + }, + { + "epoch": 9.64, + "learning_rate": 0.0004482306196815009, + "loss": 0.7131, + "step": 39500 + }, + { + "epoch": 9.64, + "learning_rate": 0.00044819742056114483, + "loss": 0.6714, + "step": 39525 + }, + { + "epoch": 9.65, + "learning_rate": 0.00044816422144078875, + "loss": 0.7331, + "step": 39550 + }, + { + "epoch": 9.66, + "learning_rate": 0.0004481310223204326, + "loss": 0.669, + "step": 39575 + }, + { + "epoch": 9.66, + "learning_rate": 0.0004480978232000765, + "loss": 0.7278, + "step": 39600 + }, + { + "epoch": 9.67, + "learning_rate": 0.0004480646240797204, + "loss": 0.71, + "step": 39625 + }, + { + "epoch": 9.68, + "learning_rate": 0.0004480314249593643, + "loss": 0.7189, + "step": 39650 + }, + { + "epoch": 9.68, + "learning_rate": 0.00044799822583900815, + "loss": 0.6807, + "step": 39675 + }, + { + "epoch": 9.69, + "learning_rate": 0.00044796502671865207, + "loss": 0.7424, + "step": 39700 + }, + { + "epoch": 9.69, + "learning_rate": 0.000447931827598296, + "loss": 0.6599, + "step": 39725 + }, + { + "epoch": 9.7, + "learning_rate": 0.0004478986284779399, + "loss": 0.7126, + "step": 39750 + }, + { + "epoch": 9.71, + "learning_rate": 0.00044786542935758376, + "loss": 0.6809, + "step": 39775 + }, + { + "epoch": 9.71, + "learning_rate": 0.0004478322302372276, + "loss": 0.7082, + "step": 39800 + }, + { + "epoch": 9.72, + "learning_rate": 0.00044779903111687153, + "loss": 0.6746, + "step": 39825 + }, + { + "epoch": 9.72, + "learning_rate": 0.00044776583199651544, + "loss": 0.7128, + "step": 39850 + }, + { + "epoch": 9.73, + "learning_rate": 0.00044773263287615936, + "loss": 0.6563, + "step": 39875 + }, + { + "epoch": 9.74, + "learning_rate": 0.0004476994337558032, + "loss": 0.7062, + "step": 39900 + }, + { + "epoch": 9.74, + "learning_rate": 0.0004476662346354471, + "loss": 0.7103, + "step": 39925 + }, + { + "epoch": 9.75, + "learning_rate": 0.000447633035515091, + "loss": 0.7658, + "step": 39950 + }, + { + "epoch": 9.75, + "learning_rate": 0.0004475998363947349, + "loss": 0.71, + "step": 39975 + }, + { + "epoch": 9.76, + "learning_rate": 0.0004475666372743788, + "loss": 0.7136, + "step": 40000 + }, + { + "epoch": 9.77, + "learning_rate": 0.0004475334381540227, + "loss": 0.6374, + "step": 40025 + }, + { + "epoch": 9.77, + "learning_rate": 0.0004475002390336666, + "loss": 0.7416, + "step": 40050 + }, + { + "epoch": 9.78, + "learning_rate": 0.00044746703991331045, + "loss": 0.6768, + "step": 40075 + }, + { + "epoch": 9.79, + "learning_rate": 0.00044743384079295437, + "loss": 0.7113, + "step": 40100 + }, + { + "epoch": 9.79, + "learning_rate": 0.0004474006416725982, + "loss": 0.7097, + "step": 40125 + }, + { + "epoch": 9.8, + "learning_rate": 0.00044736744255224214, + "loss": 0.73, + "step": 40150 + }, + { + "epoch": 9.8, + "learning_rate": 0.00044733424343188606, + "loss": 0.6649, + "step": 40175 + }, + { + "epoch": 9.81, + "learning_rate": 0.0004473010443115299, + "loss": 0.7055, + "step": 40200 + }, + { + "epoch": 9.82, + "learning_rate": 0.00044726784519117383, + "loss": 0.7035, + "step": 40225 + }, + { + "epoch": 9.82, + "learning_rate": 0.0004472346460708177, + "loss": 0.6875, + "step": 40250 + }, + { + "epoch": 9.83, + "learning_rate": 0.0004472014469504616, + "loss": 0.6591, + "step": 40275 + }, + { + "epoch": 9.83, + "learning_rate": 0.0004471682478301055, + "loss": 0.7477, + "step": 40300 + }, + { + "epoch": 9.84, + "learning_rate": 0.00044713504870974943, + "loss": 0.6654, + "step": 40325 + }, + { + "epoch": 9.85, + "learning_rate": 0.00044710184958939324, + "loss": 0.7281, + "step": 40350 + }, + { + "epoch": 9.85, + "learning_rate": 0.00044706865046903715, + "loss": 0.7106, + "step": 40375 + }, + { + "epoch": 9.86, + "learning_rate": 0.00044703545134868106, + "loss": 0.6784, + "step": 40400 + }, + { + "epoch": 9.86, + "learning_rate": 0.000447002252228325, + "loss": 0.7191, + "step": 40425 + }, + { + "epoch": 9.87, + "learning_rate": 0.0004469690531079689, + "loss": 0.7231, + "step": 40450 + }, + { + "epoch": 9.88, + "learning_rate": 0.00044693585398761275, + "loss": 0.6801, + "step": 40475 + }, + { + "epoch": 9.88, + "learning_rate": 0.0004469026548672566, + "loss": 0.7126, + "step": 40500 + }, + { + "epoch": 9.89, + "learning_rate": 0.0004468694557469005, + "loss": 0.6579, + "step": 40525 + }, + { + "epoch": 9.9, + "learning_rate": 0.00044683625662654444, + "loss": 0.7128, + "step": 40550 + }, + { + "epoch": 9.9, + "learning_rate": 0.0004468030575061883, + "loss": 0.677, + "step": 40575 + }, + { + "epoch": 9.91, + "learning_rate": 0.0004467698583858322, + "loss": 0.707, + "step": 40600 + }, + { + "epoch": 9.91, + "learning_rate": 0.00044673665926547613, + "loss": 0.6787, + "step": 40625 + }, + { + "epoch": 9.92, + "learning_rate": 0.00044670346014512, + "loss": 0.7532, + "step": 40650 + }, + { + "epoch": 9.93, + "learning_rate": 0.0004466702610247639, + "loss": 0.6928, + "step": 40675 + }, + { + "epoch": 9.93, + "learning_rate": 0.00044663706190440776, + "loss": 0.7258, + "step": 40700 + }, + { + "epoch": 9.94, + "learning_rate": 0.0004466038627840517, + "loss": 0.6488, + "step": 40725 + }, + { + "epoch": 9.94, + "learning_rate": 0.0004465706636636956, + "loss": 0.731, + "step": 40750 + }, + { + "epoch": 9.95, + "learning_rate": 0.0004465374645433395, + "loss": 0.6426, + "step": 40775 + }, + { + "epoch": 9.96, + "learning_rate": 0.00044650426542298336, + "loss": 0.7102, + "step": 40800 + }, + { + "epoch": 9.96, + "learning_rate": 0.0004464710663026272, + "loss": 0.6771, + "step": 40825 + }, + { + "epoch": 9.97, + "learning_rate": 0.00044643786718227114, + "loss": 0.7049, + "step": 40850 + }, + { + "epoch": 9.97, + "learning_rate": 0.00044640466806191505, + "loss": 0.6875, + "step": 40875 + }, + { + "epoch": 9.98, + "learning_rate": 0.00044637146894155896, + "loss": 0.7471, + "step": 40900 + }, + { + "epoch": 9.99, + "learning_rate": 0.0004463382698212028, + "loss": 0.6649, + "step": 40925 + }, + { + "epoch": 9.99, + "learning_rate": 0.0004463050707008467, + "loss": 0.7104, + "step": 40950 + }, + { + "epoch": 10.0, + "learning_rate": 0.0004462718715804906, + "loss": 0.6589, + "step": 40975 + }, + { + "epoch": 10.0, + "learning_rate": 0.0004462386724601345, + "loss": 0.7005, + "step": 41000 + }, + { + "epoch": 10.01, + "learning_rate": 0.0004462054733397784, + "loss": 0.661, + "step": 41025 + }, + { + "epoch": 10.02, + "learning_rate": 0.0004461722742194223, + "loss": 0.6775, + "step": 41050 + }, + { + "epoch": 10.02, + "learning_rate": 0.0004461390750990662, + "loss": 0.6869, + "step": 41075 + }, + { + "epoch": 10.03, + "learning_rate": 0.00044610587597871006, + "loss": 0.6901, + "step": 41100 + }, + { + "epoch": 10.04, + "learning_rate": 0.000446072676858354, + "loss": 0.6488, + "step": 41125 + }, + { + "epoch": 10.04, + "learning_rate": 0.00044603947773799783, + "loss": 0.6936, + "step": 41150 + }, + { + "epoch": 10.05, + "learning_rate": 0.00044600627861764175, + "loss": 0.6753, + "step": 41175 + }, + { + "epoch": 10.05, + "learning_rate": 0.00044597307949728566, + "loss": 0.6729, + "step": 41200 + }, + { + "epoch": 10.06, + "learning_rate": 0.0004459398803769296, + "loss": 0.6251, + "step": 41225 + }, + { + "epoch": 10.07, + "learning_rate": 0.00044590668125657343, + "loss": 0.6957, + "step": 41250 + }, + { + "epoch": 10.07, + "learning_rate": 0.0004458734821362173, + "loss": 0.6599, + "step": 41275 + }, + { + "epoch": 10.08, + "learning_rate": 0.0004458402830158612, + "loss": 0.6987, + "step": 41300 + }, + { + "epoch": 10.08, + "learning_rate": 0.0004458070838955051, + "loss": 0.6458, + "step": 41325 + }, + { + "epoch": 10.09, + "learning_rate": 0.00044577388477514904, + "loss": 0.6997, + "step": 41350 + }, + { + "epoch": 10.1, + "learning_rate": 0.0004457406856547929, + "loss": 0.6358, + "step": 41375 + }, + { + "epoch": 10.1, + "learning_rate": 0.00044570748653443676, + "loss": 0.6762, + "step": 41400 + }, + { + "epoch": 10.11, + "learning_rate": 0.00044567428741408067, + "loss": 0.65, + "step": 41425 + }, + { + "epoch": 10.11, + "learning_rate": 0.0004456410882937246, + "loss": 0.6963, + "step": 41450 + }, + { + "epoch": 10.12, + "learning_rate": 0.0004456078891733685, + "loss": 0.6206, + "step": 41475 + }, + { + "epoch": 10.13, + "learning_rate": 0.00044557469005301236, + "loss": 0.7114, + "step": 41500 + }, + { + "epoch": 10.13, + "learning_rate": 0.00044554149093265627, + "loss": 0.6766, + "step": 41525 + }, + { + "epoch": 10.14, + "learning_rate": 0.00044550829181230013, + "loss": 0.6714, + "step": 41550 + }, + { + "epoch": 10.15, + "learning_rate": 0.00044547509269194405, + "loss": 0.6488, + "step": 41575 + }, + { + "epoch": 10.15, + "learning_rate": 0.0004454418935715879, + "loss": 0.689, + "step": 41600 + }, + { + "epoch": 10.16, + "learning_rate": 0.0004454086944512318, + "loss": 0.6763, + "step": 41625 + }, + { + "epoch": 10.16, + "learning_rate": 0.00044537549533087573, + "loss": 0.6771, + "step": 41650 + }, + { + "epoch": 10.17, + "learning_rate": 0.00044534229621051965, + "loss": 0.6449, + "step": 41675 + }, + { + "epoch": 10.18, + "learning_rate": 0.0004453090970901635, + "loss": 0.7202, + "step": 41700 + }, + { + "epoch": 10.18, + "learning_rate": 0.00044527589796980737, + "loss": 0.6936, + "step": 41725 + }, + { + "epoch": 10.19, + "learning_rate": 0.0004452426988494513, + "loss": 0.7044, + "step": 41750 + }, + { + "epoch": 10.19, + "learning_rate": 0.0004452094997290952, + "loss": 0.6643, + "step": 41775 + }, + { + "epoch": 10.2, + "learning_rate": 0.0004451763006087391, + "loss": 0.6966, + "step": 41800 + }, + { + "epoch": 10.21, + "learning_rate": 0.000445143101488383, + "loss": 0.6873, + "step": 41825 + }, + { + "epoch": 10.21, + "learning_rate": 0.00044510990236802683, + "loss": 0.7328, + "step": 41850 + }, + { + "epoch": 10.22, + "learning_rate": 0.00044507670324767074, + "loss": 0.6346, + "step": 41875 + }, + { + "epoch": 10.22, + "learning_rate": 0.00044504350412731466, + "loss": 0.6716, + "step": 41900 + }, + { + "epoch": 10.23, + "learning_rate": 0.00044501030500695857, + "loss": 0.6719, + "step": 41925 + }, + { + "epoch": 10.24, + "learning_rate": 0.00044497710588660243, + "loss": 0.7415, + "step": 41950 + }, + { + "epoch": 10.24, + "learning_rate": 0.00044494390676624634, + "loss": 0.6444, + "step": 41975 + }, + { + "epoch": 10.25, + "learning_rate": 0.0004449107076458902, + "loss": 0.6563, + "step": 42000 + }, + { + "epoch": 10.25, + "eval_cer": 0.14417420407995646, + "eval_loss": 0.4852425754070282, + "eval_runtime": 146.8969, + "eval_samples_per_second": 28.544, + "eval_steps_per_second": 7.141, + "eval_wer": 0.5690701468189233, + "step": 42000 + }, + { + "epoch": 10.26, + "learning_rate": 0.0004448775085255341, + "loss": 0.6437, + "step": 42025 + }, + { + "epoch": 10.26, + "learning_rate": 0.00044484430940517803, + "loss": 0.7146, + "step": 42050 + }, + { + "epoch": 10.27, + "learning_rate": 0.0004448111102848219, + "loss": 0.6791, + "step": 42075 + }, + { + "epoch": 10.27, + "learning_rate": 0.0004447779111644658, + "loss": 0.7027, + "step": 42100 + }, + { + "epoch": 10.28, + "learning_rate": 0.0004447447120441097, + "loss": 0.6643, + "step": 42125 + }, + { + "epoch": 10.29, + "learning_rate": 0.0004447115129237536, + "loss": 0.693, + "step": 42150 + }, + { + "epoch": 10.29, + "learning_rate": 0.00044467831380339744, + "loss": 0.6317, + "step": 42175 + }, + { + "epoch": 10.3, + "learning_rate": 0.00044464511468304135, + "loss": 0.72, + "step": 42200 + }, + { + "epoch": 10.3, + "learning_rate": 0.00044461191556268527, + "loss": 0.6405, + "step": 42225 + }, + { + "epoch": 10.31, + "learning_rate": 0.0004445787164423292, + "loss": 0.7249, + "step": 42250 + }, + { + "epoch": 10.32, + "learning_rate": 0.0004445455173219731, + "loss": 0.7042, + "step": 42275 + }, + { + "epoch": 10.32, + "learning_rate": 0.0004445123182016169, + "loss": 0.7549, + "step": 42300 + }, + { + "epoch": 10.33, + "learning_rate": 0.0004444791190812608, + "loss": 0.6494, + "step": 42325 + }, + { + "epoch": 10.33, + "learning_rate": 0.00044444591996090473, + "loss": 0.6912, + "step": 42350 + }, + { + "epoch": 10.34, + "learning_rate": 0.00044441272084054864, + "loss": 0.6709, + "step": 42375 + }, + { + "epoch": 10.35, + "learning_rate": 0.0004443795217201925, + "loss": 0.6731, + "step": 42400 + }, + { + "epoch": 10.35, + "learning_rate": 0.0004443463225998364, + "loss": 0.6616, + "step": 42425 + }, + { + "epoch": 10.36, + "learning_rate": 0.0004443131234794803, + "loss": 0.6595, + "step": 42450 + }, + { + "epoch": 10.36, + "learning_rate": 0.0004442799243591242, + "loss": 0.671, + "step": 42475 + }, + { + "epoch": 10.37, + "learning_rate": 0.0004442467252387681, + "loss": 0.7151, + "step": 42500 + }, + { + "epoch": 10.38, + "learning_rate": 0.00044421352611841196, + "loss": 0.7016, + "step": 42525 + }, + { + "epoch": 10.38, + "learning_rate": 0.0004441803269980559, + "loss": 0.6729, + "step": 42550 + }, + { + "epoch": 10.39, + "learning_rate": 0.0004441471278776998, + "loss": 0.6412, + "step": 42575 + }, + { + "epoch": 10.4, + "learning_rate": 0.00044411392875734365, + "loss": 0.6664, + "step": 42600 + }, + { + "epoch": 10.4, + "learning_rate": 0.0004440807296369875, + "loss": 0.6066, + "step": 42625 + }, + { + "epoch": 10.41, + "learning_rate": 0.0004440475305166314, + "loss": 0.7433, + "step": 42650 + }, + { + "epoch": 10.41, + "learning_rate": 0.00044401433139627534, + "loss": 0.6678, + "step": 42675 + }, + { + "epoch": 10.42, + "learning_rate": 0.00044398113227591925, + "loss": 0.7147, + "step": 42700 + }, + { + "epoch": 10.43, + "learning_rate": 0.00044394793315556317, + "loss": 0.6558, + "step": 42725 + }, + { + "epoch": 10.43, + "learning_rate": 0.00044391473403520697, + "loss": 0.7616, + "step": 42750 + }, + { + "epoch": 10.44, + "learning_rate": 0.0004438815349148509, + "loss": 0.6852, + "step": 42775 + }, + { + "epoch": 10.44, + "learning_rate": 0.0004438483357944948, + "loss": 0.6825, + "step": 42800 + }, + { + "epoch": 10.45, + "learning_rate": 0.0004438151366741387, + "loss": 0.6371, + "step": 42825 + }, + { + "epoch": 10.46, + "learning_rate": 0.0004437819375537826, + "loss": 0.6984, + "step": 42850 + }, + { + "epoch": 10.46, + "learning_rate": 0.0004437487384334265, + "loss": 0.64, + "step": 42875 + }, + { + "epoch": 10.47, + "learning_rate": 0.00044371553931307035, + "loss": 0.6893, + "step": 42900 + }, + { + "epoch": 10.47, + "learning_rate": 0.00044368234019271426, + "loss": 0.6656, + "step": 42925 + }, + { + "epoch": 10.48, + "learning_rate": 0.0004436491410723582, + "loss": 0.6727, + "step": 42950 + }, + { + "epoch": 10.49, + "learning_rate": 0.00044361594195200204, + "loss": 0.5953, + "step": 42975 + }, + { + "epoch": 10.49, + "learning_rate": 0.00044358274283164595, + "loss": 0.7229, + "step": 43000 + }, + { + "epoch": 10.5, + "learning_rate": 0.00044354954371128986, + "loss": 0.6533, + "step": 43025 + }, + { + "epoch": 10.51, + "learning_rate": 0.0004435163445909337, + "loss": 0.6537, + "step": 43050 + }, + { + "epoch": 10.51, + "learning_rate": 0.0004434831454705776, + "loss": 0.6482, + "step": 43075 + }, + { + "epoch": 10.52, + "learning_rate": 0.0004434499463502215, + "loss": 0.684, + "step": 43100 + }, + { + "epoch": 10.52, + "learning_rate": 0.0004434167472298654, + "loss": 0.5997, + "step": 43125 + }, + { + "epoch": 10.53, + "learning_rate": 0.0004433835481095093, + "loss": 0.6668, + "step": 43150 + }, + { + "epoch": 10.54, + "learning_rate": 0.00044335034898915324, + "loss": 0.6491, + "step": 43175 + }, + { + "epoch": 10.54, + "learning_rate": 0.00044331714986879704, + "loss": 0.7128, + "step": 43200 + }, + { + "epoch": 10.55, + "learning_rate": 0.00044328395074844096, + "loss": 0.6342, + "step": 43225 + }, + { + "epoch": 10.55, + "learning_rate": 0.00044325075162808487, + "loss": 0.6943, + "step": 43250 + }, + { + "epoch": 10.56, + "learning_rate": 0.0004432175525077288, + "loss": 0.6803, + "step": 43275 + }, + { + "epoch": 10.57, + "learning_rate": 0.0004431843533873727, + "loss": 0.7371, + "step": 43300 + }, + { + "epoch": 10.57, + "learning_rate": 0.00044315115426701656, + "loss": 0.6904, + "step": 43325 + }, + { + "epoch": 10.58, + "learning_rate": 0.0004431179551466604, + "loss": 0.6995, + "step": 43350 + }, + { + "epoch": 10.58, + "learning_rate": 0.00044308475602630433, + "loss": 0.6529, + "step": 43375 + }, + { + "epoch": 10.59, + "learning_rate": 0.00044305155690594825, + "loss": 0.7138, + "step": 43400 + }, + { + "epoch": 10.6, + "learning_rate": 0.0004430183577855921, + "loss": 0.6653, + "step": 43425 + }, + { + "epoch": 10.6, + "learning_rate": 0.000442985158665236, + "loss": 0.6868, + "step": 43450 + }, + { + "epoch": 10.61, + "learning_rate": 0.00044295195954487994, + "loss": 0.6545, + "step": 43475 + }, + { + "epoch": 10.61, + "learning_rate": 0.0004429187604245238, + "loss": 0.696, + "step": 43500 + }, + { + "epoch": 10.62, + "learning_rate": 0.0004428855613041677, + "loss": 0.6071, + "step": 43525 + }, + { + "epoch": 10.63, + "learning_rate": 0.00044285236218381157, + "loss": 0.6957, + "step": 43550 + }, + { + "epoch": 10.63, + "learning_rate": 0.0004428191630634555, + "loss": 0.6626, + "step": 43575 + }, + { + "epoch": 10.64, + "learning_rate": 0.0004427859639430994, + "loss": 0.706, + "step": 43600 + }, + { + "epoch": 10.65, + "learning_rate": 0.0004427527648227433, + "loss": 0.6271, + "step": 43625 + }, + { + "epoch": 10.65, + "learning_rate": 0.0004427195657023871, + "loss": 0.6782, + "step": 43650 + }, + { + "epoch": 10.66, + "learning_rate": 0.00044268636658203103, + "loss": 0.6682, + "step": 43675 + }, + { + "epoch": 10.66, + "learning_rate": 0.00044265316746167494, + "loss": 0.6901, + "step": 43700 + }, + { + "epoch": 10.67, + "learning_rate": 0.00044261996834131886, + "loss": 0.6317, + "step": 43725 + }, + { + "epoch": 10.68, + "learning_rate": 0.00044258676922096277, + "loss": 0.6766, + "step": 43750 + }, + { + "epoch": 10.68, + "learning_rate": 0.00044255357010060663, + "loss": 0.5699, + "step": 43775 + }, + { + "epoch": 10.69, + "learning_rate": 0.0004425203709802505, + "loss": 0.72, + "step": 43800 + }, + { + "epoch": 10.69, + "learning_rate": 0.0004424871718598944, + "loss": 0.635, + "step": 43825 + }, + { + "epoch": 10.7, + "learning_rate": 0.0004424539727395383, + "loss": 0.7373, + "step": 43850 + }, + { + "epoch": 10.71, + "learning_rate": 0.0004424207736191822, + "loss": 0.6996, + "step": 43875 + }, + { + "epoch": 10.71, + "learning_rate": 0.0004423875744988261, + "loss": 0.6847, + "step": 43900 + }, + { + "epoch": 10.72, + "learning_rate": 0.00044235570334328424, + "loss": 0.6777, + "step": 43925 + }, + { + "epoch": 10.72, + "learning_rate": 0.00044232250422292815, + "loss": 0.7208, + "step": 43950 + }, + { + "epoch": 10.73, + "learning_rate": 0.000442289305102572, + "loss": 0.6545, + "step": 43975 + }, + { + "epoch": 10.74, + "learning_rate": 0.00044225610598221587, + "loss": 0.6631, + "step": 44000 + }, + { + "epoch": 10.74, + "learning_rate": 0.0004422229068618598, + "loss": 0.6274, + "step": 44025 + }, + { + "epoch": 10.75, + "learning_rate": 0.0004421897077415037, + "loss": 0.688, + "step": 44050 + }, + { + "epoch": 10.76, + "learning_rate": 0.0004421565086211476, + "loss": 0.6188, + "step": 44075 + }, + { + "epoch": 10.76, + "learning_rate": 0.00044212330950079147, + "loss": 0.6948, + "step": 44100 + }, + { + "epoch": 10.77, + "learning_rate": 0.0004420901103804354, + "loss": 0.6858, + "step": 44125 + }, + { + "epoch": 10.77, + "learning_rate": 0.00044205691126007925, + "loss": 0.7341, + "step": 44150 + }, + { + "epoch": 10.78, + "learning_rate": 0.00044202371213972316, + "loss": 0.6184, + "step": 44175 + }, + { + "epoch": 10.79, + "learning_rate": 0.000441990513019367, + "loss": 0.6862, + "step": 44200 + }, + { + "epoch": 10.79, + "learning_rate": 0.00044195731389901093, + "loss": 0.6461, + "step": 44225 + }, + { + "epoch": 10.8, + "learning_rate": 0.00044192411477865485, + "loss": 0.7194, + "step": 44250 + }, + { + "epoch": 10.8, + "learning_rate": 0.00044189091565829876, + "loss": 0.6877, + "step": 44275 + }, + { + "epoch": 10.81, + "learning_rate": 0.0004418577165379426, + "loss": 0.7203, + "step": 44300 + }, + { + "epoch": 10.82, + "learning_rate": 0.0004418245174175865, + "loss": 0.6138, + "step": 44325 + }, + { + "epoch": 10.82, + "learning_rate": 0.0004417913182972304, + "loss": 0.7073, + "step": 44350 + }, + { + "epoch": 10.83, + "learning_rate": 0.0004417581191768743, + "loss": 0.6408, + "step": 44375 + }, + { + "epoch": 10.83, + "learning_rate": 0.0004417249200565182, + "loss": 0.6973, + "step": 44400 + }, + { + "epoch": 10.84, + "learning_rate": 0.00044169172093616214, + "loss": 0.6758, + "step": 44425 + }, + { + "epoch": 10.85, + "learning_rate": 0.00044165852181580594, + "loss": 0.717, + "step": 44450 + }, + { + "epoch": 10.85, + "learning_rate": 0.00044162532269544986, + "loss": 0.6669, + "step": 44475 + }, + { + "epoch": 10.86, + "learning_rate": 0.00044159212357509377, + "loss": 0.7094, + "step": 44500 + }, + { + "epoch": 10.87, + "learning_rate": 0.0004415589244547377, + "loss": 0.6459, + "step": 44525 + }, + { + "epoch": 10.87, + "learning_rate": 0.00044152572533438154, + "loss": 0.6706, + "step": 44550 + }, + { + "epoch": 10.88, + "learning_rate": 0.00044149252621402546, + "loss": 0.6072, + "step": 44575 + }, + { + "epoch": 10.88, + "learning_rate": 0.0004414593270936693, + "loss": 0.7027, + "step": 44600 + }, + { + "epoch": 10.89, + "learning_rate": 0.00044142612797331323, + "loss": 0.637, + "step": 44625 + }, + { + "epoch": 10.9, + "learning_rate": 0.00044139292885295715, + "loss": 0.7063, + "step": 44650 + }, + { + "epoch": 10.9, + "learning_rate": 0.000441359729732601, + "loss": 0.7203, + "step": 44675 + }, + { + "epoch": 10.91, + "learning_rate": 0.0004413265306122449, + "loss": 0.6884, + "step": 44700 + }, + { + "epoch": 10.91, + "learning_rate": 0.00044129333149188883, + "loss": 0.6446, + "step": 44725 + }, + { + "epoch": 10.92, + "learning_rate": 0.0004412601323715327, + "loss": 0.739, + "step": 44750 + }, + { + "epoch": 10.93, + "learning_rate": 0.00044122693325117655, + "loss": 0.6525, + "step": 44775 + }, + { + "epoch": 10.93, + "learning_rate": 0.00044119373413082047, + "loss": 0.7124, + "step": 44800 + }, + { + "epoch": 10.94, + "learning_rate": 0.0004411605350104644, + "loss": 0.6768, + "step": 44825 + }, + { + "epoch": 10.94, + "learning_rate": 0.0004411273358901083, + "loss": 0.7047, + "step": 44850 + }, + { + "epoch": 10.95, + "learning_rate": 0.00044109413676975216, + "loss": 0.6307, + "step": 44875 + }, + { + "epoch": 10.96, + "learning_rate": 0.000441060937649396, + "loss": 0.6887, + "step": 44900 + }, + { + "epoch": 10.96, + "learning_rate": 0.00044102773852903993, + "loss": 0.6407, + "step": 44925 + }, + { + "epoch": 10.97, + "learning_rate": 0.00044099453940868384, + "loss": 0.7153, + "step": 44950 + }, + { + "epoch": 10.97, + "learning_rate": 0.00044096134028832776, + "loss": 0.6612, + "step": 44975 + }, + { + "epoch": 10.98, + "learning_rate": 0.0004409281411679716, + "loss": 0.7166, + "step": 45000 + }, + { + "epoch": 10.98, + "eval_cer": 0.14372247261377985, + "eval_loss": 0.4731488525867462, + "eval_runtime": 144.4871, + "eval_samples_per_second": 29.02, + "eval_steps_per_second": 7.26, + "eval_wer": 0.5718433931484502, + "step": 45000 + }, + { + "epoch": 10.99, + "learning_rate": 0.0004408949420476155, + "loss": 0.6463, + "step": 45025 + }, + { + "epoch": 10.99, + "learning_rate": 0.0004408617429272594, + "loss": 0.7169, + "step": 45050 + }, + { + "epoch": 11.0, + "learning_rate": 0.0004408285438069033, + "loss": 0.6929, + "step": 45075 + }, + { + "epoch": 11.01, + "learning_rate": 0.0004407953446865472, + "loss": 0.7587, + "step": 45100 + }, + { + "epoch": 11.01, + "learning_rate": 0.0004407621455661911, + "loss": 0.6414, + "step": 45125 + }, + { + "epoch": 11.02, + "learning_rate": 0.000440728946445835, + "loss": 0.7008, + "step": 45150 + }, + { + "epoch": 11.02, + "learning_rate": 0.00044069574732547885, + "loss": 0.6039, + "step": 45175 + }, + { + "epoch": 11.03, + "learning_rate": 0.00044066254820512277, + "loss": 0.6642, + "step": 45200 + }, + { + "epoch": 11.04, + "learning_rate": 0.0004406293490847666, + "loss": 0.5708, + "step": 45225 + }, + { + "epoch": 11.04, + "learning_rate": 0.00044059614996441054, + "loss": 0.6622, + "step": 45250 + }, + { + "epoch": 11.05, + "learning_rate": 0.00044056295084405445, + "loss": 0.6563, + "step": 45275 + }, + { + "epoch": 11.05, + "learning_rate": 0.00044052975172369837, + "loss": 0.682, + "step": 45300 + }, + { + "epoch": 11.06, + "learning_rate": 0.00044049655260334223, + "loss": 0.6252, + "step": 45325 + }, + { + "epoch": 11.07, + "learning_rate": 0.0004404633534829861, + "loss": 0.6542, + "step": 45350 + }, + { + "epoch": 11.07, + "learning_rate": 0.00044043015436263, + "loss": 0.6675, + "step": 45375 + }, + { + "epoch": 11.08, + "learning_rate": 0.0004403969552422739, + "loss": 0.6733, + "step": 45400 + }, + { + "epoch": 11.08, + "learning_rate": 0.00044036375612191783, + "loss": 0.603, + "step": 45425 + }, + { + "epoch": 11.09, + "learning_rate": 0.0004403305570015617, + "loss": 0.6562, + "step": 45450 + }, + { + "epoch": 11.1, + "learning_rate": 0.00044029735788120555, + "loss": 0.6738, + "step": 45475 + }, + { + "epoch": 11.1, + "learning_rate": 0.00044026415876084946, + "loss": 0.6869, + "step": 45500 + }, + { + "epoch": 11.11, + "learning_rate": 0.0004402309596404934, + "loss": 0.639, + "step": 45525 + }, + { + "epoch": 11.12, + "learning_rate": 0.0004401977605201373, + "loss": 0.6751, + "step": 45550 + }, + { + "epoch": 11.12, + "learning_rate": 0.00044016456139978115, + "loss": 0.5983, + "step": 45575 + }, + { + "epoch": 11.13, + "learning_rate": 0.00044013136227942506, + "loss": 0.6827, + "step": 45600 + }, + { + "epoch": 11.13, + "learning_rate": 0.0004400981631590689, + "loss": 0.6128, + "step": 45625 + }, + { + "epoch": 11.14, + "learning_rate": 0.00044006496403871284, + "loss": 0.6782, + "step": 45650 + }, + { + "epoch": 11.15, + "learning_rate": 0.0004400317649183567, + "loss": 0.6196, + "step": 45675 + }, + { + "epoch": 11.15, + "learning_rate": 0.0004399985657980006, + "loss": 0.6424, + "step": 45700 + }, + { + "epoch": 11.16, + "learning_rate": 0.0004399653666776445, + "loss": 0.5857, + "step": 45725 + }, + { + "epoch": 11.16, + "learning_rate": 0.00043993216755728844, + "loss": 0.6674, + "step": 45750 + }, + { + "epoch": 11.17, + "learning_rate": 0.0004398989684369323, + "loss": 0.6245, + "step": 45775 + }, + { + "epoch": 11.18, + "learning_rate": 0.00043986576931657616, + "loss": 0.6766, + "step": 45800 + }, + { + "epoch": 11.18, + "learning_rate": 0.0004398325701962201, + "loss": 0.64, + "step": 45825 + }, + { + "epoch": 11.19, + "learning_rate": 0.000439799371075864, + "loss": 0.6693, + "step": 45850 + }, + { + "epoch": 11.19, + "learning_rate": 0.00043976749992032213, + "loss": 0.654, + "step": 45875 + }, + { + "epoch": 11.2, + "learning_rate": 0.000439734300799966, + "loss": 0.6695, + "step": 45900 + }, + { + "epoch": 11.21, + "learning_rate": 0.0004397011016796099, + "loss": 0.6548, + "step": 45925 + }, + { + "epoch": 11.21, + "learning_rate": 0.0004396679025592538, + "loss": 0.6577, + "step": 45950 + }, + { + "epoch": 11.22, + "learning_rate": 0.0004396347034388977, + "loss": 0.5869, + "step": 45975 + }, + { + "epoch": 11.22, + "learning_rate": 0.0004396015043185416, + "loss": 0.6876, + "step": 46000 + }, + { + "epoch": 11.23, + "learning_rate": 0.00043956830519818545, + "loss": 0.5679, + "step": 46025 + }, + { + "epoch": 11.24, + "learning_rate": 0.00043953510607782937, + "loss": 0.6973, + "step": 46050 + }, + { + "epoch": 11.24, + "learning_rate": 0.0004395019069574733, + "loss": 0.6237, + "step": 46075 + }, + { + "epoch": 11.25, + "learning_rate": 0.0004394687078371172, + "loss": 0.6779, + "step": 46100 + }, + { + "epoch": 11.26, + "learning_rate": 0.000439435508716761, + "loss": 0.6205, + "step": 46125 + }, + { + "epoch": 11.26, + "learning_rate": 0.0004394023095964049, + "loss": 0.6393, + "step": 46150 + }, + { + "epoch": 11.27, + "learning_rate": 0.00043936911047604883, + "loss": 0.6353, + "step": 46175 + }, + { + "epoch": 11.27, + "learning_rate": 0.00043933591135569274, + "loss": 0.6752, + "step": 46200 + }, + { + "epoch": 11.28, + "learning_rate": 0.00043930271223533666, + "loss": 0.6567, + "step": 46225 + }, + { + "epoch": 11.29, + "learning_rate": 0.0004392695131149805, + "loss": 0.6625, + "step": 46250 + }, + { + "epoch": 11.29, + "learning_rate": 0.0004392363139946244, + "loss": 0.6082, + "step": 46275 + }, + { + "epoch": 11.3, + "learning_rate": 0.0004392031148742683, + "loss": 0.6796, + "step": 46300 + }, + { + "epoch": 11.3, + "learning_rate": 0.0004391699157539122, + "loss": 0.6016, + "step": 46325 + }, + { + "epoch": 11.31, + "learning_rate": 0.00043913671663355606, + "loss": 0.6826, + "step": 46350 + }, + { + "epoch": 11.32, + "learning_rate": 0.0004391035175132, + "loss": 0.6277, + "step": 46375 + }, + { + "epoch": 11.32, + "learning_rate": 0.0004390703183928439, + "loss": 0.705, + "step": 46400 + }, + { + "epoch": 11.33, + "learning_rate": 0.00043903711927248775, + "loss": 0.6284, + "step": 46425 + }, + { + "epoch": 11.33, + "learning_rate": 0.00043900392015213167, + "loss": 0.6422, + "step": 46450 + }, + { + "epoch": 11.34, + "learning_rate": 0.0004389707210317755, + "loss": 0.6124, + "step": 46475 + }, + { + "epoch": 11.35, + "learning_rate": 0.00043893752191141944, + "loss": 0.7005, + "step": 46500 + }, + { + "epoch": 11.35, + "learning_rate": 0.00043890432279106335, + "loss": 0.638, + "step": 46525 + }, + { + "epoch": 11.36, + "learning_rate": 0.00043887112367070727, + "loss": 0.6668, + "step": 46550 + }, + { + "epoch": 11.37, + "learning_rate": 0.00043883792455035107, + "loss": 0.629, + "step": 46575 + }, + { + "epoch": 11.37, + "learning_rate": 0.000438804725429995, + "loss": 0.6606, + "step": 46600 + }, + { + "epoch": 11.38, + "learning_rate": 0.0004387715263096389, + "loss": 0.622, + "step": 46625 + }, + { + "epoch": 11.38, + "learning_rate": 0.0004387383271892828, + "loss": 0.6692, + "step": 46650 + }, + { + "epoch": 11.39, + "learning_rate": 0.00043870512806892673, + "loss": 0.6024, + "step": 46675 + }, + { + "epoch": 11.4, + "learning_rate": 0.0004386719289485706, + "loss": 0.6572, + "step": 46700 + }, + { + "epoch": 11.4, + "learning_rate": 0.00043863872982821445, + "loss": 0.6421, + "step": 46725 + }, + { + "epoch": 11.41, + "learning_rate": 0.00043860553070785836, + "loss": 0.6752, + "step": 46750 + }, + { + "epoch": 11.41, + "learning_rate": 0.0004385723315875023, + "loss": 0.6175, + "step": 46775 + }, + { + "epoch": 11.42, + "learning_rate": 0.00043853913246714614, + "loss": 0.7093, + "step": 46800 + }, + { + "epoch": 11.43, + "learning_rate": 0.00043850593334679005, + "loss": 0.6018, + "step": 46825 + }, + { + "epoch": 11.43, + "learning_rate": 0.00043847273422643396, + "loss": 0.7242, + "step": 46850 + }, + { + "epoch": 11.44, + "learning_rate": 0.0004384395351060778, + "loss": 0.6118, + "step": 46875 + }, + { + "epoch": 11.44, + "learning_rate": 0.00043840633598572174, + "loss": 0.6412, + "step": 46900 + }, + { + "epoch": 11.45, + "learning_rate": 0.0004383731368653656, + "loss": 0.6692, + "step": 46925 + }, + { + "epoch": 11.46, + "learning_rate": 0.0004383399377450095, + "loss": 0.6875, + "step": 46950 + }, + { + "epoch": 11.46, + "learning_rate": 0.0004383067386246534, + "loss": 0.6527, + "step": 46975 + }, + { + "epoch": 11.47, + "learning_rate": 0.00043827353950429734, + "loss": 0.6862, + "step": 47000 + }, + { + "epoch": 11.48, + "learning_rate": 0.00043824034038394114, + "loss": 0.6665, + "step": 47025 + }, + { + "epoch": 11.48, + "learning_rate": 0.00043820714126358506, + "loss": 0.6639, + "step": 47050 + }, + { + "epoch": 11.49, + "learning_rate": 0.00043817394214322897, + "loss": 0.6384, + "step": 47075 + }, + { + "epoch": 11.49, + "learning_rate": 0.0004381407430228729, + "loss": 0.6528, + "step": 47100 + }, + { + "epoch": 11.5, + "learning_rate": 0.0004381075439025168, + "loss": 0.6745, + "step": 47125 + }, + { + "epoch": 11.51, + "learning_rate": 0.00043807434478216066, + "loss": 0.671, + "step": 47150 + }, + { + "epoch": 11.51, + "learning_rate": 0.0004380411456618045, + "loss": 0.6352, + "step": 47175 + }, + { + "epoch": 11.52, + "learning_rate": 0.00043800794654144843, + "loss": 0.645, + "step": 47200 + }, + { + "epoch": 11.52, + "learning_rate": 0.00043797474742109235, + "loss": 0.6738, + "step": 47225 + }, + { + "epoch": 11.53, + "learning_rate": 0.00043794154830073626, + "loss": 0.6946, + "step": 47250 + }, + { + "epoch": 11.54, + "learning_rate": 0.0004379083491803801, + "loss": 0.6427, + "step": 47275 + }, + { + "epoch": 11.54, + "learning_rate": 0.00043787515006002404, + "loss": 0.6668, + "step": 47300 + }, + { + "epoch": 11.55, + "learning_rate": 0.0004378419509396679, + "loss": 0.6233, + "step": 47325 + }, + { + "epoch": 11.55, + "learning_rate": 0.0004378087518193118, + "loss": 0.6855, + "step": 47350 + }, + { + "epoch": 11.56, + "learning_rate": 0.00043777555269895567, + "loss": 0.6396, + "step": 47375 + }, + { + "epoch": 11.57, + "learning_rate": 0.0004377423535785996, + "loss": 0.6812, + "step": 47400 + }, + { + "epoch": 11.57, + "learning_rate": 0.0004377091544582435, + "loss": 0.626, + "step": 47425 + }, + { + "epoch": 11.58, + "learning_rate": 0.0004376759553378874, + "loss": 0.655, + "step": 47450 + }, + { + "epoch": 11.58, + "learning_rate": 0.00043764275621753127, + "loss": 0.6244, + "step": 47475 + }, + { + "epoch": 11.59, + "learning_rate": 0.00043760955709717513, + "loss": 0.6704, + "step": 47500 + }, + { + "epoch": 11.6, + "learning_rate": 0.00043757635797681904, + "loss": 0.6312, + "step": 47525 + }, + { + "epoch": 11.6, + "learning_rate": 0.00043754315885646296, + "loss": 0.7087, + "step": 47550 + }, + { + "epoch": 11.61, + "learning_rate": 0.00043750995973610687, + "loss": 0.5872, + "step": 47575 + }, + { + "epoch": 11.62, + "learning_rate": 0.00043747676061575073, + "loss": 0.655, + "step": 47600 + }, + { + "epoch": 11.62, + "learning_rate": 0.0004374435614953946, + "loss": 0.6432, + "step": 47625 + }, + { + "epoch": 11.63, + "learning_rate": 0.0004374103623750385, + "loss": 0.6731, + "step": 47650 + }, + { + "epoch": 11.63, + "learning_rate": 0.0004373771632546824, + "loss": 0.6227, + "step": 47675 + }, + { + "epoch": 11.64, + "learning_rate": 0.00043734396413432633, + "loss": 0.7036, + "step": 47700 + }, + { + "epoch": 11.65, + "learning_rate": 0.0004373107650139702, + "loss": 0.6288, + "step": 47725 + }, + { + "epoch": 11.65, + "learning_rate": 0.0004372775658936141, + "loss": 0.659, + "step": 47750 + }, + { + "epoch": 11.66, + "learning_rate": 0.00043724436677325797, + "loss": 0.6138, + "step": 47775 + }, + { + "epoch": 11.66, + "learning_rate": 0.0004372111676529019, + "loss": 0.6878, + "step": 47800 + }, + { + "epoch": 11.67, + "learning_rate": 0.00043717796853254574, + "loss": 0.6326, + "step": 47825 + }, + { + "epoch": 11.68, + "learning_rate": 0.00043714476941218966, + "loss": 0.6692, + "step": 47850 + }, + { + "epoch": 11.68, + "learning_rate": 0.00043711157029183357, + "loss": 0.6122, + "step": 47875 + }, + { + "epoch": 11.69, + "learning_rate": 0.0004370783711714775, + "loss": 0.7086, + "step": 47900 + }, + { + "epoch": 11.69, + "learning_rate": 0.00043704517205112134, + "loss": 0.6116, + "step": 47925 + }, + { + "epoch": 11.7, + "learning_rate": 0.0004370119729307652, + "loss": 0.6945, + "step": 47950 + }, + { + "epoch": 11.71, + "learning_rate": 0.0004369787738104091, + "loss": 0.5723, + "step": 47975 + }, + { + "epoch": 11.71, + "learning_rate": 0.00043694557469005303, + "loss": 0.6627, + "step": 48000 + }, + { + "epoch": 11.71, + "eval_cer": 0.14209521267312095, + "eval_loss": 0.47871026396751404, + "eval_runtime": 145.6062, + "eval_samples_per_second": 28.797, + "eval_steps_per_second": 7.204, + "eval_wer": 0.559510603588907, + "step": 48000 + }, + { + "epoch": 11.72, + "learning_rate": 0.00043691237556969694, + "loss": 0.5936, + "step": 48025 + }, + { + "epoch": 11.73, + "learning_rate": 0.0004368791764493408, + "loss": 0.6948, + "step": 48050 + }, + { + "epoch": 11.73, + "learning_rate": 0.00043684597732898466, + "loss": 0.6084, + "step": 48075 + }, + { + "epoch": 11.74, + "learning_rate": 0.0004368127782086286, + "loss": 0.6846, + "step": 48100 + }, + { + "epoch": 11.74, + "learning_rate": 0.0004367795790882725, + "loss": 0.6348, + "step": 48125 + }, + { + "epoch": 11.75, + "learning_rate": 0.0004367463799679164, + "loss": 0.6736, + "step": 48150 + }, + { + "epoch": 11.76, + "learning_rate": 0.00043671318084756027, + "loss": 0.6213, + "step": 48175 + }, + { + "epoch": 11.76, + "learning_rate": 0.0004366799817272042, + "loss": 0.7163, + "step": 48200 + }, + { + "epoch": 11.77, + "learning_rate": 0.00043664678260684804, + "loss": 0.6381, + "step": 48225 + }, + { + "epoch": 11.77, + "learning_rate": 0.00043661358348649195, + "loss": 0.7344, + "step": 48250 + }, + { + "epoch": 11.78, + "learning_rate": 0.00043658038436613587, + "loss": 0.6165, + "step": 48275 + }, + { + "epoch": 11.79, + "learning_rate": 0.00043654718524577973, + "loss": 0.6836, + "step": 48300 + }, + { + "epoch": 11.79, + "learning_rate": 0.00043651398612542364, + "loss": 0.6184, + "step": 48325 + }, + { + "epoch": 11.8, + "learning_rate": 0.00043648078700506756, + "loss": 0.7038, + "step": 48350 + }, + { + "epoch": 11.8, + "learning_rate": 0.0004364475878847114, + "loss": 0.6353, + "step": 48375 + }, + { + "epoch": 11.81, + "learning_rate": 0.0004364143887643553, + "loss": 0.6672, + "step": 48400 + }, + { + "epoch": 11.82, + "learning_rate": 0.0004363811896439992, + "loss": 0.613, + "step": 48425 + }, + { + "epoch": 11.82, + "learning_rate": 0.0004363479905236431, + "loss": 0.7012, + "step": 48450 + }, + { + "epoch": 11.83, + "learning_rate": 0.000436314791403287, + "loss": 0.6223, + "step": 48475 + }, + { + "epoch": 11.84, + "learning_rate": 0.00043628159228293093, + "loss": 0.6902, + "step": 48500 + }, + { + "epoch": 11.84, + "learning_rate": 0.00043624839316257474, + "loss": 0.5867, + "step": 48525 + }, + { + "epoch": 11.85, + "learning_rate": 0.00043621519404221865, + "loss": 0.6947, + "step": 48550 + }, + { + "epoch": 11.85, + "learning_rate": 0.00043618199492186256, + "loss": 0.6178, + "step": 48575 + }, + { + "epoch": 11.86, + "learning_rate": 0.0004361487958015065, + "loss": 0.6746, + "step": 48600 + }, + { + "epoch": 11.87, + "learning_rate": 0.00043611559668115034, + "loss": 0.6568, + "step": 48625 + }, + { + "epoch": 11.87, + "learning_rate": 0.00043608239756079425, + "loss": 0.6817, + "step": 48650 + }, + { + "epoch": 11.88, + "learning_rate": 0.0004360491984404381, + "loss": 0.6562, + "step": 48675 + }, + { + "epoch": 11.88, + "learning_rate": 0.000436015999320082, + "loss": 0.6814, + "step": 48700 + }, + { + "epoch": 11.89, + "learning_rate": 0.0004359841281645401, + "loss": 0.6593, + "step": 48725 + }, + { + "epoch": 11.9, + "learning_rate": 0.00043595092904418403, + "loss": 0.7107, + "step": 48750 + }, + { + "epoch": 11.9, + "learning_rate": 0.00043591772992382794, + "loss": 0.6651, + "step": 48775 + }, + { + "epoch": 11.91, + "learning_rate": 0.00043588453080347186, + "loss": 0.7025, + "step": 48800 + }, + { + "epoch": 11.91, + "learning_rate": 0.00043585133168311577, + "loss": 0.638, + "step": 48825 + }, + { + "epoch": 11.92, + "learning_rate": 0.00043581813256275963, + "loss": 0.6696, + "step": 48850 + }, + { + "epoch": 11.93, + "learning_rate": 0.0004357849334424035, + "loss": 0.6291, + "step": 48875 + }, + { + "epoch": 11.93, + "learning_rate": 0.0004357517343220474, + "loss": 0.6475, + "step": 48900 + }, + { + "epoch": 11.94, + "learning_rate": 0.0004357185352016913, + "loss": 0.6309, + "step": 48925 + }, + { + "epoch": 11.94, + "learning_rate": 0.0004356853360813352, + "loss": 0.6623, + "step": 48950 + }, + { + "epoch": 11.95, + "learning_rate": 0.0004356521369609791, + "loss": 0.6565, + "step": 48975 + }, + { + "epoch": 11.96, + "learning_rate": 0.000435618937840623, + "loss": 0.6518, + "step": 49000 + }, + { + "epoch": 11.96, + "learning_rate": 0.00043558573872026687, + "loss": 0.6328, + "step": 49025 + }, + { + "epoch": 11.97, + "learning_rate": 0.0004355525395999108, + "loss": 0.6526, + "step": 49050 + }, + { + "epoch": 11.98, + "learning_rate": 0.00043551934047955464, + "loss": 0.6355, + "step": 49075 + }, + { + "epoch": 11.98, + "learning_rate": 0.00043548614135919855, + "loss": 0.7023, + "step": 49100 + }, + { + "epoch": 11.99, + "learning_rate": 0.00043545294223884247, + "loss": 0.6291, + "step": 49125 + }, + { + "epoch": 11.99, + "learning_rate": 0.0004354197431184864, + "loss": 0.6556, + "step": 49150 + }, + { + "epoch": 12.0, + "learning_rate": 0.0004353865439981302, + "loss": 0.631, + "step": 49175 + }, + { + "epoch": 12.01, + "learning_rate": 0.0004353533448777741, + "loss": 0.69, + "step": 49200 + }, + { + "epoch": 12.01, + "learning_rate": 0.000435320145757418, + "loss": 0.5947, + "step": 49225 + }, + { + "epoch": 12.02, + "learning_rate": 0.00043528694663706193, + "loss": 0.6668, + "step": 49250 + }, + { + "epoch": 12.02, + "learning_rate": 0.00043525374751670584, + "loss": 0.6321, + "step": 49275 + }, + { + "epoch": 12.03, + "learning_rate": 0.0004352205483963497, + "loss": 0.644, + "step": 49300 + }, + { + "epoch": 12.04, + "learning_rate": 0.00043518734927599356, + "loss": 0.628, + "step": 49325 + }, + { + "epoch": 12.04, + "learning_rate": 0.0004351541501556375, + "loss": 0.639, + "step": 49350 + }, + { + "epoch": 12.05, + "learning_rate": 0.0004351209510352814, + "loss": 0.5915, + "step": 49375 + }, + { + "epoch": 12.05, + "learning_rate": 0.00043508775191492525, + "loss": 0.6678, + "step": 49400 + }, + { + "epoch": 12.06, + "learning_rate": 0.00043505455279456917, + "loss": 0.6273, + "step": 49425 + }, + { + "epoch": 12.07, + "learning_rate": 0.0004350213536742131, + "loss": 0.6117, + "step": 49450 + }, + { + "epoch": 12.07, + "learning_rate": 0.00043498815455385694, + "loss": 0.5568, + "step": 49475 + }, + { + "epoch": 12.08, + "learning_rate": 0.00043495495543350085, + "loss": 0.6563, + "step": 49500 + }, + { + "epoch": 12.09, + "learning_rate": 0.0004349217563131447, + "loss": 0.5866, + "step": 49525 + }, + { + "epoch": 12.09, + "learning_rate": 0.0004348885571927886, + "loss": 0.6908, + "step": 49550 + }, + { + "epoch": 12.1, + "learning_rate": 0.00043485535807243254, + "loss": 0.6039, + "step": 49575 + }, + { + "epoch": 12.1, + "learning_rate": 0.00043482215895207645, + "loss": 0.6675, + "step": 49600 + }, + { + "epoch": 12.11, + "learning_rate": 0.0004347889598317203, + "loss": 0.5785, + "step": 49625 + }, + { + "epoch": 12.12, + "learning_rate": 0.0004347557607113642, + "loss": 0.6426, + "step": 49650 + }, + { + "epoch": 12.12, + "learning_rate": 0.0004347225615910081, + "loss": 0.658, + "step": 49675 + }, + { + "epoch": 12.13, + "learning_rate": 0.000434689362470652, + "loss": 0.6528, + "step": 49700 + }, + { + "epoch": 12.13, + "learning_rate": 0.0004346561633502959, + "loss": 0.5638, + "step": 49725 + }, + { + "epoch": 12.14, + "learning_rate": 0.0004346229642299398, + "loss": 0.6568, + "step": 49750 + }, + { + "epoch": 12.15, + "learning_rate": 0.00043458976510958364, + "loss": 0.6403, + "step": 49775 + }, + { + "epoch": 12.15, + "learning_rate": 0.00043455656598922755, + "loss": 0.6668, + "step": 49800 + }, + { + "epoch": 12.16, + "learning_rate": 0.00043452336686887146, + "loss": 0.6377, + "step": 49825 + }, + { + "epoch": 12.16, + "learning_rate": 0.0004344901677485154, + "loss": 0.6156, + "step": 49850 + }, + { + "epoch": 12.17, + "learning_rate": 0.00043445696862815924, + "loss": 0.5868, + "step": 49875 + }, + { + "epoch": 12.18, + "learning_rate": 0.00043442376950780315, + "loss": 0.6497, + "step": 49900 + }, + { + "epoch": 12.18, + "learning_rate": 0.000434390570387447, + "loss": 0.618, + "step": 49925 + }, + { + "epoch": 12.19, + "learning_rate": 0.0004343573712670909, + "loss": 0.6685, + "step": 49950 + }, + { + "epoch": 12.19, + "learning_rate": 0.0004343241721467348, + "loss": 0.6276, + "step": 49975 + }, + { + "epoch": 12.2, + "learning_rate": 0.0004342909730263787, + "loss": 0.6609, + "step": 50000 + }, + { + "epoch": 12.21, + "learning_rate": 0.0004342577739060226, + "loss": 0.5746, + "step": 50025 + }, + { + "epoch": 12.21, + "learning_rate": 0.0004342245747856665, + "loss": 0.6416, + "step": 50050 + }, + { + "epoch": 12.22, + "learning_rate": 0.0004341913756653104, + "loss": 0.5834, + "step": 50075 + }, + { + "epoch": 12.23, + "learning_rate": 0.00043415817654495425, + "loss": 0.6515, + "step": 50100 + }, + { + "epoch": 12.23, + "learning_rate": 0.00043412497742459816, + "loss": 0.5516, + "step": 50125 + }, + { + "epoch": 12.24, + "learning_rate": 0.0004340917783042421, + "loss": 0.6494, + "step": 50150 + }, + { + "epoch": 12.24, + "learning_rate": 0.000434058579183886, + "loss": 0.5935, + "step": 50175 + }, + { + "epoch": 12.25, + "learning_rate": 0.00043402538006352985, + "loss": 0.6556, + "step": 50200 + }, + { + "epoch": 12.26, + "learning_rate": 0.0004339921809431737, + "loss": 0.6083, + "step": 50225 + }, + { + "epoch": 12.26, + "learning_rate": 0.0004339589818228176, + "loss": 0.6471, + "step": 50250 + }, + { + "epoch": 12.27, + "learning_rate": 0.00043392711066727577, + "loss": 0.5967, + "step": 50275 + }, + { + "epoch": 12.27, + "learning_rate": 0.0004338939115469196, + "loss": 0.6667, + "step": 50300 + }, + { + "epoch": 12.28, + "learning_rate": 0.00043386071242656354, + "loss": 0.5851, + "step": 50325 + }, + { + "epoch": 12.29, + "learning_rate": 0.00043382751330620745, + "loss": 0.683, + "step": 50350 + }, + { + "epoch": 12.29, + "learning_rate": 0.00043379431418585137, + "loss": 0.6329, + "step": 50375 + }, + { + "epoch": 12.3, + "learning_rate": 0.0004337611150654953, + "loss": 0.64, + "step": 50400 + }, + { + "epoch": 12.3, + "learning_rate": 0.0004337279159451391, + "loss": 0.6474, + "step": 50425 + }, + { + "epoch": 12.31, + "learning_rate": 0.000433694716824783, + "loss": 0.6692, + "step": 50450 + }, + { + "epoch": 12.32, + "learning_rate": 0.0004336615177044269, + "loss": 0.6072, + "step": 50475 + }, + { + "epoch": 12.32, + "learning_rate": 0.00043362831858407083, + "loss": 0.6352, + "step": 50500 + }, + { + "epoch": 12.33, + "learning_rate": 0.0004335951194637147, + "loss": 0.5983, + "step": 50525 + }, + { + "epoch": 12.34, + "learning_rate": 0.0004335619203433586, + "loss": 0.6722, + "step": 50550 + }, + { + "epoch": 12.34, + "learning_rate": 0.00043352872122300246, + "loss": 0.6317, + "step": 50575 + }, + { + "epoch": 12.35, + "learning_rate": 0.0004334955221026464, + "loss": 0.6641, + "step": 50600 + }, + { + "epoch": 12.35, + "learning_rate": 0.0004334623229822903, + "loss": 0.613, + "step": 50625 + }, + { + "epoch": 12.36, + "learning_rate": 0.00043342912386193415, + "loss": 0.638, + "step": 50650 + }, + { + "epoch": 12.37, + "learning_rate": 0.00043339592474157806, + "loss": 0.5691, + "step": 50675 + }, + { + "epoch": 12.37, + "learning_rate": 0.000433362725621222, + "loss": 0.638, + "step": 50700 + }, + { + "epoch": 12.38, + "learning_rate": 0.00043332952650086584, + "loss": 0.6625, + "step": 50725 + }, + { + "epoch": 12.38, + "learning_rate": 0.0004332963273805097, + "loss": 0.6371, + "step": 50750 + }, + { + "epoch": 12.39, + "learning_rate": 0.0004332631282601536, + "loss": 0.5906, + "step": 50775 + }, + { + "epoch": 12.4, + "learning_rate": 0.0004332299291397975, + "loss": 0.6377, + "step": 50800 + }, + { + "epoch": 12.4, + "learning_rate": 0.00043319673001944144, + "loss": 0.5568, + "step": 50825 + }, + { + "epoch": 12.41, + "learning_rate": 0.00043316353089908535, + "loss": 0.6468, + "step": 50850 + }, + { + "epoch": 12.41, + "learning_rate": 0.00043313033177872916, + "loss": 0.5864, + "step": 50875 + }, + { + "epoch": 12.42, + "learning_rate": 0.0004330971326583731, + "loss": 0.6945, + "step": 50900 + }, + { + "epoch": 12.43, + "learning_rate": 0.000433063933538017, + "loss": 0.6353, + "step": 50925 + }, + { + "epoch": 12.43, + "learning_rate": 0.0004330307344176609, + "loss": 0.689, + "step": 50950 + }, + { + "epoch": 12.44, + "learning_rate": 0.0004329975352973048, + "loss": 0.6057, + "step": 50975 + }, + { + "epoch": 12.45, + "learning_rate": 0.0004329643361769487, + "loss": 0.6642, + "step": 51000 + }, + { + "epoch": 12.45, + "eval_cer": 0.135288440807778, + "eval_loss": 0.4786597192287445, + "eval_runtime": 145.9643, + "eval_samples_per_second": 28.726, + "eval_steps_per_second": 7.187, + "eval_wer": 0.5417292006525285, + "step": 51000 + }, + { + "epoch": 12.45, + "learning_rate": 0.00043293113705659254, + "loss": 0.5972, + "step": 51025 + }, + { + "epoch": 12.46, + "learning_rate": 0.00043289793793623645, + "loss": 0.6796, + "step": 51050 + }, + { + "epoch": 12.46, + "learning_rate": 0.00043286473881588036, + "loss": 0.5829, + "step": 51075 + }, + { + "epoch": 12.47, + "learning_rate": 0.0004328315396955242, + "loss": 0.6555, + "step": 51100 + }, + { + "epoch": 12.48, + "learning_rate": 0.00043279834057516814, + "loss": 0.638, + "step": 51125 + }, + { + "epoch": 12.48, + "learning_rate": 0.000432765141454812, + "loss": 0.6506, + "step": 51150 + }, + { + "epoch": 12.49, + "learning_rate": 0.0004327319423344559, + "loss": 0.5731, + "step": 51175 + }, + { + "epoch": 12.49, + "learning_rate": 0.0004326987432140998, + "loss": 0.6235, + "step": 51200 + }, + { + "epoch": 12.5, + "learning_rate": 0.0004326655440937437, + "loss": 0.6339, + "step": 51225 + }, + { + "epoch": 12.51, + "learning_rate": 0.0004326323449733876, + "loss": 0.6643, + "step": 51250 + }, + { + "epoch": 12.51, + "learning_rate": 0.0004325991458530315, + "loss": 0.6002, + "step": 51275 + }, + { + "epoch": 12.52, + "learning_rate": 0.00043256594673267537, + "loss": 0.6213, + "step": 51300 + }, + { + "epoch": 12.52, + "learning_rate": 0.00043253274761231923, + "loss": 0.6105, + "step": 51325 + }, + { + "epoch": 12.53, + "learning_rate": 0.00043249954849196315, + "loss": 0.6795, + "step": 51350 + }, + { + "epoch": 12.54, + "learning_rate": 0.00043246634937160706, + "loss": 0.6539, + "step": 51375 + }, + { + "epoch": 12.54, + "learning_rate": 0.000432433150251251, + "loss": 0.6513, + "step": 51400 + }, + { + "epoch": 12.55, + "learning_rate": 0.0004323999511308949, + "loss": 0.6141, + "step": 51425 + }, + { + "epoch": 12.55, + "learning_rate": 0.0004323667520105387, + "loss": 0.6625, + "step": 51450 + }, + { + "epoch": 12.56, + "learning_rate": 0.0004323335528901826, + "loss": 0.601, + "step": 51475 + }, + { + "epoch": 12.57, + "learning_rate": 0.0004323003537698265, + "loss": 0.6888, + "step": 51500 + }, + { + "epoch": 12.57, + "learning_rate": 0.00043226715464947044, + "loss": 0.6562, + "step": 51525 + }, + { + "epoch": 12.58, + "learning_rate": 0.0004322339555291143, + "loss": 0.6252, + "step": 51550 + }, + { + "epoch": 12.59, + "learning_rate": 0.0004322007564087582, + "loss": 0.6727, + "step": 51575 + }, + { + "epoch": 12.59, + "learning_rate": 0.00043216755728840207, + "loss": 0.6696, + "step": 51600 + }, + { + "epoch": 12.6, + "learning_rate": 0.000432134358168046, + "loss": 0.5774, + "step": 51625 + }, + { + "epoch": 12.6, + "learning_rate": 0.0004321011590476899, + "loss": 0.6587, + "step": 51650 + }, + { + "epoch": 12.61, + "learning_rate": 0.00043206795992733376, + "loss": 0.5901, + "step": 51675 + }, + { + "epoch": 12.62, + "learning_rate": 0.00043203476080697767, + "loss": 0.66, + "step": 51700 + }, + { + "epoch": 12.62, + "learning_rate": 0.0004320015616866216, + "loss": 0.6307, + "step": 51725 + }, + { + "epoch": 12.63, + "learning_rate": 0.00043196836256626544, + "loss": 0.6557, + "step": 51750 + }, + { + "epoch": 12.63, + "learning_rate": 0.0004319351634459093, + "loss": 0.6062, + "step": 51775 + }, + { + "epoch": 12.64, + "learning_rate": 0.0004319019643255532, + "loss": 0.6771, + "step": 51800 + }, + { + "epoch": 12.65, + "learning_rate": 0.00043186876520519713, + "loss": 0.5835, + "step": 51825 + }, + { + "epoch": 12.65, + "learning_rate": 0.00043183556608484105, + "loss": 0.6817, + "step": 51850 + }, + { + "epoch": 12.66, + "learning_rate": 0.00043180236696448496, + "loss": 0.5813, + "step": 51875 + }, + { + "epoch": 12.66, + "learning_rate": 0.00043176916784412877, + "loss": 0.6822, + "step": 51900 + }, + { + "epoch": 12.67, + "learning_rate": 0.0004317359687237727, + "loss": 0.624, + "step": 51925 + }, + { + "epoch": 12.68, + "learning_rate": 0.0004317027696034166, + "loss": 0.6184, + "step": 51950 + }, + { + "epoch": 12.68, + "learning_rate": 0.0004316695704830605, + "loss": 0.5797, + "step": 51975 + }, + { + "epoch": 12.69, + "learning_rate": 0.0004316363713627044, + "loss": 0.6656, + "step": 52000 + }, + { + "epoch": 12.7, + "learning_rate": 0.0004316031722423483, + "loss": 0.6369, + "step": 52025 + }, + { + "epoch": 12.7, + "learning_rate": 0.00043156997312199214, + "loss": 0.6581, + "step": 52050 + }, + { + "epoch": 12.71, + "learning_rate": 0.00043153677400163605, + "loss": 0.6149, + "step": 52075 + }, + { + "epoch": 12.71, + "learning_rate": 0.00043150357488127997, + "loss": 0.6381, + "step": 52100 + }, + { + "epoch": 12.72, + "learning_rate": 0.00043147037576092383, + "loss": 0.6081, + "step": 52125 + }, + { + "epoch": 12.73, + "learning_rate": 0.00043143717664056774, + "loss": 0.6467, + "step": 52150 + }, + { + "epoch": 12.73, + "learning_rate": 0.00043140397752021166, + "loss": 0.6111, + "step": 52175 + }, + { + "epoch": 12.74, + "learning_rate": 0.0004313707783998555, + "loss": 0.6133, + "step": 52200 + }, + { + "epoch": 12.74, + "learning_rate": 0.00043133757927949943, + "loss": 0.6808, + "step": 52225 + }, + { + "epoch": 12.75, + "learning_rate": 0.0004313043801591433, + "loss": 0.6614, + "step": 52250 + }, + { + "epoch": 12.76, + "learning_rate": 0.0004312711810387872, + "loss": 0.6509, + "step": 52275 + }, + { + "epoch": 12.76, + "learning_rate": 0.0004312379819184311, + "loss": 0.6602, + "step": 52300 + }, + { + "epoch": 12.77, + "learning_rate": 0.00043120478279807503, + "loss": 0.6146, + "step": 52325 + }, + { + "epoch": 12.77, + "learning_rate": 0.00043117158367771884, + "loss": 0.6843, + "step": 52350 + }, + { + "epoch": 12.78, + "learning_rate": 0.00043113838455736275, + "loss": 0.6288, + "step": 52375 + }, + { + "epoch": 12.79, + "learning_rate": 0.00043110518543700667, + "loss": 0.6445, + "step": 52400 + }, + { + "epoch": 12.79, + "learning_rate": 0.0004310719863166506, + "loss": 0.5682, + "step": 52425 + }, + { + "epoch": 12.8, + "learning_rate": 0.0004310387871962945, + "loss": 0.7003, + "step": 52450 + }, + { + "epoch": 12.81, + "learning_rate": 0.00043100558807593835, + "loss": 0.5748, + "step": 52475 + }, + { + "epoch": 12.81, + "learning_rate": 0.0004309723889555822, + "loss": 0.6869, + "step": 52500 + }, + { + "epoch": 12.82, + "learning_rate": 0.0004309391898352261, + "loss": 0.5552, + "step": 52525 + }, + { + "epoch": 12.82, + "learning_rate": 0.00043090599071487004, + "loss": 0.6504, + "step": 52550 + }, + { + "epoch": 12.83, + "learning_rate": 0.0004308727915945139, + "loss": 0.6439, + "step": 52575 + }, + { + "epoch": 12.84, + "learning_rate": 0.0004308395924741578, + "loss": 0.6415, + "step": 52600 + }, + { + "epoch": 12.84, + "learning_rate": 0.00043080639335380173, + "loss": 0.6279, + "step": 52625 + }, + { + "epoch": 12.85, + "learning_rate": 0.0004307731942334456, + "loss": 0.6609, + "step": 52650 + }, + { + "epoch": 12.85, + "learning_rate": 0.0004307399951130895, + "loss": 0.628, + "step": 52675 + }, + { + "epoch": 12.86, + "learning_rate": 0.00043070679599273336, + "loss": 0.6844, + "step": 52700 + }, + { + "epoch": 12.87, + "learning_rate": 0.0004306735968723773, + "loss": 0.6197, + "step": 52725 + }, + { + "epoch": 12.87, + "learning_rate": 0.0004306403977520212, + "loss": 0.6395, + "step": 52750 + }, + { + "epoch": 12.88, + "learning_rate": 0.0004306071986316651, + "loss": 0.6112, + "step": 52775 + }, + { + "epoch": 12.88, + "learning_rate": 0.0004305739995113089, + "loss": 0.6495, + "step": 52800 + }, + { + "epoch": 12.89, + "learning_rate": 0.0004305408003909528, + "loss": 0.5714, + "step": 52825 + }, + { + "epoch": 12.9, + "learning_rate": 0.00043050760127059674, + "loss": 0.6368, + "step": 52850 + }, + { + "epoch": 12.9, + "learning_rate": 0.00043047440215024065, + "loss": 0.6219, + "step": 52875 + }, + { + "epoch": 12.91, + "learning_rate": 0.00043044120302988457, + "loss": 0.6374, + "step": 52900 + }, + { + "epoch": 12.91, + "learning_rate": 0.0004304080039095284, + "loss": 0.6305, + "step": 52925 + }, + { + "epoch": 12.92, + "learning_rate": 0.0004303748047891723, + "loss": 0.6444, + "step": 52950 + }, + { + "epoch": 12.93, + "learning_rate": 0.0004303416056688162, + "loss": 0.6064, + "step": 52975 + }, + { + "epoch": 12.93, + "learning_rate": 0.0004303084065484601, + "loss": 0.6849, + "step": 53000 + }, + { + "epoch": 12.94, + "learning_rate": 0.00043027520742810397, + "loss": 0.6103, + "step": 53025 + }, + { + "epoch": 12.95, + "learning_rate": 0.0004302420083077479, + "loss": 0.6676, + "step": 53050 + }, + { + "epoch": 12.95, + "learning_rate": 0.0004302088091873918, + "loss": 0.6101, + "step": 53075 + }, + { + "epoch": 12.96, + "learning_rate": 0.00043017561006703566, + "loss": 0.6528, + "step": 53100 + }, + { + "epoch": 12.96, + "learning_rate": 0.0004301424109466796, + "loss": 0.6113, + "step": 53125 + }, + { + "epoch": 12.97, + "learning_rate": 0.00043010921182632343, + "loss": 0.6564, + "step": 53150 + }, + { + "epoch": 12.98, + "learning_rate": 0.00043007601270596735, + "loss": 0.6153, + "step": 53175 + }, + { + "epoch": 12.98, + "learning_rate": 0.00043004281358561126, + "loss": 0.6683, + "step": 53200 + }, + { + "epoch": 12.99, + "learning_rate": 0.0004300096144652552, + "loss": 0.616, + "step": 53225 + }, + { + "epoch": 12.99, + "learning_rate": 0.000429976415344899, + "loss": 0.6465, + "step": 53250 + }, + { + "epoch": 13.0, + "learning_rate": 0.0004299432162245429, + "loss": 0.6009, + "step": 53275 + }, + { + "epoch": 13.01, + "learning_rate": 0.0004299100171041868, + "loss": 0.5988, + "step": 53300 + }, + { + "epoch": 13.01, + "learning_rate": 0.0004298768179838307, + "loss": 0.6029, + "step": 53325 + }, + { + "epoch": 13.02, + "learning_rate": 0.00042984361886347464, + "loss": 0.6456, + "step": 53350 + }, + { + "epoch": 13.02, + "learning_rate": 0.0004298104197431185, + "loss": 0.5629, + "step": 53375 + }, + { + "epoch": 13.03, + "learning_rate": 0.00042977722062276236, + "loss": 0.6884, + "step": 53400 + }, + { + "epoch": 13.04, + "learning_rate": 0.00042974402150240627, + "loss": 0.5485, + "step": 53425 + }, + { + "epoch": 13.04, + "learning_rate": 0.0004297108223820502, + "loss": 0.6364, + "step": 53450 + }, + { + "epoch": 13.05, + "learning_rate": 0.0004296776232616941, + "loss": 0.6216, + "step": 53475 + }, + { + "epoch": 13.06, + "learning_rate": 0.00042964442414133796, + "loss": 0.6327, + "step": 53500 + }, + { + "epoch": 13.06, + "learning_rate": 0.00042961122502098187, + "loss": 0.5482, + "step": 53525 + }, + { + "epoch": 13.07, + "learning_rate": 0.00042957802590062573, + "loss": 0.6113, + "step": 53550 + }, + { + "epoch": 13.07, + "learning_rate": 0.00042954482678026965, + "loss": 0.6428, + "step": 53575 + }, + { + "epoch": 13.08, + "learning_rate": 0.0004295116276599135, + "loss": 0.6235, + "step": 53600 + }, + { + "epoch": 13.09, + "learning_rate": 0.0004294784285395574, + "loss": 0.5614, + "step": 53625 + }, + { + "epoch": 13.09, + "learning_rate": 0.00042944522941920133, + "loss": 0.6227, + "step": 53650 + }, + { + "epoch": 13.1, + "learning_rate": 0.00042941203029884525, + "loss": 0.6198, + "step": 53675 + }, + { + "epoch": 13.1, + "learning_rate": 0.0004293788311784891, + "loss": 0.6465, + "step": 53700 + }, + { + "epoch": 13.11, + "learning_rate": 0.00042934563205813297, + "loss": 0.5627, + "step": 53725 + }, + { + "epoch": 13.12, + "learning_rate": 0.0004293124329377769, + "loss": 0.5748, + "step": 53750 + }, + { + "epoch": 13.12, + "learning_rate": 0.0004292792338174208, + "loss": 0.6012, + "step": 53775 + }, + { + "epoch": 13.13, + "learning_rate": 0.0004292460346970647, + "loss": 0.6468, + "step": 53800 + }, + { + "epoch": 13.13, + "learning_rate": 0.00042921283557670857, + "loss": 0.5995, + "step": 53825 + }, + { + "epoch": 13.14, + "learning_rate": 0.00042917963645635243, + "loss": 0.6065, + "step": 53850 + }, + { + "epoch": 13.15, + "learning_rate": 0.00042914643733599634, + "loss": 0.5887, + "step": 53875 + }, + { + "epoch": 13.15, + "learning_rate": 0.00042911323821564026, + "loss": 0.63, + "step": 53900 + }, + { + "epoch": 13.16, + "learning_rate": 0.00042908003909528417, + "loss": 0.5393, + "step": 53925 + }, + { + "epoch": 13.16, + "learning_rate": 0.00042904683997492803, + "loss": 0.5984, + "step": 53950 + }, + { + "epoch": 13.17, + "learning_rate": 0.00042901364085457194, + "loss": 0.626, + "step": 53975 + }, + { + "epoch": 13.18, + "learning_rate": 0.0004289804417342158, + "loss": 0.615, + "step": 54000 + }, + { + "epoch": 13.18, + "eval_cer": 0.13237785283820827, + "eval_loss": 0.4704066812992096, + "eval_runtime": 146.2141, + "eval_samples_per_second": 28.677, + "eval_steps_per_second": 7.174, + "eval_wer": 0.5296900489396411, + "step": 54000 + }, + { + "epoch": 13.18, + "learning_rate": 0.0004289472426138597, + "loss": 0.5829, + "step": 54025 + }, + { + "epoch": 13.19, + "learning_rate": 0.0004289140434935036, + "loss": 0.6365, + "step": 54050 + }, + { + "epoch": 13.2, + "learning_rate": 0.0004288808443731475, + "loss": 0.6134, + "step": 54075 + }, + { + "epoch": 13.2, + "learning_rate": 0.0004288476452527914, + "loss": 0.6517, + "step": 54100 + }, + { + "epoch": 13.21, + "learning_rate": 0.0004288144461324353, + "loss": 0.5775, + "step": 54125 + }, + { + "epoch": 13.21, + "learning_rate": 0.0004287812470120792, + "loss": 0.6561, + "step": 54150 + }, + { + "epoch": 13.22, + "learning_rate": 0.00042874804789172304, + "loss": 0.5299, + "step": 54175 + }, + { + "epoch": 13.23, + "learning_rate": 0.00042871484877136695, + "loss": 0.608, + "step": 54200 + }, + { + "epoch": 13.23, + "learning_rate": 0.00042868164965101087, + "loss": 0.5702, + "step": 54225 + }, + { + "epoch": 13.24, + "learning_rate": 0.0004286484505306548, + "loss": 0.6428, + "step": 54250 + }, + { + "epoch": 13.24, + "learning_rate": 0.00042861525141029864, + "loss": 0.5802, + "step": 54275 + }, + { + "epoch": 13.25, + "learning_rate": 0.0004285820522899425, + "loss": 0.5996, + "step": 54300 + }, + { + "epoch": 13.26, + "learning_rate": 0.0004285488531695864, + "loss": 0.5291, + "step": 54325 + }, + { + "epoch": 13.26, + "learning_rate": 0.00042851565404923033, + "loss": 0.6271, + "step": 54350 + }, + { + "epoch": 13.27, + "learning_rate": 0.00042848245492887424, + "loss": 0.5607, + "step": 54375 + }, + { + "epoch": 13.27, + "learning_rate": 0.0004284492558085181, + "loss": 0.6246, + "step": 54400 + }, + { + "epoch": 13.28, + "learning_rate": 0.000428416056688162, + "loss": 0.5731, + "step": 54425 + }, + { + "epoch": 13.29, + "learning_rate": 0.0004283828575678059, + "loss": 0.6058, + "step": 54450 + }, + { + "epoch": 13.29, + "learning_rate": 0.0004283496584474498, + "loss": 0.5722, + "step": 54475 + }, + { + "epoch": 13.3, + "learning_rate": 0.00042831645932709365, + "loss": 0.614, + "step": 54500 + }, + { + "epoch": 13.31, + "learning_rate": 0.00042828326020673756, + "loss": 0.6, + "step": 54525 + }, + { + "epoch": 13.31, + "learning_rate": 0.0004282500610863815, + "loss": 0.6331, + "step": 54550 + }, + { + "epoch": 13.32, + "learning_rate": 0.0004282168619660254, + "loss": 0.6208, + "step": 54575 + }, + { + "epoch": 13.32, + "learning_rate": 0.00042818366284566925, + "loss": 0.6295, + "step": 54600 + }, + { + "epoch": 13.33, + "learning_rate": 0.0004281504637253131, + "loss": 0.6451, + "step": 54625 + }, + { + "epoch": 13.34, + "learning_rate": 0.000428117264604957, + "loss": 0.6238, + "step": 54650 + }, + { + "epoch": 13.34, + "learning_rate": 0.00042808406548460094, + "loss": 0.5815, + "step": 54675 + }, + { + "epoch": 13.35, + "learning_rate": 0.00042805086636424485, + "loss": 0.6429, + "step": 54700 + }, + { + "epoch": 13.35, + "learning_rate": 0.00042801766724388877, + "loss": 0.6381, + "step": 54725 + }, + { + "epoch": 13.36, + "learning_rate": 0.0004279844681235326, + "loss": 0.5901, + "step": 54750 + }, + { + "epoch": 13.37, + "learning_rate": 0.0004279512690031765, + "loss": 0.5912, + "step": 54775 + }, + { + "epoch": 13.37, + "learning_rate": 0.0004279180698828204, + "loss": 0.6324, + "step": 54800 + }, + { + "epoch": 13.38, + "learning_rate": 0.0004278848707624643, + "loss": 0.6042, + "step": 54825 + }, + { + "epoch": 13.38, + "learning_rate": 0.0004278516716421082, + "loss": 0.653, + "step": 54850 + }, + { + "epoch": 13.39, + "learning_rate": 0.0004278184725217521, + "loss": 0.5603, + "step": 54875 + }, + { + "epoch": 13.4, + "learning_rate": 0.00042778527340139595, + "loss": 0.6358, + "step": 54900 + }, + { + "epoch": 13.4, + "learning_rate": 0.00042775207428103986, + "loss": 0.5259, + "step": 54925 + }, + { + "epoch": 13.41, + "learning_rate": 0.0004277188751606838, + "loss": 0.6624, + "step": 54950 + }, + { + "epoch": 13.42, + "learning_rate": 0.00042768567604032764, + "loss": 0.5836, + "step": 54975 + }, + { + "epoch": 13.42, + "learning_rate": 0.00042765247691997155, + "loss": 0.659, + "step": 55000 + }, + { + "epoch": 13.43, + "learning_rate": 0.0004276192777996154, + "loss": 0.5618, + "step": 55025 + }, + { + "epoch": 13.43, + "learning_rate": 0.0004275860786792593, + "loss": 0.6365, + "step": 55050 + }, + { + "epoch": 13.44, + "learning_rate": 0.0004275528795589032, + "loss": 0.596, + "step": 55075 + }, + { + "epoch": 13.45, + "learning_rate": 0.0004275196804385471, + "loss": 0.6246, + "step": 55100 + }, + { + "epoch": 13.45, + "learning_rate": 0.000427486481318191, + "loss": 0.6119, + "step": 55125 + }, + { + "epoch": 13.46, + "learning_rate": 0.0004274532821978349, + "loss": 0.6495, + "step": 55150 + }, + { + "epoch": 13.46, + "learning_rate": 0.0004274200830774788, + "loss": 0.5684, + "step": 55175 + }, + { + "epoch": 13.47, + "learning_rate": 0.00042738688395712265, + "loss": 0.6245, + "step": 55200 + }, + { + "epoch": 13.48, + "learning_rate": 0.00042735501280158084, + "loss": 0.5476, + "step": 55225 + }, + { + "epoch": 13.48, + "learning_rate": 0.0004273218136812247, + "loss": 0.6062, + "step": 55250 + }, + { + "epoch": 13.49, + "learning_rate": 0.0004272886145608686, + "loss": 0.5916, + "step": 55275 + }, + { + "epoch": 13.49, + "learning_rate": 0.0004272554154405125, + "loss": 0.6337, + "step": 55300 + }, + { + "epoch": 13.5, + "learning_rate": 0.0004272222163201564, + "loss": 0.5957, + "step": 55325 + }, + { + "epoch": 13.51, + "learning_rate": 0.0004271890171998003, + "loss": 0.6467, + "step": 55350 + }, + { + "epoch": 13.51, + "learning_rate": 0.0004271558180794442, + "loss": 0.5772, + "step": 55375 + }, + { + "epoch": 13.52, + "learning_rate": 0.000427122618959088, + "loss": 0.649, + "step": 55400 + }, + { + "epoch": 13.52, + "learning_rate": 0.00042708941983873194, + "loss": 0.5464, + "step": 55425 + }, + { + "epoch": 13.53, + "learning_rate": 0.00042705622071837585, + "loss": 0.6423, + "step": 55450 + }, + { + "epoch": 13.54, + "learning_rate": 0.00042702302159801977, + "loss": 0.6658, + "step": 55475 + }, + { + "epoch": 13.54, + "learning_rate": 0.0004269898224776637, + "loss": 0.6415, + "step": 55500 + }, + { + "epoch": 13.55, + "learning_rate": 0.00042695662335730754, + "loss": 0.5512, + "step": 55525 + }, + { + "epoch": 13.56, + "learning_rate": 0.0004269234242369514, + "loss": 0.6279, + "step": 55550 + }, + { + "epoch": 13.56, + "learning_rate": 0.0004268902251165953, + "loss": 0.6403, + "step": 55575 + }, + { + "epoch": 13.57, + "learning_rate": 0.00042685702599623923, + "loss": 0.6368, + "step": 55600 + }, + { + "epoch": 13.57, + "learning_rate": 0.0004268238268758831, + "loss": 0.6262, + "step": 55625 + }, + { + "epoch": 13.58, + "learning_rate": 0.000426790627755527, + "loss": 0.6254, + "step": 55650 + }, + { + "epoch": 13.59, + "learning_rate": 0.0004267574286351709, + "loss": 0.5924, + "step": 55675 + }, + { + "epoch": 13.59, + "learning_rate": 0.0004267242295148148, + "loss": 0.6158, + "step": 55700 + }, + { + "epoch": 13.6, + "learning_rate": 0.0004266910303944587, + "loss": 0.6169, + "step": 55725 + }, + { + "epoch": 13.6, + "learning_rate": 0.00042665783127410255, + "loss": 0.617, + "step": 55750 + }, + { + "epoch": 13.61, + "learning_rate": 0.00042662463215374646, + "loss": 0.5882, + "step": 55775 + }, + { + "epoch": 13.62, + "learning_rate": 0.0004265914330333904, + "loss": 0.6228, + "step": 55800 + }, + { + "epoch": 13.62, + "learning_rate": 0.00042655823391303424, + "loss": 0.5645, + "step": 55825 + }, + { + "epoch": 13.63, + "learning_rate": 0.0004265250347926781, + "loss": 0.6124, + "step": 55850 + }, + { + "epoch": 13.63, + "learning_rate": 0.000426491835672322, + "loss": 0.6378, + "step": 55875 + }, + { + "epoch": 13.64, + "learning_rate": 0.0004264586365519659, + "loss": 0.6315, + "step": 55900 + }, + { + "epoch": 13.65, + "learning_rate": 0.00042642543743160984, + "loss": 0.5701, + "step": 55925 + }, + { + "epoch": 13.65, + "learning_rate": 0.00042639223831125375, + "loss": 0.6325, + "step": 55950 + }, + { + "epoch": 13.66, + "learning_rate": 0.00042635903919089756, + "loss": 0.5678, + "step": 55975 + }, + { + "epoch": 13.67, + "learning_rate": 0.00042632584007054147, + "loss": 0.6605, + "step": 56000 + }, + { + "epoch": 13.67, + "learning_rate": 0.0004262926409501854, + "loss": 0.5455, + "step": 56025 + }, + { + "epoch": 13.68, + "learning_rate": 0.0004262594418298293, + "loss": 0.6301, + "step": 56050 + }, + { + "epoch": 13.68, + "learning_rate": 0.0004262262427094732, + "loss": 0.6023, + "step": 56075 + }, + { + "epoch": 13.69, + "learning_rate": 0.0004261930435891171, + "loss": 0.6524, + "step": 56100 + }, + { + "epoch": 13.7, + "learning_rate": 0.00042615984446876093, + "loss": 0.5723, + "step": 56125 + }, + { + "epoch": 13.7, + "learning_rate": 0.00042612664534840485, + "loss": 0.6332, + "step": 56150 + }, + { + "epoch": 13.71, + "learning_rate": 0.00042609344622804876, + "loss": 0.4887, + "step": 56175 + }, + { + "epoch": 13.71, + "learning_rate": 0.0004260602471076926, + "loss": 0.6688, + "step": 56200 + }, + { + "epoch": 13.72, + "learning_rate": 0.00042602704798733654, + "loss": 0.6288, + "step": 56225 + }, + { + "epoch": 13.73, + "learning_rate": 0.00042599384886698045, + "loss": 0.6548, + "step": 56250 + }, + { + "epoch": 13.73, + "learning_rate": 0.0004259606497466243, + "loss": 0.6337, + "step": 56275 + }, + { + "epoch": 13.74, + "learning_rate": 0.0004259274506262682, + "loss": 0.6278, + "step": 56300 + }, + { + "epoch": 13.74, + "learning_rate": 0.0004258942515059121, + "loss": 0.6219, + "step": 56325 + }, + { + "epoch": 13.75, + "learning_rate": 0.000425861052385556, + "loss": 0.6294, + "step": 56350 + }, + { + "epoch": 13.76, + "learning_rate": 0.0004258278532651999, + "loss": 0.5719, + "step": 56375 + }, + { + "epoch": 13.76, + "learning_rate": 0.0004257946541448438, + "loss": 0.6342, + "step": 56400 + }, + { + "epoch": 13.77, + "learning_rate": 0.00042576145502448763, + "loss": 0.6385, + "step": 56425 + }, + { + "epoch": 13.78, + "learning_rate": 0.00042572825590413154, + "loss": 0.6423, + "step": 56450 + }, + { + "epoch": 13.78, + "learning_rate": 0.00042569505678377546, + "loss": 0.5712, + "step": 56475 + }, + { + "epoch": 13.79, + "learning_rate": 0.00042566185766341937, + "loss": 0.5906, + "step": 56500 + }, + { + "epoch": 13.79, + "learning_rate": 0.0004256286585430633, + "loss": 0.6113, + "step": 56525 + }, + { + "epoch": 13.8, + "learning_rate": 0.00042559545942270715, + "loss": 0.6131, + "step": 56550 + }, + { + "epoch": 13.81, + "learning_rate": 0.000425562260302351, + "loss": 0.5752, + "step": 56575 + }, + { + "epoch": 13.81, + "learning_rate": 0.0004255290611819949, + "loss": 0.6672, + "step": 56600 + }, + { + "epoch": 13.82, + "learning_rate": 0.00042549586206163883, + "loss": 0.6447, + "step": 56625 + }, + { + "epoch": 13.82, + "learning_rate": 0.0004254626629412827, + "loss": 0.611, + "step": 56650 + }, + { + "epoch": 13.83, + "learning_rate": 0.0004254294638209266, + "loss": 0.5499, + "step": 56675 + }, + { + "epoch": 13.84, + "learning_rate": 0.0004253962647005705, + "loss": 0.6201, + "step": 56700 + }, + { + "epoch": 13.84, + "learning_rate": 0.0004253630655802144, + "loss": 0.6202, + "step": 56725 + }, + { + "epoch": 13.85, + "learning_rate": 0.0004253298664598583, + "loss": 0.6132, + "step": 56750 + }, + { + "epoch": 13.85, + "learning_rate": 0.00042529666733950216, + "loss": 0.5538, + "step": 56775 + }, + { + "epoch": 13.86, + "learning_rate": 0.00042526346821914607, + "loss": 0.6536, + "step": 56800 + }, + { + "epoch": 13.87, + "learning_rate": 0.00042523026909879, + "loss": 0.5926, + "step": 56825 + }, + { + "epoch": 13.87, + "learning_rate": 0.0004251970699784339, + "loss": 0.6069, + "step": 56850 + }, + { + "epoch": 13.88, + "learning_rate": 0.0004251638708580777, + "loss": 0.5366, + "step": 56875 + }, + { + "epoch": 13.88, + "learning_rate": 0.0004251306717377216, + "loss": 0.6103, + "step": 56900 + }, + { + "epoch": 13.89, + "learning_rate": 0.00042509747261736553, + "loss": 0.6493, + "step": 56925 + }, + { + "epoch": 13.9, + "learning_rate": 0.00042506427349700944, + "loss": 0.6284, + "step": 56950 + }, + { + "epoch": 13.9, + "learning_rate": 0.00042503107437665336, + "loss": 0.6125, + "step": 56975 + }, + { + "epoch": 13.91, + "learning_rate": 0.0004249978752562972, + "loss": 0.6308, + "step": 57000 + }, + { + "epoch": 13.91, + "eval_cer": 0.1298163300925023, + "eval_loss": 0.4570181965827942, + "eval_runtime": 145.5018, + "eval_samples_per_second": 28.818, + "eval_steps_per_second": 7.21, + "eval_wer": 0.5181402936378466, + "step": 57000 + }, + { + "epoch": 13.92, + "learning_rate": 0.0004249646761359411, + "loss": 0.591, + "step": 57025 + }, + { + "epoch": 13.92, + "learning_rate": 0.000424931477015585, + "loss": 0.6476, + "step": 57050 + }, + { + "epoch": 13.93, + "learning_rate": 0.0004248982778952289, + "loss": 0.6229, + "step": 57075 + }, + { + "epoch": 13.93, + "learning_rate": 0.00042486507877487277, + "loss": 0.6675, + "step": 57100 + }, + { + "epoch": 13.94, + "learning_rate": 0.0004248318796545167, + "loss": 0.6594, + "step": 57125 + }, + { + "epoch": 13.95, + "learning_rate": 0.0004247986805341606, + "loss": 0.623, + "step": 57150 + }, + { + "epoch": 13.95, + "learning_rate": 0.00042476548141380445, + "loss": 0.5794, + "step": 57175 + }, + { + "epoch": 13.96, + "learning_rate": 0.00042473228229344837, + "loss": 0.6319, + "step": 57200 + }, + { + "epoch": 13.96, + "learning_rate": 0.00042469908317309223, + "loss": 0.5749, + "step": 57225 + }, + { + "epoch": 13.97, + "learning_rate": 0.00042466588405273614, + "loss": 0.6396, + "step": 57250 + }, + { + "epoch": 13.98, + "learning_rate": 0.00042463268493238006, + "loss": 0.5968, + "step": 57275 + }, + { + "epoch": 13.98, + "learning_rate": 0.00042459948581202397, + "loss": 0.6442, + "step": 57300 + }, + { + "epoch": 13.99, + "learning_rate": 0.00042456628669166783, + "loss": 0.561, + "step": 57325 + }, + { + "epoch": 13.99, + "learning_rate": 0.0004245330875713117, + "loss": 0.617, + "step": 57350 + }, + { + "epoch": 14.0, + "learning_rate": 0.0004244998884509556, + "loss": 0.5744, + "step": 57375 + }, + { + "epoch": 14.01, + "learning_rate": 0.0004244666893305995, + "loss": 0.6043, + "step": 57400 + }, + { + "epoch": 14.01, + "learning_rate": 0.00042443349021024343, + "loss": 0.5643, + "step": 57425 + }, + { + "epoch": 14.02, + "learning_rate": 0.0004244002910898873, + "loss": 0.6069, + "step": 57450 + }, + { + "epoch": 14.03, + "learning_rate": 0.00042436709196953115, + "loss": 0.5898, + "step": 57475 + }, + { + "epoch": 14.03, + "learning_rate": 0.00042433389284917506, + "loss": 0.5904, + "step": 57500 + }, + { + "epoch": 14.04, + "learning_rate": 0.000424300693728819, + "loss": 0.5918, + "step": 57525 + }, + { + "epoch": 14.04, + "learning_rate": 0.0004242674946084629, + "loss": 0.5941, + "step": 57550 + }, + { + "epoch": 14.05, + "learning_rate": 0.00042423429548810675, + "loss": 0.6079, + "step": 57575 + }, + { + "epoch": 14.06, + "learning_rate": 0.00042420109636775067, + "loss": 0.5946, + "step": 57600 + }, + { + "epoch": 14.06, + "learning_rate": 0.0004241678972473945, + "loss": 0.6464, + "step": 57625 + }, + { + "epoch": 14.07, + "learning_rate": 0.00042413469812703844, + "loss": 0.6279, + "step": 57650 + }, + { + "epoch": 14.07, + "learning_rate": 0.00042410282697149653, + "loss": 0.5383, + "step": 57675 + }, + { + "epoch": 14.08, + "learning_rate": 0.00042406962785114044, + "loss": 0.5984, + "step": 57700 + }, + { + "epoch": 14.09, + "learning_rate": 0.00042403642873078436, + "loss": 0.588, + "step": 57725 + }, + { + "epoch": 14.09, + "learning_rate": 0.00042400322961042827, + "loss": 0.6184, + "step": 57750 + }, + { + "epoch": 14.1, + "learning_rate": 0.00042397003049007213, + "loss": 0.5526, + "step": 57775 + }, + { + "epoch": 14.1, + "learning_rate": 0.00042393683136971605, + "loss": 0.6482, + "step": 57800 + }, + { + "epoch": 14.11, + "learning_rate": 0.0004239036322493599, + "loss": 0.5692, + "step": 57825 + }, + { + "epoch": 14.12, + "learning_rate": 0.0004238704331290038, + "loss": 0.5955, + "step": 57850 + }, + { + "epoch": 14.12, + "learning_rate": 0.00042383723400864773, + "loss": 0.6025, + "step": 57875 + }, + { + "epoch": 14.13, + "learning_rate": 0.0004238040348882916, + "loss": 0.6018, + "step": 57900 + }, + { + "epoch": 14.13, + "learning_rate": 0.0004237708357679355, + "loss": 0.5857, + "step": 57925 + }, + { + "epoch": 14.14, + "learning_rate": 0.0004237376366475794, + "loss": 0.5763, + "step": 57950 + }, + { + "epoch": 14.15, + "learning_rate": 0.0004237044375272233, + "loss": 0.6155, + "step": 57975 + }, + { + "epoch": 14.15, + "learning_rate": 0.00042367123840686714, + "loss": 0.6198, + "step": 58000 + }, + { + "epoch": 14.16, + "learning_rate": 0.00042363803928651105, + "loss": 0.5932, + "step": 58025 + }, + { + "epoch": 14.17, + "learning_rate": 0.00042360484016615497, + "loss": 0.5814, + "step": 58050 + }, + { + "epoch": 14.17, + "learning_rate": 0.0004235716410457989, + "loss": 0.5931, + "step": 58075 + }, + { + "epoch": 14.18, + "learning_rate": 0.0004235384419254428, + "loss": 0.5842, + "step": 58100 + }, + { + "epoch": 14.18, + "learning_rate": 0.0004235052428050866, + "loss": 0.5457, + "step": 58125 + }, + { + "epoch": 14.19, + "learning_rate": 0.0004234720436847305, + "loss": 0.6123, + "step": 58150 + }, + { + "epoch": 14.2, + "learning_rate": 0.00042343884456437443, + "loss": 0.5326, + "step": 58175 + }, + { + "epoch": 14.2, + "learning_rate": 0.00042340564544401834, + "loss": 0.5919, + "step": 58200 + }, + { + "epoch": 14.21, + "learning_rate": 0.0004233724463236622, + "loss": 0.5965, + "step": 58225 + }, + { + "epoch": 14.21, + "learning_rate": 0.0004233392472033061, + "loss": 0.5863, + "step": 58250 + }, + { + "epoch": 14.22, + "learning_rate": 0.00042330604808295, + "loss": 0.5605, + "step": 58275 + }, + { + "epoch": 14.23, + "learning_rate": 0.0004232728489625939, + "loss": 0.614, + "step": 58300 + }, + { + "epoch": 14.23, + "learning_rate": 0.0004232396498422378, + "loss": 0.5654, + "step": 58325 + }, + { + "epoch": 14.24, + "learning_rate": 0.00042320645072188167, + "loss": 0.5933, + "step": 58350 + }, + { + "epoch": 14.24, + "learning_rate": 0.0004231732516015256, + "loss": 0.5873, + "step": 58375 + }, + { + "epoch": 14.25, + "learning_rate": 0.0004231400524811695, + "loss": 0.5915, + "step": 58400 + }, + { + "epoch": 14.26, + "learning_rate": 0.00042310685336081335, + "loss": 0.6126, + "step": 58425 + }, + { + "epoch": 14.26, + "learning_rate": 0.0004230736542404572, + "loss": 0.6042, + "step": 58450 + }, + { + "epoch": 14.27, + "learning_rate": 0.0004230404551201011, + "loss": 0.5961, + "step": 58475 + }, + { + "epoch": 14.28, + "learning_rate": 0.00042300725599974504, + "loss": 0.6288, + "step": 58500 + }, + { + "epoch": 14.28, + "learning_rate": 0.00042297405687938895, + "loss": 0.4981, + "step": 58525 + }, + { + "epoch": 14.29, + "learning_rate": 0.00042294085775903287, + "loss": 0.5907, + "step": 58550 + }, + { + "epoch": 14.29, + "learning_rate": 0.0004229076586386767, + "loss": 0.5619, + "step": 58575 + }, + { + "epoch": 14.3, + "learning_rate": 0.0004228744595183206, + "loss": 0.6181, + "step": 58600 + }, + { + "epoch": 14.31, + "learning_rate": 0.0004228412603979645, + "loss": 0.5144, + "step": 58625 + }, + { + "epoch": 14.31, + "learning_rate": 0.0004228080612776084, + "loss": 0.6199, + "step": 58650 + }, + { + "epoch": 14.32, + "learning_rate": 0.00042277486215725233, + "loss": 0.6018, + "step": 58675 + }, + { + "epoch": 14.32, + "learning_rate": 0.0004227416630368962, + "loss": 0.5986, + "step": 58700 + }, + { + "epoch": 14.33, + "learning_rate": 0.00042270846391654005, + "loss": 0.5543, + "step": 58725 + }, + { + "epoch": 14.34, + "learning_rate": 0.00042267526479618396, + "loss": 0.6112, + "step": 58750 + }, + { + "epoch": 14.34, + "learning_rate": 0.0004226420656758279, + "loss": 0.5911, + "step": 58775 + }, + { + "epoch": 14.35, + "learning_rate": 0.00042260886655547174, + "loss": 0.6487, + "step": 58800 + }, + { + "epoch": 14.35, + "learning_rate": 0.00042257566743511565, + "loss": 0.5668, + "step": 58825 + }, + { + "epoch": 14.36, + "learning_rate": 0.00042254246831475957, + "loss": 0.5784, + "step": 58850 + }, + { + "epoch": 14.37, + "learning_rate": 0.0004225092691944034, + "loss": 0.5174, + "step": 58875 + }, + { + "epoch": 14.37, + "learning_rate": 0.00042247607007404734, + "loss": 0.5878, + "step": 58900 + }, + { + "epoch": 14.38, + "learning_rate": 0.0004224428709536912, + "loss": 0.5745, + "step": 58925 + }, + { + "epoch": 14.39, + "learning_rate": 0.0004224096718333351, + "loss": 0.6411, + "step": 58950 + }, + { + "epoch": 14.39, + "learning_rate": 0.000422376472712979, + "loss": 0.5667, + "step": 58975 + }, + { + "epoch": 14.4, + "learning_rate": 0.00042234327359262294, + "loss": 0.6156, + "step": 59000 + }, + { + "epoch": 14.4, + "learning_rate": 0.00042231007447226675, + "loss": 0.5767, + "step": 59025 + }, + { + "epoch": 14.41, + "learning_rate": 0.00042227687535191066, + "loss": 0.6067, + "step": 59050 + }, + { + "epoch": 14.42, + "learning_rate": 0.0004222436762315546, + "loss": 0.5967, + "step": 59075 + }, + { + "epoch": 14.42, + "learning_rate": 0.0004222104771111985, + "loss": 0.6227, + "step": 59100 + }, + { + "epoch": 14.43, + "learning_rate": 0.0004221772779908424, + "loss": 0.5626, + "step": 59125 + }, + { + "epoch": 14.43, + "learning_rate": 0.00042214407887048626, + "loss": 0.6133, + "step": 59150 + }, + { + "epoch": 14.44, + "learning_rate": 0.0004221108797501301, + "loss": 0.5761, + "step": 59175 + }, + { + "epoch": 14.45, + "learning_rate": 0.00042207768062977404, + "loss": 0.5861, + "step": 59200 + }, + { + "epoch": 14.45, + "learning_rate": 0.00042204448150941795, + "loss": 0.5882, + "step": 59225 + }, + { + "epoch": 14.46, + "learning_rate": 0.0004220112823890618, + "loss": 0.6155, + "step": 59250 + }, + { + "epoch": 14.46, + "learning_rate": 0.0004219780832687057, + "loss": 0.5599, + "step": 59275 + }, + { + "epoch": 14.47, + "learning_rate": 0.00042194488414834964, + "loss": 0.5907, + "step": 59300 + }, + { + "epoch": 14.48, + "learning_rate": 0.0004219116850279935, + "loss": 0.5632, + "step": 59325 + }, + { + "epoch": 14.48, + "learning_rate": 0.0004218784859076374, + "loss": 0.6302, + "step": 59350 + }, + { + "epoch": 14.49, + "learning_rate": 0.00042184528678728127, + "loss": 0.5725, + "step": 59375 + }, + { + "epoch": 14.49, + "learning_rate": 0.0004218120876669252, + "loss": 0.639, + "step": 59400 + }, + { + "epoch": 14.5, + "learning_rate": 0.0004217788885465691, + "loss": 0.5299, + "step": 59425 + }, + { + "epoch": 14.51, + "learning_rate": 0.000421745689426213, + "loss": 0.6035, + "step": 59450 + }, + { + "epoch": 14.51, + "learning_rate": 0.0004217124903058568, + "loss": 0.5558, + "step": 59475 + }, + { + "epoch": 14.52, + "learning_rate": 0.00042167929118550073, + "loss": 0.6101, + "step": 59500 + }, + { + "epoch": 14.53, + "learning_rate": 0.00042164609206514465, + "loss": 0.6208, + "step": 59525 + }, + { + "epoch": 14.53, + "learning_rate": 0.00042161289294478856, + "loss": 0.6033, + "step": 59550 + }, + { + "epoch": 14.54, + "learning_rate": 0.0004215796938244325, + "loss": 0.598, + "step": 59575 + }, + { + "epoch": 14.54, + "learning_rate": 0.00042154649470407633, + "loss": 0.6098, + "step": 59600 + }, + { + "epoch": 14.55, + "learning_rate": 0.0004215132955837202, + "loss": 0.5855, + "step": 59625 + }, + { + "epoch": 14.56, + "learning_rate": 0.0004214800964633641, + "loss": 0.5699, + "step": 59650 + }, + { + "epoch": 14.56, + "learning_rate": 0.000421446897343008, + "loss": 0.5767, + "step": 59675 + }, + { + "epoch": 14.57, + "learning_rate": 0.00042141369822265194, + "loss": 0.6179, + "step": 59700 + }, + { + "epoch": 14.57, + "learning_rate": 0.0004213804991022958, + "loss": 0.5859, + "step": 59725 + }, + { + "epoch": 14.58, + "learning_rate": 0.0004213472999819397, + "loss": 0.6002, + "step": 59750 + }, + { + "epoch": 14.59, + "learning_rate": 0.00042131410086158357, + "loss": 0.6104, + "step": 59775 + }, + { + "epoch": 14.59, + "learning_rate": 0.0004212809017412275, + "loss": 0.6178, + "step": 59800 + }, + { + "epoch": 14.6, + "learning_rate": 0.00042124770262087134, + "loss": 0.6554, + "step": 59825 + }, + { + "epoch": 14.6, + "learning_rate": 0.00042121450350051526, + "loss": 0.6093, + "step": 59850 + }, + { + "epoch": 14.61, + "learning_rate": 0.00042118130438015917, + "loss": 0.5681, + "step": 59875 + }, + { + "epoch": 14.62, + "learning_rate": 0.0004211481052598031, + "loss": 0.5955, + "step": 59900 + }, + { + "epoch": 14.62, + "learning_rate": 0.00042111490613944694, + "loss": 0.5824, + "step": 59925 + }, + { + "epoch": 14.63, + "learning_rate": 0.0004210817070190908, + "loss": 0.5922, + "step": 59950 + }, + { + "epoch": 14.64, + "learning_rate": 0.0004210485078987347, + "loss": 0.6048, + "step": 59975 + }, + { + "epoch": 14.64, + "learning_rate": 0.00042101530877837863, + "loss": 0.6169, + "step": 60000 + }, + { + "epoch": 14.64, + "eval_cer": 0.12906173321150272, + "eval_loss": 0.45141759514808655, + "eval_runtime": 146.1787, + "eval_samples_per_second": 28.684, + "eval_steps_per_second": 7.176, + "eval_wer": 0.5106362153344208, + "step": 60000 + }, + { + "epoch": 14.65, + "learning_rate": 0.00042098210965802255, + "loss": 0.5448, + "step": 60025 + }, + { + "epoch": 14.65, + "learning_rate": 0.0004209489105376664, + "loss": 0.5884, + "step": 60050 + }, + { + "epoch": 14.66, + "learning_rate": 0.00042091571141731027, + "loss": 0.6039, + "step": 60075 + }, + { + "epoch": 14.67, + "learning_rate": 0.0004208825122969542, + "loss": 0.5554, + "step": 60100 + }, + { + "epoch": 14.67, + "learning_rate": 0.0004208493131765981, + "loss": 0.5541, + "step": 60125 + }, + { + "epoch": 14.68, + "learning_rate": 0.000420816114056242, + "loss": 0.6163, + "step": 60150 + }, + { + "epoch": 14.68, + "learning_rate": 0.00042078291493588587, + "loss": 0.5741, + "step": 60175 + }, + { + "epoch": 14.69, + "learning_rate": 0.0004207497158155298, + "loss": 0.6034, + "step": 60200 + }, + { + "epoch": 14.7, + "learning_rate": 0.00042071651669517364, + "loss": 0.6086, + "step": 60225 + }, + { + "epoch": 14.7, + "learning_rate": 0.00042068331757481756, + "loss": 0.5983, + "step": 60250 + }, + { + "epoch": 14.71, + "learning_rate": 0.0004206501184544614, + "loss": 0.5811, + "step": 60275 + }, + { + "epoch": 14.71, + "learning_rate": 0.00042061691933410533, + "loss": 0.629, + "step": 60300 + }, + { + "epoch": 14.72, + "learning_rate": 0.00042058372021374924, + "loss": 0.5687, + "step": 60325 + }, + { + "epoch": 14.73, + "learning_rate": 0.00042055052109339316, + "loss": 0.5759, + "step": 60350 + }, + { + "epoch": 14.73, + "learning_rate": 0.000420517321973037, + "loss": 0.6268, + "step": 60375 + }, + { + "epoch": 14.74, + "learning_rate": 0.0004204841228526809, + "loss": 0.6366, + "step": 60400 + }, + { + "epoch": 14.74, + "learning_rate": 0.0004204509237323248, + "loss": 0.5926, + "step": 60425 + }, + { + "epoch": 14.75, + "learning_rate": 0.0004204177246119687, + "loss": 0.5949, + "step": 60450 + }, + { + "epoch": 14.76, + "learning_rate": 0.0004203845254916126, + "loss": 0.5102, + "step": 60475 + }, + { + "epoch": 14.76, + "learning_rate": 0.0004203513263712564, + "loss": 0.5873, + "step": 60500 + }, + { + "epoch": 14.77, + "learning_rate": 0.00042031812725090034, + "loss": 0.5693, + "step": 60525 + }, + { + "epoch": 14.78, + "learning_rate": 0.00042028492813054425, + "loss": 0.6257, + "step": 60550 + }, + { + "epoch": 14.78, + "learning_rate": 0.00042025172901018817, + "loss": 0.6004, + "step": 60575 + }, + { + "epoch": 14.79, + "learning_rate": 0.0004202185298898321, + "loss": 0.6049, + "step": 60600 + }, + { + "epoch": 14.79, + "learning_rate": 0.00042018533076947594, + "loss": 0.5733, + "step": 60625 + }, + { + "epoch": 14.8, + "learning_rate": 0.0004201521316491198, + "loss": 0.6075, + "step": 60650 + }, + { + "epoch": 14.81, + "learning_rate": 0.0004201189325287637, + "loss": 0.5729, + "step": 60675 + }, + { + "epoch": 14.81, + "learning_rate": 0.00042008573340840763, + "loss": 0.6376, + "step": 60700 + }, + { + "epoch": 14.82, + "learning_rate": 0.0004200525342880515, + "loss": 0.5921, + "step": 60725 + }, + { + "epoch": 14.82, + "learning_rate": 0.0004200193351676954, + "loss": 0.6365, + "step": 60750 + }, + { + "epoch": 14.83, + "learning_rate": 0.0004199861360473393, + "loss": 0.5834, + "step": 60775 + }, + { + "epoch": 14.84, + "learning_rate": 0.0004199529369269832, + "loss": 0.6236, + "step": 60800 + }, + { + "epoch": 14.84, + "learning_rate": 0.0004199197378066271, + "loss": 0.5911, + "step": 60825 + }, + { + "epoch": 14.85, + "learning_rate": 0.00041988653868627095, + "loss": 0.597, + "step": 60850 + }, + { + "epoch": 14.85, + "learning_rate": 0.00041985333956591486, + "loss": 0.5702, + "step": 60875 + }, + { + "epoch": 14.86, + "learning_rate": 0.0004198201404455588, + "loss": 0.5864, + "step": 60900 + }, + { + "epoch": 14.87, + "learning_rate": 0.0004197869413252027, + "loss": 0.5568, + "step": 60925 + }, + { + "epoch": 14.87, + "learning_rate": 0.0004197537422048465, + "loss": 0.6031, + "step": 60950 + }, + { + "epoch": 14.88, + "learning_rate": 0.0004197205430844904, + "loss": 0.6211, + "step": 60975 + }, + { + "epoch": 14.89, + "learning_rate": 0.0004196873439641343, + "loss": 0.624, + "step": 61000 + }, + { + "epoch": 14.89, + "learning_rate": 0.00041965414484377824, + "loss": 0.5962, + "step": 61025 + }, + { + "epoch": 14.9, + "learning_rate": 0.00041962094572342215, + "loss": 0.6123, + "step": 61050 + }, + { + "epoch": 14.9, + "learning_rate": 0.000419587746603066, + "loss": 0.5665, + "step": 61075 + }, + { + "epoch": 14.91, + "learning_rate": 0.00041955454748270987, + "loss": 0.623, + "step": 61100 + }, + { + "epoch": 14.92, + "learning_rate": 0.0004195213483623538, + "loss": 0.5411, + "step": 61125 + }, + { + "epoch": 14.92, + "learning_rate": 0.0004194881492419977, + "loss": 0.6203, + "step": 61150 + }, + { + "epoch": 14.93, + "learning_rate": 0.0004194549501216416, + "loss": 0.5577, + "step": 61175 + }, + { + "epoch": 14.93, + "learning_rate": 0.0004194217510012855, + "loss": 0.6094, + "step": 61200 + }, + { + "epoch": 14.94, + "learning_rate": 0.0004193885518809294, + "loss": 0.6089, + "step": 61225 + }, + { + "epoch": 14.95, + "learning_rate": 0.00041935535276057325, + "loss": 0.6125, + "step": 61250 + }, + { + "epoch": 14.95, + "learning_rate": 0.00041932215364021716, + "loss": 0.5804, + "step": 61275 + }, + { + "epoch": 14.96, + "learning_rate": 0.000419288954519861, + "loss": 0.5942, + "step": 61300 + }, + { + "epoch": 14.96, + "learning_rate": 0.00041925575539950493, + "loss": 0.6231, + "step": 61325 + }, + { + "epoch": 14.97, + "learning_rate": 0.00041922255627914885, + "loss": 0.6048, + "step": 61350 + }, + { + "epoch": 14.98, + "learning_rate": 0.00041918935715879276, + "loss": 0.5772, + "step": 61375 + }, + { + "epoch": 14.98, + "learning_rate": 0.0004191561580384366, + "loss": 0.6248, + "step": 61400 + }, + { + "epoch": 14.99, + "learning_rate": 0.0004191229589180805, + "loss": 0.6252, + "step": 61425 + }, + { + "epoch": 15.0, + "learning_rate": 0.0004190897597977244, + "loss": 0.6205, + "step": 61450 + }, + { + "epoch": 15.0, + "learning_rate": 0.0004190565606773683, + "loss": 0.5726, + "step": 61475 + }, + { + "epoch": 15.01, + "learning_rate": 0.0004190233615570122, + "loss": 0.5984, + "step": 61500 + }, + { + "epoch": 15.01, + "learning_rate": 0.0004189901624366561, + "loss": 0.5569, + "step": 61525 + }, + { + "epoch": 15.02, + "learning_rate": 0.00041895696331629994, + "loss": 0.6261, + "step": 61550 + }, + { + "epoch": 15.03, + "learning_rate": 0.00041892376419594386, + "loss": 0.5558, + "step": 61575 + }, + { + "epoch": 15.03, + "learning_rate": 0.00041889056507558777, + "loss": 0.5589, + "step": 61600 + }, + { + "epoch": 15.04, + "learning_rate": 0.0004188573659552317, + "loss": 0.6264, + "step": 61625 + }, + { + "epoch": 15.04, + "learning_rate": 0.00041882416683487555, + "loss": 0.5598, + "step": 61650 + }, + { + "epoch": 15.05, + "learning_rate": 0.0004187922956793337, + "loss": 0.5917, + "step": 61675 + }, + { + "epoch": 15.06, + "learning_rate": 0.0004187590965589776, + "loss": 0.6053, + "step": 61700 + }, + { + "epoch": 15.06, + "learning_rate": 0.0004187258974386215, + "loss": 0.5212, + "step": 61725 + }, + { + "epoch": 15.07, + "learning_rate": 0.0004186926983182653, + "loss": 0.6262, + "step": 61750 + }, + { + "epoch": 15.07, + "learning_rate": 0.00041865949919790924, + "loss": 0.5495, + "step": 61775 + }, + { + "epoch": 15.08, + "learning_rate": 0.00041862630007755315, + "loss": 0.6077, + "step": 61800 + }, + { + "epoch": 15.09, + "learning_rate": 0.00041859310095719707, + "loss": 0.5933, + "step": 61825 + }, + { + "epoch": 15.09, + "learning_rate": 0.0004185599018368409, + "loss": 0.5604, + "step": 61850 + }, + { + "epoch": 15.1, + "learning_rate": 0.00041852670271648484, + "loss": 0.5932, + "step": 61875 + }, + { + "epoch": 15.1, + "learning_rate": 0.0004184935035961287, + "loss": 0.5503, + "step": 61900 + }, + { + "epoch": 15.11, + "learning_rate": 0.0004184603044757726, + "loss": 0.5703, + "step": 61925 + }, + { + "epoch": 15.12, + "learning_rate": 0.0004184271053554165, + "loss": 0.5733, + "step": 61950 + }, + { + "epoch": 15.12, + "learning_rate": 0.0004183939062350604, + "loss": 0.5573, + "step": 61975 + }, + { + "epoch": 15.13, + "learning_rate": 0.0004183607071147043, + "loss": 0.598, + "step": 62000 + }, + { + "epoch": 15.14, + "learning_rate": 0.0004183275079943482, + "loss": 0.579, + "step": 62025 + }, + { + "epoch": 15.14, + "learning_rate": 0.0004182943088739921, + "loss": 0.572, + "step": 62050 + }, + { + "epoch": 15.15, + "learning_rate": 0.00041826110975363593, + "loss": 0.5451, + "step": 62075 + }, + { + "epoch": 15.15, + "learning_rate": 0.00041822791063327985, + "loss": 0.5816, + "step": 62100 + }, + { + "epoch": 15.16, + "learning_rate": 0.00041819471151292376, + "loss": 0.5448, + "step": 62125 + }, + { + "epoch": 15.17, + "learning_rate": 0.0004181615123925677, + "loss": 0.5673, + "step": 62150 + }, + { + "epoch": 15.17, + "learning_rate": 0.0004181283132722116, + "loss": 0.5592, + "step": 62175 + }, + { + "epoch": 15.18, + "learning_rate": 0.0004180951141518554, + "loss": 0.5821, + "step": 62200 + }, + { + "epoch": 15.18, + "learning_rate": 0.0004180619150314993, + "loss": 0.5912, + "step": 62225 + }, + { + "epoch": 15.19, + "learning_rate": 0.0004180287159111432, + "loss": 0.5935, + "step": 62250 + }, + { + "epoch": 15.2, + "learning_rate": 0.00041799551679078714, + "loss": 0.5177, + "step": 62275 + }, + { + "epoch": 15.2, + "learning_rate": 0.00041796231767043105, + "loss": 0.6028, + "step": 62300 + }, + { + "epoch": 15.21, + "learning_rate": 0.0004179291185500749, + "loss": 0.5421, + "step": 62325 + }, + { + "epoch": 15.21, + "learning_rate": 0.00041789591942971877, + "loss": 0.5825, + "step": 62350 + }, + { + "epoch": 15.22, + "learning_rate": 0.0004178627203093627, + "loss": 0.5568, + "step": 62375 + }, + { + "epoch": 15.23, + "learning_rate": 0.0004178295211890066, + "loss": 0.5786, + "step": 62400 + }, + { + "epoch": 15.23, + "learning_rate": 0.00041779632206865046, + "loss": 0.59, + "step": 62425 + }, + { + "epoch": 15.24, + "learning_rate": 0.00041776312294829437, + "loss": 0.5885, + "step": 62450 + }, + { + "epoch": 15.25, + "learning_rate": 0.0004177299238279383, + "loss": 0.5425, + "step": 62475 + }, + { + "epoch": 15.25, + "learning_rate": 0.00041769672470758215, + "loss": 0.5888, + "step": 62500 + }, + { + "epoch": 15.26, + "learning_rate": 0.00041766352558722606, + "loss": 0.5933, + "step": 62525 + }, + { + "epoch": 15.26, + "learning_rate": 0.0004176303264668699, + "loss": 0.5985, + "step": 62550 + }, + { + "epoch": 15.27, + "learning_rate": 0.00041759712734651383, + "loss": 0.5137, + "step": 62575 + }, + { + "epoch": 15.28, + "learning_rate": 0.00041756392822615775, + "loss": 0.5934, + "step": 62600 + }, + { + "epoch": 15.28, + "learning_rate": 0.00041753072910580166, + "loss": 0.5218, + "step": 62625 + }, + { + "epoch": 15.29, + "learning_rate": 0.00041749752998544547, + "loss": 0.6012, + "step": 62650 + }, + { + "epoch": 15.29, + "learning_rate": 0.0004174643308650894, + "loss": 0.6265, + "step": 62675 + }, + { + "epoch": 15.3, + "learning_rate": 0.0004174311317447333, + "loss": 0.5904, + "step": 62700 + }, + { + "epoch": 15.31, + "learning_rate": 0.0004173979326243772, + "loss": 0.582, + "step": 62725 + }, + { + "epoch": 15.31, + "learning_rate": 0.0004173647335040211, + "loss": 0.5837, + "step": 62750 + }, + { + "epoch": 15.32, + "learning_rate": 0.000417331534383665, + "loss": 0.5676, + "step": 62775 + }, + { + "epoch": 15.32, + "learning_rate": 0.00041729833526330884, + "loss": 0.5988, + "step": 62800 + }, + { + "epoch": 15.33, + "learning_rate": 0.00041726513614295276, + "loss": 0.5467, + "step": 62825 + }, + { + "epoch": 15.34, + "learning_rate": 0.00041723193702259667, + "loss": 0.5601, + "step": 62850 + }, + { + "epoch": 15.34, + "learning_rate": 0.00041719873790224053, + "loss": 0.5655, + "step": 62875 + }, + { + "epoch": 15.35, + "learning_rate": 0.00041716553878188444, + "loss": 0.5704, + "step": 62900 + }, + { + "epoch": 15.36, + "learning_rate": 0.00041713233966152836, + "loss": 0.555, + "step": 62925 + }, + { + "epoch": 15.36, + "learning_rate": 0.0004170991405411722, + "loss": 0.5744, + "step": 62950 + }, + { + "epoch": 15.37, + "learning_rate": 0.00041706594142081613, + "loss": 0.5445, + "step": 62975 + }, + { + "epoch": 15.37, + "learning_rate": 0.00041703274230046, + "loss": 0.5731, + "step": 63000 + }, + { + "epoch": 15.37, + "eval_cer": 0.12588421301191954, + "eval_loss": 0.44619035720825195, + "eval_runtime": 146.3854, + "eval_samples_per_second": 28.644, + "eval_steps_per_second": 7.166, + "eval_wer": 0.5028058727569331, + "step": 63000 + }, + { + "epoch": 15.38, + "learning_rate": 0.0004169995431801039, + "loss": 0.5442, + "step": 63025 + }, + { + "epoch": 15.39, + "learning_rate": 0.0004169663440597478, + "loss": 0.6078, + "step": 63050 + }, + { + "epoch": 15.39, + "learning_rate": 0.00041693314493939173, + "loss": 0.575, + "step": 63075 + }, + { + "epoch": 15.4, + "learning_rate": 0.00041689994581903554, + "loss": 0.5903, + "step": 63100 + }, + { + "epoch": 15.4, + "learning_rate": 0.00041686674669867945, + "loss": 0.5715, + "step": 63125 + }, + { + "epoch": 15.41, + "learning_rate": 0.00041683354757832337, + "loss": 0.6195, + "step": 63150 + }, + { + "epoch": 15.42, + "learning_rate": 0.0004168003484579673, + "loss": 0.5652, + "step": 63175 + }, + { + "epoch": 15.42, + "learning_rate": 0.0004167671493376112, + "loss": 0.5955, + "step": 63200 + }, + { + "epoch": 15.43, + "learning_rate": 0.00041673395021725506, + "loss": 0.5727, + "step": 63225 + }, + { + "epoch": 15.43, + "learning_rate": 0.0004167007510968989, + "loss": 0.6131, + "step": 63250 + }, + { + "epoch": 15.44, + "learning_rate": 0.00041666755197654283, + "loss": 0.5705, + "step": 63275 + }, + { + "epoch": 15.45, + "learning_rate": 0.00041663435285618674, + "loss": 0.6169, + "step": 63300 + }, + { + "epoch": 15.45, + "learning_rate": 0.0004166011537358306, + "loss": 0.6131, + "step": 63325 + }, + { + "epoch": 15.46, + "learning_rate": 0.0004165679546154745, + "loss": 0.5592, + "step": 63350 + }, + { + "epoch": 15.46, + "learning_rate": 0.00041653475549511843, + "loss": 0.5564, + "step": 63375 + }, + { + "epoch": 15.47, + "learning_rate": 0.0004165028843395766, + "loss": 0.5988, + "step": 63400 + }, + { + "epoch": 15.48, + "learning_rate": 0.0004164696852192205, + "loss": 0.5358, + "step": 63425 + }, + { + "epoch": 15.48, + "learning_rate": 0.0004164364860988643, + "loss": 0.5594, + "step": 63450 + }, + { + "epoch": 15.49, + "learning_rate": 0.0004164032869785082, + "loss": 0.5878, + "step": 63475 + }, + { + "epoch": 15.5, + "learning_rate": 0.0004163700878581521, + "loss": 0.606, + "step": 63500 + }, + { + "epoch": 15.5, + "learning_rate": 0.00041633688873779604, + "loss": 0.5355, + "step": 63525 + }, + { + "epoch": 15.51, + "learning_rate": 0.0004163036896174399, + "loss": 0.6155, + "step": 63550 + }, + { + "epoch": 15.51, + "learning_rate": 0.0004162704904970838, + "loss": 0.5276, + "step": 63575 + }, + { + "epoch": 15.52, + "learning_rate": 0.00041623729137672767, + "loss": 0.569, + "step": 63600 + }, + { + "epoch": 15.53, + "learning_rate": 0.0004162040922563716, + "loss": 0.5634, + "step": 63625 + }, + { + "epoch": 15.53, + "learning_rate": 0.0004161708931360155, + "loss": 0.5897, + "step": 63650 + }, + { + "epoch": 15.54, + "learning_rate": 0.00041613769401565936, + "loss": 0.5776, + "step": 63675 + }, + { + "epoch": 15.54, + "learning_rate": 0.00041610449489530327, + "loss": 0.5752, + "step": 63700 + }, + { + "epoch": 15.55, + "learning_rate": 0.0004160712957749472, + "loss": 0.5591, + "step": 63725 + }, + { + "epoch": 15.56, + "learning_rate": 0.00041603809665459105, + "loss": 0.6018, + "step": 63750 + }, + { + "epoch": 15.56, + "learning_rate": 0.0004160048975342349, + "loss": 0.5902, + "step": 63775 + }, + { + "epoch": 15.57, + "learning_rate": 0.0004159716984138788, + "loss": 0.5798, + "step": 63800 + }, + { + "epoch": 15.57, + "learning_rate": 0.00041593849929352273, + "loss": 0.5805, + "step": 63825 + }, + { + "epoch": 15.58, + "learning_rate": 0.00041590530017316665, + "loss": 0.5771, + "step": 63850 + }, + { + "epoch": 15.59, + "learning_rate": 0.00041587210105281056, + "loss": 0.5451, + "step": 63875 + }, + { + "epoch": 15.59, + "learning_rate": 0.00041583890193245437, + "loss": 0.5912, + "step": 63900 + }, + { + "epoch": 15.6, + "learning_rate": 0.0004158057028120983, + "loss": 0.5415, + "step": 63925 + }, + { + "epoch": 15.61, + "learning_rate": 0.0004157725036917422, + "loss": 0.5909, + "step": 63950 + }, + { + "epoch": 15.61, + "learning_rate": 0.0004157393045713861, + "loss": 0.6075, + "step": 63975 + }, + { + "epoch": 15.62, + "learning_rate": 0.00041570610545102997, + "loss": 0.5866, + "step": 64000 + }, + { + "epoch": 15.62, + "learning_rate": 0.0004156729063306739, + "loss": 0.548, + "step": 64025 + }, + { + "epoch": 15.63, + "learning_rate": 0.00041563970721031774, + "loss": 0.566, + "step": 64050 + }, + { + "epoch": 15.64, + "learning_rate": 0.00041560650808996166, + "loss": 0.5828, + "step": 64075 + }, + { + "epoch": 15.64, + "learning_rate": 0.00041557330896960557, + "loss": 0.6185, + "step": 64100 + }, + { + "epoch": 15.65, + "learning_rate": 0.00041554010984924943, + "loss": 0.5782, + "step": 64125 + }, + { + "epoch": 15.65, + "learning_rate": 0.00041550691072889334, + "loss": 0.6042, + "step": 64150 + }, + { + "epoch": 15.66, + "learning_rate": 0.00041547371160853726, + "loss": 0.5636, + "step": 64175 + }, + { + "epoch": 15.67, + "learning_rate": 0.0004154405124881811, + "loss": 0.6106, + "step": 64200 + }, + { + "epoch": 15.67, + "learning_rate": 0.000415407313367825, + "loss": 0.5675, + "step": 64225 + }, + { + "epoch": 15.68, + "learning_rate": 0.0004153741142474689, + "loss": 0.5768, + "step": 64250 + }, + { + "epoch": 15.68, + "learning_rate": 0.0004153409151271128, + "loss": 0.5954, + "step": 64275 + }, + { + "epoch": 15.69, + "learning_rate": 0.0004153077160067567, + "loss": 0.5635, + "step": 64300 + }, + { + "epoch": 15.7, + "learning_rate": 0.00041527451688640063, + "loss": 0.5603, + "step": 64325 + }, + { + "epoch": 15.7, + "learning_rate": 0.00041524131776604444, + "loss": 0.5893, + "step": 64350 + }, + { + "epoch": 15.71, + "learning_rate": 0.00041520811864568835, + "loss": 0.5608, + "step": 64375 + }, + { + "epoch": 15.71, + "learning_rate": 0.00041517491952533227, + "loss": 0.5534, + "step": 64400 + }, + { + "epoch": 15.72, + "learning_rate": 0.0004151417204049762, + "loss": 0.5961, + "step": 64425 + }, + { + "epoch": 15.73, + "learning_rate": 0.00041510852128462004, + "loss": 0.5614, + "step": 64450 + }, + { + "epoch": 15.73, + "learning_rate": 0.00041507532216426395, + "loss": 0.5431, + "step": 64475 + }, + { + "epoch": 15.74, + "learning_rate": 0.0004150421230439078, + "loss": 0.588, + "step": 64500 + }, + { + "epoch": 15.75, + "learning_rate": 0.00041500892392355173, + "loss": 0.616, + "step": 64525 + }, + { + "epoch": 15.75, + "learning_rate": 0.00041497572480319564, + "loss": 0.6145, + "step": 64550 + }, + { + "epoch": 15.76, + "learning_rate": 0.0004149425256828395, + "loss": 0.5783, + "step": 64575 + }, + { + "epoch": 15.76, + "learning_rate": 0.0004149093265624834, + "loss": 0.5769, + "step": 64600 + }, + { + "epoch": 15.77, + "learning_rate": 0.00041487612744212733, + "loss": 0.6041, + "step": 64625 + }, + { + "epoch": 15.78, + "learning_rate": 0.0004148429283217712, + "loss": 0.5768, + "step": 64650 + }, + { + "epoch": 15.78, + "learning_rate": 0.00041480972920141505, + "loss": 0.5923, + "step": 64675 + }, + { + "epoch": 15.79, + "learning_rate": 0.00041477653008105896, + "loss": 0.5551, + "step": 64700 + }, + { + "epoch": 15.79, + "learning_rate": 0.0004147433309607029, + "loss": 0.5495, + "step": 64725 + }, + { + "epoch": 15.8, + "learning_rate": 0.0004147101318403468, + "loss": 0.6238, + "step": 64750 + }, + { + "epoch": 15.81, + "learning_rate": 0.0004146769327199907, + "loss": 0.5442, + "step": 64775 + }, + { + "epoch": 15.81, + "learning_rate": 0.0004146437335996345, + "loss": 0.5986, + "step": 64800 + }, + { + "epoch": 15.82, + "learning_rate": 0.0004146105344792784, + "loss": 0.6223, + "step": 64825 + }, + { + "epoch": 15.82, + "learning_rate": 0.00041457733535892234, + "loss": 0.5737, + "step": 64850 + }, + { + "epoch": 15.83, + "learning_rate": 0.00041454413623856625, + "loss": 0.528, + "step": 64875 + }, + { + "epoch": 15.84, + "learning_rate": 0.00041451093711821017, + "loss": 0.615, + "step": 64900 + }, + { + "epoch": 15.84, + "learning_rate": 0.000414477737997854, + "loss": 0.5476, + "step": 64925 + }, + { + "epoch": 15.85, + "learning_rate": 0.0004144445388774979, + "loss": 0.603, + "step": 64950 + }, + { + "epoch": 15.86, + "learning_rate": 0.0004144113397571418, + "loss": 0.5325, + "step": 64975 + }, + { + "epoch": 15.86, + "learning_rate": 0.0004143781406367857, + "loss": 0.6006, + "step": 65000 + }, + { + "epoch": 15.87, + "learning_rate": 0.0004143449415164296, + "loss": 0.5636, + "step": 65025 + }, + { + "epoch": 15.87, + "learning_rate": 0.0004143117423960735, + "loss": 0.6104, + "step": 65050 + }, + { + "epoch": 15.88, + "learning_rate": 0.0004142785432757174, + "loss": 0.5742, + "step": 65075 + }, + { + "epoch": 15.89, + "learning_rate": 0.00041424534415536126, + "loss": 0.5944, + "step": 65100 + }, + { + "epoch": 15.89, + "learning_rate": 0.0004142121450350052, + "loss": 0.6145, + "step": 65125 + }, + { + "epoch": 15.9, + "learning_rate": 0.00041417894591464904, + "loss": 0.5822, + "step": 65150 + }, + { + "epoch": 15.9, + "learning_rate": 0.00041414574679429295, + "loss": 0.6058, + "step": 65175 + }, + { + "epoch": 15.91, + "learning_rate": 0.00041411254767393686, + "loss": 0.6146, + "step": 65200 + }, + { + "epoch": 15.92, + "learning_rate": 0.0004140793485535808, + "loss": 0.5819, + "step": 65225 + }, + { + "epoch": 15.92, + "learning_rate": 0.0004140461494332246, + "loss": 0.5744, + "step": 65250 + }, + { + "epoch": 15.93, + "learning_rate": 0.0004140129503128685, + "loss": 0.5917, + "step": 65275 + }, + { + "epoch": 15.93, + "learning_rate": 0.0004139797511925124, + "loss": 0.5648, + "step": 65300 + }, + { + "epoch": 15.94, + "learning_rate": 0.0004139465520721563, + "loss": 0.6056, + "step": 65325 + }, + { + "epoch": 15.95, + "learning_rate": 0.00041391335295180024, + "loss": 0.5887, + "step": 65350 + }, + { + "epoch": 15.95, + "learning_rate": 0.0004138801538314441, + "loss": 0.5744, + "step": 65375 + }, + { + "epoch": 15.96, + "learning_rate": 0.00041384695471108796, + "loss": 0.5921, + "step": 65400 + }, + { + "epoch": 15.97, + "learning_rate": 0.00041381375559073187, + "loss": 0.5323, + "step": 65425 + }, + { + "epoch": 15.97, + "learning_rate": 0.0004137805564703758, + "loss": 0.5728, + "step": 65450 + }, + { + "epoch": 15.98, + "learning_rate": 0.00041374735735001965, + "loss": 0.5658, + "step": 65475 + }, + { + "epoch": 15.98, + "learning_rate": 0.00041371415822966356, + "loss": 0.6099, + "step": 65500 + }, + { + "epoch": 15.99, + "learning_rate": 0.0004136809591093075, + "loss": 0.5746, + "step": 65525 + }, + { + "epoch": 16.0, + "learning_rate": 0.00041364775998895133, + "loss": 0.6292, + "step": 65550 + }, + { + "epoch": 16.0, + "learning_rate": 0.00041361456086859525, + "loss": 0.5792, + "step": 65575 + }, + { + "epoch": 16.01, + "learning_rate": 0.0004135813617482391, + "loss": 0.5845, + "step": 65600 + }, + { + "epoch": 16.01, + "learning_rate": 0.000413548162627883, + "loss": 0.5785, + "step": 65625 + }, + { + "epoch": 16.02, + "learning_rate": 0.00041351496350752694, + "loss": 0.5528, + "step": 65650 + }, + { + "epoch": 16.03, + "learning_rate": 0.00041348176438717085, + "loss": 0.5395, + "step": 65675 + }, + { + "epoch": 16.03, + "learning_rate": 0.00041344856526681466, + "loss": 0.5619, + "step": 65700 + }, + { + "epoch": 16.04, + "learning_rate": 0.00041341536614645857, + "loss": 0.5891, + "step": 65725 + }, + { + "epoch": 16.04, + "learning_rate": 0.0004133821670261025, + "loss": 0.5549, + "step": 65750 + }, + { + "epoch": 16.05, + "learning_rate": 0.0004133489679057464, + "loss": 0.5421, + "step": 65775 + }, + { + "epoch": 16.06, + "learning_rate": 0.0004133157687853903, + "loss": 0.5779, + "step": 65800 + }, + { + "epoch": 16.06, + "learning_rate": 0.00041328256966503417, + "loss": 0.5777, + "step": 65825 + }, + { + "epoch": 16.07, + "learning_rate": 0.00041324937054467803, + "loss": 0.5473, + "step": 65850 + }, + { + "epoch": 16.07, + "learning_rate": 0.00041321617142432194, + "loss": 0.5424, + "step": 65875 + }, + { + "epoch": 16.08, + "learning_rate": 0.00041318297230396586, + "loss": 0.5444, + "step": 65900 + }, + { + "epoch": 16.09, + "learning_rate": 0.0004131497731836097, + "loss": 0.5406, + "step": 65925 + }, + { + "epoch": 16.09, + "learning_rate": 0.00041311657406325363, + "loss": 0.5825, + "step": 65950 + }, + { + "epoch": 16.1, + "learning_rate": 0.0004130833749428975, + "loss": 0.5226, + "step": 65975 + }, + { + "epoch": 16.11, + "learning_rate": 0.0004130501758225414, + "loss": 0.5328, + "step": 66000 + }, + { + "epoch": 16.11, + "eval_cer": 0.12461115160724003, + "eval_loss": 0.45345035195350647, + "eval_runtime": 146.1861, + "eval_samples_per_second": 28.683, + "eval_steps_per_second": 7.176, + "eval_wer": 0.5022512234910277, + "step": 66000 + }, + { + "epoch": 16.11, + "learning_rate": 0.0004130169767021853, + "loss": 0.5759, + "step": 66025 + }, + { + "epoch": 16.12, + "learning_rate": 0.0004129837775818292, + "loss": 0.6023, + "step": 66050 + }, + { + "epoch": 16.12, + "learning_rate": 0.0004129505784614731, + "loss": 0.5949, + "step": 66075 + }, + { + "epoch": 16.13, + "learning_rate": 0.000412917379341117, + "loss": 0.5579, + "step": 66100 + }, + { + "epoch": 16.14, + "learning_rate": 0.00041288418022076087, + "loss": 0.5562, + "step": 66125 + }, + { + "epoch": 16.14, + "learning_rate": 0.0004128509811004048, + "loss": 0.5863, + "step": 66150 + }, + { + "epoch": 16.15, + "learning_rate": 0.00041281778198004864, + "loss": 0.5399, + "step": 66175 + }, + { + "epoch": 16.15, + "learning_rate": 0.00041278458285969256, + "loss": 0.5882, + "step": 66200 + }, + { + "epoch": 16.16, + "learning_rate": 0.00041275138373933647, + "loss": 0.5625, + "step": 66225 + }, + { + "epoch": 16.17, + "learning_rate": 0.0004127181846189804, + "loss": 0.5508, + "step": 66250 + }, + { + "epoch": 16.17, + "learning_rate": 0.0004126849854986242, + "loss": 0.5435, + "step": 66275 + }, + { + "epoch": 16.18, + "learning_rate": 0.0004126517863782681, + "loss": 0.5725, + "step": 66300 + }, + { + "epoch": 16.18, + "learning_rate": 0.000412618587257912, + "loss": 0.5654, + "step": 66325 + }, + { + "epoch": 16.19, + "learning_rate": 0.00041258538813755593, + "loss": 0.5876, + "step": 66350 + }, + { + "epoch": 16.2, + "learning_rate": 0.00041255218901719984, + "loss": 0.5763, + "step": 66375 + }, + { + "epoch": 16.2, + "learning_rate": 0.0004125189898968437, + "loss": 0.5609, + "step": 66400 + }, + { + "epoch": 16.21, + "learning_rate": 0.00041248579077648756, + "loss": 0.5789, + "step": 66425 + }, + { + "epoch": 16.22, + "learning_rate": 0.0004124525916561315, + "loss": 0.5859, + "step": 66450 + }, + { + "epoch": 16.22, + "learning_rate": 0.0004124193925357754, + "loss": 0.5816, + "step": 66475 + }, + { + "epoch": 16.23, + "learning_rate": 0.00041238619341541925, + "loss": 0.5813, + "step": 66500 + }, + { + "epoch": 16.23, + "learning_rate": 0.00041235299429506317, + "loss": 0.512, + "step": 66525 + }, + { + "epoch": 16.24, + "learning_rate": 0.0004123197951747071, + "loss": 0.5868, + "step": 66550 + }, + { + "epoch": 16.25, + "learning_rate": 0.00041228659605435094, + "loss": 0.5437, + "step": 66575 + }, + { + "epoch": 16.25, + "learning_rate": 0.00041225339693399485, + "loss": 0.5212, + "step": 66600 + }, + { + "epoch": 16.26, + "learning_rate": 0.0004122201978136387, + "loss": 0.542, + "step": 66625 + }, + { + "epoch": 16.26, + "learning_rate": 0.00041218699869328263, + "loss": 0.5695, + "step": 66650 + }, + { + "epoch": 16.27, + "learning_rate": 0.00041215379957292654, + "loss": 0.5057, + "step": 66675 + }, + { + "epoch": 16.28, + "learning_rate": 0.00041212060045257046, + "loss": 0.5713, + "step": 66700 + }, + { + "epoch": 16.28, + "learning_rate": 0.00041208740133221426, + "loss": 0.5371, + "step": 66725 + }, + { + "epoch": 16.29, + "learning_rate": 0.0004120542022118582, + "loss": 0.5522, + "step": 66750 + }, + { + "epoch": 16.29, + "learning_rate": 0.0004120210030915021, + "loss": 0.5789, + "step": 66775 + }, + { + "epoch": 16.3, + "learning_rate": 0.000411987803971146, + "loss": 0.5469, + "step": 66800 + }, + { + "epoch": 16.31, + "learning_rate": 0.0004119546048507899, + "loss": 0.5718, + "step": 66825 + }, + { + "epoch": 16.31, + "learning_rate": 0.0004119214057304338, + "loss": 0.5656, + "step": 66850 + }, + { + "epoch": 16.32, + "learning_rate": 0.00041188820661007764, + "loss": 0.5515, + "step": 66875 + }, + { + "epoch": 16.33, + "learning_rate": 0.00041185500748972155, + "loss": 0.5725, + "step": 66900 + }, + { + "epoch": 16.33, + "learning_rate": 0.00041182180836936546, + "loss": 0.5504, + "step": 66925 + }, + { + "epoch": 16.34, + "learning_rate": 0.0004117886092490093, + "loss": 0.5304, + "step": 66950 + }, + { + "epoch": 16.34, + "learning_rate": 0.00041175541012865324, + "loss": 0.5575, + "step": 66975 + }, + { + "epoch": 16.35, + "learning_rate": 0.00041172221100829715, + "loss": 0.5828, + "step": 67000 + }, + { + "epoch": 16.36, + "learning_rate": 0.000411689011887941, + "loss": 0.5903, + "step": 67025 + }, + { + "epoch": 16.36, + "learning_rate": 0.0004116558127675849, + "loss": 0.5894, + "step": 67050 + }, + { + "epoch": 16.37, + "learning_rate": 0.0004116226136472288, + "loss": 0.5657, + "step": 67075 + }, + { + "epoch": 16.37, + "learning_rate": 0.0004115894145268727, + "loss": 0.5672, + "step": 67100 + }, + { + "epoch": 16.38, + "learning_rate": 0.0004115562154065166, + "loss": 0.5476, + "step": 67125 + }, + { + "epoch": 16.39, + "learning_rate": 0.00041152301628616053, + "loss": 0.5779, + "step": 67150 + }, + { + "epoch": 16.39, + "learning_rate": 0.00041148981716580433, + "loss": 0.5328, + "step": 67175 + }, + { + "epoch": 16.4, + "learning_rate": 0.00041145661804544825, + "loss": 0.5777, + "step": 67200 + }, + { + "epoch": 16.4, + "learning_rate": 0.00041142341892509216, + "loss": 0.5645, + "step": 67225 + }, + { + "epoch": 16.41, + "learning_rate": 0.0004113902198047361, + "loss": 0.582, + "step": 67250 + }, + { + "epoch": 16.42, + "learning_rate": 0.00041135702068438, + "loss": 0.5448, + "step": 67275 + }, + { + "epoch": 16.42, + "learning_rate": 0.00041132382156402385, + "loss": 0.557, + "step": 67300 + }, + { + "epoch": 16.43, + "learning_rate": 0.0004112906224436677, + "loss": 0.5427, + "step": 67325 + }, + { + "epoch": 16.43, + "learning_rate": 0.0004112574233233116, + "loss": 0.553, + "step": 67350 + }, + { + "epoch": 16.44, + "learning_rate": 0.00041122422420295554, + "loss": 0.5965, + "step": 67375 + }, + { + "epoch": 16.45, + "learning_rate": 0.00041119102508259945, + "loss": 0.5488, + "step": 67400 + }, + { + "epoch": 16.45, + "learning_rate": 0.0004111578259622433, + "loss": 0.5309, + "step": 67425 + }, + { + "epoch": 16.46, + "learning_rate": 0.0004111246268418872, + "loss": 0.599, + "step": 67450 + }, + { + "epoch": 16.47, + "learning_rate": 0.0004110914277215311, + "loss": 0.5384, + "step": 67475 + }, + { + "epoch": 16.47, + "learning_rate": 0.000411058228601175, + "loss": 0.5998, + "step": 67500 + }, + { + "epoch": 16.48, + "learning_rate": 0.00041102502948081886, + "loss": 0.545, + "step": 67525 + }, + { + "epoch": 16.48, + "learning_rate": 0.00041099183036046277, + "loss": 0.5732, + "step": 67550 + }, + { + "epoch": 16.49, + "learning_rate": 0.0004109586312401067, + "loss": 0.5608, + "step": 67575 + }, + { + "epoch": 16.5, + "learning_rate": 0.0004109254321197506, + "loss": 0.5466, + "step": 67600 + }, + { + "epoch": 16.5, + "learning_rate": 0.00041089223299939446, + "loss": 0.5771, + "step": 67625 + }, + { + "epoch": 16.51, + "learning_rate": 0.0004108590338790383, + "loss": 0.5959, + "step": 67650 + }, + { + "epoch": 16.51, + "learning_rate": 0.00041082583475868223, + "loss": 0.5573, + "step": 67675 + }, + { + "epoch": 16.52, + "learning_rate": 0.00041079263563832615, + "loss": 0.5681, + "step": 67700 + }, + { + "epoch": 16.53, + "learning_rate": 0.00041075943651797006, + "loss": 0.5956, + "step": 67725 + }, + { + "epoch": 16.53, + "learning_rate": 0.0004107262373976139, + "loss": 0.5685, + "step": 67750 + }, + { + "epoch": 16.54, + "learning_rate": 0.0004106930382772578, + "loss": 0.5794, + "step": 67775 + }, + { + "epoch": 16.54, + "learning_rate": 0.0004106598391569017, + "loss": 0.5751, + "step": 67800 + }, + { + "epoch": 16.55, + "learning_rate": 0.0004106266400365456, + "loss": 0.5426, + "step": 67825 + }, + { + "epoch": 16.56, + "learning_rate": 0.0004105934409161895, + "loss": 0.5655, + "step": 67850 + }, + { + "epoch": 16.56, + "learning_rate": 0.0004105615697606476, + "loss": 0.5888, + "step": 67875 + }, + { + "epoch": 16.57, + "learning_rate": 0.0004105283706402915, + "loss": 0.5562, + "step": 67900 + }, + { + "epoch": 16.58, + "learning_rate": 0.00041049517151993544, + "loss": 0.5631, + "step": 67925 + }, + { + "epoch": 16.58, + "learning_rate": 0.00041046197239957935, + "loss": 0.563, + "step": 67950 + }, + { + "epoch": 16.59, + "learning_rate": 0.00041042877327922316, + "loss": 0.5945, + "step": 67975 + }, + { + "epoch": 16.59, + "learning_rate": 0.0004103955741588671, + "loss": 0.5984, + "step": 68000 + }, + { + "epoch": 16.6, + "learning_rate": 0.000410362375038511, + "loss": 0.5718, + "step": 68025 + }, + { + "epoch": 16.61, + "learning_rate": 0.0004103291759181549, + "loss": 0.5531, + "step": 68050 + }, + { + "epoch": 16.61, + "learning_rate": 0.00041029597679779876, + "loss": 0.5585, + "step": 68075 + }, + { + "epoch": 16.62, + "learning_rate": 0.0004102627776774427, + "loss": 0.6041, + "step": 68100 + }, + { + "epoch": 16.62, + "learning_rate": 0.00041022957855708654, + "loss": 0.5161, + "step": 68125 + }, + { + "epoch": 16.63, + "learning_rate": 0.00041019637943673045, + "loss": 0.576, + "step": 68150 + }, + { + "epoch": 16.64, + "learning_rate": 0.00041016318031637436, + "loss": 0.5904, + "step": 68175 + }, + { + "epoch": 16.64, + "learning_rate": 0.0004101299811960182, + "loss": 0.5504, + "step": 68200 + }, + { + "epoch": 16.65, + "learning_rate": 0.00041009678207566214, + "loss": 0.5495, + "step": 68225 + }, + { + "epoch": 16.65, + "learning_rate": 0.00041006358295530605, + "loss": 0.5813, + "step": 68250 + }, + { + "epoch": 16.66, + "learning_rate": 0.0004100303838349499, + "loss": 0.5604, + "step": 68275 + }, + { + "epoch": 16.67, + "learning_rate": 0.00040999718471459377, + "loss": 0.5899, + "step": 68300 + }, + { + "epoch": 16.67, + "learning_rate": 0.0004099639855942377, + "loss": 0.5665, + "step": 68325 + }, + { + "epoch": 16.68, + "learning_rate": 0.0004099307864738816, + "loss": 0.5539, + "step": 68350 + }, + { + "epoch": 16.68, + "learning_rate": 0.0004098975873535255, + "loss": 0.5938, + "step": 68375 + }, + { + "epoch": 16.69, + "learning_rate": 0.0004098643882331694, + "loss": 0.5765, + "step": 68400 + }, + { + "epoch": 16.7, + "learning_rate": 0.00040983118911281323, + "loss": 0.5873, + "step": 68425 + }, + { + "epoch": 16.7, + "learning_rate": 0.00040979798999245715, + "loss": 0.5986, + "step": 68450 + }, + { + "epoch": 16.71, + "learning_rate": 0.00040976479087210106, + "loss": 0.5746, + "step": 68475 + }, + { + "epoch": 16.72, + "learning_rate": 0.000409731591751745, + "loss": 0.5931, + "step": 68500 + }, + { + "epoch": 16.72, + "learning_rate": 0.0004096983926313889, + "loss": 0.5582, + "step": 68525 + }, + { + "epoch": 16.73, + "learning_rate": 0.00040966519351103275, + "loss": 0.5683, + "step": 68550 + }, + { + "epoch": 16.73, + "learning_rate": 0.0004096319943906766, + "loss": 0.5985, + "step": 68575 + }, + { + "epoch": 16.74, + "learning_rate": 0.0004095987952703205, + "loss": 0.5949, + "step": 68600 + }, + { + "epoch": 16.75, + "learning_rate": 0.00040956559614996444, + "loss": 0.5495, + "step": 68625 + }, + { + "epoch": 16.75, + "learning_rate": 0.0004095323970296083, + "loss": 0.5408, + "step": 68650 + }, + { + "epoch": 16.76, + "learning_rate": 0.0004094991979092522, + "loss": 0.5318, + "step": 68675 + }, + { + "epoch": 16.76, + "learning_rate": 0.0004094659987888961, + "loss": 0.5701, + "step": 68700 + }, + { + "epoch": 16.77, + "learning_rate": 0.00040943279966854, + "loss": 0.5707, + "step": 68725 + }, + { + "epoch": 16.78, + "learning_rate": 0.0004093996005481839, + "loss": 0.5885, + "step": 68750 + }, + { + "epoch": 16.78, + "learning_rate": 0.00040936640142782776, + "loss": 0.5422, + "step": 68775 + }, + { + "epoch": 16.79, + "learning_rate": 0.00040933320230747167, + "loss": 0.598, + "step": 68800 + }, + { + "epoch": 16.79, + "learning_rate": 0.0004093000031871156, + "loss": 0.5318, + "step": 68825 + }, + { + "epoch": 16.8, + "learning_rate": 0.0004092668040667595, + "loss": 0.5587, + "step": 68850 + }, + { + "epoch": 16.81, + "learning_rate": 0.0004092336049464033, + "loss": 0.5803, + "step": 68875 + }, + { + "epoch": 16.81, + "learning_rate": 0.0004092004058260472, + "loss": 0.5688, + "step": 68900 + }, + { + "epoch": 16.82, + "learning_rate": 0.00040916720670569113, + "loss": 0.5538, + "step": 68925 + }, + { + "epoch": 16.83, + "learning_rate": 0.00040913400758533505, + "loss": 0.58, + "step": 68950 + }, + { + "epoch": 16.83, + "learning_rate": 0.00040910080846497896, + "loss": 0.5765, + "step": 68975 + }, + { + "epoch": 16.84, + "learning_rate": 0.0004090676093446228, + "loss": 0.5743, + "step": 69000 + }, + { + "epoch": 16.84, + "eval_cer": 0.1254632814184368, + "eval_loss": 0.45550015568733215, + "eval_runtime": 147.0347, + "eval_samples_per_second": 28.517, + "eval_steps_per_second": 7.134, + "eval_wer": 0.5069168026101142, + "step": 69000 + }, + { + "epoch": 16.84, + "learning_rate": 0.0004090344102242667, + "loss": 0.518, + "step": 69025 + }, + { + "epoch": 16.85, + "learning_rate": 0.0004090012111039106, + "loss": 0.5542, + "step": 69050 + }, + { + "epoch": 16.86, + "learning_rate": 0.0004089680119835545, + "loss": 0.5315, + "step": 69075 + }, + { + "epoch": 16.86, + "learning_rate": 0.00040893481286319837, + "loss": 0.5702, + "step": 69100 + }, + { + "epoch": 16.87, + "learning_rate": 0.0004089016137428423, + "loss": 0.5372, + "step": 69125 + }, + { + "epoch": 16.87, + "learning_rate": 0.0004088684146224862, + "loss": 0.5451, + "step": 69150 + }, + { + "epoch": 16.88, + "learning_rate": 0.00040883521550213006, + "loss": 0.5251, + "step": 69175 + }, + { + "epoch": 16.89, + "learning_rate": 0.00040880201638177397, + "loss": 0.5762, + "step": 69200 + }, + { + "epoch": 16.89, + "learning_rate": 0.00040876881726141783, + "loss": 0.5446, + "step": 69225 + }, + { + "epoch": 16.9, + "learning_rate": 0.00040873561814106174, + "loss": 0.5725, + "step": 69250 + }, + { + "epoch": 16.9, + "learning_rate": 0.00040870241902070566, + "loss": 0.5888, + "step": 69275 + }, + { + "epoch": 16.91, + "learning_rate": 0.00040866921990034957, + "loss": 0.5712, + "step": 69300 + }, + { + "epoch": 16.92, + "learning_rate": 0.0004086360207799934, + "loss": 0.6126, + "step": 69325 + }, + { + "epoch": 16.92, + "learning_rate": 0.0004086028216596373, + "loss": 0.5406, + "step": 69350 + }, + { + "epoch": 16.93, + "learning_rate": 0.0004085696225392812, + "loss": 0.5716, + "step": 69375 + }, + { + "epoch": 16.94, + "learning_rate": 0.0004085364234189251, + "loss": 0.5786, + "step": 69400 + }, + { + "epoch": 16.94, + "learning_rate": 0.00040850322429856903, + "loss": 0.5627, + "step": 69425 + }, + { + "epoch": 16.95, + "learning_rate": 0.0004084700251782129, + "loss": 0.565, + "step": 69450 + }, + { + "epoch": 16.95, + "learning_rate": 0.00040843682605785675, + "loss": 0.55, + "step": 69475 + }, + { + "epoch": 16.96, + "learning_rate": 0.00040840362693750067, + "loss": 0.591, + "step": 69500 + }, + { + "epoch": 16.97, + "learning_rate": 0.0004083704278171446, + "loss": 0.5239, + "step": 69525 + }, + { + "epoch": 16.97, + "learning_rate": 0.00040833722869678844, + "loss": 0.5663, + "step": 69550 + }, + { + "epoch": 16.98, + "learning_rate": 0.00040830402957643235, + "loss": 0.5758, + "step": 69575 + }, + { + "epoch": 16.98, + "learning_rate": 0.00040827083045607627, + "loss": 0.5516, + "step": 69600 + }, + { + "epoch": 16.99, + "learning_rate": 0.00040823763133572013, + "loss": 0.5874, + "step": 69625 + }, + { + "epoch": 17.0, + "learning_rate": 0.00040820443221536404, + "loss": 0.5773, + "step": 69650 + }, + { + "epoch": 17.0, + "learning_rate": 0.00040817256105982213, + "loss": 0.6173, + "step": 69675 + }, + { + "epoch": 17.01, + "learning_rate": 0.00040813936193946605, + "loss": 0.5685, + "step": 69700 + }, + { + "epoch": 17.01, + "learning_rate": 0.00040810616281910996, + "loss": 0.5947, + "step": 69725 + }, + { + "epoch": 17.02, + "learning_rate": 0.0004080729636987539, + "loss": 0.5506, + "step": 69750 + }, + { + "epoch": 17.03, + "learning_rate": 0.00040803976457839773, + "loss": 0.5246, + "step": 69775 + }, + { + "epoch": 17.03, + "learning_rate": 0.00040800656545804165, + "loss": 0.5586, + "step": 69800 + }, + { + "epoch": 17.04, + "learning_rate": 0.0004079733663376855, + "loss": 0.5482, + "step": 69825 + }, + { + "epoch": 17.04, + "learning_rate": 0.0004079401672173294, + "loss": 0.5213, + "step": 69850 + }, + { + "epoch": 17.05, + "learning_rate": 0.00040790696809697333, + "loss": 0.578, + "step": 69875 + }, + { + "epoch": 17.06, + "learning_rate": 0.0004078737689766172, + "loss": 0.5675, + "step": 69900 + }, + { + "epoch": 17.06, + "learning_rate": 0.0004078405698562611, + "loss": 0.5336, + "step": 69925 + }, + { + "epoch": 17.07, + "learning_rate": 0.000407807370735905, + "loss": 0.549, + "step": 69950 + }, + { + "epoch": 17.08, + "learning_rate": 0.0004077741716155489, + "loss": 0.5888, + "step": 69975 + }, + { + "epoch": 17.08, + "learning_rate": 0.00040774097249519274, + "loss": 0.546, + "step": 70000 + }, + { + "epoch": 17.09, + "learning_rate": 0.00040770777337483666, + "loss": 0.5392, + "step": 70025 + }, + { + "epoch": 17.09, + "learning_rate": 0.00040767457425448057, + "loss": 0.5331, + "step": 70050 + }, + { + "epoch": 17.1, + "learning_rate": 0.0004076413751341245, + "loss": 0.4992, + "step": 70075 + }, + { + "epoch": 17.11, + "learning_rate": 0.0004076081760137684, + "loss": 0.5935, + "step": 70100 + }, + { + "epoch": 17.11, + "learning_rate": 0.0004075749768934122, + "loss": 0.5448, + "step": 70125 + }, + { + "epoch": 17.12, + "learning_rate": 0.0004075417777730561, + "loss": 0.5383, + "step": 70150 + }, + { + "epoch": 17.12, + "learning_rate": 0.00040750857865270003, + "loss": 0.5574, + "step": 70175 + }, + { + "epoch": 17.13, + "learning_rate": 0.00040747537953234395, + "loss": 0.5287, + "step": 70200 + }, + { + "epoch": 17.14, + "learning_rate": 0.0004074421804119878, + "loss": 0.5176, + "step": 70225 + }, + { + "epoch": 17.14, + "learning_rate": 0.0004074089812916317, + "loss": 0.514, + "step": 70250 + }, + { + "epoch": 17.15, + "learning_rate": 0.0004073757821712756, + "loss": 0.5223, + "step": 70275 + }, + { + "epoch": 17.15, + "learning_rate": 0.0004073425830509195, + "loss": 0.5599, + "step": 70300 + }, + { + "epoch": 17.16, + "learning_rate": 0.0004073093839305634, + "loss": 0.5492, + "step": 70325 + }, + { + "epoch": 17.17, + "learning_rate": 0.00040727618481020727, + "loss": 0.5432, + "step": 70350 + }, + { + "epoch": 17.17, + "learning_rate": 0.0004072429856898512, + "loss": 0.5706, + "step": 70375 + }, + { + "epoch": 17.18, + "learning_rate": 0.0004072097865694951, + "loss": 0.5642, + "step": 70400 + }, + { + "epoch": 17.19, + "learning_rate": 0.00040717658744913895, + "loss": 0.5706, + "step": 70425 + }, + { + "epoch": 17.19, + "learning_rate": 0.0004071433883287828, + "loss": 0.4991, + "step": 70450 + }, + { + "epoch": 17.2, + "learning_rate": 0.00040711018920842673, + "loss": 0.5495, + "step": 70475 + }, + { + "epoch": 17.2, + "learning_rate": 0.00040707699008807064, + "loss": 0.5227, + "step": 70500 + }, + { + "epoch": 17.21, + "learning_rate": 0.00040704379096771456, + "loss": 0.5789, + "step": 70525 + }, + { + "epoch": 17.22, + "learning_rate": 0.00040701059184735847, + "loss": 0.5442, + "step": 70550 + }, + { + "epoch": 17.22, + "learning_rate": 0.0004069773927270023, + "loss": 0.5567, + "step": 70575 + }, + { + "epoch": 17.23, + "learning_rate": 0.0004069441936066462, + "loss": 0.5408, + "step": 70600 + }, + { + "epoch": 17.23, + "learning_rate": 0.0004069109944862901, + "loss": 0.557, + "step": 70625 + }, + { + "epoch": 17.24, + "learning_rate": 0.000406877795365934, + "loss": 0.5338, + "step": 70650 + }, + { + "epoch": 17.25, + "learning_rate": 0.0004068445962455779, + "loss": 0.5138, + "step": 70675 + }, + { + "epoch": 17.25, + "learning_rate": 0.0004068113971252218, + "loss": 0.5655, + "step": 70700 + }, + { + "epoch": 17.26, + "learning_rate": 0.00040677819800486565, + "loss": 0.5419, + "step": 70725 + }, + { + "epoch": 17.26, + "learning_rate": 0.00040674499888450956, + "loss": 0.5177, + "step": 70750 + }, + { + "epoch": 17.27, + "learning_rate": 0.0004067117997641535, + "loss": 0.5388, + "step": 70775 + }, + { + "epoch": 17.28, + "learning_rate": 0.00040667860064379734, + "loss": 0.5382, + "step": 70800 + }, + { + "epoch": 17.28, + "learning_rate": 0.00040664540152344125, + "loss": 0.5697, + "step": 70825 + }, + { + "epoch": 17.29, + "learning_rate": 0.00040661220240308517, + "loss": 0.5452, + "step": 70850 + }, + { + "epoch": 17.3, + "learning_rate": 0.000406579003282729, + "loss": 0.5611, + "step": 70875 + }, + { + "epoch": 17.3, + "learning_rate": 0.0004065458041623729, + "loss": 0.5321, + "step": 70900 + }, + { + "epoch": 17.31, + "learning_rate": 0.0004065126050420168, + "loss": 0.546, + "step": 70925 + }, + { + "epoch": 17.31, + "learning_rate": 0.0004064794059216607, + "loss": 0.5901, + "step": 70950 + }, + { + "epoch": 17.32, + "learning_rate": 0.00040644620680130463, + "loss": 0.5018, + "step": 70975 + }, + { + "epoch": 17.33, + "learning_rate": 0.00040641300768094854, + "loss": 0.5433, + "step": 71000 + }, + { + "epoch": 17.33, + "learning_rate": 0.00040637980856059235, + "loss": 0.5856, + "step": 71025 + }, + { + "epoch": 17.34, + "learning_rate": 0.00040634660944023626, + "loss": 0.5445, + "step": 71050 + }, + { + "epoch": 17.34, + "learning_rate": 0.0004063134103198802, + "loss": 0.5376, + "step": 71075 + }, + { + "epoch": 17.35, + "learning_rate": 0.0004062802111995241, + "loss": 0.5303, + "step": 71100 + }, + { + "epoch": 17.36, + "learning_rate": 0.000406247012079168, + "loss": 0.5202, + "step": 71125 + }, + { + "epoch": 17.36, + "learning_rate": 0.00040621381295881186, + "loss": 0.5504, + "step": 71150 + }, + { + "epoch": 17.37, + "learning_rate": 0.0004061806138384557, + "loss": 0.5456, + "step": 71175 + }, + { + "epoch": 17.37, + "learning_rate": 0.00040614741471809964, + "loss": 0.565, + "step": 71200 + }, + { + "epoch": 17.38, + "learning_rate": 0.00040611421559774355, + "loss": 0.5316, + "step": 71225 + }, + { + "epoch": 17.39, + "learning_rate": 0.0004060810164773874, + "loss": 0.5479, + "step": 71250 + }, + { + "epoch": 17.39, + "learning_rate": 0.0004060478173570313, + "loss": 0.5441, + "step": 71275 + }, + { + "epoch": 17.4, + "learning_rate": 0.00040601461823667524, + "loss": 0.5295, + "step": 71300 + }, + { + "epoch": 17.4, + "learning_rate": 0.0004059814191163191, + "loss": 0.5384, + "step": 71325 + }, + { + "epoch": 17.41, + "learning_rate": 0.000405948219995963, + "loss": 0.5691, + "step": 71350 + }, + { + "epoch": 17.42, + "learning_rate": 0.00040591502087560687, + "loss": 0.6323, + "step": 71375 + }, + { + "epoch": 17.42, + "learning_rate": 0.0004058818217552508, + "loss": 0.584, + "step": 71400 + }, + { + "epoch": 17.43, + "learning_rate": 0.0004058486226348947, + "loss": 0.5904, + "step": 71425 + }, + { + "epoch": 17.44, + "learning_rate": 0.00040581542351453856, + "loss": 0.56, + "step": 71450 + }, + { + "epoch": 17.44, + "learning_rate": 0.0004057822243941824, + "loss": 0.5599, + "step": 71475 + }, + { + "epoch": 17.45, + "learning_rate": 0.00040574902527382633, + "loss": 0.5294, + "step": 71500 + }, + { + "epoch": 17.45, + "learning_rate": 0.00040571582615347025, + "loss": 0.5451, + "step": 71525 + }, + { + "epoch": 17.46, + "learning_rate": 0.00040568262703311416, + "loss": 0.5828, + "step": 71550 + }, + { + "epoch": 17.47, + "learning_rate": 0.0004056494279127581, + "loss": 0.5037, + "step": 71575 + }, + { + "epoch": 17.47, + "learning_rate": 0.0004056162287924019, + "loss": 0.5308, + "step": 71600 + }, + { + "epoch": 17.48, + "learning_rate": 0.0004055830296720458, + "loss": 0.5456, + "step": 71625 + }, + { + "epoch": 17.48, + "learning_rate": 0.0004055498305516897, + "loss": 0.5405, + "step": 71650 + }, + { + "epoch": 17.49, + "learning_rate": 0.0004055166314313336, + "loss": 0.5725, + "step": 71675 + }, + { + "epoch": 17.5, + "learning_rate": 0.0004054834323109775, + "loss": 0.5379, + "step": 71700 + }, + { + "epoch": 17.5, + "learning_rate": 0.0004054502331906214, + "loss": 0.5498, + "step": 71725 + }, + { + "epoch": 17.51, + "learning_rate": 0.00040541703407026526, + "loss": 0.5228, + "step": 71750 + }, + { + "epoch": 17.51, + "learning_rate": 0.00040538383494990917, + "loss": 0.5078, + "step": 71775 + }, + { + "epoch": 17.52, + "learning_rate": 0.0004053506358295531, + "loss": 0.5552, + "step": 71800 + }, + { + "epoch": 17.53, + "learning_rate": 0.00040531743670919694, + "loss": 0.574, + "step": 71825 + }, + { + "epoch": 17.53, + "learning_rate": 0.00040528423758884086, + "loss": 0.5456, + "step": 71850 + }, + { + "epoch": 17.54, + "learning_rate": 0.00040525103846848477, + "loss": 0.5166, + "step": 71875 + }, + { + "epoch": 17.55, + "learning_rate": 0.00040521783934812863, + "loss": 0.5637, + "step": 71900 + }, + { + "epoch": 17.55, + "learning_rate": 0.0004051846402277725, + "loss": 0.5762, + "step": 71925 + }, + { + "epoch": 17.56, + "learning_rate": 0.0004051514411074164, + "loss": 0.5937, + "step": 71950 + }, + { + "epoch": 17.56, + "learning_rate": 0.0004051182419870603, + "loss": 0.5883, + "step": 71975 + }, + { + "epoch": 17.57, + "learning_rate": 0.00040508504286670423, + "loss": 0.5363, + "step": 72000 + }, + { + "epoch": 17.57, + "eval_cer": 0.12136176503803785, + "eval_loss": 0.4388948678970337, + "eval_runtime": 147.1784, + "eval_samples_per_second": 28.489, + "eval_steps_per_second": 7.127, + "eval_wer": 0.49148450244698205, + "step": 72000 + }, + { + "epoch": 17.58, + "learning_rate": 0.00040505184374634815, + "loss": 0.532, + "step": 72025 + }, + { + "epoch": 17.58, + "learning_rate": 0.00040501864462599195, + "loss": 0.5279, + "step": 72050 + }, + { + "epoch": 17.59, + "learning_rate": 0.00040498544550563587, + "loss": 0.5578, + "step": 72075 + }, + { + "epoch": 17.59, + "learning_rate": 0.0004049522463852798, + "loss": 0.5357, + "step": 72100 + }, + { + "epoch": 17.6, + "learning_rate": 0.0004049190472649237, + "loss": 0.5405, + "step": 72125 + }, + { + "epoch": 17.61, + "learning_rate": 0.00040488584814456755, + "loss": 0.5273, + "step": 72150 + }, + { + "epoch": 17.61, + "learning_rate": 0.00040485264902421147, + "loss": 0.5772, + "step": 72175 + }, + { + "epoch": 17.62, + "learning_rate": 0.00040481944990385533, + "loss": 0.5308, + "step": 72200 + }, + { + "epoch": 17.62, + "learning_rate": 0.00040478625078349924, + "loss": 0.5678, + "step": 72225 + }, + { + "epoch": 17.63, + "learning_rate": 0.00040475305166314316, + "loss": 0.5161, + "step": 72250 + }, + { + "epoch": 17.64, + "learning_rate": 0.000404719852542787, + "loss": 0.5953, + "step": 72275 + }, + { + "epoch": 17.64, + "learning_rate": 0.00040468665342243093, + "loss": 0.5763, + "step": 72300 + }, + { + "epoch": 17.65, + "learning_rate": 0.00040465345430207484, + "loss": 0.545, + "step": 72325 + }, + { + "epoch": 17.65, + "learning_rate": 0.0004046202551817187, + "loss": 0.5738, + "step": 72350 + }, + { + "epoch": 17.66, + "learning_rate": 0.00040458705606136256, + "loss": 0.5208, + "step": 72375 + }, + { + "epoch": 17.67, + "learning_rate": 0.0004045538569410065, + "loss": 0.538, + "step": 72400 + }, + { + "epoch": 17.67, + "learning_rate": 0.0004045206578206504, + "loss": 0.5776, + "step": 72425 + }, + { + "epoch": 17.68, + "learning_rate": 0.0004044874587002943, + "loss": 0.5831, + "step": 72450 + }, + { + "epoch": 17.69, + "learning_rate": 0.0004044542595799382, + "loss": 0.5136, + "step": 72475 + }, + { + "epoch": 17.69, + "learning_rate": 0.000404421060459582, + "loss": 0.5116, + "step": 72500 + }, + { + "epoch": 17.7, + "learning_rate": 0.00040438786133922594, + "loss": 0.5752, + "step": 72525 + }, + { + "epoch": 17.7, + "learning_rate": 0.00040435466221886985, + "loss": 0.5525, + "step": 72550 + }, + { + "epoch": 17.71, + "learning_rate": 0.00040432146309851377, + "loss": 0.5546, + "step": 72575 + }, + { + "epoch": 17.72, + "learning_rate": 0.0004042882639781577, + "loss": 0.5408, + "step": 72600 + }, + { + "epoch": 17.72, + "learning_rate": 0.00040425506485780154, + "loss": 0.5833, + "step": 72625 + }, + { + "epoch": 17.73, + "learning_rate": 0.0004042218657374454, + "loss": 0.565, + "step": 72650 + }, + { + "epoch": 17.73, + "learning_rate": 0.0004041886666170893, + "loss": 0.5366, + "step": 72675 + }, + { + "epoch": 17.74, + "learning_rate": 0.00040415546749673323, + "loss": 0.5232, + "step": 72700 + }, + { + "epoch": 17.75, + "learning_rate": 0.0004041222683763771, + "loss": 0.5818, + "step": 72725 + }, + { + "epoch": 17.75, + "learning_rate": 0.000404089069256021, + "loss": 0.541, + "step": 72750 + }, + { + "epoch": 17.76, + "learning_rate": 0.0004040558701356649, + "loss": 0.5453, + "step": 72775 + }, + { + "epoch": 17.76, + "learning_rate": 0.0004040226710153088, + "loss": 0.5412, + "step": 72800 + }, + { + "epoch": 17.77, + "learning_rate": 0.0004039894718949527, + "loss": 0.5513, + "step": 72825 + }, + { + "epoch": 17.78, + "learning_rate": 0.00040395627277459655, + "loss": 0.5736, + "step": 72850 + }, + { + "epoch": 17.78, + "learning_rate": 0.00040392307365424046, + "loss": 0.5623, + "step": 72875 + }, + { + "epoch": 17.79, + "learning_rate": 0.0004038898745338844, + "loss": 0.5901, + "step": 72900 + }, + { + "epoch": 17.8, + "learning_rate": 0.0004038566754135283, + "loss": 0.5831, + "step": 72925 + }, + { + "epoch": 17.8, + "learning_rate": 0.0004038234762931721, + "loss": 0.5359, + "step": 72950 + }, + { + "epoch": 17.81, + "learning_rate": 0.000403790277172816, + "loss": 0.6014, + "step": 72975 + }, + { + "epoch": 17.81, + "learning_rate": 0.0004037570780524599, + "loss": 0.5446, + "step": 73000 + }, + { + "epoch": 17.82, + "learning_rate": 0.00040372387893210384, + "loss": 0.4802, + "step": 73025 + }, + { + "epoch": 17.83, + "learning_rate": 0.00040369067981174775, + "loss": 0.5288, + "step": 73050 + }, + { + "epoch": 17.83, + "learning_rate": 0.0004036574806913916, + "loss": 0.5275, + "step": 73075 + }, + { + "epoch": 17.84, + "learning_rate": 0.0004036242815710355, + "loss": 0.5719, + "step": 73100 + }, + { + "epoch": 17.84, + "learning_rate": 0.0004035910824506794, + "loss": 0.5496, + "step": 73125 + }, + { + "epoch": 17.85, + "learning_rate": 0.0004035578833303233, + "loss": 0.5475, + "step": 73150 + }, + { + "epoch": 17.86, + "learning_rate": 0.00040352468420996716, + "loss": 0.5142, + "step": 73175 + }, + { + "epoch": 17.86, + "learning_rate": 0.0004034914850896111, + "loss": 0.5324, + "step": 73200 + }, + { + "epoch": 17.87, + "learning_rate": 0.000403458285969255, + "loss": 0.5521, + "step": 73225 + }, + { + "epoch": 17.87, + "learning_rate": 0.00040342508684889885, + "loss": 0.546, + "step": 73250 + }, + { + "epoch": 17.88, + "learning_rate": 0.00040339188772854276, + "loss": 0.5351, + "step": 73275 + }, + { + "epoch": 17.89, + "learning_rate": 0.0004033586886081866, + "loss": 0.5669, + "step": 73300 + }, + { + "epoch": 17.89, + "learning_rate": 0.00040332548948783054, + "loss": 0.5633, + "step": 73325 + }, + { + "epoch": 17.9, + "learning_rate": 0.00040329229036747445, + "loss": 0.5263, + "step": 73350 + }, + { + "epoch": 17.91, + "learning_rate": 0.00040325909124711836, + "loss": 0.5618, + "step": 73375 + }, + { + "epoch": 17.91, + "learning_rate": 0.00040322589212676217, + "loss": 0.545, + "step": 73400 + }, + { + "epoch": 17.92, + "learning_rate": 0.0004031926930064061, + "loss": 0.5756, + "step": 73425 + }, + { + "epoch": 17.92, + "learning_rate": 0.00040315949388605, + "loss": 0.565, + "step": 73450 + }, + { + "epoch": 17.93, + "learning_rate": 0.0004031262947656939, + "loss": 0.5497, + "step": 73475 + }, + { + "epoch": 17.94, + "learning_rate": 0.0004030930956453378, + "loss": 0.558, + "step": 73500 + }, + { + "epoch": 17.94, + "learning_rate": 0.0004030598965249817, + "loss": 0.5668, + "step": 73525 + }, + { + "epoch": 17.95, + "learning_rate": 0.00040302669740462555, + "loss": 0.5363, + "step": 73550 + }, + { + "epoch": 17.95, + "learning_rate": 0.00040299349828426946, + "loss": 0.5227, + "step": 73575 + }, + { + "epoch": 17.96, + "learning_rate": 0.0004029602991639134, + "loss": 0.5817, + "step": 73600 + }, + { + "epoch": 17.97, + "learning_rate": 0.00040292710004355723, + "loss": 0.557, + "step": 73625 + }, + { + "epoch": 17.97, + "learning_rate": 0.00040289390092320115, + "loss": 0.5853, + "step": 73650 + }, + { + "epoch": 17.98, + "learning_rate": 0.00040286070180284506, + "loss": 0.5487, + "step": 73675 + }, + { + "epoch": 17.98, + "learning_rate": 0.0004028275026824889, + "loss": 0.6219, + "step": 73700 + }, + { + "epoch": 17.99, + "learning_rate": 0.00040279430356213283, + "loss": 0.5515, + "step": 73725 + }, + { + "epoch": 18.0, + "learning_rate": 0.0004027611044417767, + "loss": 0.5403, + "step": 73750 + }, + { + "epoch": 18.0, + "learning_rate": 0.0004027279053214206, + "loss": 0.5723, + "step": 73775 + }, + { + "epoch": 18.01, + "learning_rate": 0.0004026947062010645, + "loss": 0.5326, + "step": 73800 + }, + { + "epoch": 18.01, + "learning_rate": 0.00040266150708070844, + "loss": 0.5321, + "step": 73825 + }, + { + "epoch": 18.02, + "learning_rate": 0.0004026283079603523, + "loss": 0.4971, + "step": 73850 + }, + { + "epoch": 18.03, + "learning_rate": 0.00040259510883999616, + "loss": 0.517, + "step": 73875 + }, + { + "epoch": 18.03, + "learning_rate": 0.00040256190971964007, + "loss": 0.4976, + "step": 73900 + }, + { + "epoch": 18.04, + "learning_rate": 0.000402528710599284, + "loss": 0.5843, + "step": 73925 + }, + { + "epoch": 18.05, + "learning_rate": 0.0004024955114789279, + "loss": 0.5477, + "step": 73950 + }, + { + "epoch": 18.05, + "learning_rate": 0.00040246231235857176, + "loss": 0.5345, + "step": 73975 + }, + { + "epoch": 18.06, + "learning_rate": 0.0004024291132382156, + "loss": 0.5536, + "step": 74000 + }, + { + "epoch": 18.06, + "learning_rate": 0.00040239591411785953, + "loss": 0.5754, + "step": 74025 + }, + { + "epoch": 18.07, + "learning_rate": 0.00040236271499750345, + "loss": 0.5296, + "step": 74050 + }, + { + "epoch": 18.08, + "learning_rate": 0.00040232951587714736, + "loss": 0.5145, + "step": 74075 + }, + { + "epoch": 18.08, + "learning_rate": 0.0004022963167567912, + "loss": 0.5274, + "step": 74100 + }, + { + "epoch": 18.09, + "learning_rate": 0.00040226311763643513, + "loss": 0.5229, + "step": 74125 + }, + { + "epoch": 18.09, + "learning_rate": 0.000402229918516079, + "loss": 0.489, + "step": 74150 + }, + { + "epoch": 18.1, + "learning_rate": 0.0004021967193957229, + "loss": 0.5586, + "step": 74175 + }, + { + "epoch": 18.11, + "learning_rate": 0.00040216352027536677, + "loss": 0.5578, + "step": 74200 + }, + { + "epoch": 18.11, + "learning_rate": 0.0004021303211550107, + "loss": 0.5274, + "step": 74225 + }, + { + "epoch": 18.12, + "learning_rate": 0.0004020971220346546, + "loss": 0.5554, + "step": 74250 + }, + { + "epoch": 18.12, + "learning_rate": 0.0004020639229142985, + "loss": 0.5502, + "step": 74275 + }, + { + "epoch": 18.13, + "learning_rate": 0.00040203072379394237, + "loss": 0.5322, + "step": 74300 + }, + { + "epoch": 18.14, + "learning_rate": 0.00040199752467358623, + "loss": 0.4957, + "step": 74325 + }, + { + "epoch": 18.14, + "learning_rate": 0.00040196432555323014, + "loss": 0.483, + "step": 74350 + }, + { + "epoch": 18.15, + "learning_rate": 0.00040193112643287406, + "loss": 0.5155, + "step": 74375 + }, + { + "epoch": 18.16, + "learning_rate": 0.00040189792731251797, + "loss": 0.5262, + "step": 74400 + }, + { + "epoch": 18.16, + "learning_rate": 0.00040186472819216183, + "loss": 0.5277, + "step": 74425 + }, + { + "epoch": 18.17, + "learning_rate": 0.0004018315290718057, + "loss": 0.5151, + "step": 74450 + }, + { + "epoch": 18.17, + "learning_rate": 0.0004017983299514496, + "loss": 0.5304, + "step": 74475 + }, + { + "epoch": 18.18, + "learning_rate": 0.0004017651308310935, + "loss": 0.5293, + "step": 74500 + }, + { + "epoch": 18.19, + "learning_rate": 0.00040173193171073743, + "loss": 0.5295, + "step": 74525 + }, + { + "epoch": 18.19, + "learning_rate": 0.0004016987325903813, + "loss": 0.537, + "step": 74550 + }, + { + "epoch": 18.2, + "learning_rate": 0.0004016655334700252, + "loss": 0.545, + "step": 74575 + }, + { + "epoch": 18.2, + "learning_rate": 0.00040163233434966906, + "loss": 0.5087, + "step": 74600 + }, + { + "epoch": 18.21, + "learning_rate": 0.000401599135229313, + "loss": 0.4987, + "step": 74625 + }, + { + "epoch": 18.22, + "learning_rate": 0.00040156593610895684, + "loss": 0.5241, + "step": 74650 + }, + { + "epoch": 18.22, + "learning_rate": 0.00040153273698860075, + "loss": 0.5354, + "step": 74675 + }, + { + "epoch": 18.23, + "learning_rate": 0.00040149953786824467, + "loss": 0.5366, + "step": 74700 + }, + { + "epoch": 18.23, + "learning_rate": 0.0004014663387478886, + "loss": 0.5404, + "step": 74725 + }, + { + "epoch": 18.24, + "learning_rate": 0.00040143313962753244, + "loss": 0.5026, + "step": 74750 + }, + { + "epoch": 18.25, + "learning_rate": 0.0004013999405071763, + "loss": 0.5621, + "step": 74775 + }, + { + "epoch": 18.25, + "learning_rate": 0.0004013667413868202, + "loss": 0.5328, + "step": 74800 + }, + { + "epoch": 18.26, + "learning_rate": 0.00040133354226646413, + "loss": 0.5611, + "step": 74825 + }, + { + "epoch": 18.27, + "learning_rate": 0.00040130034314610804, + "loss": 0.521, + "step": 74850 + }, + { + "epoch": 18.27, + "learning_rate": 0.00040126714402575196, + "loss": 0.5469, + "step": 74875 + }, + { + "epoch": 18.28, + "learning_rate": 0.00040123394490539576, + "loss": 0.5093, + "step": 74900 + }, + { + "epoch": 18.28, + "learning_rate": 0.0004012007457850397, + "loss": 0.5601, + "step": 74925 + }, + { + "epoch": 18.29, + "learning_rate": 0.0004011675466646836, + "loss": 0.5073, + "step": 74950 + }, + { + "epoch": 18.3, + "learning_rate": 0.0004011343475443275, + "loss": 0.5758, + "step": 74975 + }, + { + "epoch": 18.3, + "learning_rate": 0.0004011024763887856, + "loss": 0.5078, + "step": 75000 + }, + { + "epoch": 18.3, + "eval_cer": 0.12220362822500333, + "eval_loss": 0.45253750681877136, + "eval_runtime": 147.3668, + "eval_samples_per_second": 28.453, + "eval_steps_per_second": 7.118, + "eval_wer": 0.49151712887438825, + "step": 75000 + }, + { + "epoch": 18.31, + "learning_rate": 0.0004010692772684295, + "loss": 0.5379, + "step": 75025 + }, + { + "epoch": 18.31, + "learning_rate": 0.0004010360781480734, + "loss": 0.5546, + "step": 75050 + }, + { + "epoch": 18.32, + "learning_rate": 0.00040100287902771734, + "loss": 0.5149, + "step": 75075 + }, + { + "epoch": 18.33, + "learning_rate": 0.00040096967990736114, + "loss": 0.5255, + "step": 75100 + }, + { + "epoch": 18.33, + "learning_rate": 0.00040093648078700505, + "loss": 0.5352, + "step": 75125 + }, + { + "epoch": 18.34, + "learning_rate": 0.00040090328166664897, + "loss": 0.4802, + "step": 75150 + }, + { + "epoch": 18.34, + "learning_rate": 0.0004008700825462929, + "loss": 0.5256, + "step": 75175 + }, + { + "epoch": 18.35, + "learning_rate": 0.0004008368834259368, + "loss": 0.5439, + "step": 75200 + }, + { + "epoch": 18.36, + "learning_rate": 0.00040080368430558066, + "loss": 0.516, + "step": 75225 + }, + { + "epoch": 18.36, + "learning_rate": 0.0004007704851852245, + "loss": 0.5687, + "step": 75250 + }, + { + "epoch": 18.37, + "learning_rate": 0.00040073728606486843, + "loss": 0.5459, + "step": 75275 + }, + { + "epoch": 18.37, + "learning_rate": 0.00040070408694451234, + "loss": 0.5233, + "step": 75300 + }, + { + "epoch": 18.38, + "learning_rate": 0.0004006708878241562, + "loss": 0.5328, + "step": 75325 + }, + { + "epoch": 18.39, + "learning_rate": 0.0004006376887038001, + "loss": 0.5247, + "step": 75350 + }, + { + "epoch": 18.39, + "learning_rate": 0.00040060448958344403, + "loss": 0.5751, + "step": 75375 + }, + { + "epoch": 18.4, + "learning_rate": 0.0004005712904630879, + "loss": 0.5215, + "step": 75400 + }, + { + "epoch": 18.41, + "learning_rate": 0.0004005380913427318, + "loss": 0.5242, + "step": 75425 + }, + { + "epoch": 18.41, + "learning_rate": 0.00040050489222237567, + "loss": 0.5205, + "step": 75450 + }, + { + "epoch": 18.42, + "learning_rate": 0.0004004716931020196, + "loss": 0.5528, + "step": 75475 + }, + { + "epoch": 18.42, + "learning_rate": 0.0004004384939816635, + "loss": 0.5264, + "step": 75500 + }, + { + "epoch": 18.43, + "learning_rate": 0.0004004052948613074, + "loss": 0.4788, + "step": 75525 + }, + { + "epoch": 18.44, + "learning_rate": 0.0004003720957409512, + "loss": 0.512, + "step": 75550 + }, + { + "epoch": 18.44, + "learning_rate": 0.0004003388966205951, + "loss": 0.5212, + "step": 75575 + }, + { + "epoch": 18.45, + "learning_rate": 0.00040030569750023904, + "loss": 0.5449, + "step": 75600 + }, + { + "epoch": 18.45, + "learning_rate": 0.00040027249837988295, + "loss": 0.5017, + "step": 75625 + }, + { + "epoch": 18.46, + "learning_rate": 0.00040023929925952687, + "loss": 0.5355, + "step": 75650 + }, + { + "epoch": 18.47, + "learning_rate": 0.00040020610013917073, + "loss": 0.5656, + "step": 75675 + }, + { + "epoch": 18.47, + "learning_rate": 0.0004001729010188146, + "loss": 0.5639, + "step": 75700 + }, + { + "epoch": 18.48, + "learning_rate": 0.0004001397018984585, + "loss": 0.5351, + "step": 75725 + }, + { + "epoch": 18.48, + "learning_rate": 0.0004001065027781024, + "loss": 0.506, + "step": 75750 + }, + { + "epoch": 18.49, + "learning_rate": 0.0004000733036577463, + "loss": 0.5343, + "step": 75775 + }, + { + "epoch": 18.5, + "learning_rate": 0.0004000401045373902, + "loss": 0.5089, + "step": 75800 + }, + { + "epoch": 18.5, + "learning_rate": 0.0004000069054170341, + "loss": 0.565, + "step": 75825 + }, + { + "epoch": 18.51, + "learning_rate": 0.00039997370629667796, + "loss": 0.5275, + "step": 75850 + }, + { + "epoch": 18.52, + "learning_rate": 0.0003999405071763219, + "loss": 0.532, + "step": 75875 + }, + { + "epoch": 18.52, + "learning_rate": 0.00039990730805596574, + "loss": 0.5424, + "step": 75900 + }, + { + "epoch": 18.53, + "learning_rate": 0.0003998754369004239, + "loss": 0.5468, + "step": 75925 + }, + { + "epoch": 18.53, + "learning_rate": 0.0003998422377800678, + "loss": 0.5039, + "step": 75950 + }, + { + "epoch": 18.54, + "learning_rate": 0.0003998090386597117, + "loss": 0.5426, + "step": 75975 + }, + { + "epoch": 18.55, + "learning_rate": 0.00039977583953935557, + "loss": 0.5072, + "step": 76000 + }, + { + "epoch": 18.55, + "learning_rate": 0.0003997426404189995, + "loss": 0.5543, + "step": 76025 + }, + { + "epoch": 18.56, + "learning_rate": 0.00039970944129864334, + "loss": 0.5615, + "step": 76050 + }, + { + "epoch": 18.56, + "learning_rate": 0.00039967624217828726, + "loss": 0.5061, + "step": 76075 + }, + { + "epoch": 18.57, + "learning_rate": 0.0003996430430579311, + "loss": 0.5508, + "step": 76100 + }, + { + "epoch": 18.58, + "learning_rate": 0.00039960984393757503, + "loss": 0.5134, + "step": 76125 + }, + { + "epoch": 18.58, + "learning_rate": 0.00039957664481721895, + "loss": 0.5097, + "step": 76150 + }, + { + "epoch": 18.59, + "learning_rate": 0.00039954344569686286, + "loss": 0.4996, + "step": 76175 + }, + { + "epoch": 18.59, + "learning_rate": 0.0003995102465765067, + "loss": 0.4972, + "step": 76200 + }, + { + "epoch": 18.6, + "learning_rate": 0.0003994770474561506, + "loss": 0.562, + "step": 76225 + }, + { + "epoch": 18.61, + "learning_rate": 0.0003994438483357945, + "loss": 0.5387, + "step": 76250 + }, + { + "epoch": 18.61, + "learning_rate": 0.0003994106492154384, + "loss": 0.5599, + "step": 76275 + }, + { + "epoch": 18.62, + "learning_rate": 0.0003993774500950823, + "loss": 0.533, + "step": 76300 + }, + { + "epoch": 18.62, + "learning_rate": 0.00039934425097472623, + "loss": 0.552, + "step": 76325 + }, + { + "epoch": 18.63, + "learning_rate": 0.00039931105185437004, + "loss": 0.5328, + "step": 76350 + }, + { + "epoch": 18.64, + "learning_rate": 0.00039927785273401395, + "loss": 0.5625, + "step": 76375 + }, + { + "epoch": 18.64, + "learning_rate": 0.00039924465361365787, + "loss": 0.5635, + "step": 76400 + }, + { + "epoch": 18.65, + "learning_rate": 0.0003992114544933018, + "loss": 0.5886, + "step": 76425 + }, + { + "epoch": 18.66, + "learning_rate": 0.00039917825537294564, + "loss": 0.5375, + "step": 76450 + }, + { + "epoch": 18.66, + "learning_rate": 0.00039914505625258956, + "loss": 0.5109, + "step": 76475 + }, + { + "epoch": 18.67, + "learning_rate": 0.0003991118571322334, + "loss": 0.5455, + "step": 76500 + }, + { + "epoch": 18.67, + "learning_rate": 0.00039907865801187733, + "loss": 0.5416, + "step": 76525 + }, + { + "epoch": 18.68, + "learning_rate": 0.00039904545889152124, + "loss": 0.5739, + "step": 76550 + }, + { + "epoch": 18.69, + "learning_rate": 0.0003990122597711651, + "loss": 0.5392, + "step": 76575 + }, + { + "epoch": 18.69, + "learning_rate": 0.000398979060650809, + "loss": 0.5753, + "step": 76600 + }, + { + "epoch": 18.7, + "learning_rate": 0.00039894586153045293, + "loss": 0.5331, + "step": 76625 + }, + { + "epoch": 18.7, + "learning_rate": 0.0003989126624100968, + "loss": 0.5166, + "step": 76650 + }, + { + "epoch": 18.71, + "learning_rate": 0.00039887946328974065, + "loss": 0.5217, + "step": 76675 + }, + { + "epoch": 18.72, + "learning_rate": 0.00039884626416938456, + "loss": 0.5389, + "step": 76700 + }, + { + "epoch": 18.72, + "learning_rate": 0.0003988130650490285, + "loss": 0.5295, + "step": 76725 + }, + { + "epoch": 18.73, + "learning_rate": 0.0003987798659286724, + "loss": 0.5699, + "step": 76750 + }, + { + "epoch": 18.73, + "learning_rate": 0.00039874666680831625, + "loss": 0.5373, + "step": 76775 + }, + { + "epoch": 18.74, + "learning_rate": 0.0003987134676879601, + "loss": 0.498, + "step": 76800 + }, + { + "epoch": 18.75, + "learning_rate": 0.000398680268567604, + "loss": 0.5534, + "step": 76825 + }, + { + "epoch": 18.75, + "learning_rate": 0.00039864706944724794, + "loss": 0.5273, + "step": 76850 + }, + { + "epoch": 18.76, + "learning_rate": 0.00039861387032689185, + "loss": 0.5369, + "step": 76875 + }, + { + "epoch": 18.77, + "learning_rate": 0.0003985806712065357, + "loss": 0.5222, + "step": 76900 + }, + { + "epoch": 18.77, + "learning_rate": 0.0003985474720861796, + "loss": 0.5316, + "step": 76925 + }, + { + "epoch": 18.78, + "learning_rate": 0.0003985142729658235, + "loss": 0.5146, + "step": 76950 + }, + { + "epoch": 18.78, + "learning_rate": 0.0003984810738454674, + "loss": 0.5384, + "step": 76975 + }, + { + "epoch": 18.79, + "learning_rate": 0.0003984478747251113, + "loss": 0.5177, + "step": 77000 + }, + { + "epoch": 18.8, + "learning_rate": 0.0003984146756047552, + "loss": 0.5552, + "step": 77025 + }, + { + "epoch": 18.8, + "learning_rate": 0.0003983814764843991, + "loss": 0.5154, + "step": 77050 + }, + { + "epoch": 18.81, + "learning_rate": 0.00039834827736404295, + "loss": 0.5189, + "step": 77075 + }, + { + "epoch": 18.81, + "learning_rate": 0.00039831507824368686, + "loss": 0.5299, + "step": 77100 + }, + { + "epoch": 18.82, + "learning_rate": 0.0003982818791233307, + "loss": 0.4983, + "step": 77125 + }, + { + "epoch": 18.83, + "learning_rate": 0.00039824868000297464, + "loss": 0.5253, + "step": 77150 + }, + { + "epoch": 18.83, + "learning_rate": 0.00039821548088261855, + "loss": 0.5739, + "step": 77175 + }, + { + "epoch": 18.84, + "learning_rate": 0.00039818228176226246, + "loss": 0.5569, + "step": 77200 + }, + { + "epoch": 18.84, + "learning_rate": 0.0003981490826419063, + "loss": 0.5496, + "step": 77225 + }, + { + "epoch": 18.85, + "learning_rate": 0.0003981158835215502, + "loss": 0.5505, + "step": 77250 + }, + { + "epoch": 18.86, + "learning_rate": 0.0003980826844011941, + "loss": 0.5687, + "step": 77275 + }, + { + "epoch": 18.86, + "learning_rate": 0.000398049485280838, + "loss": 0.556, + "step": 77300 + }, + { + "epoch": 18.87, + "learning_rate": 0.0003980162861604819, + "loss": 0.5188, + "step": 77325 + }, + { + "epoch": 18.88, + "learning_rate": 0.0003979830870401258, + "loss": 0.5799, + "step": 77350 + }, + { + "epoch": 18.88, + "learning_rate": 0.00039794988791976965, + "loss": 0.5696, + "step": 77375 + }, + { + "epoch": 18.89, + "learning_rate": 0.00039791668879941356, + "loss": 0.53, + "step": 77400 + }, + { + "epoch": 18.89, + "learning_rate": 0.0003978834896790575, + "loss": 0.5746, + "step": 77425 + }, + { + "epoch": 18.9, + "learning_rate": 0.0003978502905587014, + "loss": 0.5483, + "step": 77450 + }, + { + "epoch": 18.91, + "learning_rate": 0.00039781709143834525, + "loss": 0.5689, + "step": 77475 + }, + { + "epoch": 18.91, + "learning_rate": 0.00039778389231798916, + "loss": 0.5191, + "step": 77500 + }, + { + "epoch": 18.92, + "learning_rate": 0.000397750693197633, + "loss": 0.5588, + "step": 77525 + }, + { + "epoch": 18.92, + "learning_rate": 0.00039771749407727694, + "loss": 0.5028, + "step": 77550 + }, + { + "epoch": 18.93, + "learning_rate": 0.00039768429495692085, + "loss": 0.5064, + "step": 77575 + }, + { + "epoch": 18.94, + "learning_rate": 0.0003976510958365647, + "loss": 0.5281, + "step": 77600 + }, + { + "epoch": 18.94, + "learning_rate": 0.0003976178967162086, + "loss": 0.5584, + "step": 77625 + }, + { + "epoch": 18.95, + "learning_rate": 0.00039758469759585254, + "loss": 0.5377, + "step": 77650 + }, + { + "epoch": 18.95, + "learning_rate": 0.0003975514984754964, + "loss": 0.494, + "step": 77675 + }, + { + "epoch": 18.96, + "learning_rate": 0.00039751829935514026, + "loss": 0.5384, + "step": 77700 + }, + { + "epoch": 18.97, + "learning_rate": 0.00039748510023478417, + "loss": 0.5086, + "step": 77725 + }, + { + "epoch": 18.97, + "learning_rate": 0.0003974519011144281, + "loss": 0.555, + "step": 77750 + }, + { + "epoch": 18.98, + "learning_rate": 0.000397418701994072, + "loss": 0.5202, + "step": 77775 + }, + { + "epoch": 18.98, + "learning_rate": 0.0003973855028737159, + "loss": 0.5353, + "step": 77800 + }, + { + "epoch": 18.99, + "learning_rate": 0.0003973523037533597, + "loss": 0.5747, + "step": 77825 + }, + { + "epoch": 19.0, + "learning_rate": 0.00039731910463300363, + "loss": 0.4983, + "step": 77850 + }, + { + "epoch": 19.0, + "learning_rate": 0.00039728590551264755, + "loss": 0.5076, + "step": 77875 + }, + { + "epoch": 19.01, + "learning_rate": 0.00039725270639229146, + "loss": 0.5359, + "step": 77900 + }, + { + "epoch": 19.02, + "learning_rate": 0.0003972195072719353, + "loss": 0.5673, + "step": 77925 + }, + { + "epoch": 19.02, + "learning_rate": 0.00039718630815157923, + "loss": 0.5096, + "step": 77950 + }, + { + "epoch": 19.03, + "learning_rate": 0.0003971531090312231, + "loss": 0.5204, + "step": 77975 + }, + { + "epoch": 19.03, + "learning_rate": 0.000397119909910867, + "loss": 0.5075, + "step": 78000 + }, + { + "epoch": 19.03, + "eval_cer": 0.12079710070531709, + "eval_loss": 0.45315462350845337, + "eval_runtime": 146.6782, + "eval_samples_per_second": 28.586, + "eval_steps_per_second": 7.152, + "eval_wer": 0.4871451876019576, + "step": 78000 + }, + { + "epoch": 19.04, + "learning_rate": 0.0003970867107905109, + "loss": 0.5106, + "step": 78025 + }, + { + "epoch": 19.05, + "learning_rate": 0.0003970535116701548, + "loss": 0.4838, + "step": 78050 + }, + { + "epoch": 19.05, + "learning_rate": 0.0003970203125497987, + "loss": 0.5528, + "step": 78075 + }, + { + "epoch": 19.06, + "learning_rate": 0.0003969871134294426, + "loss": 0.469, + "step": 78100 + }, + { + "epoch": 19.06, + "learning_rate": 0.00039695391430908647, + "loss": 0.4894, + "step": 78125 + }, + { + "epoch": 19.07, + "learning_rate": 0.00039692071518873033, + "loss": 0.4993, + "step": 78150 + }, + { + "epoch": 19.08, + "learning_rate": 0.00039688751606837424, + "loss": 0.5519, + "step": 78175 + }, + { + "epoch": 19.08, + "learning_rate": 0.00039685431694801816, + "loss": 0.5083, + "step": 78200 + }, + { + "epoch": 19.09, + "learning_rate": 0.00039682111782766207, + "loss": 0.5324, + "step": 78225 + }, + { + "epoch": 19.09, + "learning_rate": 0.000396787918707306, + "loss": 0.4881, + "step": 78250 + }, + { + "epoch": 19.1, + "learning_rate": 0.0003967547195869498, + "loss": 0.5419, + "step": 78275 + }, + { + "epoch": 19.11, + "learning_rate": 0.0003967215204665937, + "loss": 0.5162, + "step": 78300 + }, + { + "epoch": 19.11, + "learning_rate": 0.0003966883213462376, + "loss": 0.5256, + "step": 78325 + }, + { + "epoch": 19.12, + "learning_rate": 0.00039665512222588153, + "loss": 0.4996, + "step": 78350 + }, + { + "epoch": 19.13, + "learning_rate": 0.0003966219231055254, + "loss": 0.5156, + "step": 78375 + }, + { + "epoch": 19.13, + "learning_rate": 0.0003965887239851693, + "loss": 0.4767, + "step": 78400 + }, + { + "epoch": 19.14, + "learning_rate": 0.00039655552486481317, + "loss": 0.4836, + "step": 78425 + }, + { + "epoch": 19.14, + "learning_rate": 0.0003965223257444571, + "loss": 0.5414, + "step": 78450 + }, + { + "epoch": 19.15, + "learning_rate": 0.000396489126624101, + "loss": 0.4985, + "step": 78475 + }, + { + "epoch": 19.16, + "learning_rate": 0.00039645592750374485, + "loss": 0.5329, + "step": 78500 + }, + { + "epoch": 19.16, + "learning_rate": 0.00039642272838338877, + "loss": 0.5244, + "step": 78525 + }, + { + "epoch": 19.17, + "learning_rate": 0.0003963895292630327, + "loss": 0.4926, + "step": 78550 + }, + { + "epoch": 19.17, + "learning_rate": 0.00039635633014267654, + "loss": 0.4931, + "step": 78575 + }, + { + "epoch": 19.18, + "learning_rate": 0.0003963231310223204, + "loss": 0.5234, + "step": 78600 + }, + { + "epoch": 19.19, + "learning_rate": 0.0003962899319019643, + "loss": 0.5165, + "step": 78625 + }, + { + "epoch": 19.19, + "learning_rate": 0.00039625673278160823, + "loss": 0.5369, + "step": 78650 + }, + { + "epoch": 19.2, + "learning_rate": 0.00039622353366125214, + "loss": 0.4852, + "step": 78675 + }, + { + "epoch": 19.2, + "learning_rate": 0.00039619033454089606, + "loss": 0.4958, + "step": 78700 + }, + { + "epoch": 19.21, + "learning_rate": 0.00039615713542053986, + "loss": 0.4935, + "step": 78725 + }, + { + "epoch": 19.22, + "learning_rate": 0.0003961239363001838, + "loss": 0.5221, + "step": 78750 + }, + { + "epoch": 19.22, + "learning_rate": 0.0003960907371798277, + "loss": 0.5487, + "step": 78775 + }, + { + "epoch": 19.23, + "learning_rate": 0.0003960575380594716, + "loss": 0.5195, + "step": 78800 + }, + { + "epoch": 19.23, + "learning_rate": 0.0003960243389391155, + "loss": 0.5316, + "step": 78825 + }, + { + "epoch": 19.24, + "learning_rate": 0.0003959911398187594, + "loss": 0.5014, + "step": 78850 + }, + { + "epoch": 19.25, + "learning_rate": 0.00039595794069840324, + "loss": 0.5431, + "step": 78875 + }, + { + "epoch": 19.25, + "learning_rate": 0.00039592474157804715, + "loss": 0.5156, + "step": 78900 + }, + { + "epoch": 19.26, + "learning_rate": 0.00039589154245769107, + "loss": 0.5367, + "step": 78925 + }, + { + "epoch": 19.27, + "learning_rate": 0.0003958583433373349, + "loss": 0.4882, + "step": 78950 + }, + { + "epoch": 19.27, + "learning_rate": 0.00039582514421697884, + "loss": 0.51, + "step": 78975 + }, + { + "epoch": 19.28, + "learning_rate": 0.00039579194509662275, + "loss": 0.4833, + "step": 79000 + }, + { + "epoch": 19.28, + "learning_rate": 0.0003957587459762666, + "loss": 0.5326, + "step": 79025 + }, + { + "epoch": 19.29, + "learning_rate": 0.0003957255468559105, + "loss": 0.4977, + "step": 79050 + }, + { + "epoch": 19.3, + "learning_rate": 0.0003956923477355544, + "loss": 0.5499, + "step": 79075 + }, + { + "epoch": 19.3, + "learning_rate": 0.0003956591486151983, + "loss": 0.5187, + "step": 79100 + }, + { + "epoch": 19.31, + "learning_rate": 0.0003956259494948422, + "loss": 0.5257, + "step": 79125 + }, + { + "epoch": 19.31, + "learning_rate": 0.00039559275037448613, + "loss": 0.5253, + "step": 79150 + }, + { + "epoch": 19.32, + "learning_rate": 0.00039555955125412993, + "loss": 0.5119, + "step": 79175 + }, + { + "epoch": 19.33, + "learning_rate": 0.00039552635213377385, + "loss": 0.5149, + "step": 79200 + }, + { + "epoch": 19.33, + "learning_rate": 0.00039549315301341776, + "loss": 0.5461, + "step": 79225 + }, + { + "epoch": 19.34, + "learning_rate": 0.0003954599538930617, + "loss": 0.5465, + "step": 79250 + }, + { + "epoch": 19.34, + "learning_rate": 0.0003954267547727056, + "loss": 0.5702, + "step": 79275 + }, + { + "epoch": 19.35, + "learning_rate": 0.00039539355565234945, + "loss": 0.5334, + "step": 79300 + }, + { + "epoch": 19.36, + "learning_rate": 0.0003953603565319933, + "loss": 0.5379, + "step": 79325 + }, + { + "epoch": 19.36, + "learning_rate": 0.0003953271574116372, + "loss": 0.5165, + "step": 79350 + }, + { + "epoch": 19.37, + "learning_rate": 0.00039529395829128114, + "loss": 0.5178, + "step": 79375 + }, + { + "epoch": 19.38, + "learning_rate": 0.000395260759170925, + "loss": 0.5007, + "step": 79400 + }, + { + "epoch": 19.38, + "learning_rate": 0.0003952275600505689, + "loss": 0.5203, + "step": 79425 + }, + { + "epoch": 19.39, + "learning_rate": 0.0003951943609302128, + "loss": 0.4874, + "step": 79450 + }, + { + "epoch": 19.39, + "learning_rate": 0.0003951611618098567, + "loss": 0.5472, + "step": 79475 + }, + { + "epoch": 19.4, + "learning_rate": 0.0003951279626895006, + "loss": 0.5123, + "step": 79500 + }, + { + "epoch": 19.41, + "learning_rate": 0.00039509476356914446, + "loss": 0.5628, + "step": 79525 + }, + { + "epoch": 19.41, + "learning_rate": 0.00039506156444878837, + "loss": 0.5127, + "step": 79550 + }, + { + "epoch": 19.42, + "learning_rate": 0.0003950283653284323, + "loss": 0.5461, + "step": 79575 + }, + { + "epoch": 19.42, + "learning_rate": 0.0003949951662080762, + "loss": 0.5187, + "step": 79600 + }, + { + "epoch": 19.43, + "learning_rate": 0.00039496196708772, + "loss": 0.559, + "step": 79625 + }, + { + "epoch": 19.44, + "learning_rate": 0.0003949287679673639, + "loss": 0.498, + "step": 79650 + }, + { + "epoch": 19.44, + "learning_rate": 0.00039489556884700783, + "loss": 0.4965, + "step": 79675 + }, + { + "epoch": 19.45, + "learning_rate": 0.00039486236972665175, + "loss": 0.4793, + "step": 79700 + }, + { + "epoch": 19.45, + "learning_rate": 0.00039482917060629566, + "loss": 0.4825, + "step": 79725 + }, + { + "epoch": 19.46, + "learning_rate": 0.0003947959714859395, + "loss": 0.4814, + "step": 79750 + }, + { + "epoch": 19.47, + "learning_rate": 0.0003947627723655834, + "loss": 0.4946, + "step": 79775 + }, + { + "epoch": 19.47, + "learning_rate": 0.0003947295732452273, + "loss": 0.4516, + "step": 79800 + }, + { + "epoch": 19.48, + "learning_rate": 0.0003946963741248712, + "loss": 0.5269, + "step": 79825 + }, + { + "epoch": 19.49, + "learning_rate": 0.00039466317500451507, + "loss": 0.5135, + "step": 79850 + }, + { + "epoch": 19.49, + "learning_rate": 0.000394629975884159, + "loss": 0.5563, + "step": 79875 + }, + { + "epoch": 19.5, + "learning_rate": 0.0003945967767638029, + "loss": 0.5172, + "step": 79900 + }, + { + "epoch": 19.5, + "learning_rate": 0.00039456357764344676, + "loss": 0.528, + "step": 79925 + }, + { + "epoch": 19.51, + "learning_rate": 0.00039453037852309067, + "loss": 0.5158, + "step": 79950 + }, + { + "epoch": 19.52, + "learning_rate": 0.00039449717940273453, + "loss": 0.5197, + "step": 79975 + }, + { + "epoch": 19.52, + "learning_rate": 0.00039446398028237844, + "loss": 0.522, + "step": 80000 + }, + { + "epoch": 19.53, + "learning_rate": 0.00039443078116202236, + "loss": 0.533, + "step": 80025 + }, + { + "epoch": 19.53, + "learning_rate": 0.00039439758204166627, + "loss": 0.5262, + "step": 80050 + }, + { + "epoch": 19.54, + "learning_rate": 0.0003943643829213101, + "loss": 0.5267, + "step": 80075 + }, + { + "epoch": 19.55, + "learning_rate": 0.000394331183800954, + "loss": 0.4881, + "step": 80100 + }, + { + "epoch": 19.55, + "learning_rate": 0.0003942979846805979, + "loss": 0.5977, + "step": 80125 + }, + { + "epoch": 19.56, + "learning_rate": 0.0003942647855602418, + "loss": 0.4507, + "step": 80150 + }, + { + "epoch": 19.56, + "learning_rate": 0.00039423291440469996, + "loss": 0.5734, + "step": 80175 + }, + { + "epoch": 19.57, + "learning_rate": 0.0003941997152843438, + "loss": 0.5274, + "step": 80200 + }, + { + "epoch": 19.58, + "learning_rate": 0.00039416651616398774, + "loss": 0.5174, + "step": 80225 + }, + { + "epoch": 19.58, + "learning_rate": 0.00039413331704363165, + "loss": 0.552, + "step": 80250 + }, + { + "epoch": 19.59, + "learning_rate": 0.0003941001179232755, + "loss": 0.5026, + "step": 80275 + }, + { + "epoch": 19.59, + "learning_rate": 0.00039406691880291937, + "loss": 0.5017, + "step": 80300 + }, + { + "epoch": 19.6, + "learning_rate": 0.0003940337196825633, + "loss": 0.5122, + "step": 80325 + }, + { + "epoch": 19.61, + "learning_rate": 0.0003940005205622072, + "loss": 0.5116, + "step": 80350 + }, + { + "epoch": 19.61, + "learning_rate": 0.0003939673214418511, + "loss": 0.5608, + "step": 80375 + }, + { + "epoch": 19.62, + "learning_rate": 0.00039393412232149503, + "loss": 0.4792, + "step": 80400 + }, + { + "epoch": 19.63, + "learning_rate": 0.00039390092320113883, + "loss": 0.5337, + "step": 80425 + }, + { + "epoch": 19.63, + "learning_rate": 0.00039386772408078275, + "loss": 0.4826, + "step": 80450 + }, + { + "epoch": 19.64, + "learning_rate": 0.00039383452496042666, + "loss": 0.5173, + "step": 80475 + }, + { + "epoch": 19.64, + "learning_rate": 0.0003938013258400706, + "loss": 0.4629, + "step": 80500 + }, + { + "epoch": 19.65, + "learning_rate": 0.00039376812671971444, + "loss": 0.5717, + "step": 80525 + }, + { + "epoch": 19.66, + "learning_rate": 0.00039373492759935835, + "loss": 0.499, + "step": 80550 + }, + { + "epoch": 19.66, + "learning_rate": 0.0003937017284790022, + "loss": 0.5233, + "step": 80575 + }, + { + "epoch": 19.67, + "learning_rate": 0.0003936685293586461, + "loss": 0.5131, + "step": 80600 + }, + { + "epoch": 19.67, + "learning_rate": 0.00039363533023829004, + "loss": 0.5343, + "step": 80625 + }, + { + "epoch": 19.68, + "learning_rate": 0.0003936021311179339, + "loss": 0.4978, + "step": 80650 + }, + { + "epoch": 19.69, + "learning_rate": 0.0003935689319975778, + "loss": 0.559, + "step": 80675 + }, + { + "epoch": 19.69, + "learning_rate": 0.0003935357328772217, + "loss": 0.5288, + "step": 80700 + }, + { + "epoch": 19.7, + "learning_rate": 0.0003935025337568656, + "loss": 0.5782, + "step": 80725 + }, + { + "epoch": 19.7, + "learning_rate": 0.00039346933463650944, + "loss": 0.5151, + "step": 80750 + }, + { + "epoch": 19.71, + "learning_rate": 0.00039343613551615336, + "loss": 0.5044, + "step": 80775 + }, + { + "epoch": 19.72, + "learning_rate": 0.00039340293639579727, + "loss": 0.5323, + "step": 80800 + }, + { + "epoch": 19.72, + "learning_rate": 0.0003933697372754412, + "loss": 0.5365, + "step": 80825 + }, + { + "epoch": 19.73, + "learning_rate": 0.0003933365381550851, + "loss": 0.5024, + "step": 80850 + }, + { + "epoch": 19.74, + "learning_rate": 0.0003933033390347289, + "loss": 0.5234, + "step": 80875 + }, + { + "epoch": 19.74, + "learning_rate": 0.0003932701399143728, + "loss": 0.5135, + "step": 80900 + }, + { + "epoch": 19.75, + "learning_rate": 0.00039323694079401673, + "loss": 0.5403, + "step": 80925 + }, + { + "epoch": 19.75, + "learning_rate": 0.00039320374167366065, + "loss": 0.5468, + "step": 80950 + }, + { + "epoch": 19.76, + "learning_rate": 0.0003931705425533045, + "loss": 0.4975, + "step": 80975 + }, + { + "epoch": 19.77, + "learning_rate": 0.0003931373434329484, + "loss": 0.5461, + "step": 81000 + }, + { + "epoch": 19.77, + "eval_cer": 0.11960617229448785, + "eval_loss": 0.4400729238986969, + "eval_runtime": 146.8938, + "eval_samples_per_second": 28.544, + "eval_steps_per_second": 7.141, + "eval_wer": 0.4812724306688418, + "step": 81000 + }, + { + "epoch": 19.77, + "learning_rate": 0.0003931041443125923, + "loss": 0.5305, + "step": 81025 + }, + { + "epoch": 19.78, + "learning_rate": 0.0003930709451922362, + "loss": 0.4784, + "step": 81050 + }, + { + "epoch": 19.78, + "learning_rate": 0.0003930377460718801, + "loss": 0.545, + "step": 81075 + }, + { + "epoch": 19.79, + "learning_rate": 0.00039300454695152397, + "loss": 0.4795, + "step": 81100 + }, + { + "epoch": 19.8, + "learning_rate": 0.0003929713478311679, + "loss": 0.5511, + "step": 81125 + }, + { + "epoch": 19.8, + "learning_rate": 0.0003929381487108118, + "loss": 0.5314, + "step": 81150 + }, + { + "epoch": 19.81, + "learning_rate": 0.00039290494959045566, + "loss": 0.5912, + "step": 81175 + }, + { + "epoch": 19.81, + "learning_rate": 0.0003928717504700995, + "loss": 0.5392, + "step": 81200 + }, + { + "epoch": 19.82, + "learning_rate": 0.00039283855134974343, + "loss": 0.504, + "step": 81225 + }, + { + "epoch": 19.83, + "learning_rate": 0.00039280535222938734, + "loss": 0.4723, + "step": 81250 + }, + { + "epoch": 19.83, + "learning_rate": 0.00039277215310903126, + "loss": 0.5295, + "step": 81275 + }, + { + "epoch": 19.84, + "learning_rate": 0.00039273895398867517, + "loss": 0.521, + "step": 81300 + }, + { + "epoch": 19.85, + "learning_rate": 0.000392705754868319, + "loss": 0.5833, + "step": 81325 + }, + { + "epoch": 19.85, + "learning_rate": 0.0003926725557479629, + "loss": 0.5042, + "step": 81350 + }, + { + "epoch": 19.86, + "learning_rate": 0.0003926393566276068, + "loss": 0.5365, + "step": 81375 + }, + { + "epoch": 19.86, + "learning_rate": 0.0003926061575072507, + "loss": 0.4939, + "step": 81400 + }, + { + "epoch": 19.87, + "learning_rate": 0.00039257295838689463, + "loss": 0.5449, + "step": 81425 + }, + { + "epoch": 19.88, + "learning_rate": 0.00039253975926653844, + "loss": 0.5452, + "step": 81450 + }, + { + "epoch": 19.88, + "learning_rate": 0.00039250656014618235, + "loss": 0.5635, + "step": 81475 + }, + { + "epoch": 19.89, + "learning_rate": 0.00039247336102582627, + "loss": 0.5344, + "step": 81500 + }, + { + "epoch": 19.89, + "learning_rate": 0.0003924401619054702, + "loss": 0.5103, + "step": 81525 + }, + { + "epoch": 19.9, + "learning_rate": 0.00039240696278511404, + "loss": 0.5035, + "step": 81550 + }, + { + "epoch": 19.91, + "learning_rate": 0.00039237376366475795, + "loss": 0.5693, + "step": 81575 + }, + { + "epoch": 19.91, + "learning_rate": 0.0003923405645444018, + "loss": 0.5482, + "step": 81600 + }, + { + "epoch": 19.92, + "learning_rate": 0.00039230736542404573, + "loss": 0.527, + "step": 81625 + }, + { + "epoch": 19.92, + "learning_rate": 0.00039227416630368964, + "loss": 0.5014, + "step": 81650 + }, + { + "epoch": 19.93, + "learning_rate": 0.0003922409671833335, + "loss": 0.5306, + "step": 81675 + }, + { + "epoch": 19.94, + "learning_rate": 0.0003922077680629774, + "loss": 0.5236, + "step": 81700 + }, + { + "epoch": 19.94, + "learning_rate": 0.00039217456894262133, + "loss": 0.5108, + "step": 81725 + }, + { + "epoch": 19.95, + "learning_rate": 0.0003921413698222652, + "loss": 0.4858, + "step": 81750 + }, + { + "epoch": 19.95, + "learning_rate": 0.00039210817070190905, + "loss": 0.4938, + "step": 81775 + }, + { + "epoch": 19.96, + "learning_rate": 0.00039207497158155296, + "loss": 0.5359, + "step": 81800 + }, + { + "epoch": 19.97, + "learning_rate": 0.0003920417724611969, + "loss": 0.533, + "step": 81825 + }, + { + "epoch": 19.97, + "learning_rate": 0.0003920085733408408, + "loss": 0.5, + "step": 81850 + }, + { + "epoch": 19.98, + "learning_rate": 0.0003919753742204847, + "loss": 0.5306, + "step": 81875 + }, + { + "epoch": 19.99, + "learning_rate": 0.0003919421751001285, + "loss": 0.5, + "step": 81900 + }, + { + "epoch": 19.99, + "learning_rate": 0.0003919089759797724, + "loss": 0.5182, + "step": 81925 + }, + { + "epoch": 20.0, + "learning_rate": 0.00039187577685941634, + "loss": 0.5104, + "step": 81950 + }, + { + "epoch": 20.0, + "learning_rate": 0.00039184257773906025, + "loss": 0.4774, + "step": 81975 + }, + { + "epoch": 20.01, + "learning_rate": 0.0003918093786187041, + "loss": 0.5177, + "step": 82000 + }, + { + "epoch": 20.02, + "learning_rate": 0.000391776179498348, + "loss": 0.5224, + "step": 82025 + }, + { + "epoch": 20.02, + "learning_rate": 0.0003917429803779919, + "loss": 0.4828, + "step": 82050 + }, + { + "epoch": 20.03, + "learning_rate": 0.0003917097812576358, + "loss": 0.5423, + "step": 82075 + }, + { + "epoch": 20.03, + "learning_rate": 0.0003916765821372797, + "loss": 0.443, + "step": 82100 + }, + { + "epoch": 20.04, + "learning_rate": 0.0003916433830169236, + "loss": 0.5223, + "step": 82125 + }, + { + "epoch": 20.05, + "learning_rate": 0.0003916101838965675, + "loss": 0.4703, + "step": 82150 + }, + { + "epoch": 20.05, + "learning_rate": 0.0003915769847762114, + "loss": 0.5051, + "step": 82175 + }, + { + "epoch": 20.06, + "learning_rate": 0.00039154378565585526, + "loss": 0.486, + "step": 82200 + }, + { + "epoch": 20.06, + "learning_rate": 0.0003915105865354991, + "loss": 0.4924, + "step": 82225 + }, + { + "epoch": 20.07, + "learning_rate": 0.00039147738741514304, + "loss": 0.4963, + "step": 82250 + }, + { + "epoch": 20.08, + "learning_rate": 0.00039144418829478695, + "loss": 0.4922, + "step": 82275 + }, + { + "epoch": 20.08, + "learning_rate": 0.00039141098917443086, + "loss": 0.4911, + "step": 82300 + }, + { + "epoch": 20.09, + "learning_rate": 0.0003913777900540748, + "loss": 0.5315, + "step": 82325 + }, + { + "epoch": 20.1, + "learning_rate": 0.0003913445909337186, + "loss": 0.4826, + "step": 82350 + }, + { + "epoch": 20.1, + "learning_rate": 0.0003913113918133625, + "loss": 0.5536, + "step": 82375 + }, + { + "epoch": 20.11, + "learning_rate": 0.0003912781926930064, + "loss": 0.4998, + "step": 82400 + }, + { + "epoch": 20.11, + "learning_rate": 0.0003912449935726503, + "loss": 0.5207, + "step": 82425 + }, + { + "epoch": 20.12, + "learning_rate": 0.0003912117944522942, + "loss": 0.5061, + "step": 82450 + }, + { + "epoch": 20.13, + "learning_rate": 0.0003911785953319381, + "loss": 0.4999, + "step": 82475 + }, + { + "epoch": 20.13, + "learning_rate": 0.00039114539621158196, + "loss": 0.4868, + "step": 82500 + }, + { + "epoch": 20.14, + "learning_rate": 0.00039111219709122587, + "loss": 0.5307, + "step": 82525 + }, + { + "epoch": 20.14, + "learning_rate": 0.0003910789979708698, + "loss": 0.455, + "step": 82550 + }, + { + "epoch": 20.15, + "learning_rate": 0.00039104579885051365, + "loss": 0.4881, + "step": 82575 + }, + { + "epoch": 20.16, + "learning_rate": 0.00039101259973015756, + "loss": 0.5058, + "step": 82600 + }, + { + "epoch": 20.16, + "learning_rate": 0.0003909794006098015, + "loss": 0.5035, + "step": 82625 + }, + { + "epoch": 20.17, + "learning_rate": 0.00039094620148944533, + "loss": 0.5044, + "step": 82650 + }, + { + "epoch": 20.17, + "learning_rate": 0.00039091300236908925, + "loss": 0.5321, + "step": 82675 + }, + { + "epoch": 20.18, + "learning_rate": 0.00039088113121354734, + "loss": 0.4867, + "step": 82700 + }, + { + "epoch": 20.19, + "learning_rate": 0.00039084793209319125, + "loss": 0.487, + "step": 82725 + }, + { + "epoch": 20.19, + "learning_rate": 0.00039081473297283517, + "loss": 0.5071, + "step": 82750 + }, + { + "epoch": 20.2, + "learning_rate": 0.0003907815338524791, + "loss": 0.4933, + "step": 82775 + }, + { + "epoch": 20.2, + "learning_rate": 0.00039074833473212294, + "loss": 0.5347, + "step": 82800 + }, + { + "epoch": 20.21, + "learning_rate": 0.00039071513561176685, + "loss": 0.486, + "step": 82825 + }, + { + "epoch": 20.22, + "learning_rate": 0.0003906819364914107, + "loss": 0.4886, + "step": 82850 + }, + { + "epoch": 20.22, + "learning_rate": 0.00039064873737105463, + "loss": 0.5365, + "step": 82875 + }, + { + "epoch": 20.23, + "learning_rate": 0.0003906155382506985, + "loss": 0.4923, + "step": 82900 + }, + { + "epoch": 20.24, + "learning_rate": 0.0003905823391303424, + "loss": 0.555, + "step": 82925 + }, + { + "epoch": 20.24, + "learning_rate": 0.0003905491400099863, + "loss": 0.5232, + "step": 82950 + }, + { + "epoch": 20.25, + "learning_rate": 0.00039051594088963023, + "loss": 0.5658, + "step": 82975 + }, + { + "epoch": 20.25, + "learning_rate": 0.0003904827417692741, + "loss": 0.5183, + "step": 83000 + }, + { + "epoch": 20.26, + "learning_rate": 0.00039044954264891795, + "loss": 0.5532, + "step": 83025 + }, + { + "epoch": 20.27, + "learning_rate": 0.00039041634352856186, + "loss": 0.4787, + "step": 83050 + }, + { + "epoch": 20.27, + "learning_rate": 0.0003903831444082058, + "loss": 0.5197, + "step": 83075 + }, + { + "epoch": 20.28, + "learning_rate": 0.0003903499452878497, + "loss": 0.4716, + "step": 83100 + }, + { + "epoch": 20.28, + "learning_rate": 0.00039031674616749355, + "loss": 0.5227, + "step": 83125 + }, + { + "epoch": 20.29, + "learning_rate": 0.0003902835470471374, + "loss": 0.4727, + "step": 83150 + }, + { + "epoch": 20.3, + "learning_rate": 0.0003902503479267813, + "loss": 0.5607, + "step": 83175 + }, + { + "epoch": 20.3, + "learning_rate": 0.00039021714880642524, + "loss": 0.5176, + "step": 83200 + }, + { + "epoch": 20.31, + "learning_rate": 0.00039018394968606915, + "loss": 0.5077, + "step": 83225 + }, + { + "epoch": 20.31, + "learning_rate": 0.000390150750565713, + "loss": 0.5003, + "step": 83250 + }, + { + "epoch": 20.32, + "learning_rate": 0.0003901175514453569, + "loss": 0.5059, + "step": 83275 + }, + { + "epoch": 20.33, + "learning_rate": 0.0003900843523250008, + "loss": 0.4917, + "step": 83300 + }, + { + "epoch": 20.33, + "learning_rate": 0.0003900511532046447, + "loss": 0.5032, + "step": 83325 + }, + { + "epoch": 20.34, + "learning_rate": 0.00039001795408428856, + "loss": 0.5251, + "step": 83350 + }, + { + "epoch": 20.35, + "learning_rate": 0.0003899847549639325, + "loss": 0.5191, + "step": 83375 + }, + { + "epoch": 20.35, + "learning_rate": 0.0003899515558435764, + "loss": 0.489, + "step": 83400 + }, + { + "epoch": 20.36, + "learning_rate": 0.0003899183567232203, + "loss": 0.5331, + "step": 83425 + }, + { + "epoch": 20.36, + "learning_rate": 0.00038988515760286416, + "loss": 0.4853, + "step": 83450 + }, + { + "epoch": 20.37, + "learning_rate": 0.000389851958482508, + "loss": 0.5296, + "step": 83475 + }, + { + "epoch": 20.38, + "learning_rate": 0.00038981875936215194, + "loss": 0.5222, + "step": 83500 + }, + { + "epoch": 20.38, + "learning_rate": 0.00038978556024179585, + "loss": 0.5363, + "step": 83525 + }, + { + "epoch": 20.39, + "learning_rate": 0.00038975236112143976, + "loss": 0.4851, + "step": 83550 + }, + { + "epoch": 20.39, + "learning_rate": 0.0003897191620010836, + "loss": 0.5469, + "step": 83575 + }, + { + "epoch": 20.4, + "learning_rate": 0.0003896859628807275, + "loss": 0.4488, + "step": 83600 + }, + { + "epoch": 20.41, + "learning_rate": 0.0003896527637603714, + "loss": 0.5445, + "step": 83625 + }, + { + "epoch": 20.41, + "learning_rate": 0.0003896195646400153, + "loss": 0.4996, + "step": 83650 + }, + { + "epoch": 20.42, + "learning_rate": 0.0003895863655196592, + "loss": 0.5022, + "step": 83675 + }, + { + "epoch": 20.42, + "learning_rate": 0.0003895531663993031, + "loss": 0.4456, + "step": 83700 + }, + { + "epoch": 20.43, + "learning_rate": 0.000389519967278947, + "loss": 0.531, + "step": 83725 + }, + { + "epoch": 20.44, + "learning_rate": 0.00038948676815859086, + "loss": 0.4859, + "step": 83750 + }, + { + "epoch": 20.44, + "learning_rate": 0.00038945356903823477, + "loss": 0.5109, + "step": 83775 + }, + { + "epoch": 20.45, + "learning_rate": 0.00038942036991787863, + "loss": 0.518, + "step": 83800 + }, + { + "epoch": 20.46, + "learning_rate": 0.00038938717079752255, + "loss": 0.5039, + "step": 83825 + }, + { + "epoch": 20.46, + "learning_rate": 0.00038935397167716646, + "loss": 0.4744, + "step": 83850 + }, + { + "epoch": 20.47, + "learning_rate": 0.0003893207725568104, + "loss": 0.5653, + "step": 83875 + }, + { + "epoch": 20.47, + "learning_rate": 0.00038928757343645423, + "loss": 0.5311, + "step": 83900 + }, + { + "epoch": 20.48, + "learning_rate": 0.0003892543743160981, + "loss": 0.5306, + "step": 83925 + }, + { + "epoch": 20.49, + "learning_rate": 0.000389221175195742, + "loss": 0.4814, + "step": 83950 + }, + { + "epoch": 20.49, + "learning_rate": 0.0003891879760753859, + "loss": 0.5273, + "step": 83975 + }, + { + "epoch": 20.5, + "learning_rate": 0.00038915477695502984, + "loss": 0.5044, + "step": 84000 + }, + { + "epoch": 20.5, + "eval_cer": 0.11443179368191944, + "eval_loss": 0.42682546377182007, + "eval_runtime": 146.7255, + "eval_samples_per_second": 28.577, + "eval_steps_per_second": 7.149, + "eval_wer": 0.46541598694942904, + "step": 84000 + }, + { + "epoch": 20.5, + "learning_rate": 0.00038912157783467375, + "loss": 0.522, + "step": 84025 + }, + { + "epoch": 20.51, + "learning_rate": 0.00038908837871431755, + "loss": 0.4838, + "step": 84050 + }, + { + "epoch": 20.52, + "learning_rate": 0.00038905517959396147, + "loss": 0.4854, + "step": 84075 + }, + { + "epoch": 20.52, + "learning_rate": 0.0003890219804736054, + "loss": 0.463, + "step": 84100 + }, + { + "epoch": 20.53, + "learning_rate": 0.0003889887813532493, + "loss": 0.5307, + "step": 84125 + }, + { + "epoch": 20.53, + "learning_rate": 0.00038895558223289316, + "loss": 0.4744, + "step": 84150 + }, + { + "epoch": 20.54, + "learning_rate": 0.00038892238311253707, + "loss": 0.595, + "step": 84175 + }, + { + "epoch": 20.55, + "learning_rate": 0.00038888918399218093, + "loss": 0.4853, + "step": 84200 + }, + { + "epoch": 20.55, + "learning_rate": 0.00038885598487182484, + "loss": 0.5554, + "step": 84225 + }, + { + "epoch": 20.56, + "learning_rate": 0.00038882278575146876, + "loss": 0.4629, + "step": 84250 + }, + { + "epoch": 20.56, + "learning_rate": 0.0003887895866311126, + "loss": 0.5226, + "step": 84275 + }, + { + "epoch": 20.57, + "learning_rate": 0.00038875638751075653, + "loss": 0.482, + "step": 84300 + }, + { + "epoch": 20.58, + "learning_rate": 0.00038872318839040045, + "loss": 0.4873, + "step": 84325 + }, + { + "epoch": 20.58, + "learning_rate": 0.0003886899892700443, + "loss": 0.539, + "step": 84350 + }, + { + "epoch": 20.59, + "learning_rate": 0.00038865679014968817, + "loss": 0.5458, + "step": 84375 + }, + { + "epoch": 20.6, + "learning_rate": 0.0003886235910293321, + "loss": 0.4841, + "step": 84400 + }, + { + "epoch": 20.6, + "learning_rate": 0.000388590391908976, + "loss": 0.5369, + "step": 84425 + }, + { + "epoch": 20.61, + "learning_rate": 0.0003885571927886199, + "loss": 0.4676, + "step": 84450 + }, + { + "epoch": 20.61, + "learning_rate": 0.0003885239936682638, + "loss": 0.5472, + "step": 84475 + }, + { + "epoch": 20.62, + "learning_rate": 0.0003884907945479076, + "loss": 0.4976, + "step": 84500 + }, + { + "epoch": 20.63, + "learning_rate": 0.00038845759542755154, + "loss": 0.5668, + "step": 84525 + }, + { + "epoch": 20.63, + "learning_rate": 0.00038842439630719545, + "loss": 0.5263, + "step": 84550 + }, + { + "epoch": 20.64, + "learning_rate": 0.00038839119718683937, + "loss": 0.5336, + "step": 84575 + }, + { + "epoch": 20.64, + "learning_rate": 0.00038835799806648323, + "loss": 0.5053, + "step": 84600 + }, + { + "epoch": 20.65, + "learning_rate": 0.00038832479894612714, + "loss": 0.5443, + "step": 84625 + }, + { + "epoch": 20.66, + "learning_rate": 0.000388291599825771, + "loss": 0.4887, + "step": 84650 + }, + { + "epoch": 20.66, + "learning_rate": 0.0003882584007054149, + "loss": 0.4999, + "step": 84675 + }, + { + "epoch": 20.67, + "learning_rate": 0.00038822520158505883, + "loss": 0.5104, + "step": 84700 + }, + { + "epoch": 20.67, + "learning_rate": 0.0003881920024647027, + "loss": 0.507, + "step": 84725 + }, + { + "epoch": 20.68, + "learning_rate": 0.00038816013130916083, + "loss": 0.5064, + "step": 84750 + }, + { + "epoch": 20.69, + "learning_rate": 0.00038812693218880475, + "loss": 0.5079, + "step": 84775 + }, + { + "epoch": 20.69, + "learning_rate": 0.00038809373306844866, + "loss": 0.5362, + "step": 84800 + }, + { + "epoch": 20.7, + "learning_rate": 0.0003880605339480925, + "loss": 0.5332, + "step": 84825 + }, + { + "epoch": 20.71, + "learning_rate": 0.0003880273348277364, + "loss": 0.5191, + "step": 84850 + }, + { + "epoch": 20.71, + "learning_rate": 0.0003879941357073803, + "loss": 0.5049, + "step": 84875 + }, + { + "epoch": 20.72, + "learning_rate": 0.0003879609365870242, + "loss": 0.4828, + "step": 84900 + }, + { + "epoch": 20.72, + "learning_rate": 0.00038792773746666807, + "loss": 0.5217, + "step": 84925 + }, + { + "epoch": 20.73, + "learning_rate": 0.000387894538346312, + "loss": 0.4909, + "step": 84950 + }, + { + "epoch": 20.74, + "learning_rate": 0.0003878613392259559, + "loss": 0.5039, + "step": 84975 + }, + { + "epoch": 20.74, + "learning_rate": 0.00038782946807041404, + "loss": 0.5085, + "step": 85000 + }, + { + "epoch": 20.75, + "learning_rate": 0.00038779626895005796, + "loss": 0.523, + "step": 85025 + }, + { + "epoch": 20.75, + "learning_rate": 0.00038776306982970176, + "loss": 0.4847, + "step": 85050 + }, + { + "epoch": 20.76, + "learning_rate": 0.0003877298707093457, + "loss": 0.4847, + "step": 85075 + }, + { + "epoch": 20.77, + "learning_rate": 0.0003876966715889896, + "loss": 0.5074, + "step": 85100 + }, + { + "epoch": 20.77, + "learning_rate": 0.0003876634724686335, + "loss": 0.5074, + "step": 85125 + }, + { + "epoch": 20.78, + "learning_rate": 0.00038763027334827736, + "loss": 0.4648, + "step": 85150 + }, + { + "epoch": 20.78, + "learning_rate": 0.0003875970742279213, + "loss": 0.5161, + "step": 85175 + }, + { + "epoch": 20.79, + "learning_rate": 0.00038756387510756514, + "loss": 0.5005, + "step": 85200 + }, + { + "epoch": 20.8, + "learning_rate": 0.00038753067598720905, + "loss": 0.5217, + "step": 85225 + }, + { + "epoch": 20.8, + "learning_rate": 0.00038749747686685296, + "loss": 0.5532, + "step": 85250 + }, + { + "epoch": 20.81, + "learning_rate": 0.0003874642777464968, + "loss": 0.4865, + "step": 85275 + }, + { + "epoch": 20.82, + "learning_rate": 0.00038743107862614074, + "loss": 0.4943, + "step": 85300 + }, + { + "epoch": 20.82, + "learning_rate": 0.00038739787950578465, + "loss": 0.4968, + "step": 85325 + }, + { + "epoch": 20.83, + "learning_rate": 0.0003873646803854285, + "loss": 0.5108, + "step": 85350 + }, + { + "epoch": 20.83, + "learning_rate": 0.00038733148126507237, + "loss": 0.5166, + "step": 85375 + }, + { + "epoch": 20.84, + "learning_rate": 0.0003872982821447163, + "loss": 0.5059, + "step": 85400 + }, + { + "epoch": 20.85, + "learning_rate": 0.0003872650830243602, + "loss": 0.5448, + "step": 85425 + }, + { + "epoch": 20.85, + "learning_rate": 0.0003872318839040041, + "loss": 0.459, + "step": 85450 + }, + { + "epoch": 20.86, + "learning_rate": 0.00038719868478364803, + "loss": 0.5601, + "step": 85475 + }, + { + "epoch": 20.86, + "learning_rate": 0.00038716548566329183, + "loss": 0.5406, + "step": 85500 + }, + { + "epoch": 20.87, + "learning_rate": 0.00038713228654293575, + "loss": 0.5668, + "step": 85525 + }, + { + "epoch": 20.88, + "learning_rate": 0.00038709908742257966, + "loss": 0.5244, + "step": 85550 + }, + { + "epoch": 20.88, + "learning_rate": 0.0003870658883022236, + "loss": 0.5241, + "step": 85575 + }, + { + "epoch": 20.89, + "learning_rate": 0.00038703268918186744, + "loss": 0.51, + "step": 85600 + }, + { + "epoch": 20.89, + "learning_rate": 0.00038699949006151135, + "loss": 0.5241, + "step": 85625 + }, + { + "epoch": 20.9, + "learning_rate": 0.0003869662909411552, + "loss": 0.4852, + "step": 85650 + }, + { + "epoch": 20.91, + "learning_rate": 0.0003869330918207991, + "loss": 0.4979, + "step": 85675 + }, + { + "epoch": 20.91, + "learning_rate": 0.00038689989270044304, + "loss": 0.5292, + "step": 85700 + }, + { + "epoch": 20.92, + "learning_rate": 0.0003868666935800869, + "loss": 0.5465, + "step": 85725 + }, + { + "epoch": 20.92, + "learning_rate": 0.0003868334944597308, + "loss": 0.4996, + "step": 85750 + }, + { + "epoch": 20.93, + "learning_rate": 0.0003868002953393747, + "loss": 0.5401, + "step": 85775 + }, + { + "epoch": 20.94, + "learning_rate": 0.0003867670962190186, + "loss": 0.51, + "step": 85800 + }, + { + "epoch": 20.94, + "learning_rate": 0.00038673389709866244, + "loss": 0.5461, + "step": 85825 + }, + { + "epoch": 20.95, + "learning_rate": 0.00038670069797830636, + "loss": 0.5363, + "step": 85850 + }, + { + "epoch": 20.96, + "learning_rate": 0.00038666749885795027, + "loss": 0.5452, + "step": 85875 + }, + { + "epoch": 20.96, + "learning_rate": 0.0003866342997375942, + "loss": 0.4922, + "step": 85900 + }, + { + "epoch": 20.97, + "learning_rate": 0.0003866011006172381, + "loss": 0.5316, + "step": 85925 + }, + { + "epoch": 20.97, + "learning_rate": 0.0003865679014968819, + "loss": 0.4887, + "step": 85950 + }, + { + "epoch": 20.98, + "learning_rate": 0.0003865347023765258, + "loss": 0.5274, + "step": 85975 + }, + { + "epoch": 20.99, + "learning_rate": 0.00038650150325616973, + "loss": 0.4773, + "step": 86000 + }, + { + "epoch": 20.99, + "learning_rate": 0.00038646830413581365, + "loss": 0.5313, + "step": 86025 + }, + { + "epoch": 21.0, + "learning_rate": 0.0003864351050154575, + "loss": 0.4961, + "step": 86050 + }, + { + "epoch": 21.0, + "learning_rate": 0.0003864019058951014, + "loss": 0.529, + "step": 86075 + }, + { + "epoch": 21.01, + "learning_rate": 0.0003863687067747453, + "loss": 0.4501, + "step": 86100 + }, + { + "epoch": 21.02, + "learning_rate": 0.0003863355076543892, + "loss": 0.5192, + "step": 86125 + }, + { + "epoch": 21.02, + "learning_rate": 0.0003863023085340331, + "loss": 0.5108, + "step": 86150 + }, + { + "epoch": 21.03, + "learning_rate": 0.00038626910941367697, + "loss": 0.4851, + "step": 86175 + }, + { + "epoch": 21.03, + "learning_rate": 0.0003862359102933209, + "loss": 0.5181, + "step": 86200 + }, + { + "epoch": 21.04, + "learning_rate": 0.0003862027111729648, + "loss": 0.4622, + "step": 86225 + }, + { + "epoch": 21.05, + "learning_rate": 0.00038616951205260866, + "loss": 0.481, + "step": 86250 + }, + { + "epoch": 21.05, + "learning_rate": 0.0003861363129322525, + "loss": 0.5097, + "step": 86275 + }, + { + "epoch": 21.06, + "learning_rate": 0.00038610311381189643, + "loss": 0.4656, + "step": 86300 + }, + { + "epoch": 21.07, + "learning_rate": 0.00038606991469154034, + "loss": 0.538, + "step": 86325 + }, + { + "epoch": 21.07, + "learning_rate": 0.00038603671557118426, + "loss": 0.4742, + "step": 86350 + }, + { + "epoch": 21.08, + "learning_rate": 0.00038600351645082817, + "loss": 0.5154, + "step": 86375 + }, + { + "epoch": 21.08, + "learning_rate": 0.000385970317330472, + "loss": 0.4569, + "step": 86400 + }, + { + "epoch": 21.09, + "learning_rate": 0.0003859371182101159, + "loss": 0.5032, + "step": 86425 + }, + { + "epoch": 21.1, + "learning_rate": 0.0003859039190897598, + "loss": 0.4849, + "step": 86450 + }, + { + "epoch": 21.1, + "learning_rate": 0.0003858707199694037, + "loss": 0.5501, + "step": 86475 + }, + { + "epoch": 21.11, + "learning_rate": 0.00038583752084904763, + "loss": 0.4792, + "step": 86500 + }, + { + "epoch": 21.11, + "learning_rate": 0.0003858043217286915, + "loss": 0.5251, + "step": 86525 + }, + { + "epoch": 21.12, + "learning_rate": 0.00038577112260833535, + "loss": 0.475, + "step": 86550 + }, + { + "epoch": 21.13, + "learning_rate": 0.00038573792348797927, + "loss": 0.5294, + "step": 86575 + }, + { + "epoch": 21.13, + "learning_rate": 0.0003857047243676232, + "loss": 0.4167, + "step": 86600 + }, + { + "epoch": 21.14, + "learning_rate": 0.00038567152524726704, + "loss": 0.5099, + "step": 86625 + }, + { + "epoch": 21.14, + "learning_rate": 0.00038563832612691095, + "loss": 0.4696, + "step": 86650 + }, + { + "epoch": 21.15, + "learning_rate": 0.00038560512700655487, + "loss": 0.5457, + "step": 86675 + }, + { + "epoch": 21.16, + "learning_rate": 0.00038557192788619873, + "loss": 0.4737, + "step": 86700 + }, + { + "epoch": 21.16, + "learning_rate": 0.00038553872876584264, + "loss": 0.5073, + "step": 86725 + }, + { + "epoch": 21.17, + "learning_rate": 0.0003855055296454865, + "loss": 0.4881, + "step": 86750 + }, + { + "epoch": 21.17, + "learning_rate": 0.0003854723305251304, + "loss": 0.5053, + "step": 86775 + }, + { + "epoch": 21.18, + "learning_rate": 0.00038543913140477433, + "loss": 0.48, + "step": 86800 + }, + { + "epoch": 21.19, + "learning_rate": 0.00038540593228441824, + "loss": 0.5247, + "step": 86825 + }, + { + "epoch": 21.19, + "learning_rate": 0.00038537273316406205, + "loss": 0.4993, + "step": 86850 + }, + { + "epoch": 21.2, + "learning_rate": 0.00038533953404370596, + "loss": 0.5142, + "step": 86875 + }, + { + "epoch": 21.21, + "learning_rate": 0.0003853063349233499, + "loss": 0.4572, + "step": 86900 + }, + { + "epoch": 21.21, + "learning_rate": 0.0003852731358029938, + "loss": 0.4832, + "step": 86925 + }, + { + "epoch": 21.22, + "learning_rate": 0.0003852399366826377, + "loss": 0.451, + "step": 86950 + }, + { + "epoch": 21.22, + "learning_rate": 0.00038520673756228157, + "loss": 0.5437, + "step": 86975 + }, + { + "epoch": 21.23, + "learning_rate": 0.0003851735384419254, + "loss": 0.4332, + "step": 87000 + }, + { + "epoch": 21.23, + "eval_cer": 0.11381066291592662, + "eval_loss": 0.4382989704608917, + "eval_runtime": 145.5564, + "eval_samples_per_second": 28.807, + "eval_steps_per_second": 7.207, + "eval_wer": 0.4626101141924959, + "step": 87000 + }, + { + "epoch": 21.24, + "learning_rate": 0.00038514033932156934, + "loss": 0.5451, + "step": 87025 + }, + { + "epoch": 21.24, + "learning_rate": 0.00038510714020121325, + "loss": 0.4974, + "step": 87050 + }, + { + "epoch": 21.25, + "learning_rate": 0.0003850739410808571, + "loss": 0.5291, + "step": 87075 + }, + { + "epoch": 21.25, + "learning_rate": 0.000385040741960501, + "loss": 0.4776, + "step": 87100 + }, + { + "epoch": 21.26, + "learning_rate": 0.00038500754284014494, + "loss": 0.5247, + "step": 87125 + }, + { + "epoch": 21.27, + "learning_rate": 0.0003849743437197888, + "loss": 0.4935, + "step": 87150 + }, + { + "epoch": 21.27, + "learning_rate": 0.0003849411445994327, + "loss": 0.4734, + "step": 87175 + }, + { + "epoch": 21.28, + "learning_rate": 0.0003849079454790766, + "loss": 0.4757, + "step": 87200 + }, + { + "epoch": 21.28, + "learning_rate": 0.0003848747463587205, + "loss": 0.5306, + "step": 87225 + }, + { + "epoch": 21.29, + "learning_rate": 0.0003848415472383644, + "loss": 0.4507, + "step": 87250 + }, + { + "epoch": 21.3, + "learning_rate": 0.0003848083481180083, + "loss": 0.5105, + "step": 87275 + }, + { + "epoch": 21.3, + "learning_rate": 0.0003847751489976521, + "loss": 0.4828, + "step": 87300 + }, + { + "epoch": 21.31, + "learning_rate": 0.00038474194987729604, + "loss": 0.5197, + "step": 87325 + }, + { + "epoch": 21.32, + "learning_rate": 0.00038470875075693995, + "loss": 0.4839, + "step": 87350 + }, + { + "epoch": 21.32, + "learning_rate": 0.00038467555163658386, + "loss": 0.5558, + "step": 87375 + }, + { + "epoch": 21.33, + "learning_rate": 0.0003846423525162278, + "loss": 0.4666, + "step": 87400 + }, + { + "epoch": 21.33, + "learning_rate": 0.00038460915339587164, + "loss": 0.4927, + "step": 87425 + }, + { + "epoch": 21.34, + "learning_rate": 0.0003845759542755155, + "loss": 0.4601, + "step": 87450 + }, + { + "epoch": 21.35, + "learning_rate": 0.0003845427551551594, + "loss": 0.5292, + "step": 87475 + }, + { + "epoch": 21.35, + "learning_rate": 0.0003845095560348033, + "loss": 0.4723, + "step": 87500 + }, + { + "epoch": 21.36, + "learning_rate": 0.0003844763569144472, + "loss": 0.4613, + "step": 87525 + }, + { + "epoch": 21.36, + "learning_rate": 0.0003844431577940911, + "loss": 0.484, + "step": 87550 + }, + { + "epoch": 21.37, + "learning_rate": 0.000384409958673735, + "loss": 0.5306, + "step": 87575 + }, + { + "epoch": 21.38, + "learning_rate": 0.00038437675955337887, + "loss": 0.4712, + "step": 87600 + }, + { + "epoch": 21.38, + "learning_rate": 0.0003843435604330228, + "loss": 0.5464, + "step": 87625 + }, + { + "epoch": 21.39, + "learning_rate": 0.00038431036131266665, + "loss": 0.4775, + "step": 87650 + }, + { + "epoch": 21.39, + "learning_rate": 0.00038427716219231056, + "loss": 0.4835, + "step": 87675 + }, + { + "epoch": 21.4, + "learning_rate": 0.0003842439630719545, + "loss": 0.4547, + "step": 87700 + }, + { + "epoch": 21.41, + "learning_rate": 0.00038421076395159833, + "loss": 0.5336, + "step": 87725 + }, + { + "epoch": 21.41, + "learning_rate": 0.0003841775648312422, + "loss": 0.5115, + "step": 87750 + }, + { + "epoch": 21.42, + "learning_rate": 0.0003841443657108861, + "loss": 0.4953, + "step": 87775 + }, + { + "epoch": 21.43, + "learning_rate": 0.00038411116659053, + "loss": 0.4706, + "step": 87800 + }, + { + "epoch": 21.43, + "learning_rate": 0.00038407796747017394, + "loss": 0.4955, + "step": 87825 + }, + { + "epoch": 21.44, + "learning_rate": 0.00038404476834981785, + "loss": 0.494, + "step": 87850 + }, + { + "epoch": 21.44, + "learning_rate": 0.00038401156922946166, + "loss": 0.5419, + "step": 87875 + }, + { + "epoch": 21.45, + "learning_rate": 0.00038397837010910557, + "loss": 0.4793, + "step": 87900 + }, + { + "epoch": 21.46, + "learning_rate": 0.0003839451709887495, + "loss": 0.4904, + "step": 87925 + }, + { + "epoch": 21.46, + "learning_rate": 0.0003839119718683934, + "loss": 0.4811, + "step": 87950 + }, + { + "epoch": 21.47, + "learning_rate": 0.0003838787727480373, + "loss": 0.5167, + "step": 87975 + }, + { + "epoch": 21.47, + "learning_rate": 0.00038384557362768117, + "loss": 0.4956, + "step": 88000 + }, + { + "epoch": 21.48, + "learning_rate": 0.00038381237450732503, + "loss": 0.5186, + "step": 88025 + }, + { + "epoch": 21.49, + "learning_rate": 0.00038377917538696894, + "loss": 0.4889, + "step": 88050 + }, + { + "epoch": 21.49, + "learning_rate": 0.00038374597626661286, + "loss": 0.5104, + "step": 88075 + }, + { + "epoch": 21.5, + "learning_rate": 0.0003837127771462567, + "loss": 0.457, + "step": 88100 + }, + { + "epoch": 21.5, + "learning_rate": 0.00038367957802590063, + "loss": 0.4604, + "step": 88125 + }, + { + "epoch": 21.51, + "learning_rate": 0.00038364637890554455, + "loss": 0.4942, + "step": 88150 + }, + { + "epoch": 21.52, + "learning_rate": 0.0003836131797851884, + "loss": 0.5411, + "step": 88175 + }, + { + "epoch": 21.52, + "learning_rate": 0.0003835799806648323, + "loss": 0.4869, + "step": 88200 + }, + { + "epoch": 21.53, + "learning_rate": 0.0003835467815444762, + "loss": 0.5289, + "step": 88225 + }, + { + "epoch": 21.53, + "learning_rate": 0.0003835135824241201, + "loss": 0.4726, + "step": 88250 + }, + { + "epoch": 21.54, + "learning_rate": 0.000383480383303764, + "loss": 0.4902, + "step": 88275 + }, + { + "epoch": 21.55, + "learning_rate": 0.0003834471841834079, + "loss": 0.4888, + "step": 88300 + }, + { + "epoch": 21.55, + "learning_rate": 0.00038341398506305173, + "loss": 0.5346, + "step": 88325 + }, + { + "epoch": 21.56, + "learning_rate": 0.00038338078594269564, + "loss": 0.4747, + "step": 88350 + }, + { + "epoch": 21.57, + "learning_rate": 0.00038334758682233956, + "loss": 0.5675, + "step": 88375 + }, + { + "epoch": 21.57, + "learning_rate": 0.00038331438770198347, + "loss": 0.5019, + "step": 88400 + }, + { + "epoch": 21.58, + "learning_rate": 0.0003832811885816274, + "loss": 0.5105, + "step": 88425 + }, + { + "epoch": 21.58, + "learning_rate": 0.00038324798946127124, + "loss": 0.4534, + "step": 88450 + }, + { + "epoch": 21.59, + "learning_rate": 0.0003832147903409151, + "loss": 0.472, + "step": 88475 + }, + { + "epoch": 21.6, + "learning_rate": 0.000383181591220559, + "loss": 0.4931, + "step": 88500 + }, + { + "epoch": 21.6, + "learning_rate": 0.00038314839210020293, + "loss": 0.5198, + "step": 88525 + }, + { + "epoch": 21.61, + "learning_rate": 0.0003831151929798468, + "loss": 0.4678, + "step": 88550 + }, + { + "epoch": 21.61, + "learning_rate": 0.0003830819938594907, + "loss": 0.5238, + "step": 88575 + }, + { + "epoch": 21.62, + "learning_rate": 0.0003830487947391346, + "loss": 0.4967, + "step": 88600 + }, + { + "epoch": 21.63, + "learning_rate": 0.0003830155956187785, + "loss": 0.5125, + "step": 88625 + }, + { + "epoch": 21.63, + "learning_rate": 0.0003829823964984224, + "loss": 0.4883, + "step": 88650 + }, + { + "epoch": 21.64, + "learning_rate": 0.00038294919737806625, + "loss": 0.5136, + "step": 88675 + }, + { + "epoch": 21.64, + "learning_rate": 0.00038291599825771017, + "loss": 0.4898, + "step": 88700 + }, + { + "epoch": 21.65, + "learning_rate": 0.0003828827991373541, + "loss": 0.5451, + "step": 88725 + }, + { + "epoch": 21.66, + "learning_rate": 0.000382849600016998, + "loss": 0.464, + "step": 88750 + }, + { + "epoch": 21.66, + "learning_rate": 0.0003828164008966418, + "loss": 0.5639, + "step": 88775 + }, + { + "epoch": 21.67, + "learning_rate": 0.0003827832017762857, + "loss": 0.4639, + "step": 88800 + }, + { + "epoch": 21.68, + "learning_rate": 0.00038275000265592963, + "loss": 0.5164, + "step": 88825 + }, + { + "epoch": 21.68, + "learning_rate": 0.00038271680353557354, + "loss": 0.5242, + "step": 88850 + }, + { + "epoch": 21.69, + "learning_rate": 0.00038268360441521746, + "loss": 0.532, + "step": 88875 + }, + { + "epoch": 21.69, + "learning_rate": 0.0003826504052948613, + "loss": 0.5124, + "step": 88900 + }, + { + "epoch": 21.7, + "learning_rate": 0.0003826172061745052, + "loss": 0.5157, + "step": 88925 + }, + { + "epoch": 21.71, + "learning_rate": 0.0003825840070541491, + "loss": 0.4771, + "step": 88950 + }, + { + "epoch": 21.71, + "learning_rate": 0.000382550807933793, + "loss": 0.5629, + "step": 88975 + }, + { + "epoch": 21.72, + "learning_rate": 0.0003825176088134369, + "loss": 0.473, + "step": 89000 + }, + { + "epoch": 21.72, + "learning_rate": 0.0003824844096930808, + "loss": 0.5363, + "step": 89025 + }, + { + "epoch": 21.73, + "learning_rate": 0.0003824512105727247, + "loss": 0.5015, + "step": 89050 + }, + { + "epoch": 21.74, + "learning_rate": 0.00038241801145236855, + "loss": 0.5072, + "step": 89075 + }, + { + "epoch": 21.74, + "learning_rate": 0.00038238481233201246, + "loss": 0.451, + "step": 89100 + }, + { + "epoch": 21.75, + "learning_rate": 0.0003823516132116563, + "loss": 0.5009, + "step": 89125 + }, + { + "epoch": 21.75, + "learning_rate": 0.00038231841409130024, + "loss": 0.5052, + "step": 89150 + }, + { + "epoch": 21.76, + "learning_rate": 0.00038228521497094415, + "loss": 0.5099, + "step": 89175 + }, + { + "epoch": 21.77, + "learning_rate": 0.00038225201585058807, + "loss": 0.4809, + "step": 89200 + }, + { + "epoch": 21.77, + "learning_rate": 0.0003822188167302319, + "loss": 0.5133, + "step": 89225 + }, + { + "epoch": 21.78, + "learning_rate": 0.0003821856176098758, + "loss": 0.4826, + "step": 89250 + }, + { + "epoch": 21.79, + "learning_rate": 0.0003821524184895197, + "loss": 0.5309, + "step": 89275 + }, + { + "epoch": 21.79, + "learning_rate": 0.0003821192193691636, + "loss": 0.4787, + "step": 89300 + }, + { + "epoch": 21.8, + "learning_rate": 0.00038208602024880753, + "loss": 0.5302, + "step": 89325 + }, + { + "epoch": 21.8, + "learning_rate": 0.0003820528211284514, + "loss": 0.4527, + "step": 89350 + }, + { + "epoch": 21.81, + "learning_rate": 0.00038201962200809525, + "loss": 0.5046, + "step": 89375 + }, + { + "epoch": 21.82, + "learning_rate": 0.00038198642288773916, + "loss": 0.4953, + "step": 89400 + }, + { + "epoch": 21.82, + "learning_rate": 0.0003819532237673831, + "loss": 0.552, + "step": 89425 + }, + { + "epoch": 21.83, + "learning_rate": 0.000381920024647027, + "loss": 0.5051, + "step": 89450 + }, + { + "epoch": 21.83, + "learning_rate": 0.00038188682552667085, + "loss": 0.5126, + "step": 89475 + }, + { + "epoch": 21.84, + "learning_rate": 0.00038185362640631476, + "loss": 0.4988, + "step": 89500 + }, + { + "epoch": 21.85, + "learning_rate": 0.0003912863425360371, + "loss": 0.53, + "step": 89525 + }, + { + "epoch": 21.85, + "learning_rate": 0.0003912570241876374, + "loss": 0.4469, + "step": 89550 + }, + { + "epoch": 21.86, + "learning_rate": 0.00039122648424138776, + "loss": 0.5172, + "step": 89575 + }, + { + "epoch": 21.86, + "learning_rate": 0.00039119594429513807, + "loss": 0.5424, + "step": 89600 + }, + { + "epoch": 21.87, + "learning_rate": 0.00039116540434888837, + "loss": 0.5237, + "step": 89625 + }, + { + "epoch": 21.88, + "learning_rate": 0.0003911348644026387, + "loss": 0.4864, + "step": 89650 + }, + { + "epoch": 21.88, + "learning_rate": 0.0003911043244563889, + "loss": 0.5272, + "step": 89675 + }, + { + "epoch": 21.89, + "learning_rate": 0.0003910737845101392, + "loss": 0.4576, + "step": 89700 + }, + { + "epoch": 21.89, + "learning_rate": 0.0003910432445638896, + "loss": 0.5364, + "step": 89725 + }, + { + "epoch": 21.9, + "learning_rate": 0.0003910127046176399, + "loss": 0.5269, + "step": 89750 + }, + { + "epoch": 21.91, + "learning_rate": 0.0003909821646713902, + "loss": 0.523, + "step": 89775 + }, + { + "epoch": 21.91, + "learning_rate": 0.0003909516247251405, + "loss": 0.444, + "step": 89800 + }, + { + "epoch": 21.92, + "learning_rate": 0.0003909210847788908, + "loss": 0.5496, + "step": 89825 + }, + { + "epoch": 21.93, + "learning_rate": 0.0003908905448326411, + "loss": 0.4531, + "step": 89850 + }, + { + "epoch": 21.93, + "learning_rate": 0.0003908600048863914, + "loss": 0.492, + "step": 89875 + }, + { + "epoch": 21.94, + "learning_rate": 0.0003908294649401417, + "loss": 0.4916, + "step": 89900 + }, + { + "epoch": 21.94, + "learning_rate": 0.000390798924993892, + "loss": 0.5314, + "step": 89925 + }, + { + "epoch": 21.95, + "learning_rate": 0.0003907683850476423, + "loss": 0.469, + "step": 89950 + }, + { + "epoch": 21.96, + "learning_rate": 0.00039073784510139267, + "loss": 0.5014, + "step": 89975 + }, + { + "epoch": 21.96, + "learning_rate": 0.0003907073051551429, + "loss": 0.4671, + "step": 90000 + }, + { + "epoch": 21.96, + "eval_cer": 0.11175220475755367, + "eval_loss": 0.4197826087474823, + "eval_runtime": 144.9411, + "eval_samples_per_second": 28.929, + "eval_steps_per_second": 7.237, + "eval_wer": 0.45471451876019575, + "step": 90000 + }, + { + "epoch": 21.97, + "learning_rate": 0.0003906767652088932, + "loss": 0.5545, + "step": 90025 + }, + { + "epoch": 21.97, + "learning_rate": 0.0003906462252626435, + "loss": 0.4985, + "step": 90050 + }, + { + "epoch": 21.98, + "learning_rate": 0.00039061568531639383, + "loss": 0.5421, + "step": 90075 + }, + { + "epoch": 21.99, + "learning_rate": 0.0003905851453701442, + "loss": 0.4719, + "step": 90100 + }, + { + "epoch": 21.99, + "learning_rate": 0.0003905546054238945, + "loss": 0.4999, + "step": 90125 + }, + { + "epoch": 22.0, + "learning_rate": 0.00039052406547764474, + "loss": 0.4586, + "step": 90150 + }, + { + "epoch": 22.0, + "learning_rate": 0.00039049352553139504, + "loss": 0.5135, + "step": 90175 + }, + { + "epoch": 22.01, + "learning_rate": 0.00039046298558514535, + "loss": 0.4611, + "step": 90200 + }, + { + "epoch": 22.02, + "learning_rate": 0.0003904324456388957, + "loss": 0.4822, + "step": 90225 + }, + { + "epoch": 22.02, + "learning_rate": 0.000390401905692646, + "loss": 0.4451, + "step": 90250 + }, + { + "epoch": 22.03, + "learning_rate": 0.0003903713657463963, + "loss": 0.5283, + "step": 90275 + }, + { + "epoch": 22.04, + "learning_rate": 0.0003903408258001466, + "loss": 0.4192, + "step": 90300 + }, + { + "epoch": 22.04, + "learning_rate": 0.00039031028585389686, + "loss": 0.5237, + "step": 90325 + }, + { + "epoch": 22.05, + "learning_rate": 0.0003902797459076472, + "loss": 0.4501, + "step": 90350 + }, + { + "epoch": 22.05, + "learning_rate": 0.0003902492059613975, + "loss": 0.4873, + "step": 90375 + }, + { + "epoch": 22.06, + "learning_rate": 0.00039021866601514783, + "loss": 0.4595, + "step": 90400 + }, + { + "epoch": 22.07, + "learning_rate": 0.00039018812606889813, + "loss": 0.517, + "step": 90425 + }, + { + "epoch": 22.07, + "learning_rate": 0.00039015758612264843, + "loss": 0.455, + "step": 90450 + }, + { + "epoch": 22.08, + "learning_rate": 0.00039012704617639874, + "loss": 0.5074, + "step": 90475 + }, + { + "epoch": 22.08, + "learning_rate": 0.00039009650623014904, + "loss": 0.4544, + "step": 90500 + }, + { + "epoch": 22.09, + "learning_rate": 0.00039006596628389934, + "loss": 0.4933, + "step": 90525 + }, + { + "epoch": 22.1, + "learning_rate": 0.00039003542633764965, + "loss": 0.4465, + "step": 90550 + }, + { + "epoch": 22.1, + "learning_rate": 0.00039000488639139995, + "loss": 0.4574, + "step": 90575 + }, + { + "epoch": 22.11, + "learning_rate": 0.0003899743464451503, + "loss": 0.4509, + "step": 90600 + }, + { + "epoch": 22.11, + "learning_rate": 0.00038994380649890056, + "loss": 0.5082, + "step": 90625 + }, + { + "epoch": 22.12, + "learning_rate": 0.00038991326655265086, + "loss": 0.4783, + "step": 90650 + }, + { + "epoch": 22.13, + "learning_rate": 0.00038988272660640116, + "loss": 0.4925, + "step": 90675 + }, + { + "epoch": 22.13, + "learning_rate": 0.00038985218666015147, + "loss": 0.4301, + "step": 90700 + }, + { + "epoch": 22.14, + "learning_rate": 0.0003898216467139018, + "loss": 0.5307, + "step": 90725 + }, + { + "epoch": 22.14, + "learning_rate": 0.00038979110676765213, + "loss": 0.4506, + "step": 90750 + }, + { + "epoch": 22.15, + "learning_rate": 0.00038976056682140243, + "loss": 0.4787, + "step": 90775 + }, + { + "epoch": 22.16, + "learning_rate": 0.0003897300268751527, + "loss": 0.4733, + "step": 90800 + }, + { + "epoch": 22.16, + "learning_rate": 0.000389699486928903, + "loss": 0.5464, + "step": 90825 + }, + { + "epoch": 22.17, + "learning_rate": 0.00038966894698265334, + "loss": 0.4397, + "step": 90850 + }, + { + "epoch": 22.18, + "learning_rate": 0.00038963840703640365, + "loss": 0.4903, + "step": 90875 + }, + { + "epoch": 22.18, + "learning_rate": 0.00038960786709015395, + "loss": 0.4126, + "step": 90900 + }, + { + "epoch": 22.19, + "learning_rate": 0.00038957732714390425, + "loss": 0.5237, + "step": 90925 + }, + { + "epoch": 22.19, + "learning_rate": 0.0003895467871976545, + "loss": 0.5362, + "step": 90950 + }, + { + "epoch": 22.2, + "learning_rate": 0.00038951624725140486, + "loss": 0.5327, + "step": 90975 + }, + { + "epoch": 22.21, + "learning_rate": 0.00038948570730515516, + "loss": 0.4644, + "step": 91000 + }, + { + "epoch": 22.21, + "learning_rate": 0.00038945516735890547, + "loss": 0.5763, + "step": 91025 + }, + { + "epoch": 22.22, + "learning_rate": 0.00038942462741265577, + "loss": 0.4837, + "step": 91050 + }, + { + "epoch": 22.22, + "learning_rate": 0.00038939408746640607, + "loss": 0.5277, + "step": 91075 + }, + { + "epoch": 22.23, + "learning_rate": 0.0003893635475201563, + "loss": 0.4429, + "step": 91100 + }, + { + "epoch": 22.24, + "learning_rate": 0.0003893330075739067, + "loss": 0.5015, + "step": 91125 + }, + { + "epoch": 22.24, + "learning_rate": 0.000389302467627657, + "loss": 0.4684, + "step": 91150 + }, + { + "epoch": 22.25, + "learning_rate": 0.0003892719276814073, + "loss": 0.5632, + "step": 91175 + }, + { + "epoch": 22.25, + "learning_rate": 0.0003892413877351576, + "loss": 0.4923, + "step": 91200 + }, + { + "epoch": 22.26, + "learning_rate": 0.0003892108477889079, + "loss": 0.5177, + "step": 91225 + }, + { + "epoch": 22.27, + "learning_rate": 0.00038918030784265825, + "loss": 0.4963, + "step": 91250 + }, + { + "epoch": 22.27, + "learning_rate": 0.0003891497678964085, + "loss": 0.4868, + "step": 91275 + }, + { + "epoch": 22.28, + "learning_rate": 0.0003891192279501588, + "loss": 0.4688, + "step": 91300 + }, + { + "epoch": 22.29, + "learning_rate": 0.0003890886880039091, + "loss": 0.495, + "step": 91325 + }, + { + "epoch": 22.29, + "learning_rate": 0.0003890581480576594, + "loss": 0.4599, + "step": 91350 + }, + { + "epoch": 22.3, + "learning_rate": 0.00038902760811140977, + "loss": 0.4995, + "step": 91375 + }, + { + "epoch": 22.3, + "learning_rate": 0.00038899706816516007, + "loss": 0.4644, + "step": 91400 + }, + { + "epoch": 22.31, + "learning_rate": 0.0003889665282189103, + "loss": 0.5083, + "step": 91425 + }, + { + "epoch": 22.32, + "learning_rate": 0.0003889359882726606, + "loss": 0.4402, + "step": 91450 + }, + { + "epoch": 22.32, + "learning_rate": 0.0003889054483264109, + "loss": 0.4883, + "step": 91475 + }, + { + "epoch": 22.33, + "learning_rate": 0.0003888749083801613, + "loss": 0.4897, + "step": 91500 + }, + { + "epoch": 22.33, + "learning_rate": 0.0003888443684339116, + "loss": 0.5078, + "step": 91525 + }, + { + "epoch": 22.34, + "learning_rate": 0.0003888138284876619, + "loss": 0.4662, + "step": 91550 + }, + { + "epoch": 22.35, + "learning_rate": 0.00038878451013926214, + "loss": 0.5353, + "step": 91575 + }, + { + "epoch": 22.35, + "learning_rate": 0.00038875397019301245, + "loss": 0.4879, + "step": 91600 + }, + { + "epoch": 22.36, + "learning_rate": 0.00038872343024676275, + "loss": 0.5197, + "step": 91625 + }, + { + "epoch": 22.36, + "learning_rate": 0.0003886928903005131, + "loss": 0.4503, + "step": 91650 + }, + { + "epoch": 22.37, + "learning_rate": 0.0003886623503542634, + "loss": 0.5222, + "step": 91675 + }, + { + "epoch": 22.38, + "learning_rate": 0.0003886318104080137, + "loss": 0.4813, + "step": 91700 + }, + { + "epoch": 22.38, + "learning_rate": 0.000388601270461764, + "loss": 0.5059, + "step": 91725 + }, + { + "epoch": 22.39, + "learning_rate": 0.00038857073051551427, + "loss": 0.4764, + "step": 91750 + }, + { + "epoch": 22.4, + "learning_rate": 0.00038854019056926457, + "loss": 0.5375, + "step": 91775 + }, + { + "epoch": 22.4, + "learning_rate": 0.0003885096506230149, + "loss": 0.4988, + "step": 91800 + }, + { + "epoch": 22.41, + "learning_rate": 0.00038847911067676523, + "loss": 0.4746, + "step": 91825 + }, + { + "epoch": 22.41, + "learning_rate": 0.00038844857073051553, + "loss": 0.5125, + "step": 91850 + }, + { + "epoch": 22.42, + "learning_rate": 0.00038841803078426584, + "loss": 0.5544, + "step": 91875 + }, + { + "epoch": 22.43, + "learning_rate": 0.0003883874908380161, + "loss": 0.4323, + "step": 91900 + }, + { + "epoch": 22.43, + "learning_rate": 0.00038835695089176644, + "loss": 0.4781, + "step": 91925 + }, + { + "epoch": 22.44, + "learning_rate": 0.00038832641094551675, + "loss": 0.5042, + "step": 91950 + }, + { + "epoch": 22.44, + "learning_rate": 0.00038829587099926705, + "loss": 0.5044, + "step": 91975 + }, + { + "epoch": 22.45, + "learning_rate": 0.00038826533105301735, + "loss": 0.4864, + "step": 92000 + }, + { + "epoch": 22.46, + "learning_rate": 0.00038823479110676766, + "loss": 0.561, + "step": 92025 + }, + { + "epoch": 22.46, + "learning_rate": 0.00038820425116051796, + "loss": 0.4371, + "step": 92050 + }, + { + "epoch": 22.47, + "learning_rate": 0.00038817371121426826, + "loss": 0.4977, + "step": 92075 + }, + { + "epoch": 22.47, + "learning_rate": 0.00038814317126801857, + "loss": 0.4416, + "step": 92100 + }, + { + "epoch": 22.48, + "learning_rate": 0.00038811263132176887, + "loss": 0.5439, + "step": 92125 + }, + { + "epoch": 22.49, + "learning_rate": 0.0003880820913755192, + "loss": 0.443, + "step": 92150 + }, + { + "epoch": 22.49, + "learning_rate": 0.00038805155142926953, + "loss": 0.533, + "step": 92175 + }, + { + "epoch": 22.5, + "learning_rate": 0.00038802101148301983, + "loss": 0.4652, + "step": 92200 + }, + { + "epoch": 22.5, + "learning_rate": 0.0003879904715367701, + "loss": 0.5629, + "step": 92225 + }, + { + "epoch": 22.51, + "learning_rate": 0.0003879599315905204, + "loss": 0.4605, + "step": 92250 + }, + { + "epoch": 22.52, + "learning_rate": 0.0003879293916442707, + "loss": 0.5329, + "step": 92275 + }, + { + "epoch": 22.52, + "learning_rate": 0.00038789885169802105, + "loss": 0.4571, + "step": 92300 + }, + { + "epoch": 22.53, + "learning_rate": 0.00038786831175177135, + "loss": 0.4795, + "step": 92325 + }, + { + "epoch": 22.54, + "learning_rate": 0.00038783777180552165, + "loss": 0.4904, + "step": 92350 + }, + { + "epoch": 22.54, + "learning_rate": 0.0003878072318592719, + "loss": 0.5605, + "step": 92375 + }, + { + "epoch": 22.55, + "learning_rate": 0.0003877766919130222, + "loss": 0.4585, + "step": 92400 + }, + { + "epoch": 22.55, + "learning_rate": 0.00038774615196677256, + "loss": 0.5349, + "step": 92425 + }, + { + "epoch": 22.56, + "learning_rate": 0.00038771561202052287, + "loss": 0.4769, + "step": 92450 + }, + { + "epoch": 22.57, + "learning_rate": 0.00038768507207427317, + "loss": 0.491, + "step": 92475 + }, + { + "epoch": 22.57, + "learning_rate": 0.0003876545321280235, + "loss": 0.4512, + "step": 92500 + }, + { + "epoch": 22.58, + "learning_rate": 0.0003876239921817737, + "loss": 0.5088, + "step": 92525 + }, + { + "epoch": 22.58, + "learning_rate": 0.0003875934522355241, + "loss": 0.4509, + "step": 92550 + }, + { + "epoch": 22.59, + "learning_rate": 0.0003875629122892744, + "loss": 0.5303, + "step": 92575 + }, + { + "epoch": 22.6, + "learning_rate": 0.0003875323723430247, + "loss": 0.4676, + "step": 92600 + }, + { + "epoch": 22.6, + "learning_rate": 0.000387501832396775, + "loss": 0.4776, + "step": 92625 + }, + { + "epoch": 22.61, + "learning_rate": 0.0003874712924505253, + "loss": 0.4843, + "step": 92650 + }, + { + "epoch": 22.61, + "learning_rate": 0.0003874407525042756, + "loss": 0.504, + "step": 92675 + }, + { + "epoch": 22.62, + "learning_rate": 0.0003874102125580259, + "loss": 0.4525, + "step": 92700 + }, + { + "epoch": 22.63, + "learning_rate": 0.0003873796726117762, + "loss": 0.4874, + "step": 92725 + }, + { + "epoch": 22.63, + "learning_rate": 0.0003873491326655265, + "loss": 0.5024, + "step": 92750 + }, + { + "epoch": 22.64, + "learning_rate": 0.0003873185927192768, + "loss": 0.5104, + "step": 92775 + }, + { + "epoch": 22.65, + "learning_rate": 0.00038728805277302717, + "loss": 0.4292, + "step": 92800 + }, + { + "epoch": 22.65, + "learning_rate": 0.00038725751282677747, + "loss": 0.4798, + "step": 92825 + }, + { + "epoch": 22.66, + "learning_rate": 0.0003872269728805277, + "loss": 0.4755, + "step": 92850 + }, + { + "epoch": 22.66, + "learning_rate": 0.000387196432934278, + "loss": 0.5197, + "step": 92875 + }, + { + "epoch": 22.67, + "learning_rate": 0.00038716589298802833, + "loss": 0.4345, + "step": 92900 + }, + { + "epoch": 22.68, + "learning_rate": 0.0003871353530417787, + "loss": 0.5431, + "step": 92925 + }, + { + "epoch": 22.68, + "learning_rate": 0.000387104813095529, + "loss": 0.4644, + "step": 92950 + }, + { + "epoch": 22.69, + "learning_rate": 0.0003870742731492793, + "loss": 0.4992, + "step": 92975 + }, + { + "epoch": 22.69, + "learning_rate": 0.00038704373320302954, + "loss": 0.4451, + "step": 93000 + }, + { + "epoch": 22.69, + "eval_cer": 0.11186000431198218, + "eval_loss": 0.44263726472854614, + "eval_runtime": 146.1403, + "eval_samples_per_second": 28.692, + "eval_steps_per_second": 7.178, + "eval_wer": 0.4508646003262643, + "step": 93000 + }, + { + "epoch": 22.7, + "learning_rate": 0.00038701319325677984, + "loss": 0.4674, + "step": 93025 + }, + { + "epoch": 22.71, + "learning_rate": 0.0003869826533105302, + "loss": 0.4967, + "step": 93050 + }, + { + "epoch": 22.71, + "learning_rate": 0.0003869521133642805, + "loss": 0.5561, + "step": 93075 + }, + { + "epoch": 22.72, + "learning_rate": 0.0003869215734180308, + "loss": 0.5109, + "step": 93100 + }, + { + "epoch": 22.72, + "learning_rate": 0.0003868910334717811, + "loss": 0.494, + "step": 93125 + }, + { + "epoch": 22.73, + "learning_rate": 0.00038686049352553136, + "loss": 0.4803, + "step": 93150 + }, + { + "epoch": 22.74, + "learning_rate": 0.00038682995357928166, + "loss": 0.523, + "step": 93175 + }, + { + "epoch": 22.74, + "learning_rate": 0.000386799413633032, + "loss": 0.4682, + "step": 93200 + }, + { + "epoch": 22.75, + "learning_rate": 0.0003867688736867823, + "loss": 0.4921, + "step": 93225 + }, + { + "epoch": 22.76, + "learning_rate": 0.00038673833374053263, + "loss": 0.4338, + "step": 93250 + }, + { + "epoch": 22.76, + "learning_rate": 0.00038670779379428293, + "loss": 0.5046, + "step": 93275 + }, + { + "epoch": 22.77, + "learning_rate": 0.00038667725384803324, + "loss": 0.4381, + "step": 93300 + }, + { + "epoch": 22.77, + "learning_rate": 0.00038664671390178354, + "loss": 0.5095, + "step": 93325 + }, + { + "epoch": 22.78, + "learning_rate": 0.00038661617395553384, + "loss": 0.4569, + "step": 93350 + }, + { + "epoch": 22.79, + "learning_rate": 0.00038658563400928415, + "loss": 0.5539, + "step": 93375 + }, + { + "epoch": 22.79, + "learning_rate": 0.00038655509406303445, + "loss": 0.4506, + "step": 93400 + }, + { + "epoch": 22.8, + "learning_rate": 0.00038652455411678475, + "loss": 0.4904, + "step": 93425 + }, + { + "epoch": 22.8, + "learning_rate": 0.0003864940141705351, + "loss": 0.4195, + "step": 93450 + }, + { + "epoch": 22.81, + "learning_rate": 0.00038646347422428536, + "loss": 0.5241, + "step": 93475 + }, + { + "epoch": 22.82, + "learning_rate": 0.00038643293427803566, + "loss": 0.5006, + "step": 93500 + }, + { + "epoch": 22.82, + "learning_rate": 0.00038640239433178597, + "loss": 0.5539, + "step": 93525 + }, + { + "epoch": 22.83, + "learning_rate": 0.00038637185438553627, + "loss": 0.4748, + "step": 93550 + }, + { + "epoch": 22.83, + "learning_rate": 0.0003863413144392866, + "loss": 0.5467, + "step": 93575 + }, + { + "epoch": 22.84, + "learning_rate": 0.00038631077449303693, + "loss": 0.4706, + "step": 93600 + }, + { + "epoch": 22.85, + "learning_rate": 0.0003862802345467872, + "loss": 0.5325, + "step": 93625 + }, + { + "epoch": 22.85, + "learning_rate": 0.0003862496946005375, + "loss": 0.4695, + "step": 93650 + }, + { + "epoch": 22.86, + "learning_rate": 0.0003862191546542878, + "loss": 0.4782, + "step": 93675 + }, + { + "epoch": 22.86, + "learning_rate": 0.00038618861470803814, + "loss": 0.4095, + "step": 93700 + }, + { + "epoch": 22.87, + "learning_rate": 0.00038615807476178845, + "loss": 0.51, + "step": 93725 + }, + { + "epoch": 22.88, + "learning_rate": 0.00038612753481553875, + "loss": 0.4564, + "step": 93750 + }, + { + "epoch": 22.88, + "learning_rate": 0.00038609699486928905, + "loss": 0.5336, + "step": 93775 + }, + { + "epoch": 22.89, + "learning_rate": 0.0003860664549230393, + "loss": 0.5094, + "step": 93800 + }, + { + "epoch": 22.9, + "learning_rate": 0.00038603591497678966, + "loss": 0.5279, + "step": 93825 + }, + { + "epoch": 22.9, + "learning_rate": 0.00038600537503053996, + "loss": 0.5133, + "step": 93850 + }, + { + "epoch": 22.91, + "learning_rate": 0.00038597483508429027, + "loss": 0.4836, + "step": 93875 + }, + { + "epoch": 22.91, + "learning_rate": 0.00038594429513804057, + "loss": 0.4918, + "step": 93900 + }, + { + "epoch": 22.92, + "learning_rate": 0.0003859137551917909, + "loss": 0.5372, + "step": 93925 + }, + { + "epoch": 22.93, + "learning_rate": 0.0003858832152455412, + "loss": 0.4791, + "step": 93950 + }, + { + "epoch": 22.93, + "learning_rate": 0.0003858526752992915, + "loss": 0.5199, + "step": 93975 + }, + { + "epoch": 22.94, + "learning_rate": 0.0003858233569508918, + "loss": 0.4629, + "step": 94000 + }, + { + "epoch": 22.94, + "learning_rate": 0.0003857928170046421, + "loss": 0.5178, + "step": 94025 + }, + { + "epoch": 22.95, + "learning_rate": 0.0003857622770583924, + "loss": 0.5132, + "step": 94050 + }, + { + "epoch": 22.96, + "learning_rate": 0.0003857317371121427, + "loss": 0.5321, + "step": 94075 + }, + { + "epoch": 22.96, + "learning_rate": 0.00038570119716589295, + "loss": 0.4338, + "step": 94100 + }, + { + "epoch": 22.97, + "learning_rate": 0.0003856706572196433, + "loss": 0.4782, + "step": 94125 + }, + { + "epoch": 22.97, + "learning_rate": 0.0003856401172733936, + "loss": 0.5093, + "step": 94150 + }, + { + "epoch": 22.98, + "learning_rate": 0.0003856095773271439, + "loss": 0.4996, + "step": 94175 + }, + { + "epoch": 22.99, + "learning_rate": 0.0003855790373808942, + "loss": 0.4576, + "step": 94200 + }, + { + "epoch": 22.99, + "learning_rate": 0.0003855484974346445, + "loss": 0.5363, + "step": 94225 + }, + { + "epoch": 23.0, + "learning_rate": 0.0003855179574883949, + "loss": 0.4586, + "step": 94250 + }, + { + "epoch": 23.01, + "learning_rate": 0.0003854874175421451, + "loss": 0.5103, + "step": 94275 + }, + { + "epoch": 23.01, + "learning_rate": 0.0003854568775958954, + "loss": 0.4995, + "step": 94300 + }, + { + "epoch": 23.02, + "learning_rate": 0.00038542633764964573, + "loss": 0.4858, + "step": 94325 + }, + { + "epoch": 23.02, + "learning_rate": 0.00038539579770339603, + "loss": 0.4616, + "step": 94350 + }, + { + "epoch": 23.03, + "learning_rate": 0.0003853652577571464, + "loss": 0.4772, + "step": 94375 + }, + { + "epoch": 23.04, + "learning_rate": 0.0003853347178108967, + "loss": 0.4242, + "step": 94400 + }, + { + "epoch": 23.04, + "learning_rate": 0.00038530417786464694, + "loss": 0.4551, + "step": 94425 + }, + { + "epoch": 23.05, + "learning_rate": 0.00038527363791839725, + "loss": 0.4337, + "step": 94450 + }, + { + "epoch": 23.05, + "learning_rate": 0.00038524309797214755, + "loss": 0.5081, + "step": 94475 + }, + { + "epoch": 23.06, + "learning_rate": 0.0003852125580258979, + "loss": 0.4795, + "step": 94500 + }, + { + "epoch": 23.07, + "learning_rate": 0.0003851820180796482, + "loss": 0.4721, + "step": 94525 + }, + { + "epoch": 23.07, + "learning_rate": 0.0003851514781333985, + "loss": 0.4625, + "step": 94550 + }, + { + "epoch": 23.08, + "learning_rate": 0.00038512093818714876, + "loss": 0.5091, + "step": 94575 + }, + { + "epoch": 23.08, + "learning_rate": 0.00038509039824089907, + "loss": 0.4679, + "step": 94600 + }, + { + "epoch": 23.09, + "learning_rate": 0.0003850598582946494, + "loss": 0.4813, + "step": 94625 + }, + { + "epoch": 23.1, + "learning_rate": 0.00038502931834839973, + "loss": 0.4172, + "step": 94650 + }, + { + "epoch": 23.1, + "learning_rate": 0.00038499877840215003, + "loss": 0.4948, + "step": 94675 + }, + { + "epoch": 23.11, + "learning_rate": 0.00038496823845590033, + "loss": 0.4403, + "step": 94700 + }, + { + "epoch": 23.11, + "learning_rate": 0.00038493769850965064, + "loss": 0.4947, + "step": 94725 + }, + { + "epoch": 23.12, + "learning_rate": 0.00038490715856340094, + "loss": 0.44, + "step": 94750 + }, + { + "epoch": 23.13, + "learning_rate": 0.00038487661861715124, + "loss": 0.5244, + "step": 94775 + }, + { + "epoch": 23.13, + "learning_rate": 0.00038484607867090155, + "loss": 0.4809, + "step": 94800 + }, + { + "epoch": 23.14, + "learning_rate": 0.00038481553872465185, + "loss": 0.4803, + "step": 94825 + }, + { + "epoch": 23.15, + "learning_rate": 0.00038478499877840215, + "loss": 0.4412, + "step": 94850 + }, + { + "epoch": 23.15, + "learning_rate": 0.0003847544588321525, + "loss": 0.5365, + "step": 94875 + }, + { + "epoch": 23.16, + "learning_rate": 0.00038472391888590276, + "loss": 0.4305, + "step": 94900 + }, + { + "epoch": 23.16, + "learning_rate": 0.00038469337893965306, + "loss": 0.5242, + "step": 94925 + }, + { + "epoch": 23.17, + "learning_rate": 0.00038466283899340337, + "loss": 0.4683, + "step": 94950 + }, + { + "epoch": 23.18, + "learning_rate": 0.00038463229904715367, + "loss": 0.5065, + "step": 94975 + }, + { + "epoch": 23.18, + "learning_rate": 0.00038460175910090403, + "loss": 0.4666, + "step": 95000 + }, + { + "epoch": 23.19, + "learning_rate": 0.00038457121915465433, + "loss": 0.4901, + "step": 95025 + }, + { + "epoch": 23.19, + "learning_rate": 0.0003845406792084046, + "loss": 0.461, + "step": 95050 + }, + { + "epoch": 23.2, + "learning_rate": 0.0003845101392621549, + "loss": 0.4689, + "step": 95075 + }, + { + "epoch": 23.21, + "learning_rate": 0.0003844795993159052, + "loss": 0.4183, + "step": 95100 + }, + { + "epoch": 23.21, + "learning_rate": 0.0003844490593696555, + "loss": 0.4992, + "step": 95125 + }, + { + "epoch": 23.22, + "learning_rate": 0.00038441851942340585, + "loss": 0.4255, + "step": 95150 + }, + { + "epoch": 23.22, + "learning_rate": 0.00038438797947715615, + "loss": 0.4857, + "step": 95175 + }, + { + "epoch": 23.23, + "learning_rate": 0.00038435743953090646, + "loss": 0.474, + "step": 95200 + }, + { + "epoch": 23.24, + "learning_rate": 0.0003843268995846567, + "loss": 0.4662, + "step": 95225 + }, + { + "epoch": 23.24, + "learning_rate": 0.000384296359638407, + "loss": 0.4002, + "step": 95250 + }, + { + "epoch": 23.25, + "learning_rate": 0.00038426581969215737, + "loss": 0.4931, + "step": 95275 + }, + { + "epoch": 23.26, + "learning_rate": 0.00038423527974590767, + "loss": 0.4502, + "step": 95300 + }, + { + "epoch": 23.26, + "learning_rate": 0.00038420473979965797, + "loss": 0.4826, + "step": 95325 + }, + { + "epoch": 23.27, + "learning_rate": 0.0003841741998534083, + "loss": 0.4563, + "step": 95350 + }, + { + "epoch": 23.27, + "learning_rate": 0.0003841436599071585, + "loss": 0.4959, + "step": 95375 + }, + { + "epoch": 23.28, + "learning_rate": 0.0003841131199609089, + "loss": 0.4783, + "step": 95400 + }, + { + "epoch": 23.29, + "learning_rate": 0.0003840825800146592, + "loss": 0.5152, + "step": 95425 + }, + { + "epoch": 23.29, + "learning_rate": 0.0003840520400684095, + "loss": 0.473, + "step": 95450 + }, + { + "epoch": 23.3, + "learning_rate": 0.0003840215001221598, + "loss": 0.495, + "step": 95475 + }, + { + "epoch": 23.3, + "learning_rate": 0.0003839909601759101, + "loss": 0.4423, + "step": 95500 + }, + { + "epoch": 23.31, + "learning_rate": 0.0003839604202296604, + "loss": 0.5382, + "step": 95525 + }, + { + "epoch": 23.32, + "learning_rate": 0.0003839298802834107, + "loss": 0.4199, + "step": 95550 + }, + { + "epoch": 23.32, + "learning_rate": 0.000383899340337161, + "loss": 0.4925, + "step": 95575 + }, + { + "epoch": 23.33, + "learning_rate": 0.0003838688003909113, + "loss": 0.4474, + "step": 95600 + }, + { + "epoch": 23.33, + "learning_rate": 0.0003838382604446616, + "loss": 0.5181, + "step": 95625 + }, + { + "epoch": 23.34, + "learning_rate": 0.00038380772049841197, + "loss": 0.4751, + "step": 95650 + }, + { + "epoch": 23.35, + "learning_rate": 0.0003837771805521623, + "loss": 0.4907, + "step": 95675 + }, + { + "epoch": 23.35, + "learning_rate": 0.0003837466406059125, + "loss": 0.4483, + "step": 95700 + }, + { + "epoch": 23.36, + "learning_rate": 0.0003837161006596628, + "loss": 0.5041, + "step": 95725 + }, + { + "epoch": 23.37, + "learning_rate": 0.00038368556071341313, + "loss": 0.4663, + "step": 95750 + }, + { + "epoch": 23.37, + "learning_rate": 0.0003836550207671635, + "loss": 0.5671, + "step": 95775 + }, + { + "epoch": 23.38, + "learning_rate": 0.0003836244808209138, + "loss": 0.4279, + "step": 95800 + }, + { + "epoch": 23.38, + "learning_rate": 0.0003835939408746641, + "loss": 0.4945, + "step": 95825 + }, + { + "epoch": 23.39, + "learning_rate": 0.00038356340092841434, + "loss": 0.4691, + "step": 95850 + }, + { + "epoch": 23.4, + "learning_rate": 0.00038353286098216465, + "loss": 0.5027, + "step": 95875 + }, + { + "epoch": 23.4, + "learning_rate": 0.000383502321035915, + "loss": 0.4723, + "step": 95900 + }, + { + "epoch": 23.41, + "learning_rate": 0.0003834717810896653, + "loss": 0.5334, + "step": 95925 + }, + { + "epoch": 23.41, + "learning_rate": 0.0003834412411434156, + "loss": 0.437, + "step": 95950 + }, + { + "epoch": 23.42, + "learning_rate": 0.0003834107011971659, + "loss": 0.4901, + "step": 95975 + }, + { + "epoch": 23.43, + "learning_rate": 0.00038338016125091616, + "loss": 0.4319, + "step": 96000 + }, + { + "epoch": 23.43, + "eval_cer": 0.10958081373263658, + "eval_loss": 0.4272046983242035, + "eval_runtime": 149.2388, + "eval_samples_per_second": 28.096, + "eval_steps_per_second": 7.029, + "eval_wer": 0.4472430668841762, + "step": 96000 + }, + { + "epoch": 23.43, + "learning_rate": 0.0003833496213046665, + "loss": 0.5031, + "step": 96025 + }, + { + "epoch": 23.44, + "learning_rate": 0.0003833190813584168, + "loss": 0.4644, + "step": 96050 + }, + { + "epoch": 23.44, + "learning_rate": 0.0003832885414121671, + "loss": 0.5066, + "step": 96075 + }, + { + "epoch": 23.45, + "learning_rate": 0.00038325800146591743, + "loss": 0.4638, + "step": 96100 + }, + { + "epoch": 23.46, + "learning_rate": 0.00038322746151966773, + "loss": 0.4751, + "step": 96125 + }, + { + "epoch": 23.46, + "learning_rate": 0.00038319692157341804, + "loss": 0.4367, + "step": 96150 + }, + { + "epoch": 23.47, + "learning_rate": 0.0003831676032250183, + "loss": 0.5076, + "step": 96175 + }, + { + "epoch": 23.47, + "learning_rate": 0.00038313706327876865, + "loss": 0.3962, + "step": 96200 + }, + { + "epoch": 23.48, + "learning_rate": 0.00038310652333251895, + "loss": 0.5018, + "step": 96225 + }, + { + "epoch": 23.49, + "learning_rate": 0.00038307598338626925, + "loss": 0.4345, + "step": 96250 + }, + { + "epoch": 23.49, + "learning_rate": 0.00038304544344001956, + "loss": 0.5086, + "step": 96275 + }, + { + "epoch": 23.5, + "learning_rate": 0.00038301490349376986, + "loss": 0.4465, + "step": 96300 + }, + { + "epoch": 23.51, + "learning_rate": 0.00038298436354752016, + "loss": 0.5403, + "step": 96325 + }, + { + "epoch": 23.51, + "learning_rate": 0.00038295382360127047, + "loss": 0.4466, + "step": 96350 + }, + { + "epoch": 23.52, + "learning_rate": 0.00038292328365502077, + "loss": 0.5121, + "step": 96375 + }, + { + "epoch": 23.52, + "learning_rate": 0.0003828927437087711, + "loss": 0.4536, + "step": 96400 + }, + { + "epoch": 23.53, + "learning_rate": 0.0003828622037625214, + "loss": 0.4811, + "step": 96425 + }, + { + "epoch": 23.54, + "learning_rate": 0.00038283166381627173, + "loss": 0.4512, + "step": 96450 + }, + { + "epoch": 23.54, + "learning_rate": 0.000382801123870022, + "loss": 0.5013, + "step": 96475 + }, + { + "epoch": 23.55, + "learning_rate": 0.0003827705839237723, + "loss": 0.4513, + "step": 96500 + }, + { + "epoch": 23.55, + "learning_rate": 0.0003827400439775226, + "loss": 0.4703, + "step": 96525 + }, + { + "epoch": 23.56, + "learning_rate": 0.0003827095040312729, + "loss": 0.4889, + "step": 96550 + }, + { + "epoch": 23.57, + "learning_rate": 0.00038267896408502325, + "loss": 0.4766, + "step": 96575 + }, + { + "epoch": 23.57, + "learning_rate": 0.00038264842413877355, + "loss": 0.4529, + "step": 96600 + }, + { + "epoch": 23.58, + "learning_rate": 0.0003826178841925238, + "loss": 0.493, + "step": 96625 + }, + { + "epoch": 23.58, + "learning_rate": 0.0003825873442462741, + "loss": 0.4478, + "step": 96650 + }, + { + "epoch": 23.59, + "learning_rate": 0.0003825568043000244, + "loss": 0.5043, + "step": 96675 + }, + { + "epoch": 23.6, + "learning_rate": 0.00038252626435377477, + "loss": 0.4583, + "step": 96700 + }, + { + "epoch": 23.6, + "learning_rate": 0.00038249572440752507, + "loss": 0.5067, + "step": 96725 + }, + { + "epoch": 23.61, + "learning_rate": 0.0003824651844612754, + "loss": 0.4689, + "step": 96750 + }, + { + "epoch": 23.62, + "learning_rate": 0.0003824346445150257, + "loss": 0.5348, + "step": 96775 + }, + { + "epoch": 23.62, + "learning_rate": 0.0003824041045687759, + "loss": 0.4366, + "step": 96800 + }, + { + "epoch": 23.63, + "learning_rate": 0.0003823735646225263, + "loss": 0.508, + "step": 96825 + }, + { + "epoch": 23.63, + "learning_rate": 0.0003823430246762766, + "loss": 0.4352, + "step": 96850 + }, + { + "epoch": 23.64, + "learning_rate": 0.0003823124847300269, + "loss": 0.5385, + "step": 96875 + }, + { + "epoch": 23.65, + "learning_rate": 0.0003822819447837772, + "loss": 0.4585, + "step": 96900 + }, + { + "epoch": 23.65, + "learning_rate": 0.0003822514048375275, + "loss": 0.5147, + "step": 96925 + }, + { + "epoch": 23.66, + "learning_rate": 0.0003822208648912778, + "loss": 0.4456, + "step": 96950 + }, + { + "epoch": 23.66, + "learning_rate": 0.0003821903249450281, + "loss": 0.4983, + "step": 96975 + }, + { + "epoch": 23.67, + "learning_rate": 0.0003821597849987784, + "loss": 0.4749, + "step": 97000 + }, + { + "epoch": 23.68, + "learning_rate": 0.0003821292450525287, + "loss": 0.5113, + "step": 97025 + }, + { + "epoch": 23.68, + "learning_rate": 0.000382098705106279, + "loss": 0.5146, + "step": 97050 + }, + { + "epoch": 23.69, + "learning_rate": 0.00038206816516002937, + "loss": 0.495, + "step": 97075 + }, + { + "epoch": 23.69, + "learning_rate": 0.0003820376252137796, + "loss": 0.4706, + "step": 97100 + }, + { + "epoch": 23.7, + "learning_rate": 0.0003820070852675299, + "loss": 0.5337, + "step": 97125 + }, + { + "epoch": 23.71, + "learning_rate": 0.00038197654532128023, + "loss": 0.4133, + "step": 97150 + }, + { + "epoch": 23.71, + "learning_rate": 0.00038194600537503053, + "loss": 0.502, + "step": 97175 + }, + { + "epoch": 23.72, + "learning_rate": 0.00038191546542878083, + "loss": 0.4532, + "step": 97200 + }, + { + "epoch": 23.72, + "learning_rate": 0.0003818849254825312, + "loss": 0.5145, + "step": 97225 + }, + { + "epoch": 23.73, + "learning_rate": 0.0003818543855362815, + "loss": 0.4581, + "step": 97250 + }, + { + "epoch": 23.74, + "learning_rate": 0.00038182384559003174, + "loss": 0.5038, + "step": 97275 + }, + { + "epoch": 23.74, + "learning_rate": 0.00038179330564378205, + "loss": 0.4292, + "step": 97300 + }, + { + "epoch": 23.75, + "learning_rate": 0.00038176276569753235, + "loss": 0.5076, + "step": 97325 + }, + { + "epoch": 23.76, + "learning_rate": 0.0003817322257512827, + "loss": 0.4406, + "step": 97350 + }, + { + "epoch": 23.76, + "learning_rate": 0.000381701685805033, + "loss": 0.5133, + "step": 97375 + }, + { + "epoch": 23.77, + "learning_rate": 0.0003816711458587833, + "loss": 0.4, + "step": 97400 + }, + { + "epoch": 23.77, + "learning_rate": 0.00038164060591253356, + "loss": 0.4934, + "step": 97425 + }, + { + "epoch": 23.78, + "learning_rate": 0.00038161006596628387, + "loss": 0.4434, + "step": 97450 + }, + { + "epoch": 23.79, + "learning_rate": 0.0003815795260200342, + "loss": 0.5085, + "step": 97475 + }, + { + "epoch": 23.79, + "learning_rate": 0.00038154898607378453, + "loss": 0.4546, + "step": 97500 + }, + { + "epoch": 23.8, + "learning_rate": 0.00038151844612753483, + "loss": 0.499, + "step": 97525 + }, + { + "epoch": 23.8, + "learning_rate": 0.00038148790618128514, + "loss": 0.4719, + "step": 97550 + }, + { + "epoch": 23.81, + "learning_rate": 0.0003814573662350354, + "loss": 0.5191, + "step": 97575 + }, + { + "epoch": 23.82, + "learning_rate": 0.00038142682628878574, + "loss": 0.4995, + "step": 97600 + }, + { + "epoch": 23.82, + "learning_rate": 0.00038139628634253605, + "loss": 0.5225, + "step": 97625 + }, + { + "epoch": 23.83, + "learning_rate": 0.00038136574639628635, + "loss": 0.4468, + "step": 97650 + }, + { + "epoch": 23.83, + "learning_rate": 0.00038133520645003665, + "loss": 0.5187, + "step": 97675 + }, + { + "epoch": 23.84, + "learning_rate": 0.00038130466650378696, + "loss": 0.426, + "step": 97700 + }, + { + "epoch": 23.85, + "learning_rate": 0.0003812741265575373, + "loss": 0.486, + "step": 97725 + }, + { + "epoch": 23.85, + "learning_rate": 0.00038124358661128756, + "loss": 0.5055, + "step": 97750 + }, + { + "epoch": 23.86, + "learning_rate": 0.00038121304666503787, + "loss": 0.5072, + "step": 97775 + }, + { + "epoch": 23.87, + "learning_rate": 0.00038118250671878817, + "loss": 0.4402, + "step": 97800 + }, + { + "epoch": 23.87, + "learning_rate": 0.00038115196677253847, + "loss": 0.4967, + "step": 97825 + }, + { + "epoch": 23.88, + "learning_rate": 0.00038112142682628883, + "loss": 0.4496, + "step": 97850 + }, + { + "epoch": 23.88, + "learning_rate": 0.00038109088688003913, + "loss": 0.5174, + "step": 97875 + }, + { + "epoch": 23.89, + "learning_rate": 0.0003810603469337894, + "loss": 0.4629, + "step": 97900 + }, + { + "epoch": 23.9, + "learning_rate": 0.0003810298069875397, + "loss": 0.4647, + "step": 97925 + }, + { + "epoch": 23.9, + "learning_rate": 0.00038099926704129, + "loss": 0.4622, + "step": 97950 + }, + { + "epoch": 23.91, + "learning_rate": 0.00038096872709504035, + "loss": 0.4721, + "step": 97975 + }, + { + "epoch": 23.91, + "learning_rate": 0.00038093818714879065, + "loss": 0.4376, + "step": 98000 + }, + { + "epoch": 23.92, + "learning_rate": 0.00038090764720254095, + "loss": 0.5157, + "step": 98025 + }, + { + "epoch": 23.93, + "learning_rate": 0.0003808771072562912, + "loss": 0.4177, + "step": 98050 + }, + { + "epoch": 23.93, + "learning_rate": 0.0003808465673100415, + "loss": 0.4717, + "step": 98075 + }, + { + "epoch": 23.94, + "learning_rate": 0.00038081602736379186, + "loss": 0.434, + "step": 98100 + }, + { + "epoch": 23.94, + "learning_rate": 0.00038078548741754217, + "loss": 0.4996, + "step": 98125 + }, + { + "epoch": 23.95, + "learning_rate": 0.00038075494747129247, + "loss": 0.4659, + "step": 98150 + }, + { + "epoch": 23.96, + "learning_rate": 0.0003807244075250428, + "loss": 0.5177, + "step": 98175 + }, + { + "epoch": 23.96, + "learning_rate": 0.0003806938675787931, + "loss": 0.4773, + "step": 98200 + }, + { + "epoch": 23.97, + "learning_rate": 0.0003806633276325434, + "loss": 0.5166, + "step": 98225 + }, + { + "epoch": 23.98, + "learning_rate": 0.0003806327876862937, + "loss": 0.4357, + "step": 98250 + }, + { + "epoch": 23.98, + "learning_rate": 0.000380602247740044, + "loss": 0.5099, + "step": 98275 + }, + { + "epoch": 23.99, + "learning_rate": 0.0003805717077937943, + "loss": 0.4399, + "step": 98300 + }, + { + "epoch": 23.99, + "learning_rate": 0.0003805411678475446, + "loss": 0.4911, + "step": 98325 + }, + { + "epoch": 24.0, + "learning_rate": 0.00038051062790129495, + "loss": 0.4196, + "step": 98350 + }, + { + "epoch": 24.01, + "learning_rate": 0.0003804800879550452, + "loss": 0.5231, + "step": 98375 + }, + { + "epoch": 24.01, + "learning_rate": 0.0003804495480087955, + "loss": 0.4501, + "step": 98400 + }, + { + "epoch": 24.02, + "learning_rate": 0.0003804190080625458, + "loss": 0.4743, + "step": 98425 + }, + { + "epoch": 24.02, + "learning_rate": 0.0003803884681162961, + "loss": 0.4069, + "step": 98450 + }, + { + "epoch": 24.03, + "learning_rate": 0.00038035792817004647, + "loss": 0.4805, + "step": 98475 + }, + { + "epoch": 24.04, + "learning_rate": 0.00038032738822379677, + "loss": 0.4623, + "step": 98500 + }, + { + "epoch": 24.04, + "learning_rate": 0.000380296848277547, + "loss": 0.5046, + "step": 98525 + }, + { + "epoch": 24.05, + "learning_rate": 0.0003802663083312973, + "loss": 0.4241, + "step": 98550 + }, + { + "epoch": 24.05, + "learning_rate": 0.0003802357683850476, + "loss": 0.4994, + "step": 98575 + }, + { + "epoch": 24.06, + "learning_rate": 0.00038020522843879793, + "loss": 0.4444, + "step": 98600 + }, + { + "epoch": 24.07, + "learning_rate": 0.0003801746884925483, + "loss": 0.495, + "step": 98625 + }, + { + "epoch": 24.07, + "learning_rate": 0.0003801441485462986, + "loss": 0.4386, + "step": 98650 + }, + { + "epoch": 24.08, + "learning_rate": 0.0003801136086000489, + "loss": 0.4757, + "step": 98675 + }, + { + "epoch": 24.08, + "learning_rate": 0.00038008306865379914, + "loss": 0.4466, + "step": 98700 + }, + { + "epoch": 24.09, + "learning_rate": 0.00038005252870754945, + "loss": 0.4837, + "step": 98725 + }, + { + "epoch": 24.1, + "learning_rate": 0.0003800219887612998, + "loss": 0.4318, + "step": 98750 + }, + { + "epoch": 24.1, + "learning_rate": 0.0003799914488150501, + "loss": 0.4878, + "step": 98775 + }, + { + "epoch": 24.11, + "learning_rate": 0.0003799621304666504, + "loss": 0.4346, + "step": 98800 + }, + { + "epoch": 24.12, + "learning_rate": 0.0003799315905204007, + "loss": 0.5095, + "step": 98825 + }, + { + "epoch": 24.12, + "learning_rate": 0.00037990105057415097, + "loss": 0.4116, + "step": 98850 + }, + { + "epoch": 24.13, + "learning_rate": 0.00037987051062790127, + "loss": 0.4906, + "step": 98875 + }, + { + "epoch": 24.13, + "learning_rate": 0.00037983997068165163, + "loss": 0.4252, + "step": 98900 + }, + { + "epoch": 24.14, + "learning_rate": 0.00037980943073540193, + "loss": 0.5012, + "step": 98925 + }, + { + "epoch": 24.15, + "learning_rate": 0.00037977889078915223, + "loss": 0.4239, + "step": 98950 + }, + { + "epoch": 24.15, + "learning_rate": 0.00037974835084290254, + "loss": 0.4926, + "step": 98975 + }, + { + "epoch": 24.16, + "learning_rate": 0.0003797178108966528, + "loss": 0.3624, + "step": 99000 + }, + { + "epoch": 24.16, + "eval_cer": 0.10784575423754915, + "eval_loss": 0.4347018301486969, + "eval_runtime": 148.8009, + "eval_samples_per_second": 28.179, + "eval_steps_per_second": 7.05, + "eval_wer": 0.4436541598694943, + "step": 99000 + }, + { + "epoch": 24.16, + "learning_rate": 0.00037968727095040314, + "loss": 0.5116, + "step": 99025 + }, + { + "epoch": 24.17, + "learning_rate": 0.00037965673100415345, + "loss": 0.4564, + "step": 99050 + }, + { + "epoch": 24.18, + "learning_rate": 0.00037962619105790375, + "loss": 0.4854, + "step": 99075 + }, + { + "epoch": 24.18, + "learning_rate": 0.00037959565111165405, + "loss": 0.4459, + "step": 99100 + }, + { + "epoch": 24.19, + "learning_rate": 0.00037956511116540436, + "loss": 0.5061, + "step": 99125 + }, + { + "epoch": 24.19, + "learning_rate": 0.0003795345712191547, + "loss": 0.4437, + "step": 99150 + }, + { + "epoch": 24.2, + "learning_rate": 0.00037950403127290496, + "loss": 0.4884, + "step": 99175 + }, + { + "epoch": 24.21, + "learning_rate": 0.00037947349132665527, + "loss": 0.4645, + "step": 99200 + }, + { + "epoch": 24.21, + "learning_rate": 0.00037944295138040557, + "loss": 0.4735, + "step": 99225 + }, + { + "epoch": 24.22, + "learning_rate": 0.0003794124114341559, + "loss": 0.4911, + "step": 99250 + }, + { + "epoch": 24.23, + "learning_rate": 0.0003793818714879062, + "loss": 0.5021, + "step": 99275 + }, + { + "epoch": 24.23, + "learning_rate": 0.00037935133154165654, + "loss": 0.4534, + "step": 99300 + }, + { + "epoch": 24.24, + "learning_rate": 0.0003793207915954068, + "loss": 0.4726, + "step": 99325 + }, + { + "epoch": 24.24, + "learning_rate": 0.0003792902516491571, + "loss": 0.4014, + "step": 99350 + }, + { + "epoch": 24.25, + "learning_rate": 0.0003792597117029074, + "loss": 0.4678, + "step": 99375 + }, + { + "epoch": 24.26, + "learning_rate": 0.0003792291717566577, + "loss": 0.3988, + "step": 99400 + }, + { + "epoch": 24.26, + "learning_rate": 0.00037919863181040805, + "loss": 0.4794, + "step": 99425 + }, + { + "epoch": 24.27, + "learning_rate": 0.00037916809186415836, + "loss": 0.4524, + "step": 99450 + }, + { + "epoch": 24.27, + "learning_rate": 0.0003791375519179086, + "loss": 0.4803, + "step": 99475 + }, + { + "epoch": 24.28, + "learning_rate": 0.0003791070119716589, + "loss": 0.4655, + "step": 99500 + }, + { + "epoch": 24.29, + "learning_rate": 0.0003790764720254092, + "loss": 0.4993, + "step": 99525 + }, + { + "epoch": 24.29, + "learning_rate": 0.00037904593207915957, + "loss": 0.4255, + "step": 99550 + }, + { + "epoch": 24.3, + "learning_rate": 0.00037901539213290987, + "loss": 0.4846, + "step": 99575 + }, + { + "epoch": 24.3, + "learning_rate": 0.0003789848521866602, + "loss": 0.4249, + "step": 99600 + }, + { + "epoch": 24.31, + "learning_rate": 0.0003789543122404104, + "loss": 0.5019, + "step": 99625 + }, + { + "epoch": 24.32, + "learning_rate": 0.00037892377229416073, + "loss": 0.4535, + "step": 99650 + }, + { + "epoch": 24.32, + "learning_rate": 0.0003788932323479111, + "loss": 0.4661, + "step": 99675 + }, + { + "epoch": 24.33, + "learning_rate": 0.0003788626924016614, + "loss": 0.4599, + "step": 99700 + }, + { + "epoch": 24.34, + "learning_rate": 0.0003788321524554117, + "loss": 0.4824, + "step": 99725 + }, + { + "epoch": 24.34, + "learning_rate": 0.000378801612509162, + "loss": 0.4772, + "step": 99750 + }, + { + "epoch": 24.35, + "learning_rate": 0.0003787710725629123, + "loss": 0.5119, + "step": 99775 + }, + { + "epoch": 24.35, + "learning_rate": 0.0003787405326166626, + "loss": 0.4115, + "step": 99800 + }, + { + "epoch": 24.36, + "learning_rate": 0.0003787099926704129, + "loss": 0.4619, + "step": 99825 + }, + { + "epoch": 24.37, + "learning_rate": 0.0003786794527241632, + "loss": 0.4373, + "step": 99850 + }, + { + "epoch": 24.37, + "learning_rate": 0.0003786489127779135, + "loss": 0.473, + "step": 99875 + }, + { + "epoch": 24.38, + "learning_rate": 0.0003786183728316638, + "loss": 0.4698, + "step": 99900 + }, + { + "epoch": 24.38, + "learning_rate": 0.0003785878328854142, + "loss": 0.5249, + "step": 99925 + }, + { + "epoch": 24.39, + "learning_rate": 0.0003785572929391644, + "loss": 0.4278, + "step": 99950 + }, + { + "epoch": 24.4, + "learning_rate": 0.0003785267529929147, + "loss": 0.5147, + "step": 99975 + }, + { + "epoch": 24.4, + "learning_rate": 0.00037849621304666503, + "loss": 0.4447, + "step": 100000 + }, + { + "epoch": 24.41, + "learning_rate": 0.00037846567310041533, + "loss": 0.4606, + "step": 100025 + }, + { + "epoch": 24.41, + "learning_rate": 0.0003784351331541657, + "loss": 0.4419, + "step": 100050 + }, + { + "epoch": 24.42, + "learning_rate": 0.000378404593207916, + "loss": 0.5273, + "step": 100075 + }, + { + "epoch": 24.43, + "learning_rate": 0.00037837405326166624, + "loss": 0.4586, + "step": 100100 + }, + { + "epoch": 24.43, + "learning_rate": 0.00037834351331541655, + "loss": 0.4693, + "step": 100125 + }, + { + "epoch": 24.44, + "learning_rate": 0.00037831297336916685, + "loss": 0.4369, + "step": 100150 + }, + { + "epoch": 24.44, + "learning_rate": 0.0003782824334229172, + "loss": 0.4678, + "step": 100175 + }, + { + "epoch": 24.45, + "learning_rate": 0.0003782518934766675, + "loss": 0.4281, + "step": 100200 + }, + { + "epoch": 24.46, + "learning_rate": 0.0003782213535304178, + "loss": 0.5052, + "step": 100225 + }, + { + "epoch": 24.46, + "learning_rate": 0.0003781908135841681, + "loss": 0.4302, + "step": 100250 + }, + { + "epoch": 24.47, + "learning_rate": 0.00037816027363791837, + "loss": 0.5099, + "step": 100275 + }, + { + "epoch": 24.48, + "learning_rate": 0.0003781297336916687, + "loss": 0.4803, + "step": 100300 + }, + { + "epoch": 24.48, + "learning_rate": 0.000378099193745419, + "loss": 0.465, + "step": 100325 + }, + { + "epoch": 24.49, + "learning_rate": 0.00037806865379916933, + "loss": 0.4174, + "step": 100350 + }, + { + "epoch": 24.49, + "learning_rate": 0.00037803811385291963, + "loss": 0.4863, + "step": 100375 + }, + { + "epoch": 24.5, + "learning_rate": 0.00037800757390666994, + "loss": 0.4603, + "step": 100400 + }, + { + "epoch": 24.51, + "learning_rate": 0.00037797703396042024, + "loss": 0.4693, + "step": 100425 + }, + { + "epoch": 24.51, + "learning_rate": 0.00037794649401417054, + "loss": 0.4687, + "step": 100450 + }, + { + "epoch": 24.52, + "learning_rate": 0.00037791595406792085, + "loss": 0.4858, + "step": 100475 + }, + { + "epoch": 24.52, + "learning_rate": 0.00037788541412167115, + "loss": 0.4145, + "step": 100500 + }, + { + "epoch": 24.53, + "learning_rate": 0.00037785487417542145, + "loss": 0.5032, + "step": 100525 + }, + { + "epoch": 24.54, + "learning_rate": 0.0003778243342291718, + "loss": 0.4617, + "step": 100550 + }, + { + "epoch": 24.54, + "learning_rate": 0.00037779379428292206, + "loss": 0.479, + "step": 100575 + }, + { + "epoch": 24.55, + "learning_rate": 0.00037776325433667236, + "loss": 0.4391, + "step": 100600 + }, + { + "epoch": 24.55, + "learning_rate": 0.00037773271439042267, + "loss": 0.4667, + "step": 100625 + }, + { + "epoch": 24.56, + "learning_rate": 0.00037770217444417297, + "loss": 0.4343, + "step": 100650 + }, + { + "epoch": 24.57, + "learning_rate": 0.0003776716344979233, + "loss": 0.5094, + "step": 100675 + }, + { + "epoch": 24.57, + "learning_rate": 0.00037764109455167363, + "loss": 0.4378, + "step": 100700 + }, + { + "epoch": 24.58, + "learning_rate": 0.00037761055460542393, + "loss": 0.4847, + "step": 100725 + }, + { + "epoch": 24.59, + "learning_rate": 0.0003775800146591742, + "loss": 0.486, + "step": 100750 + }, + { + "epoch": 24.59, + "learning_rate": 0.0003775494747129245, + "loss": 0.4984, + "step": 100775 + }, + { + "epoch": 24.6, + "learning_rate": 0.0003775189347666748, + "loss": 0.4548, + "step": 100800 + }, + { + "epoch": 24.6, + "learning_rate": 0.00037748839482042515, + "loss": 0.4844, + "step": 100825 + }, + { + "epoch": 24.61, + "learning_rate": 0.00037745785487417545, + "loss": 0.4017, + "step": 100850 + }, + { + "epoch": 24.62, + "learning_rate": 0.00037742731492792575, + "loss": 0.5021, + "step": 100875 + }, + { + "epoch": 24.62, + "learning_rate": 0.000377396774981676, + "loss": 0.4189, + "step": 100900 + }, + { + "epoch": 24.63, + "learning_rate": 0.0003773662350354263, + "loss": 0.4647, + "step": 100925 + }, + { + "epoch": 24.63, + "learning_rate": 0.00037733569508917666, + "loss": 0.4269, + "step": 100950 + }, + { + "epoch": 24.64, + "learning_rate": 0.00037730515514292697, + "loss": 0.5024, + "step": 100975 + }, + { + "epoch": 24.65, + "learning_rate": 0.00037727461519667727, + "loss": 0.4887, + "step": 101000 + }, + { + "epoch": 24.65, + "learning_rate": 0.0003772440752504276, + "loss": 0.5028, + "step": 101025 + }, + { + "epoch": 24.66, + "learning_rate": 0.0003772135353041778, + "loss": 0.4119, + "step": 101050 + }, + { + "epoch": 24.66, + "learning_rate": 0.0003771829953579282, + "loss": 0.5086, + "step": 101075 + }, + { + "epoch": 24.67, + "learning_rate": 0.0003771524554116785, + "loss": 0.4606, + "step": 101100 + }, + { + "epoch": 24.68, + "learning_rate": 0.0003771219154654288, + "loss": 0.5296, + "step": 101125 + }, + { + "epoch": 24.68, + "learning_rate": 0.0003770913755191791, + "loss": 0.4198, + "step": 101150 + }, + { + "epoch": 24.69, + "learning_rate": 0.0003770608355729294, + "loss": 0.5104, + "step": 101175 + }, + { + "epoch": 24.69, + "learning_rate": 0.00037703029562667975, + "loss": 0.4763, + "step": 101200 + }, + { + "epoch": 24.7, + "learning_rate": 0.00037699975568043, + "loss": 0.4919, + "step": 101225 + }, + { + "epoch": 24.71, + "learning_rate": 0.0003769692157341803, + "loss": 0.4559, + "step": 101250 + }, + { + "epoch": 24.71, + "learning_rate": 0.0003769386757879306, + "loss": 0.4789, + "step": 101275 + }, + { + "epoch": 24.72, + "learning_rate": 0.0003769081358416809, + "loss": 0.3941, + "step": 101300 + }, + { + "epoch": 24.73, + "learning_rate": 0.00037687759589543127, + "loss": 0.4652, + "step": 101325 + }, + { + "epoch": 24.73, + "learning_rate": 0.00037684705594918157, + "loss": 0.4512, + "step": 101350 + }, + { + "epoch": 24.74, + "learning_rate": 0.0003768165160029318, + "loss": 0.5269, + "step": 101375 + }, + { + "epoch": 24.74, + "learning_rate": 0.0003767859760566821, + "loss": 0.4127, + "step": 101400 + }, + { + "epoch": 24.75, + "learning_rate": 0.00037675543611043243, + "loss": 0.5224, + "step": 101425 + }, + { + "epoch": 24.76, + "learning_rate": 0.0003767248961641828, + "loss": 0.4827, + "step": 101450 + }, + { + "epoch": 24.76, + "learning_rate": 0.0003766943562179331, + "loss": 0.5129, + "step": 101475 + }, + { + "epoch": 24.77, + "learning_rate": 0.0003766638162716834, + "loss": 0.4572, + "step": 101500 + }, + { + "epoch": 24.77, + "learning_rate": 0.00037663327632543364, + "loss": 0.4873, + "step": 101525 + }, + { + "epoch": 24.78, + "learning_rate": 0.00037660273637918395, + "loss": 0.4274, + "step": 101550 + }, + { + "epoch": 24.79, + "learning_rate": 0.0003765721964329343, + "loss": 0.4658, + "step": 101575 + }, + { + "epoch": 24.79, + "learning_rate": 0.0003765416564866846, + "loss": 0.4689, + "step": 101600 + }, + { + "epoch": 24.8, + "learning_rate": 0.0003765111165404349, + "loss": 0.4879, + "step": 101625 + }, + { + "epoch": 24.8, + "learning_rate": 0.0003764805765941852, + "loss": 0.452, + "step": 101650 + }, + { + "epoch": 24.81, + "learning_rate": 0.0003764500366479355, + "loss": 0.5189, + "step": 101675 + }, + { + "epoch": 24.82, + "learning_rate": 0.0003764194967016858, + "loss": 0.4351, + "step": 101700 + }, + { + "epoch": 24.82, + "learning_rate": 0.0003763889567554361, + "loss": 0.5103, + "step": 101725 + }, + { + "epoch": 24.83, + "learning_rate": 0.0003763584168091864, + "loss": 0.4763, + "step": 101750 + }, + { + "epoch": 24.84, + "learning_rate": 0.00037632787686293673, + "loss": 0.4859, + "step": 101775 + }, + { + "epoch": 24.84, + "learning_rate": 0.00037629733691668703, + "loss": 0.4515, + "step": 101800 + }, + { + "epoch": 24.85, + "learning_rate": 0.0003762667969704374, + "loss": 0.5135, + "step": 101825 + }, + { + "epoch": 24.85, + "learning_rate": 0.00037623625702418764, + "loss": 0.4947, + "step": 101850 + }, + { + "epoch": 24.86, + "learning_rate": 0.00037620571707793794, + "loss": 0.5274, + "step": 101875 + }, + { + "epoch": 24.87, + "learning_rate": 0.00037617517713168825, + "loss": 0.4772, + "step": 101900 + }, + { + "epoch": 24.87, + "learning_rate": 0.00037614463718543855, + "loss": 0.4879, + "step": 101925 + }, + { + "epoch": 24.88, + "learning_rate": 0.00037611531883703886, + "loss": 0.3944, + "step": 101950 + }, + { + "epoch": 24.88, + "learning_rate": 0.00037608477889078916, + "loss": 0.4763, + "step": 101975 + }, + { + "epoch": 24.89, + "learning_rate": 0.00037605423894453946, + "loss": 0.4512, + "step": 102000 + }, + { + "epoch": 24.89, + "eval_cer": 0.1102122111228607, + "eval_loss": 0.4270845651626587, + "eval_runtime": 147.9389, + "eval_samples_per_second": 28.343, + "eval_steps_per_second": 7.091, + "eval_wer": 0.4470799347471452, + "step": 102000 + }, + { + "epoch": 24.9, + "learning_rate": 0.00037602369899828977, + "loss": 0.475, + "step": 102025 + }, + { + "epoch": 24.9, + "learning_rate": 0.00037599315905204007, + "loss": 0.4679, + "step": 102050 + }, + { + "epoch": 24.91, + "learning_rate": 0.00037596261910579037, + "loss": 0.4831, + "step": 102075 + }, + { + "epoch": 24.91, + "learning_rate": 0.0003759320791595407, + "loss": 0.4822, + "step": 102100 + }, + { + "epoch": 24.92, + "learning_rate": 0.00037590153921329103, + "loss": 0.4793, + "step": 102125 + }, + { + "epoch": 24.93, + "learning_rate": 0.00037587099926704134, + "loss": 0.4366, + "step": 102150 + }, + { + "epoch": 24.93, + "learning_rate": 0.0003758404593207916, + "loss": 0.4796, + "step": 102175 + }, + { + "epoch": 24.94, + "learning_rate": 0.0003758099193745419, + "loss": 0.4369, + "step": 102200 + }, + { + "epoch": 24.95, + "learning_rate": 0.0003757793794282922, + "loss": 0.4931, + "step": 102225 + }, + { + "epoch": 24.95, + "learning_rate": 0.00037574883948204255, + "loss": 0.446, + "step": 102250 + }, + { + "epoch": 24.96, + "learning_rate": 0.00037571829953579285, + "loss": 0.5142, + "step": 102275 + }, + { + "epoch": 24.96, + "learning_rate": 0.00037568775958954316, + "loss": 0.4343, + "step": 102300 + }, + { + "epoch": 24.97, + "learning_rate": 0.0003756572196432934, + "loss": 0.4518, + "step": 102325 + }, + { + "epoch": 24.98, + "learning_rate": 0.0003756266796970437, + "loss": 0.4916, + "step": 102350 + }, + { + "epoch": 24.98, + "learning_rate": 0.00037559613975079407, + "loss": 0.494, + "step": 102375 + }, + { + "epoch": 24.99, + "learning_rate": 0.00037556559980454437, + "loss": 0.4307, + "step": 102400 + }, + { + "epoch": 24.99, + "learning_rate": 0.0003755350598582947, + "loss": 0.4706, + "step": 102425 + }, + { + "epoch": 25.0, + "learning_rate": 0.000375504519912045, + "loss": 0.4222, + "step": 102450 + }, + { + "epoch": 25.01, + "learning_rate": 0.0003754739799657952, + "loss": 0.4631, + "step": 102475 + }, + { + "epoch": 25.01, + "learning_rate": 0.0003754434400195456, + "loss": 0.4621, + "step": 102500 + }, + { + "epoch": 25.02, + "learning_rate": 0.0003754129000732959, + "loss": 0.4992, + "step": 102525 + }, + { + "epoch": 25.02, + "learning_rate": 0.0003753823601270462, + "loss": 0.3952, + "step": 102550 + }, + { + "epoch": 25.03, + "learning_rate": 0.0003753518201807965, + "loss": 0.4637, + "step": 102575 + }, + { + "epoch": 25.04, + "learning_rate": 0.0003753212802345468, + "loss": 0.4229, + "step": 102600 + }, + { + "epoch": 25.04, + "learning_rate": 0.00037529074028829715, + "loss": 0.4872, + "step": 102625 + }, + { + "epoch": 25.05, + "learning_rate": 0.0003752602003420474, + "loss": 0.4627, + "step": 102650 + }, + { + "epoch": 25.05, + "learning_rate": 0.0003752296603957977, + "loss": 0.4823, + "step": 102675 + }, + { + "epoch": 25.06, + "learning_rate": 0.000375199120449548, + "loss": 0.4422, + "step": 102700 + }, + { + "epoch": 25.07, + "learning_rate": 0.0003751685805032983, + "loss": 0.4868, + "step": 102725 + }, + { + "epoch": 25.07, + "learning_rate": 0.0003751380405570486, + "loss": 0.4075, + "step": 102750 + }, + { + "epoch": 25.08, + "learning_rate": 0.000375107500610799, + "loss": 0.5041, + "step": 102775 + }, + { + "epoch": 25.09, + "learning_rate": 0.0003750769606645492, + "loss": 0.4685, + "step": 102800 + }, + { + "epoch": 25.09, + "learning_rate": 0.00037504642071829953, + "loss": 0.424, + "step": 102825 + }, + { + "epoch": 25.1, + "learning_rate": 0.00037501588077204983, + "loss": 0.4336, + "step": 102850 + }, + { + "epoch": 25.1, + "learning_rate": 0.00037498534082580013, + "loss": 0.4604, + "step": 102875 + }, + { + "epoch": 25.11, + "learning_rate": 0.0003749548008795505, + "loss": 0.4349, + "step": 102900 + }, + { + "epoch": 25.12, + "learning_rate": 0.0003749242609333008, + "loss": 0.4693, + "step": 102925 + }, + { + "epoch": 25.12, + "learning_rate": 0.00037489372098705104, + "loss": 0.4401, + "step": 102950 + }, + { + "epoch": 25.13, + "learning_rate": 0.00037486318104080135, + "loss": 0.4709, + "step": 102975 + }, + { + "epoch": 25.13, + "learning_rate": 0.00037483264109455165, + "loss": 0.4279, + "step": 103000 + }, + { + "epoch": 25.14, + "learning_rate": 0.000374802101148302, + "loss": 0.4952, + "step": 103025 + }, + { + "epoch": 25.15, + "learning_rate": 0.0003747715612020523, + "loss": 0.4015, + "step": 103050 + }, + { + "epoch": 25.15, + "learning_rate": 0.0003747410212558026, + "loss": 0.4887, + "step": 103075 + }, + { + "epoch": 25.16, + "learning_rate": 0.00037471048130955286, + "loss": 0.4545, + "step": 103100 + }, + { + "epoch": 25.16, + "learning_rate": 0.00037467994136330317, + "loss": 0.4596, + "step": 103125 + }, + { + "epoch": 25.17, + "learning_rate": 0.0003746494014170535, + "loss": 0.4146, + "step": 103150 + }, + { + "epoch": 25.18, + "learning_rate": 0.00037461886147080383, + "loss": 0.4797, + "step": 103175 + }, + { + "epoch": 25.18, + "learning_rate": 0.00037458832152455413, + "loss": 0.4724, + "step": 103200 + }, + { + "epoch": 25.19, + "learning_rate": 0.00037455778157830443, + "loss": 0.5207, + "step": 103225 + }, + { + "epoch": 25.2, + "learning_rate": 0.00037452724163205474, + "loss": 0.4235, + "step": 103250 + }, + { + "epoch": 25.2, + "learning_rate": 0.00037449670168580504, + "loss": 0.5035, + "step": 103275 + }, + { + "epoch": 25.21, + "learning_rate": 0.00037446616173955534, + "loss": 0.4209, + "step": 103300 + }, + { + "epoch": 25.21, + "learning_rate": 0.00037443562179330565, + "loss": 0.4922, + "step": 103325 + }, + { + "epoch": 25.22, + "learning_rate": 0.00037440508184705595, + "loss": 0.4448, + "step": 103350 + }, + { + "epoch": 25.23, + "learning_rate": 0.00037437454190080626, + "loss": 0.473, + "step": 103375 + }, + { + "epoch": 25.23, + "learning_rate": 0.0003743440019545566, + "loss": 0.4392, + "step": 103400 + }, + { + "epoch": 25.24, + "learning_rate": 0.00037431346200830686, + "loss": 0.466, + "step": 103425 + }, + { + "epoch": 25.24, + "learning_rate": 0.00037428292206205717, + "loss": 0.4162, + "step": 103450 + }, + { + "epoch": 25.25, + "learning_rate": 0.00037425238211580747, + "loss": 0.472, + "step": 103475 + }, + { + "epoch": 25.26, + "learning_rate": 0.00037422184216955777, + "loss": 0.4314, + "step": 103500 + }, + { + "epoch": 25.26, + "learning_rate": 0.00037419130222330813, + "loss": 0.4779, + "step": 103525 + }, + { + "epoch": 25.27, + "learning_rate": 0.00037416076227705843, + "loss": 0.4327, + "step": 103550 + }, + { + "epoch": 25.27, + "learning_rate": 0.0003741302223308087, + "loss": 0.4718, + "step": 103575 + }, + { + "epoch": 25.28, + "learning_rate": 0.000374099682384559, + "loss": 0.4607, + "step": 103600 + }, + { + "epoch": 25.29, + "learning_rate": 0.0003740691424383093, + "loss": 0.4718, + "step": 103625 + }, + { + "epoch": 25.29, + "learning_rate": 0.00037403860249205965, + "loss": 0.385, + "step": 103650 + }, + { + "epoch": 25.3, + "learning_rate": 0.00037400806254580995, + "loss": 0.448, + "step": 103675 + }, + { + "epoch": 25.31, + "learning_rate": 0.00037397752259956025, + "loss": 0.4499, + "step": 103700 + }, + { + "epoch": 25.31, + "learning_rate": 0.00037394698265331056, + "loss": 0.481, + "step": 103725 + }, + { + "epoch": 25.32, + "learning_rate": 0.0003739164427070608, + "loss": 0.3851, + "step": 103750 + }, + { + "epoch": 25.32, + "learning_rate": 0.00037388590276081116, + "loss": 0.4922, + "step": 103775 + }, + { + "epoch": 25.33, + "learning_rate": 0.0003738565844124114, + "loss": 0.4214, + "step": 103800 + }, + { + "epoch": 25.34, + "learning_rate": 0.00037382604446616177, + "loss": 0.4982, + "step": 103825 + }, + { + "epoch": 25.34, + "learning_rate": 0.0003737955045199121, + "loss": 0.4485, + "step": 103850 + }, + { + "epoch": 25.35, + "learning_rate": 0.0003737649645736624, + "loss": 0.4842, + "step": 103875 + }, + { + "epoch": 25.35, + "learning_rate": 0.00037373442462741263, + "loss": 0.4432, + "step": 103900 + }, + { + "epoch": 25.36, + "learning_rate": 0.00037370388468116293, + "loss": 0.4599, + "step": 103925 + }, + { + "epoch": 25.37, + "learning_rate": 0.0003736733447349133, + "loss": 0.456, + "step": 103950 + }, + { + "epoch": 25.37, + "learning_rate": 0.0003736428047886636, + "loss": 0.4892, + "step": 103975 + }, + { + "epoch": 25.38, + "learning_rate": 0.0003736122648424139, + "loss": 0.428, + "step": 104000 + }, + { + "epoch": 25.38, + "learning_rate": 0.0003735817248961642, + "loss": 0.4879, + "step": 104025 + }, + { + "epoch": 25.39, + "learning_rate": 0.00037355118494991445, + "loss": 0.4605, + "step": 104050 + }, + { + "epoch": 25.4, + "learning_rate": 0.0003735206450036648, + "loss": 0.4768, + "step": 104075 + }, + { + "epoch": 25.4, + "learning_rate": 0.0003734901050574151, + "loss": 0.4498, + "step": 104100 + }, + { + "epoch": 25.41, + "learning_rate": 0.0003734595651111654, + "loss": 0.4897, + "step": 104125 + }, + { + "epoch": 25.41, + "learning_rate": 0.0003734290251649157, + "loss": 0.4544, + "step": 104150 + }, + { + "epoch": 25.42, + "learning_rate": 0.000373398485218666, + "loss": 0.5028, + "step": 104175 + }, + { + "epoch": 25.43, + "learning_rate": 0.0003733679452724164, + "loss": 0.3967, + "step": 104200 + }, + { + "epoch": 25.43, + "learning_rate": 0.0003733374053261666, + "loss": 0.4598, + "step": 104225 + }, + { + "epoch": 25.44, + "learning_rate": 0.00037330686537991693, + "loss": 0.4726, + "step": 104250 + }, + { + "epoch": 25.45, + "learning_rate": 0.00037327632543366723, + "loss": 0.4783, + "step": 104275 + }, + { + "epoch": 25.45, + "learning_rate": 0.00037324578548741754, + "loss": 0.3883, + "step": 104300 + }, + { + "epoch": 25.46, + "learning_rate": 0.0003732152455411679, + "loss": 0.4943, + "step": 104325 + }, + { + "epoch": 25.46, + "learning_rate": 0.0003731847055949182, + "loss": 0.4262, + "step": 104350 + }, + { + "epoch": 25.47, + "learning_rate": 0.00037315416564866845, + "loss": 0.5044, + "step": 104375 + }, + { + "epoch": 25.48, + "learning_rate": 0.00037312362570241875, + "loss": 0.4264, + "step": 104400 + }, + { + "epoch": 25.48, + "learning_rate": 0.00037309308575616905, + "loss": 0.4692, + "step": 104425 + }, + { + "epoch": 25.49, + "learning_rate": 0.0003730625458099194, + "loss": 0.4578, + "step": 104450 + }, + { + "epoch": 25.49, + "learning_rate": 0.0003730320058636697, + "loss": 0.4825, + "step": 104475 + }, + { + "epoch": 25.5, + "learning_rate": 0.00037300146591742, + "loss": 0.472, + "step": 104500 + }, + { + "epoch": 25.51, + "learning_rate": 0.00037297092597117027, + "loss": 0.5078, + "step": 104525 + }, + { + "epoch": 25.51, + "learning_rate": 0.00037294038602492057, + "loss": 0.38, + "step": 104550 + }, + { + "epoch": 25.52, + "learning_rate": 0.0003729098460786709, + "loss": 0.4674, + "step": 104575 + }, + { + "epoch": 25.52, + "learning_rate": 0.00037287930613242123, + "loss": 0.428, + "step": 104600 + }, + { + "epoch": 25.53, + "learning_rate": 0.00037284876618617153, + "loss": 0.47, + "step": 104625 + }, + { + "epoch": 25.54, + "learning_rate": 0.00037281822623992184, + "loss": 0.403, + "step": 104650 + }, + { + "epoch": 25.54, + "learning_rate": 0.00037278768629367214, + "loss": 0.476, + "step": 104675 + }, + { + "epoch": 25.55, + "learning_rate": 0.0003727571463474224, + "loss": 0.433, + "step": 104700 + }, + { + "epoch": 25.56, + "learning_rate": 0.00037272660640117275, + "loss": 0.4434, + "step": 104725 + }, + { + "epoch": 25.56, + "learning_rate": 0.00037269606645492305, + "loss": 0.4667, + "step": 104750 + }, + { + "epoch": 25.57, + "learning_rate": 0.00037266552650867335, + "loss": 0.4814, + "step": 104775 + }, + { + "epoch": 25.57, + "learning_rate": 0.00037263498656242366, + "loss": 0.4665, + "step": 104800 + }, + { + "epoch": 25.58, + "learning_rate": 0.00037260444661617396, + "loss": 0.475, + "step": 104825 + }, + { + "epoch": 25.59, + "learning_rate": 0.00037257390666992426, + "loss": 0.4225, + "step": 104850 + }, + { + "epoch": 25.59, + "learning_rate": 0.00037254336672367457, + "loss": 0.5022, + "step": 104875 + }, + { + "epoch": 25.6, + "learning_rate": 0.00037251282677742487, + "loss": 0.396, + "step": 104900 + }, + { + "epoch": 25.6, + "learning_rate": 0.0003724822868311752, + "loss": 0.4856, + "step": 104925 + }, + { + "epoch": 25.61, + "learning_rate": 0.0003724517468849255, + "loss": 0.4229, + "step": 104950 + }, + { + "epoch": 25.62, + "learning_rate": 0.00037242120693867583, + "loss": 0.4621, + "step": 104975 + }, + { + "epoch": 25.62, + "learning_rate": 0.0003723906669924261, + "loss": 0.4049, + "step": 105000 + }, + { + "epoch": 25.62, + "eval_cer": 0.10712195722924345, + "eval_loss": 0.42072468996047974, + "eval_runtime": 147.7106, + "eval_samples_per_second": 28.387, + "eval_steps_per_second": 7.102, + "eval_wer": 0.43494290375203915, + "step": 105000 + }, + { + "epoch": 25.63, + "learning_rate": 0.0003723601270461764, + "loss": 0.465, + "step": 105025 + }, + { + "epoch": 25.63, + "learning_rate": 0.0003723295870999267, + "loss": 0.4088, + "step": 105050 + }, + { + "epoch": 25.64, + "learning_rate": 0.000372299047153677, + "loss": 0.4739, + "step": 105075 + }, + { + "epoch": 25.65, + "learning_rate": 0.00037226850720742735, + "loss": 0.4535, + "step": 105100 + }, + { + "epoch": 25.65, + "learning_rate": 0.00037223796726117765, + "loss": 0.4836, + "step": 105125 + }, + { + "epoch": 25.66, + "learning_rate": 0.00037220742731492796, + "loss": 0.4339, + "step": 105150 + }, + { + "epoch": 25.66, + "learning_rate": 0.0003721768873686782, + "loss": 0.4807, + "step": 105175 + }, + { + "epoch": 25.67, + "learning_rate": 0.0003721463474224285, + "loss": 0.3848, + "step": 105200 + }, + { + "epoch": 25.68, + "learning_rate": 0.00037211580747617887, + "loss": 0.488, + "step": 105225 + }, + { + "epoch": 25.68, + "learning_rate": 0.00037208526752992917, + "loss": 0.4458, + "step": 105250 + }, + { + "epoch": 25.69, + "learning_rate": 0.0003720547275836795, + "loss": 0.4587, + "step": 105275 + }, + { + "epoch": 25.7, + "learning_rate": 0.0003720241876374298, + "loss": 0.4346, + "step": 105300 + }, + { + "epoch": 25.7, + "learning_rate": 0.00037199364769118003, + "loss": 0.505, + "step": 105325 + }, + { + "epoch": 25.71, + "learning_rate": 0.0003719631077449304, + "loss": 0.4108, + "step": 105350 + }, + { + "epoch": 25.71, + "learning_rate": 0.0003719325677986807, + "loss": 0.4868, + "step": 105375 + }, + { + "epoch": 25.72, + "learning_rate": 0.000371902027852431, + "loss": 0.4004, + "step": 105400 + }, + { + "epoch": 25.73, + "learning_rate": 0.0003718714879061813, + "loss": 0.4812, + "step": 105425 + }, + { + "epoch": 25.73, + "learning_rate": 0.0003718409479599316, + "loss": 0.4186, + "step": 105450 + }, + { + "epoch": 25.74, + "learning_rate": 0.0003718104080136819, + "loss": 0.4643, + "step": 105475 + }, + { + "epoch": 25.74, + "learning_rate": 0.0003717798680674322, + "loss": 0.4142, + "step": 105500 + }, + { + "epoch": 25.75, + "learning_rate": 0.0003717493281211825, + "loss": 0.4678, + "step": 105525 + }, + { + "epoch": 25.76, + "learning_rate": 0.0003717187881749328, + "loss": 0.4754, + "step": 105550 + }, + { + "epoch": 25.76, + "learning_rate": 0.0003716882482286831, + "loss": 0.4888, + "step": 105575 + }, + { + "epoch": 25.77, + "learning_rate": 0.00037165770828243347, + "loss": 0.4401, + "step": 105600 + }, + { + "epoch": 25.77, + "learning_rate": 0.0003716271683361838, + "loss": 0.4438, + "step": 105625 + }, + { + "epoch": 25.78, + "learning_rate": 0.000371596628389934, + "loss": 0.3972, + "step": 105650 + }, + { + "epoch": 25.79, + "learning_rate": 0.00037156608844368433, + "loss": 0.5188, + "step": 105675 + }, + { + "epoch": 25.79, + "learning_rate": 0.00037153554849743463, + "loss": 0.433, + "step": 105700 + }, + { + "epoch": 25.8, + "learning_rate": 0.000371505008551185, + "loss": 0.4854, + "step": 105725 + }, + { + "epoch": 25.81, + "learning_rate": 0.0003714744686049353, + "loss": 0.4058, + "step": 105750 + }, + { + "epoch": 25.81, + "learning_rate": 0.0003714439286586856, + "loss": 0.4883, + "step": 105775 + }, + { + "epoch": 25.82, + "learning_rate": 0.00037141338871243585, + "loss": 0.45, + "step": 105800 + }, + { + "epoch": 25.82, + "learning_rate": 0.00037138284876618615, + "loss": 0.4894, + "step": 105825 + }, + { + "epoch": 25.83, + "learning_rate": 0.0003713523088199365, + "loss": 0.4054, + "step": 105850 + }, + { + "epoch": 25.84, + "learning_rate": 0.0003713217688736868, + "loss": 0.484, + "step": 105875 + }, + { + "epoch": 25.84, + "learning_rate": 0.0003712912289274371, + "loss": 0.4124, + "step": 105900 + }, + { + "epoch": 25.85, + "learning_rate": 0.0003712606889811874, + "loss": 0.446, + "step": 105925 + }, + { + "epoch": 25.85, + "learning_rate": 0.00037123014903493767, + "loss": 0.4206, + "step": 105950 + }, + { + "epoch": 25.86, + "learning_rate": 0.00037119960908868797, + "loss": 0.4667, + "step": 105975 + }, + { + "epoch": 25.87, + "learning_rate": 0.0003711690691424383, + "loss": 0.4795, + "step": 106000 + }, + { + "epoch": 25.87, + "learning_rate": 0.00037113852919618863, + "loss": 0.4763, + "step": 106025 + }, + { + "epoch": 25.88, + "learning_rate": 0.00037110798924993893, + "loss": 0.4272, + "step": 106050 + }, + { + "epoch": 25.88, + "learning_rate": 0.00037107744930368924, + "loss": 0.4659, + "step": 106075 + }, + { + "epoch": 25.89, + "learning_rate": 0.00037104690935743954, + "loss": 0.439, + "step": 106100 + }, + { + "epoch": 25.9, + "learning_rate": 0.00037101636941118984, + "loss": 0.4927, + "step": 106125 + }, + { + "epoch": 25.9, + "learning_rate": 0.00037098582946494015, + "loss": 0.4184, + "step": 106150 + }, + { + "epoch": 25.91, + "learning_rate": 0.00037095528951869045, + "loss": 0.4802, + "step": 106175 + }, + { + "epoch": 25.92, + "learning_rate": 0.00037092474957244075, + "loss": 0.412, + "step": 106200 + }, + { + "epoch": 25.92, + "learning_rate": 0.00037089420962619106, + "loss": 0.5181, + "step": 106225 + }, + { + "epoch": 25.93, + "learning_rate": 0.0003708636696799414, + "loss": 0.4222, + "step": 106250 + }, + { + "epoch": 25.93, + "learning_rate": 0.00037083312973369166, + "loss": 0.4779, + "step": 106275 + }, + { + "epoch": 25.94, + "learning_rate": 0.00037080258978744197, + "loss": 0.4188, + "step": 106300 + }, + { + "epoch": 25.95, + "learning_rate": 0.00037077204984119227, + "loss": 0.4708, + "step": 106325 + }, + { + "epoch": 25.95, + "learning_rate": 0.0003707415098949426, + "loss": 0.4742, + "step": 106350 + }, + { + "epoch": 25.96, + "learning_rate": 0.00037071096994869293, + "loss": 0.4712, + "step": 106375 + }, + { + "epoch": 25.96, + "learning_rate": 0.00037068043000244323, + "loss": 0.4305, + "step": 106400 + }, + { + "epoch": 25.97, + "learning_rate": 0.0003706498900561935, + "loss": 0.4821, + "step": 106425 + }, + { + "epoch": 25.98, + "learning_rate": 0.0003706193501099438, + "loss": 0.4488, + "step": 106450 + }, + { + "epoch": 25.98, + "learning_rate": 0.0003705888101636941, + "loss": 0.4867, + "step": 106475 + }, + { + "epoch": 25.99, + "learning_rate": 0.00037055827021744445, + "loss": 0.3886, + "step": 106500 + }, + { + "epoch": 25.99, + "learning_rate": 0.00037052773027119475, + "loss": 0.4734, + "step": 106525 + }, + { + "epoch": 26.0, + "learning_rate": 0.00037049719032494505, + "loss": 0.4751, + "step": 106550 + }, + { + "epoch": 26.01, + "learning_rate": 0.0003704666503786953, + "loss": 0.4749, + "step": 106575 + }, + { + "epoch": 26.01, + "learning_rate": 0.0003704361104324456, + "loss": 0.4585, + "step": 106600 + }, + { + "epoch": 26.02, + "learning_rate": 0.00037040557048619596, + "loss": 0.4786, + "step": 106625 + }, + { + "epoch": 26.02, + "learning_rate": 0.00037037503053994627, + "loss": 0.4364, + "step": 106650 + }, + { + "epoch": 26.03, + "learning_rate": 0.00037034449059369657, + "loss": 0.4331, + "step": 106675 + }, + { + "epoch": 26.04, + "learning_rate": 0.0003703139506474469, + "loss": 0.4266, + "step": 106700 + }, + { + "epoch": 26.04, + "learning_rate": 0.0003702834107011972, + "loss": 0.4936, + "step": 106725 + }, + { + "epoch": 26.05, + "learning_rate": 0.0003702528707549475, + "loss": 0.3865, + "step": 106750 + }, + { + "epoch": 26.06, + "learning_rate": 0.0003702223308086978, + "loss": 0.4762, + "step": 106775 + }, + { + "epoch": 26.06, + "learning_rate": 0.0003701917908624481, + "loss": 0.4166, + "step": 106800 + }, + { + "epoch": 26.07, + "learning_rate": 0.0003701612509161984, + "loss": 0.4492, + "step": 106825 + }, + { + "epoch": 26.07, + "learning_rate": 0.0003701307109699487, + "loss": 0.4309, + "step": 106850 + }, + { + "epoch": 26.08, + "learning_rate": 0.00037010017102369905, + "loss": 0.4462, + "step": 106875 + }, + { + "epoch": 26.09, + "learning_rate": 0.0003700696310774493, + "loss": 0.4186, + "step": 106900 + }, + { + "epoch": 26.09, + "learning_rate": 0.0003700390911311996, + "loss": 0.4786, + "step": 106925 + }, + { + "epoch": 26.1, + "learning_rate": 0.0003700085511849499, + "loss": 0.4521, + "step": 106950 + }, + { + "epoch": 26.1, + "learning_rate": 0.0003699780112387002, + "loss": 0.466, + "step": 106975 + }, + { + "epoch": 26.11, + "learning_rate": 0.00036994747129245057, + "loss": 0.4263, + "step": 107000 + }, + { + "epoch": 26.12, + "learning_rate": 0.00036991693134620087, + "loss": 0.4895, + "step": 107025 + }, + { + "epoch": 26.12, + "learning_rate": 0.0003698863913999511, + "loss": 0.4347, + "step": 107050 + }, + { + "epoch": 26.13, + "learning_rate": 0.0003698558514537014, + "loss": 0.4321, + "step": 107075 + }, + { + "epoch": 26.13, + "learning_rate": 0.00036982531150745173, + "loss": 0.4198, + "step": 107100 + }, + { + "epoch": 26.14, + "learning_rate": 0.0003697947715612021, + "loss": 0.4793, + "step": 107125 + }, + { + "epoch": 26.15, + "learning_rate": 0.0003697642316149524, + "loss": 0.4299, + "step": 107150 + }, + { + "epoch": 26.15, + "learning_rate": 0.0003697336916687027, + "loss": 0.4252, + "step": 107175 + }, + { + "epoch": 26.16, + "learning_rate": 0.000369703151722453, + "loss": 0.4794, + "step": 107200 + }, + { + "epoch": 26.17, + "learning_rate": 0.00036967261177620324, + "loss": 0.4622, + "step": 107225 + }, + { + "epoch": 26.17, + "learning_rate": 0.00036964207182995355, + "loss": 0.3999, + "step": 107250 + }, + { + "epoch": 26.18, + "learning_rate": 0.0003696115318837039, + "loss": 0.4948, + "step": 107275 + }, + { + "epoch": 26.18, + "learning_rate": 0.0003695809919374542, + "loss": 0.4358, + "step": 107300 + }, + { + "epoch": 26.19, + "learning_rate": 0.0003695504519912045, + "loss": 0.4585, + "step": 107325 + }, + { + "epoch": 26.2, + "learning_rate": 0.0003695199120449548, + "loss": 0.4442, + "step": 107350 + }, + { + "epoch": 26.2, + "learning_rate": 0.00036948937209870506, + "loss": 0.457, + "step": 107375 + }, + { + "epoch": 26.21, + "learning_rate": 0.0003694588321524554, + "loss": 0.4335, + "step": 107400 + }, + { + "epoch": 26.21, + "learning_rate": 0.0003694282922062057, + "loss": 0.4654, + "step": 107425 + }, + { + "epoch": 26.22, + "learning_rate": 0.00036939775225995603, + "loss": 0.4224, + "step": 107450 + }, + { + "epoch": 26.23, + "learning_rate": 0.00036936721231370633, + "loss": 0.4256, + "step": 107475 + }, + { + "epoch": 26.23, + "learning_rate": 0.00036933667236745664, + "loss": 0.4323, + "step": 107500 + }, + { + "epoch": 26.24, + "learning_rate": 0.00036930613242120694, + "loss": 0.485, + "step": 107525 + }, + { + "epoch": 26.24, + "learning_rate": 0.00036927559247495724, + "loss": 0.3872, + "step": 107550 + }, + { + "epoch": 26.25, + "learning_rate": 0.00036924505252870755, + "loss": 0.4637, + "step": 107575 + }, + { + "epoch": 26.26, + "learning_rate": 0.00036921451258245785, + "loss": 0.4406, + "step": 107600 + }, + { + "epoch": 26.26, + "learning_rate": 0.00036918397263620815, + "loss": 0.4668, + "step": 107625 + }, + { + "epoch": 26.27, + "learning_rate": 0.0003691534326899585, + "loss": 0.4599, + "step": 107650 + }, + { + "epoch": 26.28, + "learning_rate": 0.0003691228927437088, + "loss": 0.4629, + "step": 107675 + }, + { + "epoch": 26.28, + "learning_rate": 0.00036909235279745906, + "loss": 0.427, + "step": 107700 + }, + { + "epoch": 26.29, + "learning_rate": 0.00036906181285120937, + "loss": 0.4687, + "step": 107725 + }, + { + "epoch": 26.29, + "learning_rate": 0.00036903127290495967, + "loss": 0.4723, + "step": 107750 + }, + { + "epoch": 26.3, + "learning_rate": 0.00036900073295871, + "loss": 0.4637, + "step": 107775 + }, + { + "epoch": 26.31, + "learning_rate": 0.00036897019301246033, + "loss": 0.3946, + "step": 107800 + }, + { + "epoch": 26.31, + "learning_rate": 0.00036893965306621063, + "loss": 0.5078, + "step": 107825 + }, + { + "epoch": 26.32, + "learning_rate": 0.0003689091131199609, + "loss": 0.4029, + "step": 107850 + }, + { + "epoch": 26.32, + "learning_rate": 0.0003688785731737112, + "loss": 0.4586, + "step": 107875 + }, + { + "epoch": 26.33, + "learning_rate": 0.00036884803322746154, + "loss": 0.4345, + "step": 107900 + }, + { + "epoch": 26.34, + "learning_rate": 0.00036881749328121185, + "loss": 0.4809, + "step": 107925 + }, + { + "epoch": 26.34, + "learning_rate": 0.00036878695333496215, + "loss": 0.4448, + "step": 107950 + }, + { + "epoch": 26.35, + "learning_rate": 0.00036875641338871245, + "loss": 0.4703, + "step": 107975 + }, + { + "epoch": 26.35, + "learning_rate": 0.0003687258734424627, + "loss": 0.4134, + "step": 108000 + }, + { + "epoch": 26.35, + "eval_cer": 0.1060593616213053, + "eval_loss": 0.43024691939353943, + "eval_runtime": 147.9221, + "eval_samples_per_second": 28.346, + "eval_steps_per_second": 7.092, + "eval_wer": 0.43507340946166395, + "step": 108000 + }, + { + "epoch": 26.36, + "learning_rate": 0.00036869533349621306, + "loss": 0.4485, + "step": 108025 + }, + { + "epoch": 26.37, + "learning_rate": 0.00036866479354996336, + "loss": 0.4284, + "step": 108050 + }, + { + "epoch": 26.37, + "learning_rate": 0.00036863425360371367, + "loss": 0.462, + "step": 108075 + }, + { + "epoch": 26.38, + "learning_rate": 0.000368604935255314, + "loss": 0.4297, + "step": 108100 + }, + { + "epoch": 26.38, + "learning_rate": 0.0003685743953090643, + "loss": 0.4739, + "step": 108125 + }, + { + "epoch": 26.39, + "learning_rate": 0.0003685438553628146, + "loss": 0.4459, + "step": 108150 + }, + { + "epoch": 26.4, + "learning_rate": 0.00036851331541656483, + "loss": 0.4728, + "step": 108175 + }, + { + "epoch": 26.4, + "learning_rate": 0.0003684827754703152, + "loss": 0.3765, + "step": 108200 + }, + { + "epoch": 26.41, + "learning_rate": 0.0003684522355240655, + "loss": 0.4611, + "step": 108225 + }, + { + "epoch": 26.42, + "learning_rate": 0.0003684216955778158, + "loss": 0.4038, + "step": 108250 + }, + { + "epoch": 26.42, + "learning_rate": 0.0003683911556315661, + "loss": 0.4677, + "step": 108275 + }, + { + "epoch": 26.43, + "learning_rate": 0.0003683606156853164, + "loss": 0.4224, + "step": 108300 + }, + { + "epoch": 26.43, + "learning_rate": 0.0003683300757390667, + "loss": 0.4738, + "step": 108325 + }, + { + "epoch": 26.44, + "learning_rate": 0.000368299535792817, + "loss": 0.4373, + "step": 108350 + }, + { + "epoch": 26.45, + "learning_rate": 0.0003682689958465673, + "loss": 0.4712, + "step": 108375 + }, + { + "epoch": 26.45, + "learning_rate": 0.0003682384559003176, + "loss": 0.4267, + "step": 108400 + }, + { + "epoch": 26.46, + "learning_rate": 0.0003682079159540679, + "loss": 0.4353, + "step": 108425 + }, + { + "epoch": 26.46, + "learning_rate": 0.0003681773760078183, + "loss": 0.4254, + "step": 108450 + }, + { + "epoch": 26.47, + "learning_rate": 0.0003681468360615685, + "loss": 0.4527, + "step": 108475 + }, + { + "epoch": 26.48, + "learning_rate": 0.0003681162961153188, + "loss": 0.4297, + "step": 108500 + }, + { + "epoch": 26.48, + "learning_rate": 0.00036808575616906913, + "loss": 0.4702, + "step": 108525 + }, + { + "epoch": 26.49, + "learning_rate": 0.00036805521622281943, + "loss": 0.4419, + "step": 108550 + }, + { + "epoch": 26.49, + "learning_rate": 0.0003680246762765698, + "loss": 0.4729, + "step": 108575 + }, + { + "epoch": 26.5, + "learning_rate": 0.0003679941363303201, + "loss": 0.4453, + "step": 108600 + }, + { + "epoch": 26.51, + "learning_rate": 0.0003679635963840704, + "loss": 0.4262, + "step": 108625 + }, + { + "epoch": 26.51, + "learning_rate": 0.00036793305643782065, + "loss": 0.4974, + "step": 108650 + }, + { + "epoch": 26.52, + "learning_rate": 0.00036790251649157095, + "loss": 0.4659, + "step": 108675 + }, + { + "epoch": 26.53, + "learning_rate": 0.0003678719765453213, + "loss": 0.4658, + "step": 108700 + }, + { + "epoch": 26.53, + "learning_rate": 0.0003678414365990716, + "loss": 0.4668, + "step": 108725 + }, + { + "epoch": 26.54, + "learning_rate": 0.0003678108966528219, + "loss": 0.4197, + "step": 108750 + }, + { + "epoch": 26.54, + "learning_rate": 0.0003677803567065722, + "loss": 0.4794, + "step": 108775 + }, + { + "epoch": 26.55, + "learning_rate": 0.00036774981676032247, + "loss": 0.413, + "step": 108800 + }, + { + "epoch": 26.56, + "learning_rate": 0.0003677192768140728, + "loss": 0.4852, + "step": 108825 + }, + { + "epoch": 26.56, + "learning_rate": 0.00036768873686782313, + "loss": 0.4619, + "step": 108850 + }, + { + "epoch": 26.57, + "learning_rate": 0.00036765819692157343, + "loss": 0.4534, + "step": 108875 + }, + { + "epoch": 26.57, + "learning_rate": 0.00036762765697532373, + "loss": 0.4627, + "step": 108900 + }, + { + "epoch": 26.58, + "learning_rate": 0.00036759711702907404, + "loss": 0.4897, + "step": 108925 + }, + { + "epoch": 26.59, + "learning_rate": 0.00036756657708282434, + "loss": 0.3912, + "step": 108950 + }, + { + "epoch": 26.59, + "learning_rate": 0.00036753603713657464, + "loss": 0.4565, + "step": 108975 + }, + { + "epoch": 26.6, + "learning_rate": 0.00036750549719032495, + "loss": 0.3951, + "step": 109000 + }, + { + "epoch": 26.6, + "learning_rate": 0.00036747495724407525, + "loss": 0.4592, + "step": 109025 + }, + { + "epoch": 26.61, + "learning_rate": 0.00036744441729782555, + "loss": 0.4158, + "step": 109050 + }, + { + "epoch": 26.62, + "learning_rate": 0.0003674138773515759, + "loss": 0.4869, + "step": 109075 + }, + { + "epoch": 26.62, + "learning_rate": 0.0003673833374053262, + "loss": 0.4344, + "step": 109100 + }, + { + "epoch": 26.63, + "learning_rate": 0.00036735279745907646, + "loss": 0.477, + "step": 109125 + }, + { + "epoch": 26.63, + "learning_rate": 0.00036732225751282677, + "loss": 0.4105, + "step": 109150 + }, + { + "epoch": 26.64, + "learning_rate": 0.00036729171756657707, + "loss": 0.4881, + "step": 109175 + }, + { + "epoch": 26.65, + "learning_rate": 0.00036726117762032743, + "loss": 0.4537, + "step": 109200 + }, + { + "epoch": 26.65, + "learning_rate": 0.00036723063767407773, + "loss": 0.4819, + "step": 109225 + }, + { + "epoch": 26.66, + "learning_rate": 0.00036720009772782804, + "loss": 0.4284, + "step": 109250 + }, + { + "epoch": 26.67, + "learning_rate": 0.0003671695577815783, + "loss": 0.4793, + "step": 109275 + }, + { + "epoch": 26.67, + "learning_rate": 0.0003671390178353286, + "loss": 0.3908, + "step": 109300 + }, + { + "epoch": 26.68, + "learning_rate": 0.0003671084778890789, + "loss": 0.4925, + "step": 109325 + }, + { + "epoch": 26.68, + "learning_rate": 0.00036707793794282925, + "loss": 0.4475, + "step": 109350 + }, + { + "epoch": 26.69, + "learning_rate": 0.00036704739799657955, + "loss": 0.446, + "step": 109375 + }, + { + "epoch": 26.7, + "learning_rate": 0.00036701685805032986, + "loss": 0.4149, + "step": 109400 + }, + { + "epoch": 26.7, + "learning_rate": 0.0003669863181040801, + "loss": 0.4352, + "step": 109425 + }, + { + "epoch": 26.71, + "learning_rate": 0.0003669557781578304, + "loss": 0.4381, + "step": 109450 + }, + { + "epoch": 26.71, + "learning_rate": 0.00036692523821158077, + "loss": 0.5132, + "step": 109475 + }, + { + "epoch": 26.72, + "learning_rate": 0.00036689469826533107, + "loss": 0.4933, + "step": 109500 + }, + { + "epoch": 26.73, + "learning_rate": 0.00036686415831908137, + "loss": 0.4786, + "step": 109525 + }, + { + "epoch": 26.73, + "learning_rate": 0.0003668336183728317, + "loss": 0.4435, + "step": 109550 + }, + { + "epoch": 26.74, + "learning_rate": 0.000366803078426582, + "loss": 0.4473, + "step": 109575 + }, + { + "epoch": 26.74, + "learning_rate": 0.0003667725384803323, + "loss": 0.433, + "step": 109600 + }, + { + "epoch": 26.75, + "learning_rate": 0.0003667419985340826, + "loss": 0.516, + "step": 109625 + }, + { + "epoch": 26.76, + "learning_rate": 0.0003667114585878329, + "loss": 0.4701, + "step": 109650 + }, + { + "epoch": 26.76, + "learning_rate": 0.0003666809186415832, + "loss": 0.4402, + "step": 109675 + }, + { + "epoch": 26.77, + "learning_rate": 0.0003666503786953335, + "loss": 0.438, + "step": 109700 + }, + { + "epoch": 26.78, + "learning_rate": 0.00036661983874908385, + "loss": 0.4546, + "step": 109725 + }, + { + "epoch": 26.78, + "learning_rate": 0.0003665892988028341, + "loss": 0.4501, + "step": 109750 + }, + { + "epoch": 26.79, + "learning_rate": 0.0003665587588565844, + "loss": 0.4646, + "step": 109775 + }, + { + "epoch": 26.79, + "learning_rate": 0.0003665282189103347, + "loss": 0.4086, + "step": 109800 + }, + { + "epoch": 26.8, + "learning_rate": 0.000366497678964085, + "loss": 0.4808, + "step": 109825 + }, + { + "epoch": 26.81, + "learning_rate": 0.00036646713901783537, + "loss": 0.4235, + "step": 109850 + }, + { + "epoch": 26.81, + "learning_rate": 0.0003664365990715857, + "loss": 0.4595, + "step": 109875 + }, + { + "epoch": 26.82, + "learning_rate": 0.0003664060591253359, + "loss": 0.4173, + "step": 109900 + }, + { + "epoch": 26.82, + "learning_rate": 0.0003663755191790862, + "loss": 0.4892, + "step": 109925 + }, + { + "epoch": 26.83, + "learning_rate": 0.00036634497923283653, + "loss": 0.4327, + "step": 109950 + }, + { + "epoch": 26.84, + "learning_rate": 0.0003663144392865869, + "loss": 0.4168, + "step": 109975 + }, + { + "epoch": 26.84, + "learning_rate": 0.0003662838993403372, + "loss": 0.4306, + "step": 110000 + }, + { + "epoch": 26.85, + "learning_rate": 0.0003662533593940875, + "loss": 0.4481, + "step": 110025 + }, + { + "epoch": 26.85, + "learning_rate": 0.00036622281944783774, + "loss": 0.4577, + "step": 110050 + }, + { + "epoch": 26.86, + "learning_rate": 0.00036619227950158805, + "loss": 0.4434, + "step": 110075 + }, + { + "epoch": 26.87, + "learning_rate": 0.0003661617395553384, + "loss": 0.3799, + "step": 110100 + }, + { + "epoch": 26.87, + "learning_rate": 0.0003661311996090887, + "loss": 0.4699, + "step": 110125 + }, + { + "epoch": 26.88, + "learning_rate": 0.000366100659662839, + "loss": 0.4373, + "step": 110150 + }, + { + "epoch": 26.89, + "learning_rate": 0.0003660701197165893, + "loss": 0.4765, + "step": 110175 + }, + { + "epoch": 26.89, + "learning_rate": 0.0003660395797703396, + "loss": 0.3899, + "step": 110200 + }, + { + "epoch": 26.9, + "learning_rate": 0.0003660090398240899, + "loss": 0.4409, + "step": 110225 + }, + { + "epoch": 26.9, + "learning_rate": 0.0003659784998778402, + "loss": 0.3785, + "step": 110250 + }, + { + "epoch": 26.91, + "learning_rate": 0.0003659479599315905, + "loss": 0.441, + "step": 110275 + }, + { + "epoch": 26.92, + "learning_rate": 0.00036591741998534083, + "loss": 0.4695, + "step": 110300 + }, + { + "epoch": 26.92, + "learning_rate": 0.00036588688003909113, + "loss": 0.4657, + "step": 110325 + }, + { + "epoch": 26.93, + "learning_rate": 0.00036585756169069144, + "loss": 0.4103, + "step": 110350 + }, + { + "epoch": 26.93, + "learning_rate": 0.0003658270217444417, + "loss": 0.4654, + "step": 110375 + }, + { + "epoch": 26.94, + "learning_rate": 0.00036579648179819205, + "loss": 0.4098, + "step": 110400 + }, + { + "epoch": 26.95, + "learning_rate": 0.00036576594185194235, + "loss": 0.4484, + "step": 110425 + }, + { + "epoch": 26.95, + "learning_rate": 0.00036573540190569265, + "loss": 0.4432, + "step": 110450 + }, + { + "epoch": 26.96, + "learning_rate": 0.00036570486195944296, + "loss": 0.4621, + "step": 110475 + }, + { + "epoch": 26.96, + "learning_rate": 0.00036567432201319326, + "loss": 0.4394, + "step": 110500 + }, + { + "epoch": 26.97, + "learning_rate": 0.00036564378206694356, + "loss": 0.4914, + "step": 110525 + }, + { + "epoch": 26.98, + "learning_rate": 0.00036561324212069387, + "loss": 0.4076, + "step": 110550 + }, + { + "epoch": 26.98, + "learning_rate": 0.00036558270217444417, + "loss": 0.4726, + "step": 110575 + }, + { + "epoch": 26.99, + "learning_rate": 0.0003655521622281945, + "loss": 0.4478, + "step": 110600 + }, + { + "epoch": 26.99, + "learning_rate": 0.0003655216222819448, + "loss": 0.4744, + "step": 110625 + }, + { + "epoch": 27.0, + "learning_rate": 0.00036549108233569513, + "loss": 0.4539, + "step": 110650 + }, + { + "epoch": 27.01, + "learning_rate": 0.00036546054238944544, + "loss": 0.4507, + "step": 110675 + }, + { + "epoch": 27.01, + "learning_rate": 0.0003654300024431957, + "loss": 0.3868, + "step": 110700 + }, + { + "epoch": 27.02, + "learning_rate": 0.000365399462496946, + "loss": 0.4459, + "step": 110725 + }, + { + "epoch": 27.03, + "learning_rate": 0.0003653689225506963, + "loss": 0.4198, + "step": 110750 + }, + { + "epoch": 27.03, + "learning_rate": 0.00036533838260444665, + "loss": 0.4551, + "step": 110775 + }, + { + "epoch": 27.04, + "learning_rate": 0.00036530784265819695, + "loss": 0.4359, + "step": 110800 + }, + { + "epoch": 27.04, + "learning_rate": 0.00036527730271194726, + "loss": 0.4391, + "step": 110825 + }, + { + "epoch": 27.05, + "learning_rate": 0.0003652467627656975, + "loss": 0.3863, + "step": 110850 + }, + { + "epoch": 27.06, + "learning_rate": 0.0003652162228194478, + "loss": 0.4541, + "step": 110875 + }, + { + "epoch": 27.06, + "learning_rate": 0.00036518568287319817, + "loss": 0.4366, + "step": 110900 + }, + { + "epoch": 27.07, + "learning_rate": 0.00036515514292694847, + "loss": 0.4762, + "step": 110925 + }, + { + "epoch": 27.07, + "learning_rate": 0.0003651246029806988, + "loss": 0.448, + "step": 110950 + }, + { + "epoch": 27.08, + "learning_rate": 0.0003650940630344491, + "loss": 0.4342, + "step": 110975 + }, + { + "epoch": 27.09, + "learning_rate": 0.0003650635230881993, + "loss": 0.4083, + "step": 111000 + }, + { + "epoch": 27.09, + "eval_cer": 0.10622876092112153, + "eval_loss": 0.45828574895858765, + "eval_runtime": 148.8526, + "eval_samples_per_second": 28.169, + "eval_steps_per_second": 7.047, + "eval_wer": 0.4320065252854812, + "step": 111000 + }, + { + "epoch": 27.09, + "learning_rate": 0.0003650329831419497, + "loss": 0.4351, + "step": 111025 + }, + { + "epoch": 27.1, + "learning_rate": 0.0003650024431957, + "loss": 0.3727, + "step": 111050 + }, + { + "epoch": 27.1, + "learning_rate": 0.0003649719032494503, + "loss": 0.4853, + "step": 111075 + }, + { + "epoch": 27.11, + "learning_rate": 0.0003649413633032006, + "loss": 0.4361, + "step": 111100 + }, + { + "epoch": 27.12, + "learning_rate": 0.0003649108233569509, + "loss": 0.4412, + "step": 111125 + }, + { + "epoch": 27.12, + "learning_rate": 0.00036488028341070126, + "loss": 0.3631, + "step": 111150 + }, + { + "epoch": 27.13, + "learning_rate": 0.0003648497434644515, + "loss": 0.4637, + "step": 111175 + }, + { + "epoch": 27.14, + "learning_rate": 0.0003648192035182018, + "loss": 0.3881, + "step": 111200 + }, + { + "epoch": 27.14, + "learning_rate": 0.0003647886635719521, + "loss": 0.4586, + "step": 111225 + }, + { + "epoch": 27.15, + "learning_rate": 0.0003647581236257024, + "loss": 0.4445, + "step": 111250 + }, + { + "epoch": 27.15, + "learning_rate": 0.00036472758367945277, + "loss": 0.4346, + "step": 111275 + }, + { + "epoch": 27.16, + "learning_rate": 0.0003646970437332031, + "loss": 0.3992, + "step": 111300 + }, + { + "epoch": 27.17, + "learning_rate": 0.0003646665037869533, + "loss": 0.4515, + "step": 111325 + }, + { + "epoch": 27.17, + "learning_rate": 0.00036463596384070363, + "loss": 0.3972, + "step": 111350 + }, + { + "epoch": 27.18, + "learning_rate": 0.00036460542389445393, + "loss": 0.4142, + "step": 111375 + }, + { + "epoch": 27.18, + "learning_rate": 0.00036457488394820423, + "loss": 0.3766, + "step": 111400 + }, + { + "epoch": 27.19, + "learning_rate": 0.0003645443440019546, + "loss": 0.4359, + "step": 111425 + }, + { + "epoch": 27.2, + "learning_rate": 0.0003645138040557049, + "loss": 0.3852, + "step": 111450 + }, + { + "epoch": 27.2, + "learning_rate": 0.00036448326410945514, + "loss": 0.4507, + "step": 111475 + }, + { + "epoch": 27.21, + "learning_rate": 0.00036445272416320545, + "loss": 0.4212, + "step": 111500 + }, + { + "epoch": 27.21, + "learning_rate": 0.00036442218421695575, + "loss": 0.4715, + "step": 111525 + }, + { + "epoch": 27.22, + "learning_rate": 0.0003643916442707061, + "loss": 0.4006, + "step": 111550 + }, + { + "epoch": 27.23, + "learning_rate": 0.0003643611043244564, + "loss": 0.4579, + "step": 111575 + }, + { + "epoch": 27.23, + "learning_rate": 0.0003643305643782067, + "loss": 0.4084, + "step": 111600 + }, + { + "epoch": 27.24, + "learning_rate": 0.000364300024431957, + "loss": 0.4738, + "step": 111625 + }, + { + "epoch": 27.24, + "learning_rate": 0.00036426948448570727, + "loss": 0.472, + "step": 111650 + }, + { + "epoch": 27.25, + "learning_rate": 0.0003642389445394576, + "loss": 0.4421, + "step": 111675 + }, + { + "epoch": 27.26, + "learning_rate": 0.00036420840459320793, + "loss": 0.4112, + "step": 111700 + }, + { + "epoch": 27.26, + "learning_rate": 0.00036417786464695823, + "loss": 0.457, + "step": 111725 + }, + { + "epoch": 27.27, + "learning_rate": 0.00036414732470070854, + "loss": 0.4342, + "step": 111750 + }, + { + "epoch": 27.28, + "learning_rate": 0.00036411678475445884, + "loss": 0.4509, + "step": 111775 + }, + { + "epoch": 27.28, + "learning_rate": 0.00036408624480820914, + "loss": 0.3766, + "step": 111800 + }, + { + "epoch": 27.29, + "learning_rate": 0.00036405570486195945, + "loss": 0.4579, + "step": 111825 + }, + { + "epoch": 27.29, + "learning_rate": 0.00036402638651355975, + "loss": 0.4228, + "step": 111850 + }, + { + "epoch": 27.3, + "learning_rate": 0.00036399584656731006, + "loss": 0.4387, + "step": 111875 + }, + { + "epoch": 27.31, + "learning_rate": 0.00036396530662106036, + "loss": 0.407, + "step": 111900 + }, + { + "epoch": 27.31, + "learning_rate": 0.00036393476667481066, + "loss": 0.4576, + "step": 111925 + }, + { + "epoch": 27.32, + "learning_rate": 0.00036390422672856097, + "loss": 0.3912, + "step": 111950 + }, + { + "epoch": 27.32, + "learning_rate": 0.00036387368678231127, + "loss": 0.4313, + "step": 111975 + }, + { + "epoch": 27.33, + "learning_rate": 0.00036384314683606157, + "loss": 0.4289, + "step": 112000 + }, + { + "epoch": 27.34, + "learning_rate": 0.0003638126068898119, + "loss": 0.4334, + "step": 112025 + }, + { + "epoch": 27.34, + "learning_rate": 0.0003637820669435622, + "loss": 0.4155, + "step": 112050 + }, + { + "epoch": 27.35, + "learning_rate": 0.00036375152699731254, + "loss": 0.4347, + "step": 112075 + }, + { + "epoch": 27.35, + "learning_rate": 0.00036372098705106284, + "loss": 0.4325, + "step": 112100 + }, + { + "epoch": 27.36, + "learning_rate": 0.0003636904471048131, + "loss": 0.4639, + "step": 112125 + }, + { + "epoch": 27.37, + "learning_rate": 0.0003636599071585634, + "loss": 0.4588, + "step": 112150 + }, + { + "epoch": 27.37, + "learning_rate": 0.0003636293672123137, + "loss": 0.4401, + "step": 112175 + }, + { + "epoch": 27.38, + "learning_rate": 0.000363598827266064, + "loss": 0.4654, + "step": 112200 + }, + { + "epoch": 27.39, + "learning_rate": 0.00036356828731981436, + "loss": 0.4443, + "step": 112225 + }, + { + "epoch": 27.39, + "learning_rate": 0.00036353774737356466, + "loss": 0.4255, + "step": 112250 + }, + { + "epoch": 27.4, + "learning_rate": 0.0003635072074273149, + "loss": 0.4641, + "step": 112275 + }, + { + "epoch": 27.4, + "learning_rate": 0.0003634766674810652, + "loss": 0.4369, + "step": 112300 + }, + { + "epoch": 27.41, + "learning_rate": 0.0003634461275348155, + "loss": 0.446, + "step": 112325 + }, + { + "epoch": 27.42, + "learning_rate": 0.0003634155875885659, + "loss": 0.4385, + "step": 112350 + }, + { + "epoch": 27.42, + "learning_rate": 0.0003633850476423162, + "loss": 0.4708, + "step": 112375 + }, + { + "epoch": 27.43, + "learning_rate": 0.0003633545076960665, + "loss": 0.4086, + "step": 112400 + }, + { + "epoch": 27.43, + "learning_rate": 0.00036332396774981673, + "loss": 0.4416, + "step": 112425 + }, + { + "epoch": 27.44, + "learning_rate": 0.00036329342780356703, + "loss": 0.4096, + "step": 112450 + }, + { + "epoch": 27.45, + "learning_rate": 0.0003632628878573174, + "loss": 0.4395, + "step": 112475 + }, + { + "epoch": 27.45, + "learning_rate": 0.0003632323479110677, + "loss": 0.4392, + "step": 112500 + }, + { + "epoch": 27.46, + "learning_rate": 0.000363201807964818, + "loss": 0.4743, + "step": 112525 + }, + { + "epoch": 27.46, + "learning_rate": 0.0003631712680185683, + "loss": 0.4474, + "step": 112550 + }, + { + "epoch": 27.47, + "learning_rate": 0.0003631407280723186, + "loss": 0.4738, + "step": 112575 + }, + { + "epoch": 27.48, + "learning_rate": 0.0003631101881260689, + "loss": 0.3719, + "step": 112600 + }, + { + "epoch": 27.48, + "learning_rate": 0.0003630796481798192, + "loss": 0.4503, + "step": 112625 + }, + { + "epoch": 27.49, + "learning_rate": 0.0003630491082335695, + "loss": 0.4223, + "step": 112650 + }, + { + "epoch": 27.5, + "learning_rate": 0.0003630185682873198, + "loss": 0.4613, + "step": 112675 + }, + { + "epoch": 27.5, + "learning_rate": 0.0003629880283410701, + "loss": 0.4107, + "step": 112700 + }, + { + "epoch": 27.51, + "learning_rate": 0.0003629574883948205, + "loss": 0.4359, + "step": 112725 + }, + { + "epoch": 27.51, + "learning_rate": 0.0003629269484485707, + "loss": 0.3979, + "step": 112750 + }, + { + "epoch": 27.52, + "learning_rate": 0.00036289640850232103, + "loss": 0.481, + "step": 112775 + }, + { + "epoch": 27.53, + "learning_rate": 0.00036286586855607133, + "loss": 0.4453, + "step": 112800 + }, + { + "epoch": 27.53, + "learning_rate": 0.00036283532860982164, + "loss": 0.4792, + "step": 112825 + }, + { + "epoch": 27.54, + "learning_rate": 0.000362804788663572, + "loss": 0.4001, + "step": 112850 + }, + { + "epoch": 27.54, + "learning_rate": 0.0003627742487173223, + "loss": 0.43, + "step": 112875 + }, + { + "epoch": 27.55, + "learning_rate": 0.00036274370877107255, + "loss": 0.3869, + "step": 112900 + }, + { + "epoch": 27.56, + "learning_rate": 0.00036271316882482285, + "loss": 0.4596, + "step": 112925 + }, + { + "epoch": 27.56, + "learning_rate": 0.00036268262887857315, + "loss": 0.4507, + "step": 112950 + }, + { + "epoch": 27.57, + "learning_rate": 0.0003626520889323235, + "loss": 0.4765, + "step": 112975 + }, + { + "epoch": 27.57, + "learning_rate": 0.0003626215489860738, + "loss": 0.4441, + "step": 113000 + }, + { + "epoch": 27.58, + "learning_rate": 0.0003625910090398241, + "loss": 0.4576, + "step": 113025 + }, + { + "epoch": 27.59, + "learning_rate": 0.0003625604690935744, + "loss": 0.4279, + "step": 113050 + }, + { + "epoch": 27.59, + "learning_rate": 0.00036252992914732467, + "loss": 0.4251, + "step": 113075 + }, + { + "epoch": 27.6, + "learning_rate": 0.00036249938920107503, + "loss": 0.4277, + "step": 113100 + }, + { + "epoch": 27.6, + "learning_rate": 0.00036246884925482533, + "loss": 0.4642, + "step": 113125 + }, + { + "epoch": 27.61, + "learning_rate": 0.00036243830930857563, + "loss": 0.3901, + "step": 113150 + }, + { + "epoch": 27.62, + "learning_rate": 0.00036240776936232594, + "loss": 0.4645, + "step": 113175 + }, + { + "epoch": 27.62, + "learning_rate": 0.00036237722941607624, + "loss": 0.4778, + "step": 113200 + }, + { + "epoch": 27.63, + "learning_rate": 0.00036234668946982654, + "loss": 0.4684, + "step": 113225 + }, + { + "epoch": 27.64, + "learning_rate": 0.00036231614952357685, + "loss": 0.4339, + "step": 113250 + }, + { + "epoch": 27.64, + "learning_rate": 0.00036228560957732715, + "loss": 0.4372, + "step": 113275 + }, + { + "epoch": 27.65, + "learning_rate": 0.00036225506963107745, + "loss": 0.4579, + "step": 113300 + }, + { + "epoch": 27.65, + "learning_rate": 0.00036222452968482776, + "loss": 0.4499, + "step": 113325 + }, + { + "epoch": 27.66, + "learning_rate": 0.0003621939897385781, + "loss": 0.4247, + "step": 113350 + }, + { + "epoch": 27.67, + "learning_rate": 0.00036216344979232836, + "loss": 0.4518, + "step": 113375 + }, + { + "epoch": 27.67, + "learning_rate": 0.00036213290984607867, + "loss": 0.4446, + "step": 113400 + }, + { + "epoch": 27.68, + "learning_rate": 0.00036210236989982897, + "loss": 0.4472, + "step": 113425 + }, + { + "epoch": 27.68, + "learning_rate": 0.0003620718299535793, + "loss": 0.3938, + "step": 113450 + }, + { + "epoch": 27.69, + "learning_rate": 0.0003620412900073296, + "loss": 0.4338, + "step": 113475 + }, + { + "epoch": 27.7, + "learning_rate": 0.00036201075006107994, + "loss": 0.3876, + "step": 113500 + }, + { + "epoch": 27.7, + "learning_rate": 0.00036198021011483024, + "loss": 0.4739, + "step": 113525 + }, + { + "epoch": 27.71, + "learning_rate": 0.0003619496701685805, + "loss": 0.4749, + "step": 113550 + }, + { + "epoch": 27.71, + "learning_rate": 0.0003619191302223308, + "loss": 0.4201, + "step": 113575 + }, + { + "epoch": 27.72, + "learning_rate": 0.0003618885902760811, + "loss": 0.4033, + "step": 113600 + }, + { + "epoch": 27.73, + "learning_rate": 0.00036185805032983145, + "loss": 0.4496, + "step": 113625 + }, + { + "epoch": 27.73, + "learning_rate": 0.00036182751038358176, + "loss": 0.4209, + "step": 113650 + }, + { + "epoch": 27.74, + "learning_rate": 0.00036179697043733206, + "loss": 0.4398, + "step": 113675 + }, + { + "epoch": 27.75, + "learning_rate": 0.0003617664304910823, + "loss": 0.4328, + "step": 113700 + }, + { + "epoch": 27.75, + "learning_rate": 0.0003617358905448326, + "loss": 0.4169, + "step": 113725 + }, + { + "epoch": 27.76, + "learning_rate": 0.00036170535059858297, + "loss": 0.4463, + "step": 113750 + }, + { + "epoch": 27.76, + "learning_rate": 0.00036167481065233327, + "loss": 0.4666, + "step": 113775 + }, + { + "epoch": 27.77, + "learning_rate": 0.0003616442707060836, + "loss": 0.4087, + "step": 113800 + }, + { + "epoch": 27.78, + "learning_rate": 0.0003616137307598339, + "loss": 0.4208, + "step": 113825 + }, + { + "epoch": 27.78, + "learning_rate": 0.00036158319081358413, + "loss": 0.4215, + "step": 113850 + }, + { + "epoch": 27.79, + "learning_rate": 0.0003615526508673345, + "loss": 0.4414, + "step": 113875 + }, + { + "epoch": 27.79, + "learning_rate": 0.0003615221109210848, + "loss": 0.4207, + "step": 113900 + }, + { + "epoch": 27.8, + "learning_rate": 0.0003614915709748351, + "loss": 0.4305, + "step": 113925 + }, + { + "epoch": 27.81, + "learning_rate": 0.0003614610310285854, + "loss": 0.3685, + "step": 113950 + }, + { + "epoch": 27.81, + "learning_rate": 0.0003614304910823357, + "loss": 0.4715, + "step": 113975 + }, + { + "epoch": 27.82, + "learning_rate": 0.000361399951136086, + "loss": 0.4618, + "step": 114000 + }, + { + "epoch": 27.82, + "eval_cer": 0.10462203422892519, + "eval_loss": 0.42293429374694824, + "eval_runtime": 148.9045, + "eval_samples_per_second": 28.159, + "eval_steps_per_second": 7.045, + "eval_wer": 0.42812398042414357, + "step": 114000 + }, + { + "epoch": 27.82, + "learning_rate": 0.0003613694111898363, + "loss": 0.4892, + "step": 114025 + }, + { + "epoch": 27.83, + "learning_rate": 0.0003613388712435866, + "loss": 0.4525, + "step": 114050 + }, + { + "epoch": 27.84, + "learning_rate": 0.0003613083312973369, + "loss": 0.443, + "step": 114075 + }, + { + "epoch": 27.84, + "learning_rate": 0.0003612777913510872, + "loss": 0.4399, + "step": 114100 + }, + { + "epoch": 27.85, + "learning_rate": 0.0003612472514048376, + "loss": 0.4276, + "step": 114125 + }, + { + "epoch": 27.86, + "learning_rate": 0.0003612167114585879, + "loss": 0.3892, + "step": 114150 + }, + { + "epoch": 27.86, + "learning_rate": 0.0003611861715123381, + "loss": 0.4562, + "step": 114175 + }, + { + "epoch": 27.87, + "learning_rate": 0.00036115563156608843, + "loss": 0.4128, + "step": 114200 + }, + { + "epoch": 27.87, + "learning_rate": 0.00036112509161983873, + "loss": 0.4409, + "step": 114225 + }, + { + "epoch": 27.88, + "learning_rate": 0.0003610945516735891, + "loss": 0.4134, + "step": 114250 + }, + { + "epoch": 27.89, + "learning_rate": 0.0003610640117273394, + "loss": 0.4426, + "step": 114275 + }, + { + "epoch": 27.89, + "learning_rate": 0.0003610334717810897, + "loss": 0.4581, + "step": 114300 + }, + { + "epoch": 27.9, + "learning_rate": 0.00036100293183483995, + "loss": 0.445, + "step": 114325 + }, + { + "epoch": 27.9, + "learning_rate": 0.00036097239188859025, + "loss": 0.4231, + "step": 114350 + }, + { + "epoch": 27.91, + "learning_rate": 0.0003609418519423406, + "loss": 0.4608, + "step": 114375 + }, + { + "epoch": 27.92, + "learning_rate": 0.0003609113119960909, + "loss": 0.4112, + "step": 114400 + }, + { + "epoch": 27.92, + "learning_rate": 0.0003608807720498412, + "loss": 0.4675, + "step": 114425 + }, + { + "epoch": 27.93, + "learning_rate": 0.0003608502321035915, + "loss": 0.4105, + "step": 114450 + }, + { + "epoch": 27.93, + "learning_rate": 0.00036081969215734177, + "loss": 0.4548, + "step": 114475 + }, + { + "epoch": 27.94, + "learning_rate": 0.0003607891522110921, + "loss": 0.471, + "step": 114500 + }, + { + "epoch": 27.95, + "learning_rate": 0.0003607586122648424, + "loss": 0.4264, + "step": 114525 + }, + { + "epoch": 27.95, + "learning_rate": 0.00036072807231859273, + "loss": 0.418, + "step": 114550 + }, + { + "epoch": 27.96, + "learning_rate": 0.00036069753237234303, + "loss": 0.4569, + "step": 114575 + }, + { + "epoch": 27.96, + "learning_rate": 0.00036066699242609334, + "loss": 0.4326, + "step": 114600 + }, + { + "epoch": 27.97, + "learning_rate": 0.0003606364524798437, + "loss": 0.4641, + "step": 114625 + }, + { + "epoch": 27.98, + "learning_rate": 0.00036060591253359394, + "loss": 0.4108, + "step": 114650 + }, + { + "epoch": 27.98, + "learning_rate": 0.00036057537258734425, + "loss": 0.4225, + "step": 114675 + }, + { + "epoch": 27.99, + "learning_rate": 0.00036054483264109455, + "loss": 0.45, + "step": 114700 + }, + { + "epoch": 28.0, + "learning_rate": 0.00036051429269484485, + "loss": 0.4469, + "step": 114725 + }, + { + "epoch": 28.0, + "learning_rate": 0.00036048375274859516, + "loss": 0.3933, + "step": 114750 + }, + { + "epoch": 28.01, + "learning_rate": 0.0003604532128023455, + "loss": 0.4146, + "step": 114775 + }, + { + "epoch": 28.01, + "learning_rate": 0.00036042267285609576, + "loss": 0.4307, + "step": 114800 + }, + { + "epoch": 28.02, + "learning_rate": 0.00036039213290984607, + "loss": 0.4348, + "step": 114825 + }, + { + "epoch": 28.03, + "learning_rate": 0.00036036159296359637, + "loss": 0.499, + "step": 114850 + }, + { + "epoch": 28.03, + "learning_rate": 0.0003603310530173467, + "loss": 0.441, + "step": 114875 + }, + { + "epoch": 28.04, + "learning_rate": 0.00036030051307109703, + "loss": 0.4065, + "step": 114900 + }, + { + "epoch": 28.04, + "learning_rate": 0.00036026997312484733, + "loss": 0.4322, + "step": 114925 + }, + { + "epoch": 28.05, + "learning_rate": 0.0003602394331785976, + "loss": 0.4002, + "step": 114950 + }, + { + "epoch": 28.06, + "learning_rate": 0.0003602088932323479, + "loss": 0.4478, + "step": 114975 + }, + { + "epoch": 28.06, + "learning_rate": 0.0003601783532860982, + "loss": 0.3767, + "step": 115000 + }, + { + "epoch": 28.07, + "learning_rate": 0.00036014781333984855, + "loss": 0.4317, + "step": 115025 + }, + { + "epoch": 28.07, + "learning_rate": 0.00036011727339359885, + "loss": 0.451, + "step": 115050 + }, + { + "epoch": 28.08, + "learning_rate": 0.00036008673344734915, + "loss": 0.4586, + "step": 115075 + }, + { + "epoch": 28.09, + "learning_rate": 0.00036005619350109946, + "loss": 0.4371, + "step": 115100 + }, + { + "epoch": 28.09, + "learning_rate": 0.0003600256535548497, + "loss": 0.4382, + "step": 115125 + }, + { + "epoch": 28.1, + "learning_rate": 0.00035999511360860006, + "loss": 0.3706, + "step": 115150 + }, + { + "epoch": 28.11, + "learning_rate": 0.00035996457366235037, + "loss": 0.4424, + "step": 115175 + }, + { + "epoch": 28.11, + "learning_rate": 0.00035993403371610067, + "loss": 0.4072, + "step": 115200 + }, + { + "epoch": 28.12, + "learning_rate": 0.000359903493769851, + "loss": 0.4112, + "step": 115225 + }, + { + "epoch": 28.12, + "learning_rate": 0.0003598729538236013, + "loss": 0.3865, + "step": 115250 + }, + { + "epoch": 28.13, + "learning_rate": 0.0003598424138773516, + "loss": 0.4749, + "step": 115275 + }, + { + "epoch": 28.14, + "learning_rate": 0.0003598118739311019, + "loss": 0.416, + "step": 115300 + }, + { + "epoch": 28.14, + "learning_rate": 0.0003597813339848522, + "loss": 0.4019, + "step": 115325 + }, + { + "epoch": 28.15, + "learning_rate": 0.0003597507940386025, + "loss": 0.4413, + "step": 115350 + }, + { + "epoch": 28.15, + "learning_rate": 0.0003597202540923528, + "loss": 0.427, + "step": 115375 + }, + { + "epoch": 28.16, + "learning_rate": 0.00035968971414610315, + "loss": 0.3767, + "step": 115400 + }, + { + "epoch": 28.17, + "learning_rate": 0.0003596591741998534, + "loss": 0.4356, + "step": 115425 + }, + { + "epoch": 28.17, + "learning_rate": 0.0003596286342536037, + "loss": 0.4551, + "step": 115450 + }, + { + "epoch": 28.18, + "learning_rate": 0.000359598094307354, + "loss": 0.446, + "step": 115475 + }, + { + "epoch": 28.18, + "learning_rate": 0.0003595675543611043, + "loss": 0.4216, + "step": 115500 + }, + { + "epoch": 28.19, + "learning_rate": 0.00035953701441485467, + "loss": 0.4307, + "step": 115525 + }, + { + "epoch": 28.2, + "learning_rate": 0.00035950647446860497, + "loss": 0.4476, + "step": 115550 + }, + { + "epoch": 28.2, + "learning_rate": 0.0003594759345223553, + "loss": 0.4522, + "step": 115575 + }, + { + "epoch": 28.21, + "learning_rate": 0.0003594453945761055, + "loss": 0.398, + "step": 115600 + }, + { + "epoch": 28.21, + "learning_rate": 0.00035941485462985583, + "loss": 0.4434, + "step": 115625 + }, + { + "epoch": 28.22, + "learning_rate": 0.0003593843146836062, + "loss": 0.4161, + "step": 115650 + }, + { + "epoch": 28.23, + "learning_rate": 0.0003593537747373565, + "loss": 0.4172, + "step": 115675 + }, + { + "epoch": 28.23, + "learning_rate": 0.0003593232347911068, + "loss": 0.4633, + "step": 115700 + }, + { + "epoch": 28.24, + "learning_rate": 0.0003592926948448571, + "loss": 0.4339, + "step": 115725 + }, + { + "epoch": 28.25, + "learning_rate": 0.00035926215489860735, + "loss": 0.4266, + "step": 115750 + }, + { + "epoch": 28.25, + "learning_rate": 0.0003592316149523577, + "loss": 0.4322, + "step": 115775 + }, + { + "epoch": 28.26, + "learning_rate": 0.000359201075006108, + "loss": 0.4352, + "step": 115800 + }, + { + "epoch": 28.26, + "learning_rate": 0.0003591705350598583, + "loss": 0.4283, + "step": 115825 + }, + { + "epoch": 28.27, + "learning_rate": 0.0003591399951136086, + "loss": 0.4588, + "step": 115850 + }, + { + "epoch": 28.28, + "learning_rate": 0.0003591094551673589, + "loss": 0.4461, + "step": 115875 + }, + { + "epoch": 28.28, + "learning_rate": 0.0003590789152211092, + "loss": 0.3807, + "step": 115900 + }, + { + "epoch": 28.29, + "learning_rate": 0.0003590483752748595, + "loss": 0.4291, + "step": 115925 + }, + { + "epoch": 28.29, + "learning_rate": 0.0003590178353286098, + "loss": 0.4416, + "step": 115950 + }, + { + "epoch": 28.3, + "learning_rate": 0.00035898729538236013, + "loss": 0.4219, + "step": 115975 + }, + { + "epoch": 28.31, + "learning_rate": 0.00035895675543611043, + "loss": 0.4263, + "step": 116000 + }, + { + "epoch": 28.31, + "learning_rate": 0.0003589262154898608, + "loss": 0.4394, + "step": 116025 + }, + { + "epoch": 28.32, + "learning_rate": 0.0003588956755436111, + "loss": 0.4312, + "step": 116050 + }, + { + "epoch": 28.32, + "learning_rate": 0.00035886513559736134, + "loss": 0.4249, + "step": 116075 + }, + { + "epoch": 28.33, + "learning_rate": 0.00035883459565111165, + "loss": 0.4145, + "step": 116100 + }, + { + "epoch": 28.34, + "learning_rate": 0.00035880405570486195, + "loss": 0.4173, + "step": 116125 + }, + { + "epoch": 28.34, + "learning_rate": 0.00035877351575861225, + "loss": 0.4505, + "step": 116150 + }, + { + "epoch": 28.35, + "learning_rate": 0.0003587429758123626, + "loss": 0.4273, + "step": 116175 + }, + { + "epoch": 28.36, + "learning_rate": 0.0003587124358661129, + "loss": 0.3887, + "step": 116200 + }, + { + "epoch": 28.36, + "learning_rate": 0.00035868189591986316, + "loss": 0.416, + "step": 116225 + }, + { + "epoch": 28.37, + "learning_rate": 0.00035865135597361347, + "loss": 0.4085, + "step": 116250 + }, + { + "epoch": 28.37, + "learning_rate": 0.00035862081602736377, + "loss": 0.4551, + "step": 116275 + }, + { + "epoch": 28.38, + "learning_rate": 0.0003585914976789641, + "loss": 0.42, + "step": 116300 + }, + { + "epoch": 28.39, + "learning_rate": 0.00035856095773271443, + "loss": 0.4185, + "step": 116325 + }, + { + "epoch": 28.39, + "learning_rate": 0.00035853041778646474, + "loss": 0.4174, + "step": 116350 + }, + { + "epoch": 28.4, + "learning_rate": 0.000358499877840215, + "loss": 0.4303, + "step": 116375 + }, + { + "epoch": 28.4, + "learning_rate": 0.0003584693378939653, + "loss": 0.4787, + "step": 116400 + }, + { + "epoch": 28.41, + "learning_rate": 0.0003584387979477156, + "loss": 0.4276, + "step": 116425 + }, + { + "epoch": 28.42, + "learning_rate": 0.00035840825800146595, + "loss": 0.4364, + "step": 116450 + }, + { + "epoch": 28.42, + "learning_rate": 0.00035837771805521625, + "loss": 0.4598, + "step": 116475 + }, + { + "epoch": 28.43, + "learning_rate": 0.00035834717810896656, + "loss": 0.4465, + "step": 116500 + }, + { + "epoch": 28.43, + "learning_rate": 0.00035831663816271686, + "loss": 0.4561, + "step": 116525 + }, + { + "epoch": 28.44, + "learning_rate": 0.0003582860982164671, + "loss": 0.3765, + "step": 116550 + }, + { + "epoch": 28.45, + "learning_rate": 0.00035825555827021747, + "loss": 0.3965, + "step": 116575 + }, + { + "epoch": 28.45, + "learning_rate": 0.00035822501832396777, + "loss": 0.4291, + "step": 116600 + }, + { + "epoch": 28.46, + "learning_rate": 0.0003581944783777181, + "loss": 0.4005, + "step": 116625 + }, + { + "epoch": 28.47, + "learning_rate": 0.0003581639384314684, + "loss": 0.4187, + "step": 116650 + }, + { + "epoch": 28.47, + "learning_rate": 0.0003581333984852187, + "loss": 0.4803, + "step": 116675 + }, + { + "epoch": 28.48, + "learning_rate": 0.00035810285853896893, + "loss": 0.4358, + "step": 116700 + }, + { + "epoch": 28.48, + "learning_rate": 0.0003580723185927193, + "loss": 0.4248, + "step": 116725 + }, + { + "epoch": 28.49, + "learning_rate": 0.0003580417786464696, + "loss": 0.4353, + "step": 116750 + }, + { + "epoch": 28.5, + "learning_rate": 0.0003580112387002199, + "loss": 0.4402, + "step": 116775 + }, + { + "epoch": 28.5, + "learning_rate": 0.0003579806987539702, + "loss": 0.4198, + "step": 116800 + }, + { + "epoch": 28.51, + "learning_rate": 0.0003579501588077205, + "loss": 0.4321, + "step": 116825 + }, + { + "epoch": 28.51, + "learning_rate": 0.0003579196188614708, + "loss": 0.4073, + "step": 116850 + }, + { + "epoch": 28.52, + "learning_rate": 0.0003578890789152211, + "loss": 0.4597, + "step": 116875 + }, + { + "epoch": 28.53, + "learning_rate": 0.0003578585389689714, + "loss": 0.43, + "step": 116900 + }, + { + "epoch": 28.53, + "learning_rate": 0.0003578279990227217, + "loss": 0.454, + "step": 116925 + }, + { + "epoch": 28.54, + "learning_rate": 0.000357797459076472, + "loss": 0.3605, + "step": 116950 + }, + { + "epoch": 28.54, + "learning_rate": 0.0003577669191302224, + "loss": 0.4225, + "step": 116975 + }, + { + "epoch": 28.55, + "learning_rate": 0.0003577363791839727, + "loss": 0.4538, + "step": 117000 + }, + { + "epoch": 28.55, + "eval_cer": 0.10224531071938237, + "eval_loss": 0.4060422480106354, + "eval_runtime": 148.9547, + "eval_samples_per_second": 28.149, + "eval_steps_per_second": 7.042, + "eval_wer": 0.42, + "step": 117000 + }, + { + "epoch": 28.56, + "learning_rate": 0.00035770583923772293, + "loss": 0.4308, + "step": 117025 + }, + { + "epoch": 28.56, + "learning_rate": 0.00035767529929147323, + "loss": 0.4009, + "step": 117050 + }, + { + "epoch": 28.57, + "learning_rate": 0.00035764475934522353, + "loss": 0.4436, + "step": 117075 + }, + { + "epoch": 28.57, + "learning_rate": 0.0003576142193989739, + "loss": 0.383, + "step": 117100 + }, + { + "epoch": 28.58, + "learning_rate": 0.0003575836794527242, + "loss": 0.4641, + "step": 117125 + }, + { + "epoch": 28.59, + "learning_rate": 0.0003575531395064745, + "loss": 0.4427, + "step": 117150 + }, + { + "epoch": 28.59, + "learning_rate": 0.00035752259956022475, + "loss": 0.4591, + "step": 117175 + }, + { + "epoch": 28.6, + "learning_rate": 0.00035749205961397505, + "loss": 0.4661, + "step": 117200 + }, + { + "epoch": 28.61, + "learning_rate": 0.0003574615196677254, + "loss": 0.5024, + "step": 117225 + }, + { + "epoch": 28.61, + "learning_rate": 0.0003574309797214757, + "loss": 0.457, + "step": 117250 + }, + { + "epoch": 28.62, + "learning_rate": 0.000357400439775226, + "loss": 0.4456, + "step": 117275 + }, + { + "epoch": 28.62, + "learning_rate": 0.0003573698998289763, + "loss": 0.4282, + "step": 117300 + }, + { + "epoch": 28.63, + "learning_rate": 0.00035733935988272657, + "loss": 0.457, + "step": 117325 + }, + { + "epoch": 28.64, + "learning_rate": 0.0003573088199364769, + "loss": 0.3939, + "step": 117350 + }, + { + "epoch": 28.64, + "learning_rate": 0.00035727827999022723, + "loss": 0.4394, + "step": 117375 + }, + { + "epoch": 28.65, + "learning_rate": 0.00035724774004397753, + "loss": 0.4435, + "step": 117400 + }, + { + "epoch": 28.65, + "learning_rate": 0.00035721720009772783, + "loss": 0.4603, + "step": 117425 + }, + { + "epoch": 28.66, + "learning_rate": 0.00035718666015147814, + "loss": 0.4088, + "step": 117450 + }, + { + "epoch": 28.67, + "learning_rate": 0.00035715612020522844, + "loss": 0.4357, + "step": 117475 + }, + { + "epoch": 28.67, + "learning_rate": 0.00035712558025897874, + "loss": 0.3844, + "step": 117500 + }, + { + "epoch": 28.68, + "learning_rate": 0.00035709504031272905, + "loss": 0.4333, + "step": 117525 + }, + { + "epoch": 28.68, + "learning_rate": 0.00035706450036647935, + "loss": 0.4354, + "step": 117550 + }, + { + "epoch": 28.69, + "learning_rate": 0.00035703396042022965, + "loss": 0.4478, + "step": 117575 + }, + { + "epoch": 28.7, + "learning_rate": 0.00035700342047398, + "loss": 0.44, + "step": 117600 + }, + { + "epoch": 28.7, + "learning_rate": 0.0003569728805277303, + "loss": 0.4312, + "step": 117625 + }, + { + "epoch": 28.71, + "learning_rate": 0.00035694234058148056, + "loss": 0.3937, + "step": 117650 + }, + { + "epoch": 28.72, + "learning_rate": 0.00035691180063523087, + "loss": 0.4529, + "step": 117675 + }, + { + "epoch": 28.72, + "learning_rate": 0.00035688126068898117, + "loss": 0.4707, + "step": 117700 + }, + { + "epoch": 28.73, + "learning_rate": 0.00035685072074273153, + "loss": 0.4158, + "step": 117725 + }, + { + "epoch": 28.73, + "learning_rate": 0.00035682018079648183, + "loss": 0.4417, + "step": 117750 + }, + { + "epoch": 28.74, + "learning_rate": 0.00035678964085023214, + "loss": 0.4441, + "step": 117775 + }, + { + "epoch": 28.75, + "learning_rate": 0.0003567591009039824, + "loss": 0.4552, + "step": 117800 + }, + { + "epoch": 28.75, + "learning_rate": 0.0003567285609577327, + "loss": 0.4226, + "step": 117825 + }, + { + "epoch": 28.76, + "learning_rate": 0.00035669802101148305, + "loss": 0.4139, + "step": 117850 + }, + { + "epoch": 28.76, + "learning_rate": 0.00035666748106523335, + "loss": 0.4315, + "step": 117875 + }, + { + "epoch": 28.77, + "learning_rate": 0.00035663694111898365, + "loss": 0.4402, + "step": 117900 + }, + { + "epoch": 28.78, + "learning_rate": 0.00035660640117273396, + "loss": 0.4528, + "step": 117925 + }, + { + "epoch": 28.78, + "learning_rate": 0.0003565758612264842, + "loss": 0.3793, + "step": 117950 + }, + { + "epoch": 28.79, + "learning_rate": 0.00035654532128023456, + "loss": 0.424, + "step": 117975 + }, + { + "epoch": 28.79, + "learning_rate": 0.00035651478133398487, + "loss": 0.4328, + "step": 118000 + }, + { + "epoch": 28.8, + "learning_rate": 0.00035648424138773517, + "loss": 0.4264, + "step": 118025 + }, + { + "epoch": 28.81, + "learning_rate": 0.00035645370144148547, + "loss": 0.4129, + "step": 118050 + }, + { + "epoch": 28.81, + "learning_rate": 0.0003564231614952358, + "loss": 0.4328, + "step": 118075 + }, + { + "epoch": 28.82, + "learning_rate": 0.00035639262154898613, + "loss": 0.3993, + "step": 118100 + }, + { + "epoch": 28.83, + "learning_rate": 0.0003563620816027364, + "loss": 0.4388, + "step": 118125 + }, + { + "epoch": 28.83, + "learning_rate": 0.0003563315416564867, + "loss": 0.4482, + "step": 118150 + }, + { + "epoch": 28.84, + "learning_rate": 0.000356301001710237, + "loss": 0.4477, + "step": 118175 + }, + { + "epoch": 28.84, + "learning_rate": 0.0003562704617639873, + "loss": 0.3916, + "step": 118200 + }, + { + "epoch": 28.85, + "learning_rate": 0.0003562399218177376, + "loss": 0.4721, + "step": 118225 + }, + { + "epoch": 28.86, + "learning_rate": 0.00035620938187148795, + "loss": 0.3895, + "step": 118250 + }, + { + "epoch": 28.86, + "learning_rate": 0.0003561788419252382, + "loss": 0.4329, + "step": 118275 + }, + { + "epoch": 28.87, + "learning_rate": 0.0003561483019789885, + "loss": 0.4063, + "step": 118300 + }, + { + "epoch": 28.87, + "learning_rate": 0.0003561177620327388, + "loss": 0.4025, + "step": 118325 + }, + { + "epoch": 28.88, + "learning_rate": 0.0003560872220864891, + "loss": 0.4194, + "step": 118350 + }, + { + "epoch": 28.89, + "learning_rate": 0.00035605668214023947, + "loss": 0.4511, + "step": 118375 + }, + { + "epoch": 28.89, + "learning_rate": 0.0003560261421939898, + "loss": 0.3908, + "step": 118400 + }, + { + "epoch": 28.9, + "learning_rate": 0.00035599560224774, + "loss": 0.449, + "step": 118425 + }, + { + "epoch": 28.9, + "learning_rate": 0.0003559650623014903, + "loss": 0.391, + "step": 118450 + }, + { + "epoch": 28.91, + "learning_rate": 0.00035593452235524063, + "loss": 0.4691, + "step": 118475 + }, + { + "epoch": 28.92, + "learning_rate": 0.000355903982408991, + "loss": 0.4369, + "step": 118500 + }, + { + "epoch": 28.92, + "learning_rate": 0.0003558734424627413, + "loss": 0.4306, + "step": 118525 + }, + { + "epoch": 28.93, + "learning_rate": 0.0003558429025164916, + "loss": 0.4192, + "step": 118550 + }, + { + "epoch": 28.93, + "learning_rate": 0.0003558123625702419, + "loss": 0.4288, + "step": 118575 + }, + { + "epoch": 28.94, + "learning_rate": 0.00035578182262399215, + "loss": 0.4263, + "step": 118600 + }, + { + "epoch": 28.95, + "learning_rate": 0.0003557512826777425, + "loss": 0.4425, + "step": 118625 + }, + { + "epoch": 28.95, + "learning_rate": 0.0003557207427314928, + "loss": 0.425, + "step": 118650 + }, + { + "epoch": 28.96, + "learning_rate": 0.0003556902027852431, + "loss": 0.4438, + "step": 118675 + }, + { + "epoch": 28.97, + "learning_rate": 0.0003556608844368434, + "loss": 0.4005, + "step": 118700 + }, + { + "epoch": 28.97, + "learning_rate": 0.0003556303444905937, + "loss": 0.4537, + "step": 118725 + }, + { + "epoch": 28.98, + "learning_rate": 0.00035559980454434397, + "loss": 0.4252, + "step": 118750 + }, + { + "epoch": 28.98, + "learning_rate": 0.00035556926459809427, + "loss": 0.4506, + "step": 118775 + }, + { + "epoch": 28.99, + "learning_rate": 0.00035553872465184463, + "loss": 0.403, + "step": 118800 + }, + { + "epoch": 29.0, + "learning_rate": 0.00035550818470559493, + "loss": 0.4524, + "step": 118825 + }, + { + "epoch": 29.0, + "learning_rate": 0.00035547886635719524, + "loss": 0.4421, + "step": 118850 + }, + { + "epoch": 29.01, + "learning_rate": 0.00035544832641094554, + "loss": 0.4191, + "step": 118875 + }, + { + "epoch": 29.01, + "learning_rate": 0.0003554177864646958, + "loss": 0.3572, + "step": 118900 + }, + { + "epoch": 29.02, + "learning_rate": 0.0003553872465184461, + "loss": 0.4421, + "step": 118925 + }, + { + "epoch": 29.03, + "learning_rate": 0.00035535670657219645, + "loss": 0.4118, + "step": 118950 + }, + { + "epoch": 29.03, + "learning_rate": 0.00035532616662594676, + "loss": 0.4155, + "step": 118975 + }, + { + "epoch": 29.04, + "learning_rate": 0.00035529562667969706, + "loss": 0.3973, + "step": 119000 + }, + { + "epoch": 29.04, + "learning_rate": 0.00035526508673344736, + "loss": 0.3976, + "step": 119025 + }, + { + "epoch": 29.05, + "learning_rate": 0.00035523454678719767, + "loss": 0.401, + "step": 119050 + }, + { + "epoch": 29.06, + "learning_rate": 0.00035520400684094797, + "loss": 0.4373, + "step": 119075 + }, + { + "epoch": 29.06, + "learning_rate": 0.0003551734668946983, + "loss": 0.4238, + "step": 119100 + }, + { + "epoch": 29.07, + "learning_rate": 0.0003551429269484486, + "loss": 0.4185, + "step": 119125 + }, + { + "epoch": 29.08, + "learning_rate": 0.0003551123870021989, + "loss": 0.4378, + "step": 119150 + }, + { + "epoch": 29.08, + "learning_rate": 0.0003550818470559492, + "loss": 0.4117, + "step": 119175 + }, + { + "epoch": 29.09, + "learning_rate": 0.00035505130710969954, + "loss": 0.3991, + "step": 119200 + }, + { + "epoch": 29.09, + "learning_rate": 0.0003550207671634498, + "loss": 0.4033, + "step": 119225 + }, + { + "epoch": 29.1, + "learning_rate": 0.0003549902272172001, + "loss": 0.4718, + "step": 119250 + }, + { + "epoch": 29.11, + "learning_rate": 0.0003549596872709504, + "loss": 0.4167, + "step": 119275 + }, + { + "epoch": 29.11, + "learning_rate": 0.0003549291473247007, + "loss": 0.3826, + "step": 119300 + }, + { + "epoch": 29.12, + "learning_rate": 0.00035489860737845106, + "loss": 0.396, + "step": 119325 + }, + { + "epoch": 29.12, + "learning_rate": 0.00035486806743220136, + "loss": 0.4078, + "step": 119350 + }, + { + "epoch": 29.13, + "learning_rate": 0.0003548375274859516, + "loss": 0.4355, + "step": 119375 + }, + { + "epoch": 29.14, + "learning_rate": 0.0003548069875397019, + "loss": 0.4185, + "step": 119400 + }, + { + "epoch": 29.14, + "learning_rate": 0.0003547764475934522, + "loss": 0.4028, + "step": 119425 + }, + { + "epoch": 29.15, + "learning_rate": 0.0003547459076472026, + "loss": 0.4133, + "step": 119450 + }, + { + "epoch": 29.15, + "learning_rate": 0.0003547153677009529, + "loss": 0.4119, + "step": 119475 + }, + { + "epoch": 29.16, + "learning_rate": 0.0003546848277547032, + "loss": 0.4123, + "step": 119500 + }, + { + "epoch": 29.17, + "learning_rate": 0.0003546542878084535, + "loss": 0.4062, + "step": 119525 + }, + { + "epoch": 29.17, + "learning_rate": 0.00035462374786220373, + "loss": 0.3728, + "step": 119550 + }, + { + "epoch": 29.18, + "learning_rate": 0.00035459320791595404, + "loss": 0.4246, + "step": 119575 + }, + { + "epoch": 29.18, + "learning_rate": 0.0003545626679697044, + "loss": 0.4404, + "step": 119600 + }, + { + "epoch": 29.19, + "learning_rate": 0.0003545321280234547, + "loss": 0.3943, + "step": 119625 + }, + { + "epoch": 29.2, + "learning_rate": 0.000354501588077205, + "loss": 0.3738, + "step": 119650 + }, + { + "epoch": 29.2, + "learning_rate": 0.0003544710481309553, + "loss": 0.4253, + "step": 119675 + }, + { + "epoch": 29.21, + "learning_rate": 0.00035444050818470555, + "loss": 0.395, + "step": 119700 + }, + { + "epoch": 29.22, + "learning_rate": 0.0003544099682384559, + "loss": 0.4025, + "step": 119725 + }, + { + "epoch": 29.22, + "learning_rate": 0.0003543794282922062, + "loss": 0.3931, + "step": 119750 + }, + { + "epoch": 29.23, + "learning_rate": 0.0003543488883459565, + "loss": 0.4414, + "step": 119775 + }, + { + "epoch": 29.23, + "learning_rate": 0.0003543183483997068, + "loss": 0.4295, + "step": 119800 + }, + { + "epoch": 29.24, + "learning_rate": 0.0003542878084534571, + "loss": 0.4193, + "step": 119825 + }, + { + "epoch": 29.25, + "learning_rate": 0.00035425726850720743, + "loss": 0.43, + "step": 119850 + }, + { + "epoch": 29.25, + "learning_rate": 0.00035422672856095773, + "loss": 0.4229, + "step": 119875 + }, + { + "epoch": 29.26, + "learning_rate": 0.00035419618861470803, + "loss": 0.4609, + "step": 119900 + }, + { + "epoch": 29.26, + "learning_rate": 0.00035416564866845834, + "loss": 0.4193, + "step": 119925 + }, + { + "epoch": 29.27, + "learning_rate": 0.00035413510872220864, + "loss": 0.3949, + "step": 119950 + }, + { + "epoch": 29.28, + "learning_rate": 0.000354104568775959, + "loss": 0.441, + "step": 119975 + }, + { + "epoch": 29.28, + "learning_rate": 0.0003540740288297093, + "loss": 0.4378, + "step": 120000 + }, + { + "epoch": 29.28, + "eval_cer": 0.10296397441557241, + "eval_loss": 0.4238515794277191, + "eval_runtime": 148.9169, + "eval_samples_per_second": 28.157, + "eval_steps_per_second": 7.044, + "eval_wer": 0.4160522022838499, + "step": 120000 + }, + { + "epoch": 29.29, + "learning_rate": 0.00035404348888345955, + "loss": 0.4231, + "step": 120025 + }, + { + "epoch": 29.29, + "learning_rate": 0.00035401294893720985, + "loss": 0.4101, + "step": 120050 + }, + { + "epoch": 29.3, + "learning_rate": 0.00035398240899096016, + "loss": 0.4088, + "step": 120075 + }, + { + "epoch": 29.31, + "learning_rate": 0.0003539518690447105, + "loss": 0.3619, + "step": 120100 + }, + { + "epoch": 29.31, + "learning_rate": 0.0003539213290984608, + "loss": 0.4457, + "step": 120125 + }, + { + "epoch": 29.32, + "learning_rate": 0.0003538907891522111, + "loss": 0.3938, + "step": 120150 + }, + { + "epoch": 29.33, + "learning_rate": 0.00035386024920596137, + "loss": 0.4105, + "step": 120175 + }, + { + "epoch": 29.33, + "learning_rate": 0.0003538297092597117, + "loss": 0.371, + "step": 120200 + }, + { + "epoch": 29.34, + "learning_rate": 0.00035379916931346203, + "loss": 0.4368, + "step": 120225 + }, + { + "epoch": 29.34, + "learning_rate": 0.00035376862936721234, + "loss": 0.3776, + "step": 120250 + }, + { + "epoch": 29.35, + "learning_rate": 0.00035373808942096264, + "loss": 0.43, + "step": 120275 + }, + { + "epoch": 29.36, + "learning_rate": 0.00035370754947471294, + "loss": 0.3932, + "step": 120300 + }, + { + "epoch": 29.36, + "learning_rate": 0.0003536770095284632, + "loss": 0.4435, + "step": 120325 + }, + { + "epoch": 29.37, + "learning_rate": 0.00035364646958221355, + "loss": 0.3809, + "step": 120350 + }, + { + "epoch": 29.37, + "learning_rate": 0.00035361592963596385, + "loss": 0.4235, + "step": 120375 + }, + { + "epoch": 29.38, + "learning_rate": 0.00035358538968971416, + "loss": 0.4317, + "step": 120400 + }, + { + "epoch": 29.39, + "learning_rate": 0.00035355484974346446, + "loss": 0.4346, + "step": 120425 + }, + { + "epoch": 29.39, + "learning_rate": 0.00035352430979721476, + "loss": 0.4661, + "step": 120450 + }, + { + "epoch": 29.4, + "learning_rate": 0.0003534937698509651, + "loss": 0.4154, + "step": 120475 + }, + { + "epoch": 29.4, + "learning_rate": 0.00035346322990471537, + "loss": 0.4087, + "step": 120500 + }, + { + "epoch": 29.41, + "learning_rate": 0.00035343268995846567, + "loss": 0.4124, + "step": 120525 + }, + { + "epoch": 29.42, + "learning_rate": 0.000353402150012216, + "loss": 0.3801, + "step": 120550 + }, + { + "epoch": 29.42, + "learning_rate": 0.0003533716100659663, + "loss": 0.4197, + "step": 120575 + }, + { + "epoch": 29.43, + "learning_rate": 0.00035334107011971664, + "loss": 0.4203, + "step": 120600 + }, + { + "epoch": 29.44, + "learning_rate": 0.00035331053017346694, + "loss": 0.4267, + "step": 120625 + }, + { + "epoch": 29.44, + "learning_rate": 0.0003532799902272172, + "loss": 0.4088, + "step": 120650 + }, + { + "epoch": 29.45, + "learning_rate": 0.0003532494502809675, + "loss": 0.4504, + "step": 120675 + }, + { + "epoch": 29.45, + "learning_rate": 0.0003532189103347178, + "loss": 0.3981, + "step": 120700 + }, + { + "epoch": 29.46, + "learning_rate": 0.00035318837038846815, + "loss": 0.4532, + "step": 120725 + }, + { + "epoch": 29.47, + "learning_rate": 0.00035315783044221846, + "loss": 0.4276, + "step": 120750 + }, + { + "epoch": 29.47, + "learning_rate": 0.00035312729049596876, + "loss": 0.4059, + "step": 120775 + }, + { + "epoch": 29.48, + "learning_rate": 0.000353096750549719, + "loss": 0.376, + "step": 120800 + }, + { + "epoch": 29.48, + "learning_rate": 0.0003530662106034693, + "loss": 0.3947, + "step": 120825 + }, + { + "epoch": 29.49, + "learning_rate": 0.0003530356706572196, + "loss": 0.4219, + "step": 120850 + }, + { + "epoch": 29.5, + "learning_rate": 0.00035300513071097, + "loss": 0.3965, + "step": 120875 + }, + { + "epoch": 29.5, + "learning_rate": 0.0003529745907647203, + "loss": 0.426, + "step": 120900 + }, + { + "epoch": 29.51, + "learning_rate": 0.0003529440508184706, + "loss": 0.3877, + "step": 120925 + }, + { + "epoch": 29.51, + "learning_rate": 0.0003529135108722209, + "loss": 0.4478, + "step": 120950 + }, + { + "epoch": 29.52, + "learning_rate": 0.00035288297092597113, + "loss": 0.3986, + "step": 120975 + }, + { + "epoch": 29.53, + "learning_rate": 0.0003528524309797215, + "loss": 0.3896, + "step": 121000 + }, + { + "epoch": 29.53, + "learning_rate": 0.0003528218910334718, + "loss": 0.4218, + "step": 121025 + }, + { + "epoch": 29.54, + "learning_rate": 0.0003527913510872221, + "loss": 0.4153, + "step": 121050 + }, + { + "epoch": 29.54, + "learning_rate": 0.0003527608111409724, + "loss": 0.4367, + "step": 121075 + }, + { + "epoch": 29.55, + "learning_rate": 0.0003527302711947227, + "loss": 0.3787, + "step": 121100 + }, + { + "epoch": 29.56, + "learning_rate": 0.000352699731248473, + "loss": 0.4276, + "step": 121125 + }, + { + "epoch": 29.56, + "learning_rate": 0.0003526691913022233, + "loss": 0.4234, + "step": 121150 + }, + { + "epoch": 29.57, + "learning_rate": 0.0003526386513559736, + "loss": 0.4023, + "step": 121175 + }, + { + "epoch": 29.58, + "learning_rate": 0.0003526081114097239, + "loss": 0.4466, + "step": 121200 + }, + { + "epoch": 29.58, + "learning_rate": 0.0003525775714634742, + "loss": 0.421, + "step": 121225 + }, + { + "epoch": 29.59, + "learning_rate": 0.0003525470315172246, + "loss": 0.3944, + "step": 121250 + }, + { + "epoch": 29.59, + "learning_rate": 0.00035251649157097483, + "loss": 0.4337, + "step": 121275 + }, + { + "epoch": 29.6, + "learning_rate": 0.00035248595162472513, + "loss": 0.4379, + "step": 121300 + }, + { + "epoch": 29.61, + "learning_rate": 0.00035245541167847543, + "loss": 0.4306, + "step": 121325 + }, + { + "epoch": 29.61, + "learning_rate": 0.00035242487173222574, + "loss": 0.4094, + "step": 121350 + }, + { + "epoch": 29.62, + "learning_rate": 0.0003523943317859761, + "loss": 0.4306, + "step": 121375 + }, + { + "epoch": 29.62, + "learning_rate": 0.0003523637918397264, + "loss": 0.4026, + "step": 121400 + }, + { + "epoch": 29.63, + "learning_rate": 0.00035233325189347665, + "loss": 0.3812, + "step": 121425 + }, + { + "epoch": 29.64, + "learning_rate": 0.00035230271194722695, + "loss": 0.4086, + "step": 121450 + }, + { + "epoch": 29.64, + "learning_rate": 0.00035227217200097725, + "loss": 0.4389, + "step": 121475 + }, + { + "epoch": 29.65, + "learning_rate": 0.0003522416320547276, + "loss": 0.436, + "step": 121500 + }, + { + "epoch": 29.65, + "learning_rate": 0.0003522110921084779, + "loss": 0.4004, + "step": 121525 + }, + { + "epoch": 29.66, + "learning_rate": 0.0003521805521622282, + "loss": 0.4273, + "step": 121550 + }, + { + "epoch": 29.67, + "learning_rate": 0.0003521500122159785, + "loss": 0.3943, + "step": 121575 + }, + { + "epoch": 29.67, + "learning_rate": 0.00035211947226972877, + "loss": 0.4429, + "step": 121600 + }, + { + "epoch": 29.68, + "learning_rate": 0.00035208893232347913, + "loss": 0.424, + "step": 121625 + }, + { + "epoch": 29.69, + "learning_rate": 0.00035205839237722943, + "loss": 0.3805, + "step": 121650 + }, + { + "epoch": 29.69, + "learning_rate": 0.00035202785243097974, + "loss": 0.439, + "step": 121675 + }, + { + "epoch": 29.7, + "learning_rate": 0.00035199731248473004, + "loss": 0.4186, + "step": 121700 + }, + { + "epoch": 29.7, + "learning_rate": 0.00035196677253848034, + "loss": 0.4109, + "step": 121725 + }, + { + "epoch": 29.71, + "learning_rate": 0.00035193623259223065, + "loss": 0.4328, + "step": 121750 + }, + { + "epoch": 29.72, + "learning_rate": 0.00035190569264598095, + "loss": 0.4071, + "step": 121775 + }, + { + "epoch": 29.72, + "learning_rate": 0.00035187515269973125, + "loss": 0.4389, + "step": 121800 + }, + { + "epoch": 29.73, + "learning_rate": 0.00035184461275348156, + "loss": 0.418, + "step": 121825 + }, + { + "epoch": 29.73, + "learning_rate": 0.00035181407280723186, + "loss": 0.4152, + "step": 121850 + }, + { + "epoch": 29.74, + "learning_rate": 0.0003517835328609822, + "loss": 0.4223, + "step": 121875 + }, + { + "epoch": 29.75, + "learning_rate": 0.00035175299291473247, + "loss": 0.3847, + "step": 121900 + }, + { + "epoch": 29.75, + "learning_rate": 0.00035172245296848277, + "loss": 0.4277, + "step": 121925 + }, + { + "epoch": 29.76, + "learning_rate": 0.00035169191302223307, + "loss": 0.4348, + "step": 121950 + }, + { + "epoch": 29.76, + "learning_rate": 0.0003516613730759834, + "loss": 0.4434, + "step": 121975 + }, + { + "epoch": 29.77, + "learning_rate": 0.00035163083312973373, + "loss": 0.3893, + "step": 122000 + }, + { + "epoch": 29.78, + "learning_rate": 0.00035160029318348404, + "loss": 0.4229, + "step": 122025 + }, + { + "epoch": 29.78, + "learning_rate": 0.00035156975323723434, + "loss": 0.4222, + "step": 122050 + }, + { + "epoch": 29.79, + "learning_rate": 0.0003515392132909846, + "loss": 0.4246, + "step": 122075 + }, + { + "epoch": 29.8, + "learning_rate": 0.0003515086733447349, + "loss": 0.4318, + "step": 122100 + }, + { + "epoch": 29.8, + "learning_rate": 0.00035147813339848525, + "loss": 0.4136, + "step": 122125 + }, + { + "epoch": 29.81, + "learning_rate": 0.00035144759345223555, + "loss": 0.438, + "step": 122150 + }, + { + "epoch": 29.81, + "learning_rate": 0.00035141705350598586, + "loss": 0.4111, + "step": 122175 + }, + { + "epoch": 29.82, + "learning_rate": 0.00035138651355973616, + "loss": 0.449, + "step": 122200 + }, + { + "epoch": 29.83, + "learning_rate": 0.0003513559736134864, + "loss": 0.4086, + "step": 122225 + }, + { + "epoch": 29.83, + "learning_rate": 0.0003513254336672367, + "loss": 0.4543, + "step": 122250 + }, + { + "epoch": 29.84, + "learning_rate": 0.00035129489372098707, + "loss": 0.4528, + "step": 122275 + }, + { + "epoch": 29.84, + "learning_rate": 0.00035126435377473737, + "loss": 0.4258, + "step": 122300 + }, + { + "epoch": 29.85, + "learning_rate": 0.0003512338138284877, + "loss": 0.4424, + "step": 122325 + }, + { + "epoch": 29.86, + "learning_rate": 0.000351203273882238, + "loss": 0.4306, + "step": 122350 + }, + { + "epoch": 29.86, + "learning_rate": 0.00035117273393598823, + "loss": 0.4086, + "step": 122375 + }, + { + "epoch": 29.87, + "learning_rate": 0.0003511421939897386, + "loss": 0.4361, + "step": 122400 + }, + { + "epoch": 29.87, + "learning_rate": 0.0003511116540434889, + "loss": 0.4252, + "step": 122425 + }, + { + "epoch": 29.88, + "learning_rate": 0.0003510811140972392, + "loss": 0.4612, + "step": 122450 + }, + { + "epoch": 29.89, + "learning_rate": 0.0003510505741509895, + "loss": 0.4051, + "step": 122475 + }, + { + "epoch": 29.89, + "learning_rate": 0.0003510200342047398, + "loss": 0.4299, + "step": 122500 + }, + { + "epoch": 29.9, + "learning_rate": 0.00035098949425849016, + "loss": 0.4407, + "step": 122525 + }, + { + "epoch": 29.9, + "learning_rate": 0.0003509589543122404, + "loss": 0.3986, + "step": 122550 + }, + { + "epoch": 29.91, + "learning_rate": 0.0003509284143659907, + "loss": 0.4274, + "step": 122575 + }, + { + "epoch": 29.92, + "learning_rate": 0.000350897874419741, + "loss": 0.4169, + "step": 122600 + }, + { + "epoch": 29.92, + "learning_rate": 0.0003508673344734913, + "loss": 0.4529, + "step": 122625 + }, + { + "epoch": 29.93, + "learning_rate": 0.0003508367945272417, + "loss": 0.3713, + "step": 122650 + }, + { + "epoch": 29.94, + "learning_rate": 0.000350806254580992, + "loss": 0.4434, + "step": 122675 + }, + { + "epoch": 29.94, + "learning_rate": 0.0003507757146347422, + "loss": 0.4097, + "step": 122700 + }, + { + "epoch": 29.95, + "learning_rate": 0.00035074517468849253, + "loss": 0.4375, + "step": 122725 + }, + { + "epoch": 29.95, + "learning_rate": 0.00035071463474224283, + "loss": 0.4445, + "step": 122750 + }, + { + "epoch": 29.96, + "learning_rate": 0.0003506840947959932, + "loss": 0.4342, + "step": 122775 + }, + { + "epoch": 29.97, + "learning_rate": 0.0003506535548497435, + "loss": 0.3904, + "step": 122800 + }, + { + "epoch": 29.97, + "learning_rate": 0.0003506230149034938, + "loss": 0.409, + "step": 122825 + }, + { + "epoch": 29.98, + "learning_rate": 0.00035059247495724405, + "loss": 0.4287, + "step": 122850 + }, + { + "epoch": 29.98, + "learning_rate": 0.00035056193501099435, + "loss": 0.4229, + "step": 122875 + }, + { + "epoch": 29.99, + "learning_rate": 0.0003505313950647447, + "loss": 0.3857, + "step": 122900 + }, + { + "epoch": 30.0, + "learning_rate": 0.000350500855118495, + "loss": 0.4666, + "step": 122925 + }, + { + "epoch": 30.0, + "learning_rate": 0.0003504703151722453, + "loss": 0.4071, + "step": 122950 + }, + { + "epoch": 30.01, + "learning_rate": 0.0003504397752259956, + "loss": 0.4184, + "step": 122975 + }, + { + "epoch": 30.01, + "learning_rate": 0.0003504104568775959, + "loss": 0.4062, + "step": 123000 + }, + { + "epoch": 30.01, + "eval_cer": 0.10116218186298163, + "eval_loss": 0.41296249628067017, + "eval_runtime": 148.9733, + "eval_samples_per_second": 28.146, + "eval_steps_per_second": 7.042, + "eval_wer": 0.41706362153344206, + "step": 123000 + }, + { + "epoch": 30.02, + "learning_rate": 0.0003503799169313462, + "loss": 0.4304, + "step": 123025 + }, + { + "epoch": 30.03, + "learning_rate": 0.0003503493769850965, + "loss": 0.4434, + "step": 123050 + }, + { + "epoch": 30.03, + "learning_rate": 0.00035031883703884683, + "loss": 0.408, + "step": 123075 + }, + { + "epoch": 30.04, + "learning_rate": 0.00035028951869044714, + "loss": 0.4147, + "step": 123100 + }, + { + "epoch": 30.05, + "learning_rate": 0.00035025897874419744, + "loss": 0.3929, + "step": 123125 + }, + { + "epoch": 30.05, + "learning_rate": 0.00035022843879794775, + "loss": 0.4164, + "step": 123150 + }, + { + "epoch": 30.06, + "learning_rate": 0.000350197898851698, + "loss": 0.4251, + "step": 123175 + }, + { + "epoch": 30.06, + "learning_rate": 0.0003501673589054483, + "loss": 0.3855, + "step": 123200 + }, + { + "epoch": 30.07, + "learning_rate": 0.00035013681895919866, + "loss": 0.4134, + "step": 123225 + }, + { + "epoch": 30.08, + "learning_rate": 0.00035010627901294896, + "loss": 0.4397, + "step": 123250 + }, + { + "epoch": 30.08, + "learning_rate": 0.00035007573906669926, + "loss": 0.4235, + "step": 123275 + }, + { + "epoch": 30.09, + "learning_rate": 0.00035004519912044957, + "loss": 0.3841, + "step": 123300 + }, + { + "epoch": 30.09, + "learning_rate": 0.0003500146591741998, + "loss": 0.402, + "step": 123325 + }, + { + "epoch": 30.1, + "learning_rate": 0.0003499841192279502, + "loss": 0.4278, + "step": 123350 + }, + { + "epoch": 30.11, + "learning_rate": 0.0003499535792817005, + "loss": 0.4193, + "step": 123375 + }, + { + "epoch": 30.11, + "learning_rate": 0.0003499230393354508, + "loss": 0.3789, + "step": 123400 + }, + { + "epoch": 30.12, + "learning_rate": 0.0003498924993892011, + "loss": 0.4279, + "step": 123425 + }, + { + "epoch": 30.12, + "learning_rate": 0.0003498619594429514, + "loss": 0.3855, + "step": 123450 + }, + { + "epoch": 30.13, + "learning_rate": 0.00034983141949670174, + "loss": 0.4093, + "step": 123475 + }, + { + "epoch": 30.14, + "learning_rate": 0.000349800879550452, + "loss": 0.3989, + "step": 123500 + }, + { + "epoch": 30.14, + "learning_rate": 0.0003497703396042023, + "loss": 0.412, + "step": 123525 + }, + { + "epoch": 30.15, + "learning_rate": 0.0003497397996579526, + "loss": 0.4134, + "step": 123550 + }, + { + "epoch": 30.15, + "learning_rate": 0.0003497092597117029, + "loss": 0.4041, + "step": 123575 + }, + { + "epoch": 30.16, + "learning_rate": 0.00034967871976545326, + "loss": 0.4094, + "step": 123600 + }, + { + "epoch": 30.17, + "learning_rate": 0.00034964817981920356, + "loss": 0.4239, + "step": 123625 + }, + { + "epoch": 30.17, + "learning_rate": 0.0003496176398729538, + "loss": 0.3698, + "step": 123650 + }, + { + "epoch": 30.18, + "learning_rate": 0.0003495870999267041, + "loss": 0.3939, + "step": 123675 + }, + { + "epoch": 30.19, + "learning_rate": 0.0003495565599804544, + "loss": 0.4228, + "step": 123700 + }, + { + "epoch": 30.19, + "learning_rate": 0.0003495260200342047, + "loss": 0.4043, + "step": 123725 + }, + { + "epoch": 30.2, + "learning_rate": 0.0003494954800879551, + "loss": 0.401, + "step": 123750 + }, + { + "epoch": 30.2, + "learning_rate": 0.0003494649401417054, + "loss": 0.3792, + "step": 123775 + }, + { + "epoch": 30.21, + "learning_rate": 0.00034943440019545563, + "loss": 0.3988, + "step": 123800 + }, + { + "epoch": 30.22, + "learning_rate": 0.00034940386024920594, + "loss": 0.432, + "step": 123825 + }, + { + "epoch": 30.22, + "learning_rate": 0.00034937332030295624, + "loss": 0.4485, + "step": 123850 + }, + { + "epoch": 30.23, + "learning_rate": 0.0003493427803567066, + "loss": 0.4091, + "step": 123875 + }, + { + "epoch": 30.23, + "learning_rate": 0.0003493122404104569, + "loss": 0.3819, + "step": 123900 + }, + { + "epoch": 30.24, + "learning_rate": 0.0003492817004642072, + "loss": 0.4148, + "step": 123925 + }, + { + "epoch": 30.25, + "learning_rate": 0.0003492511605179575, + "loss": 0.4096, + "step": 123950 + }, + { + "epoch": 30.25, + "learning_rate": 0.00034922062057170776, + "loss": 0.3938, + "step": 123975 + }, + { + "epoch": 30.26, + "learning_rate": 0.0003491900806254581, + "loss": 0.4216, + "step": 124000 + }, + { + "epoch": 30.26, + "learning_rate": 0.0003491595406792084, + "loss": 0.4014, + "step": 124025 + }, + { + "epoch": 30.27, + "learning_rate": 0.0003491290007329587, + "loss": 0.4154, + "step": 124050 + }, + { + "epoch": 30.28, + "learning_rate": 0.000349098460786709, + "loss": 0.426, + "step": 124075 + }, + { + "epoch": 30.28, + "learning_rate": 0.00034906792084045933, + "loss": 0.4188, + "step": 124100 + }, + { + "epoch": 30.29, + "learning_rate": 0.00034903738089420963, + "loss": 0.3845, + "step": 124125 + }, + { + "epoch": 30.3, + "learning_rate": 0.00034900684094795993, + "loss": 0.4222, + "step": 124150 + }, + { + "epoch": 30.3, + "learning_rate": 0.00034897630100171024, + "loss": 0.411, + "step": 124175 + }, + { + "epoch": 30.31, + "learning_rate": 0.00034894576105546054, + "loss": 0.4288, + "step": 124200 + }, + { + "epoch": 30.31, + "learning_rate": 0.00034891522110921085, + "loss": 0.4252, + "step": 124225 + }, + { + "epoch": 30.32, + "learning_rate": 0.0003488846811629612, + "loss": 0.4216, + "step": 124250 + }, + { + "epoch": 30.33, + "learning_rate": 0.00034885414121671145, + "loss": 0.4033, + "step": 124275 + }, + { + "epoch": 30.33, + "learning_rate": 0.00034882360127046176, + "loss": 0.4382, + "step": 124300 + }, + { + "epoch": 30.34, + "learning_rate": 0.00034879306132421206, + "loss": 0.4194, + "step": 124325 + }, + { + "epoch": 30.34, + "learning_rate": 0.00034876252137796236, + "loss": 0.3948, + "step": 124350 + }, + { + "epoch": 30.35, + "learning_rate": 0.0003487319814317127, + "loss": 0.4072, + "step": 124375 + }, + { + "epoch": 30.36, + "learning_rate": 0.000348701441485463, + "loss": 0.3921, + "step": 124400 + }, + { + "epoch": 30.36, + "learning_rate": 0.0003486709015392133, + "loss": 0.3927, + "step": 124425 + }, + { + "epoch": 30.37, + "learning_rate": 0.0003486403615929636, + "loss": 0.3803, + "step": 124450 + }, + { + "epoch": 30.37, + "learning_rate": 0.0003486098216467139, + "loss": 0.4021, + "step": 124475 + }, + { + "epoch": 30.38, + "learning_rate": 0.00034857928170046424, + "loss": 0.4273, + "step": 124500 + }, + { + "epoch": 30.39, + "learning_rate": 0.00034854874175421454, + "loss": 0.421, + "step": 124525 + }, + { + "epoch": 30.39, + "learning_rate": 0.00034851820180796484, + "loss": 0.4059, + "step": 124550 + }, + { + "epoch": 30.4, + "learning_rate": 0.00034848766186171515, + "loss": 0.4006, + "step": 124575 + }, + { + "epoch": 30.41, + "learning_rate": 0.0003484571219154654, + "loss": 0.4126, + "step": 124600 + }, + { + "epoch": 30.41, + "learning_rate": 0.00034842658196921575, + "loss": 0.4117, + "step": 124625 + }, + { + "epoch": 30.42, + "learning_rate": 0.00034839604202296606, + "loss": 0.4357, + "step": 124650 + }, + { + "epoch": 30.42, + "learning_rate": 0.00034836550207671636, + "loss": 0.3873, + "step": 124675 + }, + { + "epoch": 30.43, + "learning_rate": 0.00034833496213046666, + "loss": 0.383, + "step": 124700 + }, + { + "epoch": 30.44, + "learning_rate": 0.00034830442218421697, + "loss": 0.3809, + "step": 124725 + }, + { + "epoch": 30.44, + "learning_rate": 0.00034827388223796727, + "loss": 0.3976, + "step": 124750 + }, + { + "epoch": 30.45, + "learning_rate": 0.00034824334229171757, + "loss": 0.3906, + "step": 124775 + }, + { + "epoch": 30.45, + "learning_rate": 0.0003482128023454679, + "loss": 0.3888, + "step": 124800 + }, + { + "epoch": 30.46, + "learning_rate": 0.0003481822623992182, + "loss": 0.4004, + "step": 124825 + }, + { + "epoch": 30.47, + "learning_rate": 0.0003481517224529685, + "loss": 0.4036, + "step": 124850 + }, + { + "epoch": 30.47, + "learning_rate": 0.00034812118250671884, + "loss": 0.4037, + "step": 124875 + }, + { + "epoch": 30.48, + "learning_rate": 0.00034809064256046914, + "loss": 0.396, + "step": 124900 + }, + { + "epoch": 30.48, + "learning_rate": 0.0003480601026142194, + "loss": 0.4076, + "step": 124925 + }, + { + "epoch": 30.49, + "learning_rate": 0.0003480295626679697, + "loss": 0.4193, + "step": 124950 + }, + { + "epoch": 30.5, + "learning_rate": 0.00034799902272172, + "loss": 0.4146, + "step": 124975 + }, + { + "epoch": 30.5, + "learning_rate": 0.0003479684827754703, + "loss": 0.4226, + "step": 125000 + }, + { + "epoch": 30.51, + "learning_rate": 0.00034793794282922066, + "loss": 0.3734, + "step": 125025 + }, + { + "epoch": 30.51, + "learning_rate": 0.00034790740288297096, + "loss": 0.3793, + "step": 125050 + }, + { + "epoch": 30.52, + "learning_rate": 0.0003478768629367212, + "loss": 0.4013, + "step": 125075 + }, + { + "epoch": 30.53, + "learning_rate": 0.0003478463229904715, + "loss": 0.4157, + "step": 125100 + }, + { + "epoch": 30.53, + "learning_rate": 0.0003478157830442218, + "loss": 0.4507, + "step": 125125 + }, + { + "epoch": 30.54, + "learning_rate": 0.0003477852430979722, + "loss": 0.4108, + "step": 125150 + }, + { + "epoch": 30.55, + "learning_rate": 0.0003477547031517225, + "loss": 0.4143, + "step": 125175 + }, + { + "epoch": 30.55, + "learning_rate": 0.0003477241632054728, + "loss": 0.4348, + "step": 125200 + }, + { + "epoch": 30.56, + "learning_rate": 0.00034769362325922303, + "loss": 0.4, + "step": 125225 + }, + { + "epoch": 30.56, + "learning_rate": 0.00034766308331297334, + "loss": 0.4353, + "step": 125250 + }, + { + "epoch": 30.57, + "learning_rate": 0.0003476325433667237, + "loss": 0.4229, + "step": 125275 + }, + { + "epoch": 30.58, + "learning_rate": 0.000347602003420474, + "loss": 0.3911, + "step": 125300 + }, + { + "epoch": 30.58, + "learning_rate": 0.0003475714634742243, + "loss": 0.3888, + "step": 125325 + }, + { + "epoch": 30.59, + "learning_rate": 0.0003475409235279746, + "loss": 0.4081, + "step": 125350 + }, + { + "epoch": 30.59, + "learning_rate": 0.00034751038358172485, + "loss": 0.3961, + "step": 125375 + }, + { + "epoch": 30.6, + "learning_rate": 0.0003474798436354752, + "loss": 0.3993, + "step": 125400 + }, + { + "epoch": 30.61, + "learning_rate": 0.0003474493036892255, + "loss": 0.3694, + "step": 125425 + }, + { + "epoch": 30.61, + "learning_rate": 0.0003474187637429758, + "loss": 0.4185, + "step": 125450 + }, + { + "epoch": 30.62, + "learning_rate": 0.0003473882237967261, + "loss": 0.3864, + "step": 125475 + }, + { + "epoch": 30.62, + "learning_rate": 0.0003473576838504764, + "loss": 0.408, + "step": 125500 + }, + { + "epoch": 30.63, + "learning_rate": 0.0003473271439042268, + "loss": 0.4256, + "step": 125525 + }, + { + "epoch": 30.64, + "learning_rate": 0.00034729660395797703, + "loss": 0.4471, + "step": 125550 + }, + { + "epoch": 30.64, + "learning_rate": 0.00034726606401172733, + "loss": 0.422, + "step": 125575 + }, + { + "epoch": 30.65, + "learning_rate": 0.00034723552406547764, + "loss": 0.4016, + "step": 125600 + }, + { + "epoch": 30.66, + "learning_rate": 0.00034720498411922794, + "loss": 0.3924, + "step": 125625 + }, + { + "epoch": 30.66, + "learning_rate": 0.0003471744441729783, + "loss": 0.3669, + "step": 125650 + }, + { + "epoch": 30.67, + "learning_rate": 0.0003471439042267286, + "loss": 0.4027, + "step": 125675 + }, + { + "epoch": 30.67, + "learning_rate": 0.00034711336428047885, + "loss": 0.4206, + "step": 125700 + }, + { + "epoch": 30.68, + "learning_rate": 0.00034708282433422915, + "loss": 0.4272, + "step": 125725 + }, + { + "epoch": 30.69, + "learning_rate": 0.00034705228438797946, + "loss": 0.3985, + "step": 125750 + }, + { + "epoch": 30.69, + "learning_rate": 0.0003470217444417298, + "loss": 0.4368, + "step": 125775 + }, + { + "epoch": 30.7, + "learning_rate": 0.0003469912044954801, + "loss": 0.4344, + "step": 125800 + }, + { + "epoch": 30.7, + "learning_rate": 0.0003469606645492304, + "loss": 0.399, + "step": 125825 + }, + { + "epoch": 30.71, + "learning_rate": 0.00034693012460298067, + "loss": 0.3887, + "step": 125850 + }, + { + "epoch": 30.72, + "learning_rate": 0.000346899584656731, + "loss": 0.4529, + "step": 125875 + }, + { + "epoch": 30.72, + "learning_rate": 0.00034686904471048133, + "loss": 0.4415, + "step": 125900 + }, + { + "epoch": 30.73, + "learning_rate": 0.00034683850476423164, + "loss": 0.4205, + "step": 125925 + }, + { + "epoch": 30.73, + "learning_rate": 0.00034680796481798194, + "loss": 0.4042, + "step": 125950 + }, + { + "epoch": 30.74, + "learning_rate": 0.00034677742487173224, + "loss": 0.4339, + "step": 125975 + }, + { + "epoch": 30.75, + "learning_rate": 0.00034674688492548255, + "loss": 0.3903, + "step": 126000 + }, + { + "epoch": 30.75, + "eval_cer": 0.10059751753026087, + "eval_loss": 0.41336575150489807, + "eval_runtime": 149.0037, + "eval_samples_per_second": 28.14, + "eval_steps_per_second": 7.04, + "eval_wer": 0.4123654159869494, + "step": 126000 + }, + { + "epoch": 30.75, + "learning_rate": 0.00034671634497923285, + "loss": 0.4048, + "step": 126025 + }, + { + "epoch": 30.76, + "learning_rate": 0.00034668580503298315, + "loss": 0.4314, + "step": 126050 + }, + { + "epoch": 30.77, + "learning_rate": 0.00034665526508673346, + "loss": 0.4407, + "step": 126075 + }, + { + "epoch": 30.77, + "learning_rate": 0.00034662472514048376, + "loss": 0.4225, + "step": 126100 + }, + { + "epoch": 30.78, + "learning_rate": 0.00034659418519423406, + "loss": 0.4267, + "step": 126125 + }, + { + "epoch": 30.78, + "learning_rate": 0.0003465636452479844, + "loss": 0.3801, + "step": 126150 + }, + { + "epoch": 30.79, + "learning_rate": 0.00034653310530173467, + "loss": 0.4037, + "step": 126175 + }, + { + "epoch": 30.8, + "learning_rate": 0.00034650256535548497, + "loss": 0.4098, + "step": 126200 + }, + { + "epoch": 30.8, + "learning_rate": 0.0003464720254092353, + "loss": 0.3993, + "step": 126225 + }, + { + "epoch": 30.81, + "learning_rate": 0.0003464414854629856, + "loss": 0.4666, + "step": 126250 + }, + { + "epoch": 30.81, + "learning_rate": 0.00034641094551673594, + "loss": 0.4039, + "step": 126275 + }, + { + "epoch": 30.82, + "learning_rate": 0.00034638040557048624, + "loss": 0.4366, + "step": 126300 + }, + { + "epoch": 30.83, + "learning_rate": 0.0003463498656242365, + "loss": 0.3941, + "step": 126325 + }, + { + "epoch": 30.83, + "learning_rate": 0.0003463193256779868, + "loss": 0.3714, + "step": 126350 + }, + { + "epoch": 30.84, + "learning_rate": 0.0003462887857317371, + "loss": 0.437, + "step": 126375 + }, + { + "epoch": 30.84, + "learning_rate": 0.0003462582457854874, + "loss": 0.4148, + "step": 126400 + }, + { + "epoch": 30.85, + "learning_rate": 0.00034622770583923776, + "loss": 0.4434, + "step": 126425 + }, + { + "epoch": 30.86, + "learning_rate": 0.00034619716589298806, + "loss": 0.4539, + "step": 126450 + }, + { + "epoch": 30.86, + "learning_rate": 0.00034616662594673836, + "loss": 0.4064, + "step": 126475 + }, + { + "epoch": 30.87, + "learning_rate": 0.0003461360860004886, + "loss": 0.4261, + "step": 126500 + }, + { + "epoch": 30.87, + "learning_rate": 0.0003461055460542389, + "loss": 0.4017, + "step": 126525 + }, + { + "epoch": 30.88, + "learning_rate": 0.0003460750061079893, + "loss": 0.4168, + "step": 126550 + }, + { + "epoch": 30.89, + "learning_rate": 0.0003460444661617396, + "loss": 0.4056, + "step": 126575 + }, + { + "epoch": 30.89, + "learning_rate": 0.0003460139262154899, + "loss": 0.3872, + "step": 126600 + }, + { + "epoch": 30.9, + "learning_rate": 0.0003459833862692402, + "loss": 0.4327, + "step": 126625 + }, + { + "epoch": 30.91, + "learning_rate": 0.00034595284632299043, + "loss": 0.4261, + "step": 126650 + }, + { + "epoch": 30.91, + "learning_rate": 0.0003459223063767408, + "loss": 0.3929, + "step": 126675 + }, + { + "epoch": 30.92, + "learning_rate": 0.0003458917664304911, + "loss": 0.3899, + "step": 126700 + }, + { + "epoch": 30.92, + "learning_rate": 0.0003458612264842414, + "loss": 0.4076, + "step": 126725 + }, + { + "epoch": 30.93, + "learning_rate": 0.0003458306865379917, + "loss": 0.3944, + "step": 126750 + }, + { + "epoch": 30.94, + "learning_rate": 0.000345800146591742, + "loss": 0.4055, + "step": 126775 + }, + { + "epoch": 30.94, + "learning_rate": 0.0003457696066454923, + "loss": 0.4143, + "step": 126800 + }, + { + "epoch": 30.95, + "learning_rate": 0.0003457390666992426, + "loss": 0.4015, + "step": 126825 + }, + { + "epoch": 30.95, + "learning_rate": 0.0003457085267529929, + "loss": 0.4083, + "step": 126850 + }, + { + "epoch": 30.96, + "learning_rate": 0.0003456779868067432, + "loss": 0.4116, + "step": 126875 + }, + { + "epoch": 30.97, + "learning_rate": 0.0003456474468604935, + "loss": 0.4026, + "step": 126900 + }, + { + "epoch": 30.97, + "learning_rate": 0.0003456169069142439, + "loss": 0.3899, + "step": 126925 + }, + { + "epoch": 30.98, + "learning_rate": 0.0003455863669679942, + "loss": 0.427, + "step": 126950 + }, + { + "epoch": 30.98, + "learning_rate": 0.00034555582702174443, + "loss": 0.4051, + "step": 126975 + }, + { + "epoch": 30.99, + "learning_rate": 0.00034552528707549473, + "loss": 0.444, + "step": 127000 + }, + { + "epoch": 31.0, + "learning_rate": 0.00034549474712924504, + "loss": 0.3934, + "step": 127025 + }, + { + "epoch": 31.0, + "learning_rate": 0.0003454642071829954, + "loss": 0.394, + "step": 127050 + }, + { + "epoch": 31.01, + "learning_rate": 0.0003454336672367457, + "loss": 0.3947, + "step": 127075 + }, + { + "epoch": 31.02, + "learning_rate": 0.000345403127290496, + "loss": 0.4078, + "step": 127100 + }, + { + "epoch": 31.02, + "learning_rate": 0.00034537258734424625, + "loss": 0.4122, + "step": 127125 + }, + { + "epoch": 31.03, + "learning_rate": 0.00034534204739799655, + "loss": 0.424, + "step": 127150 + }, + { + "epoch": 31.03, + "learning_rate": 0.0003453115074517469, + "loss": 0.3971, + "step": 127175 + }, + { + "epoch": 31.04, + "learning_rate": 0.0003452809675054972, + "loss": 0.3677, + "step": 127200 + }, + { + "epoch": 31.05, + "learning_rate": 0.0003452504275592475, + "loss": 0.3823, + "step": 127225 + }, + { + "epoch": 31.05, + "learning_rate": 0.0003452198876129978, + "loss": 0.389, + "step": 127250 + }, + { + "epoch": 31.06, + "learning_rate": 0.00034518934766674807, + "loss": 0.4075, + "step": 127275 + }, + { + "epoch": 31.06, + "learning_rate": 0.00034515880772049843, + "loss": 0.4156, + "step": 127300 + }, + { + "epoch": 31.07, + "learning_rate": 0.00034512826777424873, + "loss": 0.402, + "step": 127325 + }, + { + "epoch": 31.08, + "learning_rate": 0.00034509772782799903, + "loss": 0.4084, + "step": 127350 + }, + { + "epoch": 31.08, + "learning_rate": 0.00034506718788174934, + "loss": 0.3867, + "step": 127375 + }, + { + "epoch": 31.09, + "learning_rate": 0.00034503664793549964, + "loss": 0.4277, + "step": 127400 + }, + { + "epoch": 31.09, + "learning_rate": 0.00034500610798925, + "loss": 0.372, + "step": 127425 + }, + { + "epoch": 31.1, + "learning_rate": 0.00034497556804300025, + "loss": 0.4244, + "step": 127450 + }, + { + "epoch": 31.11, + "learning_rate": 0.00034494502809675055, + "loss": 0.3852, + "step": 127475 + }, + { + "epoch": 31.11, + "learning_rate": 0.00034491448815050085, + "loss": 0.4092, + "step": 127500 + }, + { + "epoch": 31.12, + "learning_rate": 0.00034488394820425116, + "loss": 0.3903, + "step": 127525 + }, + { + "epoch": 31.12, + "learning_rate": 0.0003448534082580015, + "loss": 0.4273, + "step": 127550 + }, + { + "epoch": 31.13, + "learning_rate": 0.0003448228683117518, + "loss": 0.3588, + "step": 127575 + }, + { + "epoch": 31.14, + "learning_rate": 0.00034479232836550207, + "loss": 0.416, + "step": 127600 + }, + { + "epoch": 31.14, + "learning_rate": 0.00034476178841925237, + "loss": 0.4172, + "step": 127625 + }, + { + "epoch": 31.15, + "learning_rate": 0.0003447312484730027, + "loss": 0.424, + "step": 127650 + }, + { + "epoch": 31.16, + "learning_rate": 0.000344700708526753, + "loss": 0.3827, + "step": 127675 + }, + { + "epoch": 31.16, + "learning_rate": 0.00034467016858050334, + "loss": 0.4112, + "step": 127700 + }, + { + "epoch": 31.17, + "learning_rate": 0.00034463962863425364, + "loss": 0.3899, + "step": 127725 + }, + { + "epoch": 31.17, + "learning_rate": 0.0003446090886880039, + "loss": 0.4096, + "step": 127750 + }, + { + "epoch": 31.18, + "learning_rate": 0.0003445785487417542, + "loss": 0.3704, + "step": 127775 + }, + { + "epoch": 31.19, + "learning_rate": 0.0003445480087955045, + "loss": 0.3892, + "step": 127800 + }, + { + "epoch": 31.19, + "learning_rate": 0.00034451746884925485, + "loss": 0.4285, + "step": 127825 + }, + { + "epoch": 31.2, + "learning_rate": 0.00034448692890300516, + "loss": 0.3989, + "step": 127850 + }, + { + "epoch": 31.2, + "learning_rate": 0.00034445638895675546, + "loss": 0.3909, + "step": 127875 + }, + { + "epoch": 31.21, + "learning_rate": 0.00034442584901050576, + "loss": 0.3992, + "step": 127900 + }, + { + "epoch": 31.22, + "learning_rate": 0.000344395309064256, + "loss": 0.4138, + "step": 127925 + }, + { + "epoch": 31.22, + "learning_rate": 0.00034436476911800637, + "loss": 0.396, + "step": 127950 + }, + { + "epoch": 31.23, + "learning_rate": 0.00034433422917175667, + "loss": 0.3903, + "step": 127975 + }, + { + "epoch": 31.23, + "learning_rate": 0.000344303689225507, + "loss": 0.424, + "step": 128000 + }, + { + "epoch": 31.24, + "learning_rate": 0.0003442731492792573, + "loss": 0.415, + "step": 128025 + }, + { + "epoch": 31.25, + "learning_rate": 0.0003442426093330076, + "loss": 0.3974, + "step": 128050 + }, + { + "epoch": 31.25, + "learning_rate": 0.0003442120693867579, + "loss": 0.3778, + "step": 128075 + }, + { + "epoch": 31.26, + "learning_rate": 0.0003441815294405082, + "loss": 0.3974, + "step": 128100 + }, + { + "epoch": 31.27, + "learning_rate": 0.0003441509894942585, + "loss": 0.3574, + "step": 128125 + }, + { + "epoch": 31.27, + "learning_rate": 0.0003441204495480088, + "loss": 0.3975, + "step": 128150 + }, + { + "epoch": 31.28, + "learning_rate": 0.0003440899096017591, + "loss": 0.4121, + "step": 128175 + }, + { + "epoch": 31.28, + "learning_rate": 0.00034405936965550946, + "loss": 0.3711, + "step": 128200 + }, + { + "epoch": 31.29, + "learning_rate": 0.0003440288297092597, + "loss": 0.3926, + "step": 128225 + }, + { + "epoch": 31.3, + "learning_rate": 0.00034399828976301, + "loss": 0.3966, + "step": 128250 + }, + { + "epoch": 31.3, + "learning_rate": 0.0003439677498167603, + "loss": 0.3844, + "step": 128275 + }, + { + "epoch": 31.31, + "learning_rate": 0.0003439372098705106, + "loss": 0.4343, + "step": 128300 + }, + { + "epoch": 31.31, + "learning_rate": 0.000343906669924261, + "loss": 0.3874, + "step": 128325 + }, + { + "epoch": 31.32, + "learning_rate": 0.0003438761299780113, + "loss": 0.4114, + "step": 128350 + }, + { + "epoch": 31.33, + "learning_rate": 0.0003438455900317615, + "loss": 0.3896, + "step": 128375 + }, + { + "epoch": 31.33, + "learning_rate": 0.00034381505008551183, + "loss": 0.4045, + "step": 128400 + }, + { + "epoch": 31.34, + "learning_rate": 0.00034378451013926213, + "loss": 0.3992, + "step": 128425 + }, + { + "epoch": 31.34, + "learning_rate": 0.0003437539701930125, + "loss": 0.3824, + "step": 128450 + }, + { + "epoch": 31.35, + "learning_rate": 0.0003437234302467628, + "loss": 0.3524, + "step": 128475 + }, + { + "epoch": 31.36, + "learning_rate": 0.0003436928903005131, + "loss": 0.4461, + "step": 128500 + }, + { + "epoch": 31.36, + "learning_rate": 0.0003436623503542634, + "loss": 0.394, + "step": 128525 + }, + { + "epoch": 31.37, + "learning_rate": 0.00034363181040801365, + "loss": 0.4214, + "step": 128550 + }, + { + "epoch": 31.38, + "learning_rate": 0.000343601270461764, + "loss": 0.392, + "step": 128575 + }, + { + "epoch": 31.38, + "learning_rate": 0.0003435707305155143, + "loss": 0.4457, + "step": 128600 + }, + { + "epoch": 31.39, + "learning_rate": 0.0003435401905692646, + "loss": 0.3787, + "step": 128625 + }, + { + "epoch": 31.39, + "learning_rate": 0.0003435096506230149, + "loss": 0.3963, + "step": 128650 + }, + { + "epoch": 31.4, + "learning_rate": 0.0003434791106767652, + "loss": 0.4293, + "step": 128675 + }, + { + "epoch": 31.41, + "learning_rate": 0.00034344979232836547, + "loss": 0.4412, + "step": 128700 + }, + { + "epoch": 31.41, + "learning_rate": 0.0003434192523821158, + "loss": 0.4166, + "step": 128725 + }, + { + "epoch": 31.42, + "learning_rate": 0.00034338871243586613, + "loss": 0.3929, + "step": 128750 + }, + { + "epoch": 31.42, + "learning_rate": 0.00034335817248961644, + "loss": 0.3735, + "step": 128775 + }, + { + "epoch": 31.43, + "learning_rate": 0.00034332763254336674, + "loss": 0.3691, + "step": 128800 + }, + { + "epoch": 31.44, + "learning_rate": 0.00034329709259711704, + "loss": 0.4261, + "step": 128825 + }, + { + "epoch": 31.44, + "learning_rate": 0.0003432665526508673, + "loss": 0.398, + "step": 128850 + }, + { + "epoch": 31.45, + "learning_rate": 0.00034323601270461765, + "loss": 0.4245, + "step": 128875 + }, + { + "epoch": 31.45, + "learning_rate": 0.00034320547275836795, + "loss": 0.3894, + "step": 128900 + }, + { + "epoch": 31.46, + "learning_rate": 0.00034317493281211826, + "loss": 0.3963, + "step": 128925 + }, + { + "epoch": 31.47, + "learning_rate": 0.00034314439286586856, + "loss": 0.4036, + "step": 128950 + }, + { + "epoch": 31.47, + "learning_rate": 0.00034311385291961886, + "loss": 0.3902, + "step": 128975 + }, + { + "epoch": 31.48, + "learning_rate": 0.0003430833129733692, + "loss": 0.369, + "step": 129000 + }, + { + "epoch": 31.48, + "eval_cer": 0.09760479656684086, + "eval_loss": 0.41631850600242615, + "eval_runtime": 148.2037, + "eval_samples_per_second": 28.292, + "eval_steps_per_second": 7.078, + "eval_wer": 0.400652528548124, + "step": 129000 + }, + { + "epoch": 31.48, + "learning_rate": 0.00034305277302711947, + "loss": 0.3934, + "step": 129025 + }, + { + "epoch": 31.49, + "learning_rate": 0.0003430222330808698, + "loss": 0.4278, + "step": 129050 + }, + { + "epoch": 31.5, + "learning_rate": 0.0003429916931346201, + "loss": 0.3735, + "step": 129075 + }, + { + "epoch": 31.5, + "learning_rate": 0.0003429611531883704, + "loss": 0.4241, + "step": 129100 + }, + { + "epoch": 31.51, + "learning_rate": 0.00034293061324212074, + "loss": 0.3702, + "step": 129125 + }, + { + "epoch": 31.52, + "learning_rate": 0.00034290007329587104, + "loss": 0.4194, + "step": 129150 + }, + { + "epoch": 31.52, + "learning_rate": 0.0003428695333496213, + "loss": 0.3937, + "step": 129175 + }, + { + "epoch": 31.53, + "learning_rate": 0.0003428389934033716, + "loss": 0.4219, + "step": 129200 + }, + { + "epoch": 31.53, + "learning_rate": 0.0003428084534571219, + "loss": 0.407, + "step": 129225 + }, + { + "epoch": 31.54, + "learning_rate": 0.00034277791351087225, + "loss": 0.4078, + "step": 129250 + }, + { + "epoch": 31.55, + "learning_rate": 0.00034274737356462256, + "loss": 0.383, + "step": 129275 + }, + { + "epoch": 31.55, + "learning_rate": 0.00034271683361837286, + "loss": 0.3647, + "step": 129300 + }, + { + "epoch": 31.56, + "learning_rate": 0.0003426862936721231, + "loss": 0.4133, + "step": 129325 + }, + { + "epoch": 31.56, + "learning_rate": 0.0003426557537258734, + "loss": 0.4432, + "step": 129350 + }, + { + "epoch": 31.57, + "learning_rate": 0.00034262521377962377, + "loss": 0.3944, + "step": 129375 + }, + { + "epoch": 31.58, + "learning_rate": 0.0003425946738333741, + "loss": 0.4371, + "step": 129400 + }, + { + "epoch": 31.58, + "learning_rate": 0.0003425641338871244, + "loss": 0.3852, + "step": 129425 + }, + { + "epoch": 31.59, + "learning_rate": 0.0003425335939408747, + "loss": 0.4615, + "step": 129450 + }, + { + "epoch": 31.59, + "learning_rate": 0.000342503053994625, + "loss": 0.3881, + "step": 129475 + }, + { + "epoch": 31.6, + "learning_rate": 0.0003424725140483753, + "loss": 0.3749, + "step": 129500 + }, + { + "epoch": 31.61, + "learning_rate": 0.0003424419741021256, + "loss": 0.3825, + "step": 129525 + }, + { + "epoch": 31.61, + "learning_rate": 0.0003424114341558759, + "loss": 0.3886, + "step": 129550 + }, + { + "epoch": 31.62, + "learning_rate": 0.0003423808942096262, + "loss": 0.3683, + "step": 129575 + }, + { + "epoch": 31.63, + "learning_rate": 0.0003423503542633765, + "loss": 0.3867, + "step": 129600 + }, + { + "epoch": 31.63, + "learning_rate": 0.00034231981431712686, + "loss": 0.347, + "step": 129625 + }, + { + "epoch": 31.64, + "learning_rate": 0.0003422892743708771, + "loss": 0.4264, + "step": 129650 + }, + { + "epoch": 31.64, + "learning_rate": 0.0003422587344246274, + "loss": 0.3993, + "step": 129675 + }, + { + "epoch": 31.65, + "learning_rate": 0.0003422281944783777, + "loss": 0.402, + "step": 129700 + }, + { + "epoch": 31.66, + "learning_rate": 0.000342197654532128, + "loss": 0.3996, + "step": 129725 + }, + { + "epoch": 31.66, + "learning_rate": 0.0003421671145858783, + "loss": 0.3943, + "step": 129750 + }, + { + "epoch": 31.67, + "learning_rate": 0.0003421365746396287, + "loss": 0.3863, + "step": 129775 + }, + { + "epoch": 31.67, + "learning_rate": 0.00034210603469337893, + "loss": 0.3994, + "step": 129800 + }, + { + "epoch": 31.68, + "learning_rate": 0.00034207549474712923, + "loss": 0.4143, + "step": 129825 + }, + { + "epoch": 31.69, + "learning_rate": 0.00034204495480087953, + "loss": 0.3848, + "step": 129850 + }, + { + "epoch": 31.69, + "learning_rate": 0.00034201441485462984, + "loss": 0.3981, + "step": 129875 + }, + { + "epoch": 31.7, + "learning_rate": 0.0003419838749083802, + "loss": 0.421, + "step": 129900 + }, + { + "epoch": 31.7, + "learning_rate": 0.0003419533349621305, + "loss": 0.4067, + "step": 129925 + }, + { + "epoch": 31.71, + "learning_rate": 0.0003419227950158808, + "loss": 0.4321, + "step": 129950 + }, + { + "epoch": 31.72, + "learning_rate": 0.00034189225506963105, + "loss": 0.4127, + "step": 129975 + }, + { + "epoch": 31.72, + "learning_rate": 0.00034186171512338135, + "loss": 0.3806, + "step": 130000 + }, + { + "epoch": 31.73, + "learning_rate": 0.0003418311751771317, + "loss": 0.3789, + "step": 130025 + }, + { + "epoch": 31.73, + "learning_rate": 0.000341800635230882, + "loss": 0.4416, + "step": 130050 + }, + { + "epoch": 31.74, + "learning_rate": 0.0003417700952846323, + "loss": 0.407, + "step": 130075 + }, + { + "epoch": 31.75, + "learning_rate": 0.0003417395553383826, + "loss": 0.3916, + "step": 130100 + }, + { + "epoch": 31.75, + "learning_rate": 0.00034170901539213287, + "loss": 0.3883, + "step": 130125 + }, + { + "epoch": 31.76, + "learning_rate": 0.00034167847544588323, + "loss": 0.4128, + "step": 130150 + }, + { + "epoch": 31.77, + "learning_rate": 0.00034164793549963353, + "loss": 0.354, + "step": 130175 + }, + { + "epoch": 31.77, + "learning_rate": 0.00034161739555338384, + "loss": 0.4558, + "step": 130200 + }, + { + "epoch": 31.78, + "learning_rate": 0.00034158685560713414, + "loss": 0.3599, + "step": 130225 + }, + { + "epoch": 31.78, + "learning_rate": 0.00034155631566088444, + "loss": 0.429, + "step": 130250 + }, + { + "epoch": 31.79, + "learning_rate": 0.00034152577571463475, + "loss": 0.4128, + "step": 130275 + }, + { + "epoch": 31.8, + "learning_rate": 0.00034149523576838505, + "loss": 0.3966, + "step": 130300 + }, + { + "epoch": 31.8, + "learning_rate": 0.00034146469582213535, + "loss": 0.4003, + "step": 130325 + }, + { + "epoch": 31.81, + "learning_rate": 0.00034143415587588566, + "loss": 0.4447, + "step": 130350 + }, + { + "epoch": 31.81, + "learning_rate": 0.00034140361592963596, + "loss": 0.415, + "step": 130375 + }, + { + "epoch": 31.82, + "learning_rate": 0.0003413730759833863, + "loss": 0.4079, + "step": 130400 + }, + { + "epoch": 31.83, + "learning_rate": 0.0003413425360371366, + "loss": 0.4208, + "step": 130425 + }, + { + "epoch": 31.83, + "learning_rate": 0.00034131199609088687, + "loss": 0.4153, + "step": 130450 + }, + { + "epoch": 31.84, + "learning_rate": 0.00034128145614463717, + "loss": 0.3969, + "step": 130475 + }, + { + "epoch": 31.84, + "learning_rate": 0.0003412509161983875, + "loss": 0.4011, + "step": 130500 + }, + { + "epoch": 31.85, + "learning_rate": 0.00034122037625213783, + "loss": 0.3993, + "step": 130525 + }, + { + "epoch": 31.86, + "learning_rate": 0.00034118983630588814, + "loss": 0.444, + "step": 130550 + }, + { + "epoch": 31.86, + "learning_rate": 0.00034115929635963844, + "loss": 0.3871, + "step": 130575 + }, + { + "epoch": 31.87, + "learning_rate": 0.0003411287564133887, + "loss": 0.4001, + "step": 130600 + }, + { + "epoch": 31.88, + "learning_rate": 0.000341098216467139, + "loss": 0.4194, + "step": 130625 + }, + { + "epoch": 31.88, + "learning_rate": 0.00034106767652088935, + "loss": 0.4222, + "step": 130650 + }, + { + "epoch": 31.89, + "learning_rate": 0.00034103713657463965, + "loss": 0.3895, + "step": 130675 + }, + { + "epoch": 31.89, + "learning_rate": 0.00034100659662838996, + "loss": 0.3912, + "step": 130700 + }, + { + "epoch": 31.9, + "learning_rate": 0.00034097605668214026, + "loss": 0.4115, + "step": 130725 + }, + { + "epoch": 31.91, + "learning_rate": 0.0003409455167358905, + "loss": 0.4227, + "step": 130750 + }, + { + "epoch": 31.91, + "learning_rate": 0.00034091497678964087, + "loss": 0.3779, + "step": 130775 + }, + { + "epoch": 31.92, + "learning_rate": 0.00034088443684339117, + "loss": 0.4378, + "step": 130800 + }, + { + "epoch": 31.92, + "learning_rate": 0.0003408538968971415, + "loss": 0.3913, + "step": 130825 + }, + { + "epoch": 31.93, + "learning_rate": 0.0003408233569508918, + "loss": 0.4057, + "step": 130850 + }, + { + "epoch": 31.94, + "learning_rate": 0.0003407928170046421, + "loss": 0.4101, + "step": 130875 + }, + { + "epoch": 31.94, + "learning_rate": 0.00034076227705839244, + "loss": 0.4316, + "step": 130900 + }, + { + "epoch": 31.95, + "learning_rate": 0.0003407317371121427, + "loss": 0.4223, + "step": 130925 + }, + { + "epoch": 31.95, + "learning_rate": 0.000340701197165893, + "loss": 0.4274, + "step": 130950 + }, + { + "epoch": 31.96, + "learning_rate": 0.0003406706572196433, + "loss": 0.3901, + "step": 130975 + }, + { + "epoch": 31.97, + "learning_rate": 0.0003406401172733936, + "loss": 0.4463, + "step": 131000 + }, + { + "epoch": 31.97, + "learning_rate": 0.0003406095773271439, + "loss": 0.4061, + "step": 131025 + }, + { + "epoch": 31.98, + "learning_rate": 0.00034057903738089426, + "loss": 0.4125, + "step": 131050 + }, + { + "epoch": 31.99, + "learning_rate": 0.0003405484974346445, + "loss": 0.3804, + "step": 131075 + }, + { + "epoch": 31.99, + "learning_rate": 0.0003405179574883948, + "loss": 0.4336, + "step": 131100 + }, + { + "epoch": 32.0, + "learning_rate": 0.0003404874175421451, + "loss": 0.3988, + "step": 131125 + }, + { + "epoch": 32.0, + "learning_rate": 0.0003404568775958954, + "loss": 0.4117, + "step": 131150 + }, + { + "epoch": 32.01, + "learning_rate": 0.0003404263376496458, + "loss": 0.3902, + "step": 131175 + }, + { + "epoch": 32.02, + "learning_rate": 0.0003403957977033961, + "loss": 0.4209, + "step": 131200 + }, + { + "epoch": 32.02, + "learning_rate": 0.0003403652577571463, + "loss": 0.3716, + "step": 131225 + }, + { + "epoch": 32.03, + "learning_rate": 0.00034033471781089663, + "loss": 0.3839, + "step": 131250 + }, + { + "epoch": 32.03, + "learning_rate": 0.00034030417786464693, + "loss": 0.3534, + "step": 131275 + }, + { + "epoch": 32.04, + "learning_rate": 0.0003402736379183973, + "loss": 0.4128, + "step": 131300 + }, + { + "epoch": 32.05, + "learning_rate": 0.0003402430979721476, + "loss": 0.384, + "step": 131325 + }, + { + "epoch": 32.05, + "learning_rate": 0.0003402125580258979, + "loss": 0.4055, + "step": 131350 + }, + { + "epoch": 32.06, + "learning_rate": 0.0003401820180796482, + "loss": 0.3563, + "step": 131375 + }, + { + "epoch": 32.06, + "learning_rate": 0.00034015147813339845, + "loss": 0.3818, + "step": 131400 + }, + { + "epoch": 32.07, + "learning_rate": 0.0003401209381871488, + "loss": 0.4055, + "step": 131425 + }, + { + "epoch": 32.08, + "learning_rate": 0.0003400903982408991, + "loss": 0.3967, + "step": 131450 + }, + { + "epoch": 32.08, + "learning_rate": 0.0003400598582946494, + "loss": 0.4005, + "step": 131475 + }, + { + "epoch": 32.09, + "learning_rate": 0.0003400293183483997, + "loss": 0.37, + "step": 131500 + }, + { + "epoch": 32.09, + "learning_rate": 0.00033999877840215, + "loss": 0.3949, + "step": 131525 + }, + { + "epoch": 32.1, + "learning_rate": 0.0003399682384559003, + "loss": 0.3711, + "step": 131550 + }, + { + "epoch": 32.11, + "learning_rate": 0.00033993769850965063, + "loss": 0.3992, + "step": 131575 + }, + { + "epoch": 32.11, + "learning_rate": 0.00033990715856340093, + "loss": 0.3856, + "step": 131600 + }, + { + "epoch": 32.12, + "learning_rate": 0.00033987661861715123, + "loss": 0.3252, + "step": 131625 + }, + { + "epoch": 32.13, + "learning_rate": 0.00033984607867090154, + "loss": 0.3804, + "step": 131650 + }, + { + "epoch": 32.13, + "learning_rate": 0.0003398155387246519, + "loss": 0.3609, + "step": 131675 + }, + { + "epoch": 32.14, + "learning_rate": 0.00033978499877840214, + "loss": 0.4174, + "step": 131700 + }, + { + "epoch": 32.14, + "learning_rate": 0.00033975445883215245, + "loss": 0.3768, + "step": 131725 + }, + { + "epoch": 32.15, + "learning_rate": 0.00033972391888590275, + "loss": 0.3697, + "step": 131750 + }, + { + "epoch": 32.16, + "learning_rate": 0.00033969337893965305, + "loss": 0.3717, + "step": 131775 + }, + { + "epoch": 32.16, + "learning_rate": 0.0003396628389934034, + "loss": 0.4154, + "step": 131800 + }, + { + "epoch": 32.17, + "learning_rate": 0.0003396322990471537, + "loss": 0.3912, + "step": 131825 + }, + { + "epoch": 32.17, + "learning_rate": 0.00033960175910090396, + "loss": 0.4041, + "step": 131850 + }, + { + "epoch": 32.18, + "learning_rate": 0.00033957121915465427, + "loss": 0.3556, + "step": 131875 + }, + { + "epoch": 32.19, + "learning_rate": 0.00033954067920840457, + "loss": 0.3875, + "step": 131900 + }, + { + "epoch": 32.19, + "learning_rate": 0.00033951013926215493, + "loss": 0.3835, + "step": 131925 + }, + { + "epoch": 32.2, + "learning_rate": 0.00033947959931590523, + "loss": 0.4374, + "step": 131950 + }, + { + "epoch": 32.2, + "learning_rate": 0.00033944905936965554, + "loss": 0.3955, + "step": 131975 + }, + { + "epoch": 32.21, + "learning_rate": 0.00033941851942340584, + "loss": 0.3896, + "step": 132000 + }, + { + "epoch": 32.21, + "eval_cer": 0.09856472593246615, + "eval_loss": 0.3984539806842804, + "eval_runtime": 149.0532, + "eval_samples_per_second": 28.131, + "eval_steps_per_second": 7.038, + "eval_wer": 0.40153344208809133, + "step": 132000 + }, + { + "epoch": 32.22, + "learning_rate": 0.0003393879794771561, + "loss": 0.3759, + "step": 132025 + }, + { + "epoch": 32.22, + "learning_rate": 0.00033935743953090645, + "loss": 0.4199, + "step": 132050 + }, + { + "epoch": 32.23, + "learning_rate": 0.00033932689958465675, + "loss": 0.3597, + "step": 132075 + }, + { + "epoch": 32.24, + "learning_rate": 0.00033929635963840705, + "loss": 0.3833, + "step": 132100 + }, + { + "epoch": 32.24, + "learning_rate": 0.00033926581969215736, + "loss": 0.3782, + "step": 132125 + }, + { + "epoch": 32.25, + "learning_rate": 0.00033923527974590766, + "loss": 0.386, + "step": 132150 + }, + { + "epoch": 32.25, + "learning_rate": 0.0003392047397996579, + "loss": 0.3654, + "step": 132175 + }, + { + "epoch": 32.26, + "learning_rate": 0.00033917419985340827, + "loss": 0.3989, + "step": 132200 + }, + { + "epoch": 32.27, + "learning_rate": 0.00033914365990715857, + "loss": 0.3849, + "step": 132225 + }, + { + "epoch": 32.27, + "learning_rate": 0.00033911311996090887, + "loss": 0.3937, + "step": 132250 + }, + { + "epoch": 32.28, + "learning_rate": 0.0003390825800146592, + "loss": 0.3615, + "step": 132275 + }, + { + "epoch": 32.28, + "learning_rate": 0.0003390520400684095, + "loss": 0.3982, + "step": 132300 + }, + { + "epoch": 32.29, + "learning_rate": 0.0003390215001221598, + "loss": 0.3963, + "step": 132325 + }, + { + "epoch": 32.3, + "learning_rate": 0.0003389909601759101, + "loss": 0.4259, + "step": 132350 + }, + { + "epoch": 32.3, + "learning_rate": 0.0003389604202296604, + "loss": 0.3623, + "step": 132375 + }, + { + "epoch": 32.31, + "learning_rate": 0.0003389298802834107, + "loss": 0.3697, + "step": 132400 + }, + { + "epoch": 32.31, + "learning_rate": 0.000338899340337161, + "loss": 0.4037, + "step": 132425 + }, + { + "epoch": 32.32, + "learning_rate": 0.00033886880039091135, + "loss": 0.408, + "step": 132450 + }, + { + "epoch": 32.33, + "learning_rate": 0.00033883826044466166, + "loss": 0.4025, + "step": 132475 + }, + { + "epoch": 32.33, + "learning_rate": 0.0003388077204984119, + "loss": 0.3843, + "step": 132500 + }, + { + "epoch": 32.34, + "learning_rate": 0.0003387771805521622, + "loss": 0.4237, + "step": 132525 + }, + { + "epoch": 32.35, + "learning_rate": 0.0003387466406059125, + "loss": 0.3798, + "step": 132550 + }, + { + "epoch": 32.35, + "learning_rate": 0.0003387173222575128, + "loss": 0.3831, + "step": 132575 + }, + { + "epoch": 32.36, + "learning_rate": 0.0003386867823112632, + "loss": 0.4441, + "step": 132600 + }, + { + "epoch": 32.36, + "learning_rate": 0.0003386562423650135, + "loss": 0.3923, + "step": 132625 + }, + { + "epoch": 32.37, + "learning_rate": 0.00033862570241876373, + "loss": 0.4167, + "step": 132650 + }, + { + "epoch": 32.38, + "learning_rate": 0.00033859516247251403, + "loss": 0.3875, + "step": 132675 + }, + { + "epoch": 32.38, + "learning_rate": 0.00033856462252626434, + "loss": 0.4144, + "step": 132700 + }, + { + "epoch": 32.39, + "learning_rate": 0.0003385340825800147, + "loss": 0.4159, + "step": 132725 + }, + { + "epoch": 32.39, + "learning_rate": 0.000338503542633765, + "loss": 0.3833, + "step": 132750 + }, + { + "epoch": 32.4, + "learning_rate": 0.0003384730026875153, + "loss": 0.4222, + "step": 132775 + }, + { + "epoch": 32.41, + "learning_rate": 0.00033844246274126555, + "loss": 0.3666, + "step": 132800 + }, + { + "epoch": 32.41, + "learning_rate": 0.00033841192279501585, + "loss": 0.3791, + "step": 132825 + }, + { + "epoch": 32.42, + "learning_rate": 0.0003383813828487662, + "loss": 0.3982, + "step": 132850 + }, + { + "epoch": 32.42, + "learning_rate": 0.0003383508429025165, + "loss": 0.3673, + "step": 132875 + }, + { + "epoch": 32.43, + "learning_rate": 0.0003383203029562668, + "loss": 0.3804, + "step": 132900 + }, + { + "epoch": 32.44, + "learning_rate": 0.0003382897630100171, + "loss": 0.3506, + "step": 132925 + }, + { + "epoch": 32.44, + "learning_rate": 0.0003382592230637674, + "loss": 0.4107, + "step": 132950 + }, + { + "epoch": 32.45, + "learning_rate": 0.00033822868311751767, + "loss": 0.3897, + "step": 132975 + }, + { + "epoch": 32.45, + "learning_rate": 0.00033819814317126803, + "loss": 0.3825, + "step": 133000 + }, + { + "epoch": 32.46, + "learning_rate": 0.00033816760322501833, + "loss": 0.408, + "step": 133025 + }, + { + "epoch": 32.47, + "learning_rate": 0.00033813706327876864, + "loss": 0.4054, + "step": 133050 + }, + { + "epoch": 32.47, + "learning_rate": 0.00033810652333251894, + "loss": 0.3952, + "step": 133075 + }, + { + "epoch": 32.48, + "learning_rate": 0.00033807598338626924, + "loss": 0.4028, + "step": 133100 + }, + { + "epoch": 32.49, + "learning_rate": 0.00033804544344001955, + "loss": 0.3898, + "step": 133125 + }, + { + "epoch": 32.49, + "learning_rate": 0.00033801490349376985, + "loss": 0.4198, + "step": 133150 + }, + { + "epoch": 32.5, + "learning_rate": 0.00033798436354752015, + "loss": 0.3762, + "step": 133175 + }, + { + "epoch": 32.5, + "learning_rate": 0.00033795382360127046, + "loss": 0.4403, + "step": 133200 + }, + { + "epoch": 32.51, + "learning_rate": 0.00033792328365502076, + "loss": 0.3825, + "step": 133225 + }, + { + "epoch": 32.52, + "learning_rate": 0.0003378927437087711, + "loss": 0.404, + "step": 133250 + }, + { + "epoch": 32.52, + "learning_rate": 0.00033786220376252137, + "loss": 0.3803, + "step": 133275 + }, + { + "epoch": 32.53, + "learning_rate": 0.00033783166381627167, + "loss": 0.4274, + "step": 133300 + }, + { + "epoch": 32.53, + "learning_rate": 0.000337801123870022, + "loss": 0.3633, + "step": 133325 + }, + { + "epoch": 32.54, + "learning_rate": 0.0003377705839237723, + "loss": 0.4178, + "step": 133350 + }, + { + "epoch": 32.55, + "learning_rate": 0.00033774004397752263, + "loss": 0.386, + "step": 133375 + }, + { + "epoch": 32.55, + "learning_rate": 0.00033770950403127294, + "loss": 0.3567, + "step": 133400 + }, + { + "epoch": 32.56, + "learning_rate": 0.00033767896408502324, + "loss": 0.3817, + "step": 133425 + }, + { + "epoch": 32.56, + "learning_rate": 0.0003376484241387735, + "loss": 0.4123, + "step": 133450 + }, + { + "epoch": 32.57, + "learning_rate": 0.0003376178841925238, + "loss": 0.3853, + "step": 133475 + }, + { + "epoch": 32.58, + "learning_rate": 0.00033758734424627415, + "loss": 0.3949, + "step": 133500 + }, + { + "epoch": 32.58, + "learning_rate": 0.00033755680430002445, + "loss": 0.3601, + "step": 133525 + }, + { + "epoch": 32.59, + "learning_rate": 0.00033752626435377476, + "loss": 0.3768, + "step": 133550 + }, + { + "epoch": 32.6, + "learning_rate": 0.00033749572440752506, + "loss": 0.3772, + "step": 133575 + }, + { + "epoch": 32.6, + "learning_rate": 0.0003374651844612753, + "loss": 0.4496, + "step": 133600 + }, + { + "epoch": 32.61, + "learning_rate": 0.00033743464451502567, + "loss": 0.3942, + "step": 133625 + }, + { + "epoch": 32.61, + "learning_rate": 0.00033740410456877597, + "loss": 0.3922, + "step": 133650 + }, + { + "epoch": 32.62, + "learning_rate": 0.0003373735646225263, + "loss": 0.4161, + "step": 133675 + }, + { + "epoch": 32.63, + "learning_rate": 0.0003373430246762766, + "loss": 0.416, + "step": 133700 + }, + { + "epoch": 32.63, + "learning_rate": 0.0003373124847300269, + "loss": 0.3627, + "step": 133725 + }, + { + "epoch": 32.64, + "learning_rate": 0.0003372819447837772, + "loss": 0.3978, + "step": 133750 + }, + { + "epoch": 32.64, + "learning_rate": 0.0003372514048375275, + "loss": 0.352, + "step": 133775 + }, + { + "epoch": 32.65, + "learning_rate": 0.0003372208648912778, + "loss": 0.3799, + "step": 133800 + }, + { + "epoch": 32.66, + "learning_rate": 0.0003371903249450281, + "loss": 0.3868, + "step": 133825 + }, + { + "epoch": 32.66, + "learning_rate": 0.0003371597849987784, + "loss": 0.4069, + "step": 133850 + }, + { + "epoch": 32.67, + "learning_rate": 0.00033712924505252876, + "loss": 0.358, + "step": 133875 + }, + { + "epoch": 32.67, + "learning_rate": 0.00033709870510627906, + "loss": 0.4397, + "step": 133900 + }, + { + "epoch": 32.68, + "learning_rate": 0.0003370681651600293, + "loss": 0.4316, + "step": 133925 + }, + { + "epoch": 32.69, + "learning_rate": 0.0003370376252137796, + "loss": 0.3767, + "step": 133950 + }, + { + "epoch": 32.69, + "learning_rate": 0.0003370070852675299, + "loss": 0.4035, + "step": 133975 + }, + { + "epoch": 32.7, + "learning_rate": 0.00033697654532128027, + "loss": 0.4051, + "step": 134000 + }, + { + "epoch": 32.7, + "learning_rate": 0.0003369460053750306, + "loss": 0.4183, + "step": 134025 + }, + { + "epoch": 32.71, + "learning_rate": 0.0003369154654287809, + "loss": 0.4046, + "step": 134050 + }, + { + "epoch": 32.72, + "learning_rate": 0.00033688492548253113, + "loss": 0.388, + "step": 134075 + }, + { + "epoch": 32.72, + "learning_rate": 0.00033685438553628143, + "loss": 0.3803, + "step": 134100 + }, + { + "epoch": 32.73, + "learning_rate": 0.0003368238455900318, + "loss": 0.3721, + "step": 134125 + }, + { + "epoch": 32.74, + "learning_rate": 0.0003367933056437821, + "loss": 0.422, + "step": 134150 + }, + { + "epoch": 32.74, + "learning_rate": 0.0003367627656975324, + "loss": 0.3928, + "step": 134175 + }, + { + "epoch": 32.75, + "learning_rate": 0.0003367322257512827, + "loss": 0.4004, + "step": 134200 + }, + { + "epoch": 32.75, + "learning_rate": 0.00033670168580503295, + "loss": 0.3687, + "step": 134225 + }, + { + "epoch": 32.76, + "learning_rate": 0.00033667114585878325, + "loss": 0.3852, + "step": 134250 + }, + { + "epoch": 32.77, + "learning_rate": 0.0003366406059125336, + "loss": 0.3816, + "step": 134275 + }, + { + "epoch": 32.77, + "learning_rate": 0.0003366100659662839, + "loss": 0.4021, + "step": 134300 + }, + { + "epoch": 32.78, + "learning_rate": 0.0003365795260200342, + "loss": 0.3976, + "step": 134325 + }, + { + "epoch": 32.78, + "learning_rate": 0.0003365489860737845, + "loss": 0.4478, + "step": 134350 + }, + { + "epoch": 32.79, + "learning_rate": 0.0003365184461275348, + "loss": 0.3553, + "step": 134375 + }, + { + "epoch": 32.8, + "learning_rate": 0.0003364879061812851, + "loss": 0.4167, + "step": 134400 + }, + { + "epoch": 32.8, + "learning_rate": 0.00033645736623503543, + "loss": 0.3895, + "step": 134425 + }, + { + "epoch": 32.81, + "learning_rate": 0.00033642682628878573, + "loss": 0.3975, + "step": 134450 + }, + { + "epoch": 32.81, + "learning_rate": 0.00033639628634253604, + "loss": 0.3731, + "step": 134475 + }, + { + "epoch": 32.82, + "learning_rate": 0.00033636574639628634, + "loss": 0.4234, + "step": 134500 + }, + { + "epoch": 32.83, + "learning_rate": 0.0003363352064500367, + "loss": 0.3793, + "step": 134525 + }, + { + "epoch": 32.83, + "learning_rate": 0.00033630466650378695, + "loss": 0.4039, + "step": 134550 + }, + { + "epoch": 32.84, + "learning_rate": 0.00033627412655753725, + "loss": 0.3617, + "step": 134575 + }, + { + "epoch": 32.85, + "learning_rate": 0.00033624358661128755, + "loss": 0.4011, + "step": 134600 + }, + { + "epoch": 32.85, + "learning_rate": 0.00033621304666503786, + "loss": 0.3912, + "step": 134625 + }, + { + "epoch": 32.86, + "learning_rate": 0.0003361825067187882, + "loss": 0.3734, + "step": 134650 + }, + { + "epoch": 32.86, + "learning_rate": 0.0003361519667725385, + "loss": 0.3806, + "step": 134675 + }, + { + "epoch": 32.87, + "learning_rate": 0.00033612142682628877, + "loss": 0.3725, + "step": 134700 + }, + { + "epoch": 32.88, + "learning_rate": 0.00033609088688003907, + "loss": 0.4062, + "step": 134725 + }, + { + "epoch": 32.88, + "learning_rate": 0.00033606034693378937, + "loss": 0.4138, + "step": 134750 + }, + { + "epoch": 32.89, + "learning_rate": 0.00033602980698753973, + "loss": 0.3759, + "step": 134775 + }, + { + "epoch": 32.89, + "learning_rate": 0.00033599926704129003, + "loss": 0.3783, + "step": 134800 + }, + { + "epoch": 32.9, + "learning_rate": 0.00033596872709504034, + "loss": 0.367, + "step": 134825 + }, + { + "epoch": 32.91, + "learning_rate": 0.00033593818714879064, + "loss": 0.3837, + "step": 134850 + }, + { + "epoch": 32.91, + "learning_rate": 0.0003359076472025409, + "loss": 0.3679, + "step": 134875 + }, + { + "epoch": 32.92, + "learning_rate": 0.00033587710725629125, + "loss": 0.3842, + "step": 134900 + }, + { + "epoch": 32.92, + "learning_rate": 0.00033584656731004155, + "loss": 0.395, + "step": 134925 + }, + { + "epoch": 32.93, + "learning_rate": 0.00033581602736379185, + "loss": 0.3838, + "step": 134950 + }, + { + "epoch": 32.94, + "learning_rate": 0.00033578548741754216, + "loss": 0.3935, + "step": 134975 + }, + { + "epoch": 32.94, + "learning_rate": 0.00033575494747129246, + "loss": 0.3912, + "step": 135000 + }, + { + "epoch": 32.94, + "eval_cer": 0.09640360153178033, + "eval_loss": 0.41029471158981323, + "eval_runtime": 149.2123, + "eval_samples_per_second": 28.101, + "eval_steps_per_second": 7.03, + "eval_wer": 0.39477977161500816, + "step": 135000 + }, + { + "epoch": 32.95, + "learning_rate": 0.00033572440752504276, + "loss": 0.378, + "step": 135025 + }, + { + "epoch": 32.96, + "learning_rate": 0.00033569386757879307, + "loss": 0.4405, + "step": 135050 + }, + { + "epoch": 32.96, + "learning_rate": 0.00033566332763254337, + "loss": 0.3973, + "step": 135075 + }, + { + "epoch": 32.97, + "learning_rate": 0.0003356327876862937, + "loss": 0.4042, + "step": 135100 + }, + { + "epoch": 32.97, + "learning_rate": 0.000335602247740044, + "loss": 0.3579, + "step": 135125 + }, + { + "epoch": 32.98, + "learning_rate": 0.00033557170779379433, + "loss": 0.3996, + "step": 135150 + }, + { + "epoch": 32.99, + "learning_rate": 0.0003355411678475446, + "loss": 0.3573, + "step": 135175 + }, + { + "epoch": 32.99, + "learning_rate": 0.0003355106279012949, + "loss": 0.4172, + "step": 135200 + }, + { + "epoch": 33.0, + "learning_rate": 0.0003354800879550452, + "loss": 0.3616, + "step": 135225 + }, + { + "epoch": 33.0, + "learning_rate": 0.0003354495480087955, + "loss": 0.3836, + "step": 135250 + }, + { + "epoch": 33.01, + "learning_rate": 0.00033541900806254585, + "loss": 0.3581, + "step": 135275 + }, + { + "epoch": 33.02, + "learning_rate": 0.00033538846811629615, + "loss": 0.3902, + "step": 135300 + }, + { + "epoch": 33.02, + "learning_rate": 0.0003353579281700464, + "loss": 0.3405, + "step": 135325 + }, + { + "epoch": 33.03, + "learning_rate": 0.0003353273882237967, + "loss": 0.368, + "step": 135350 + }, + { + "epoch": 33.03, + "learning_rate": 0.000335296848277547, + "loss": 0.3399, + "step": 135375 + }, + { + "epoch": 33.04, + "learning_rate": 0.00033526630833129737, + "loss": 0.3927, + "step": 135400 + }, + { + "epoch": 33.05, + "learning_rate": 0.00033523576838504767, + "loss": 0.3737, + "step": 135425 + }, + { + "epoch": 33.05, + "learning_rate": 0.000335206450036648, + "loss": 0.3907, + "step": 135450 + }, + { + "epoch": 33.06, + "learning_rate": 0.0003351759100903983, + "loss": 0.3661, + "step": 135475 + }, + { + "epoch": 33.06, + "learning_rate": 0.00033514537014414853, + "loss": 0.3812, + "step": 135500 + }, + { + "epoch": 33.07, + "learning_rate": 0.00033511483019789883, + "loss": 0.3496, + "step": 135525 + }, + { + "epoch": 33.08, + "learning_rate": 0.00033508429025164914, + "loss": 0.3888, + "step": 135550 + }, + { + "epoch": 33.08, + "learning_rate": 0.0003350537503053995, + "loss": 0.3772, + "step": 135575 + }, + { + "epoch": 33.09, + "learning_rate": 0.0003350232103591498, + "loss": 0.4225, + "step": 135600 + }, + { + "epoch": 33.1, + "learning_rate": 0.0003349926704129001, + "loss": 0.3996, + "step": 135625 + }, + { + "epoch": 33.1, + "learning_rate": 0.00033496213046665035, + "loss": 0.3857, + "step": 135650 + }, + { + "epoch": 33.11, + "learning_rate": 0.00033493159052040065, + "loss": 0.3734, + "step": 135675 + }, + { + "epoch": 33.11, + "learning_rate": 0.000334901050574151, + "loss": 0.3788, + "step": 135700 + }, + { + "epoch": 33.12, + "learning_rate": 0.0003348705106279013, + "loss": 0.352, + "step": 135725 + }, + { + "epoch": 33.13, + "learning_rate": 0.0003348399706816516, + "loss": 0.356, + "step": 135750 + }, + { + "epoch": 33.13, + "learning_rate": 0.0003348094307354019, + "loss": 0.355, + "step": 135775 + }, + { + "epoch": 33.14, + "learning_rate": 0.00033477889078915217, + "loss": 0.4078, + "step": 135800 + }, + { + "epoch": 33.14, + "learning_rate": 0.00033474835084290253, + "loss": 0.3636, + "step": 135825 + }, + { + "epoch": 33.15, + "learning_rate": 0.00033471781089665283, + "loss": 0.3836, + "step": 135850 + }, + { + "epoch": 33.16, + "learning_rate": 0.00033468727095040313, + "loss": 0.3747, + "step": 135875 + }, + { + "epoch": 33.16, + "learning_rate": 0.00033465673100415344, + "loss": 0.3978, + "step": 135900 + }, + { + "epoch": 33.17, + "learning_rate": 0.00033462619105790374, + "loss": 0.3753, + "step": 135925 + }, + { + "epoch": 33.17, + "learning_rate": 0.0003345956511116541, + "loss": 0.3733, + "step": 135950 + }, + { + "epoch": 33.18, + "learning_rate": 0.00033456511116540435, + "loss": 0.3348, + "step": 135975 + }, + { + "epoch": 33.19, + "learning_rate": 0.00033453457121915465, + "loss": 0.3901, + "step": 136000 + }, + { + "epoch": 33.19, + "learning_rate": 0.00033450403127290495, + "loss": 0.3628, + "step": 136025 + }, + { + "epoch": 33.2, + "learning_rate": 0.00033447349132665526, + "loss": 0.398, + "step": 136050 + }, + { + "epoch": 33.21, + "learning_rate": 0.0003344429513804056, + "loss": 0.3426, + "step": 136075 + }, + { + "epoch": 33.21, + "learning_rate": 0.0003344124114341559, + "loss": 0.3727, + "step": 136100 + }, + { + "epoch": 33.22, + "learning_rate": 0.00033438187148790617, + "loss": 0.3642, + "step": 136125 + }, + { + "epoch": 33.22, + "learning_rate": 0.00033435133154165647, + "loss": 0.3884, + "step": 136150 + }, + { + "epoch": 33.23, + "learning_rate": 0.0003343220131932568, + "loss": 0.3307, + "step": 136175 + }, + { + "epoch": 33.24, + "learning_rate": 0.0003342914732470071, + "loss": 0.3864, + "step": 136200 + }, + { + "epoch": 33.24, + "learning_rate": 0.0003342609333007574, + "loss": 0.3317, + "step": 136225 + }, + { + "epoch": 33.25, + "learning_rate": 0.00033423039335450774, + "loss": 0.3878, + "step": 136250 + }, + { + "epoch": 33.25, + "learning_rate": 0.000334199853408258, + "loss": 0.3866, + "step": 136275 + }, + { + "epoch": 33.26, + "learning_rate": 0.0003341693134620083, + "loss": 0.3796, + "step": 136300 + }, + { + "epoch": 33.27, + "learning_rate": 0.0003341387735157586, + "loss": 0.336, + "step": 136325 + }, + { + "epoch": 33.27, + "learning_rate": 0.0003341082335695089, + "loss": 0.3943, + "step": 136350 + }, + { + "epoch": 33.28, + "learning_rate": 0.00033407769362325926, + "loss": 0.3875, + "step": 136375 + }, + { + "epoch": 33.28, + "learning_rate": 0.00033404715367700956, + "loss": 0.3827, + "step": 136400 + }, + { + "epoch": 33.29, + "learning_rate": 0.00033401661373075987, + "loss": 0.3293, + "step": 136425 + }, + { + "epoch": 33.3, + "learning_rate": 0.0003339860737845101, + "loss": 0.4467, + "step": 136450 + }, + { + "epoch": 33.3, + "learning_rate": 0.0003339555338382604, + "loss": 0.395, + "step": 136475 + }, + { + "epoch": 33.31, + "learning_rate": 0.0003339249938920108, + "loss": 0.4032, + "step": 136500 + }, + { + "epoch": 33.32, + "learning_rate": 0.0003338944539457611, + "loss": 0.353, + "step": 136525 + }, + { + "epoch": 33.32, + "learning_rate": 0.0003338639139995114, + "loss": 0.401, + "step": 136550 + }, + { + "epoch": 33.33, + "learning_rate": 0.0003338333740532617, + "loss": 0.3823, + "step": 136575 + }, + { + "epoch": 33.33, + "learning_rate": 0.00033380283410701193, + "loss": 0.3959, + "step": 136600 + }, + { + "epoch": 33.34, + "learning_rate": 0.0003337722941607623, + "loss": 0.3629, + "step": 136625 + }, + { + "epoch": 33.35, + "learning_rate": 0.0003337417542145126, + "loss": 0.4072, + "step": 136650 + }, + { + "epoch": 33.35, + "learning_rate": 0.0003337112142682629, + "loss": 0.3992, + "step": 136675 + }, + { + "epoch": 33.36, + "learning_rate": 0.0003336806743220132, + "loss": 0.4557, + "step": 136700 + }, + { + "epoch": 33.36, + "learning_rate": 0.0003336501343757635, + "loss": 0.349, + "step": 136725 + }, + { + "epoch": 33.37, + "learning_rate": 0.0003336195944295138, + "loss": 0.3946, + "step": 136750 + }, + { + "epoch": 33.38, + "learning_rate": 0.0003335890544832641, + "loss": 0.3782, + "step": 136775 + }, + { + "epoch": 33.38, + "learning_rate": 0.0003335585145370144, + "loss": 0.4219, + "step": 136800 + }, + { + "epoch": 33.39, + "learning_rate": 0.0003335279745907647, + "loss": 0.3675, + "step": 136825 + }, + { + "epoch": 33.39, + "learning_rate": 0.000333497434644515, + "loss": 0.3896, + "step": 136850 + }, + { + "epoch": 33.4, + "learning_rate": 0.0003334668946982654, + "loss": 0.3443, + "step": 136875 + }, + { + "epoch": 33.41, + "learning_rate": 0.0003334363547520157, + "loss": 0.3815, + "step": 136900 + }, + { + "epoch": 33.41, + "learning_rate": 0.00033340581480576593, + "loss": 0.4201, + "step": 136925 + }, + { + "epoch": 33.42, + "learning_rate": 0.00033337527485951624, + "loss": 0.3761, + "step": 136950 + }, + { + "epoch": 33.42, + "learning_rate": 0.00033334473491326654, + "loss": 0.3522, + "step": 136975 + }, + { + "epoch": 33.43, + "learning_rate": 0.0003333141949670169, + "loss": 0.424, + "step": 137000 + }, + { + "epoch": 33.44, + "learning_rate": 0.0003332836550207672, + "loss": 0.3266, + "step": 137025 + }, + { + "epoch": 33.44, + "learning_rate": 0.0003332531150745175, + "loss": 0.3849, + "step": 137050 + }, + { + "epoch": 33.45, + "learning_rate": 0.00033322257512826775, + "loss": 0.3785, + "step": 137075 + }, + { + "epoch": 33.46, + "learning_rate": 0.00033319203518201806, + "loss": 0.3789, + "step": 137100 + }, + { + "epoch": 33.46, + "learning_rate": 0.00033316149523576836, + "loss": 0.3665, + "step": 137125 + }, + { + "epoch": 33.47, + "learning_rate": 0.0003331309552895187, + "loss": 0.4229, + "step": 137150 + }, + { + "epoch": 33.47, + "learning_rate": 0.000333100415343269, + "loss": 0.3616, + "step": 137175 + }, + { + "epoch": 33.48, + "learning_rate": 0.0003330698753970193, + "loss": 0.3846, + "step": 137200 + }, + { + "epoch": 33.49, + "learning_rate": 0.00033303933545076957, + "loss": 0.3729, + "step": 137225 + }, + { + "epoch": 33.49, + "learning_rate": 0.0003330087955045199, + "loss": 0.4188, + "step": 137250 + }, + { + "epoch": 33.5, + "learning_rate": 0.00033297825555827023, + "loss": 0.3823, + "step": 137275 + }, + { + "epoch": 33.5, + "learning_rate": 0.00033294771561202054, + "loss": 0.4614, + "step": 137300 + }, + { + "epoch": 33.51, + "learning_rate": 0.00033291717566577084, + "loss": 0.3309, + "step": 137325 + }, + { + "epoch": 33.52, + "learning_rate": 0.00033288663571952114, + "loss": 0.3966, + "step": 137350 + }, + { + "epoch": 33.52, + "learning_rate": 0.00033285609577327145, + "loss": 0.3856, + "step": 137375 + }, + { + "epoch": 33.53, + "learning_rate": 0.00033282555582702175, + "loss": 0.4269, + "step": 137400 + }, + { + "epoch": 33.53, + "learning_rate": 0.00033279501588077205, + "loss": 0.3844, + "step": 137425 + }, + { + "epoch": 33.54, + "learning_rate": 0.00033276447593452236, + "loss": 0.4249, + "step": 137450 + }, + { + "epoch": 33.55, + "learning_rate": 0.00033273393598827266, + "loss": 0.3647, + "step": 137475 + }, + { + "epoch": 33.55, + "learning_rate": 0.00033270339604202296, + "loss": 0.414, + "step": 137500 + }, + { + "epoch": 33.56, + "learning_rate": 0.0003326728560957733, + "loss": 0.389, + "step": 137525 + }, + { + "epoch": 33.57, + "learning_rate": 0.00033264231614952357, + "loss": 0.4292, + "step": 137550 + }, + { + "epoch": 33.57, + "learning_rate": 0.0003326117762032739, + "loss": 0.3596, + "step": 137575 + }, + { + "epoch": 33.58, + "learning_rate": 0.0003325812362570242, + "loss": 0.3767, + "step": 137600 + }, + { + "epoch": 33.58, + "learning_rate": 0.0003325506963107745, + "loss": 0.4002, + "step": 137625 + }, + { + "epoch": 33.59, + "learning_rate": 0.00033252015636452484, + "loss": 0.4151, + "step": 137650 + }, + { + "epoch": 33.6, + "learning_rate": 0.00033248961641827514, + "loss": 0.3565, + "step": 137675 + }, + { + "epoch": 33.6, + "learning_rate": 0.0003324590764720254, + "loss": 0.448, + "step": 137700 + }, + { + "epoch": 33.61, + "learning_rate": 0.0003324285365257757, + "loss": 0.3663, + "step": 137725 + }, + { + "epoch": 33.61, + "learning_rate": 0.000332397996579526, + "loss": 0.4024, + "step": 137750 + }, + { + "epoch": 33.62, + "learning_rate": 0.00033236745663327635, + "loss": 0.3953, + "step": 137775 + }, + { + "epoch": 33.63, + "learning_rate": 0.00033233691668702666, + "loss": 0.4102, + "step": 137800 + }, + { + "epoch": 33.63, + "learning_rate": 0.00033230637674077696, + "loss": 0.3611, + "step": 137825 + }, + { + "epoch": 33.64, + "learning_rate": 0.00033227583679452726, + "loss": 0.4133, + "step": 137850 + }, + { + "epoch": 33.64, + "learning_rate": 0.0003322452968482775, + "loss": 0.4016, + "step": 137875 + }, + { + "epoch": 33.65, + "learning_rate": 0.00033221475690202787, + "loss": 0.4489, + "step": 137900 + }, + { + "epoch": 33.66, + "learning_rate": 0.0003321842169557782, + "loss": 0.4036, + "step": 137925 + }, + { + "epoch": 33.66, + "learning_rate": 0.0003321536770095285, + "loss": 0.4298, + "step": 137950 + }, + { + "epoch": 33.67, + "learning_rate": 0.0003321231370632788, + "loss": 0.3659, + "step": 137975 + }, + { + "epoch": 33.67, + "learning_rate": 0.0003320925971170291, + "loss": 0.3995, + "step": 138000 + }, + { + "epoch": 33.67, + "eval_cer": 0.09747646376394978, + "eval_loss": 0.39622190594673157, + "eval_runtime": 149.4561, + "eval_samples_per_second": 28.055, + "eval_steps_per_second": 7.019, + "eval_wer": 0.4024143556280587, + "step": 138000 + }, + { + "epoch": 33.68, + "learning_rate": 0.0003320620571707794, + "loss": 0.3921, + "step": 138025 + }, + { + "epoch": 33.69, + "learning_rate": 0.0003320315172245297, + "loss": 0.4156, + "step": 138050 + }, + { + "epoch": 33.69, + "learning_rate": 0.00033200097727828, + "loss": 0.3502, + "step": 138075 + }, + { + "epoch": 33.7, + "learning_rate": 0.0003319704373320303, + "loss": 0.3947, + "step": 138100 + }, + { + "epoch": 33.71, + "learning_rate": 0.0003319398973857806, + "loss": 0.3597, + "step": 138125 + }, + { + "epoch": 33.71, + "learning_rate": 0.00033190935743953096, + "loss": 0.3832, + "step": 138150 + }, + { + "epoch": 33.72, + "learning_rate": 0.0003318788174932812, + "loss": 0.3484, + "step": 138175 + }, + { + "epoch": 33.72, + "learning_rate": 0.0003318482775470315, + "loss": 0.3769, + "step": 138200 + }, + { + "epoch": 33.73, + "learning_rate": 0.0003318177376007818, + "loss": 0.3096, + "step": 138225 + }, + { + "epoch": 33.74, + "learning_rate": 0.0003317871976545321, + "loss": 0.3672, + "step": 138250 + }, + { + "epoch": 33.74, + "learning_rate": 0.0003317566577082825, + "loss": 0.3853, + "step": 138275 + }, + { + "epoch": 33.75, + "learning_rate": 0.0003317261177620328, + "loss": 0.3725, + "step": 138300 + }, + { + "epoch": 33.75, + "learning_rate": 0.0003316955778157831, + "loss": 0.3425, + "step": 138325 + }, + { + "epoch": 33.76, + "learning_rate": 0.00033166503786953333, + "loss": 0.3924, + "step": 138350 + }, + { + "epoch": 33.77, + "learning_rate": 0.00033163449792328364, + "loss": 0.3541, + "step": 138375 + }, + { + "epoch": 33.77, + "learning_rate": 0.00033160395797703394, + "loss": 0.4236, + "step": 138400 + }, + { + "epoch": 33.78, + "learning_rate": 0.0003315734180307843, + "loss": 0.3396, + "step": 138425 + }, + { + "epoch": 33.78, + "learning_rate": 0.0003315428780845346, + "loss": 0.4243, + "step": 138450 + }, + { + "epoch": 33.79, + "learning_rate": 0.0003315123381382849, + "loss": 0.3928, + "step": 138475 + }, + { + "epoch": 33.8, + "learning_rate": 0.00033148179819203515, + "loss": 0.4071, + "step": 138500 + }, + { + "epoch": 33.8, + "learning_rate": 0.00033145125824578546, + "loss": 0.3414, + "step": 138525 + }, + { + "epoch": 33.81, + "learning_rate": 0.0003314207182995358, + "loss": 0.4381, + "step": 138550 + }, + { + "epoch": 33.82, + "learning_rate": 0.0003313901783532861, + "loss": 0.3973, + "step": 138575 + }, + { + "epoch": 33.82, + "learning_rate": 0.0003313596384070364, + "loss": 0.361, + "step": 138600 + }, + { + "epoch": 33.83, + "learning_rate": 0.0003313290984607867, + "loss": 0.3328, + "step": 138625 + }, + { + "epoch": 33.83, + "learning_rate": 0.00033129855851453697, + "loss": 0.4502, + "step": 138650 + }, + { + "epoch": 33.84, + "learning_rate": 0.00033126801856828733, + "loss": 0.3692, + "step": 138675 + }, + { + "epoch": 33.85, + "learning_rate": 0.00033123747862203763, + "loss": 0.4154, + "step": 138700 + }, + { + "epoch": 33.85, + "learning_rate": 0.00033120693867578794, + "loss": 0.3633, + "step": 138725 + }, + { + "epoch": 33.86, + "learning_rate": 0.00033117639872953824, + "loss": 0.3845, + "step": 138750 + }, + { + "epoch": 33.86, + "learning_rate": 0.00033114585878328854, + "loss": 0.3683, + "step": 138775 + }, + { + "epoch": 33.87, + "learning_rate": 0.0003311153188370389, + "loss": 0.408, + "step": 138800 + }, + { + "epoch": 33.88, + "learning_rate": 0.00033108477889078915, + "loss": 0.3941, + "step": 138825 + }, + { + "epoch": 33.88, + "learning_rate": 0.00033105423894453945, + "loss": 0.4312, + "step": 138850 + }, + { + "epoch": 33.89, + "learning_rate": 0.00033102369899828976, + "loss": 0.3557, + "step": 138875 + }, + { + "epoch": 33.89, + "learning_rate": 0.00033099315905204006, + "loss": 0.3747, + "step": 138900 + }, + { + "epoch": 33.9, + "learning_rate": 0.0003309626191057904, + "loss": 0.3835, + "step": 138925 + }, + { + "epoch": 33.91, + "learning_rate": 0.0003309320791595407, + "loss": 0.3986, + "step": 138950 + }, + { + "epoch": 33.91, + "learning_rate": 0.00033090153921329097, + "loss": 0.398, + "step": 138975 + }, + { + "epoch": 33.92, + "learning_rate": 0.0003308709992670413, + "loss": 0.4076, + "step": 139000 + }, + { + "epoch": 33.93, + "learning_rate": 0.0003308404593207916, + "loss": 0.3694, + "step": 139025 + }, + { + "epoch": 33.93, + "learning_rate": 0.00033080991937454193, + "loss": 0.3785, + "step": 139050 + }, + { + "epoch": 33.94, + "learning_rate": 0.00033077937942829224, + "loss": 0.3693, + "step": 139075 + }, + { + "epoch": 33.94, + "learning_rate": 0.00033074883948204254, + "loss": 0.4153, + "step": 139100 + }, + { + "epoch": 33.95, + "learning_rate": 0.0003307182995357928, + "loss": 0.3817, + "step": 139125 + }, + { + "epoch": 33.96, + "learning_rate": 0.0003306877595895431, + "loss": 0.3992, + "step": 139150 + }, + { + "epoch": 33.96, + "learning_rate": 0.00033065721964329345, + "loss": 0.3649, + "step": 139175 + }, + { + "epoch": 33.97, + "learning_rate": 0.00033062667969704375, + "loss": 0.3947, + "step": 139200 + }, + { + "epoch": 33.97, + "learning_rate": 0.00033059613975079406, + "loss": 0.3397, + "step": 139225 + }, + { + "epoch": 33.98, + "learning_rate": 0.00033056559980454436, + "loss": 0.4038, + "step": 139250 + }, + { + "epoch": 33.99, + "learning_rate": 0.0003305350598582946, + "loss": 0.373, + "step": 139275 + }, + { + "epoch": 33.99, + "learning_rate": 0.00033050451991204497, + "loss": 0.4479, + "step": 139300 + }, + { + "epoch": 34.0, + "learning_rate": 0.00033047397996579527, + "loss": 0.3613, + "step": 139325 + }, + { + "epoch": 34.0, + "learning_rate": 0.0003304434400195456, + "loss": 0.3761, + "step": 139350 + }, + { + "epoch": 34.01, + "learning_rate": 0.0003304141216711459, + "loss": 0.3521, + "step": 139375 + }, + { + "epoch": 34.02, + "learning_rate": 0.0003303835817248962, + "loss": 0.4, + "step": 139400 + }, + { + "epoch": 34.02, + "learning_rate": 0.0003303530417786465, + "loss": 0.3164, + "step": 139425 + }, + { + "epoch": 34.03, + "learning_rate": 0.00033032250183239674, + "loss": 0.41, + "step": 139450 + }, + { + "epoch": 34.03, + "learning_rate": 0.0003302919618861471, + "loss": 0.3421, + "step": 139475 + }, + { + "epoch": 34.04, + "learning_rate": 0.0003302614219398974, + "loss": 0.3995, + "step": 139500 + }, + { + "epoch": 34.05, + "learning_rate": 0.0003302308819936477, + "loss": 0.3304, + "step": 139525 + }, + { + "epoch": 34.05, + "learning_rate": 0.000330200342047398, + "loss": 0.4101, + "step": 139550 + }, + { + "epoch": 34.06, + "learning_rate": 0.0003301698021011483, + "loss": 0.359, + "step": 139575 + }, + { + "epoch": 34.07, + "learning_rate": 0.0003301392621548986, + "loss": 0.3792, + "step": 139600 + }, + { + "epoch": 34.07, + "learning_rate": 0.0003301087222086489, + "loss": 0.3731, + "step": 139625 + }, + { + "epoch": 34.08, + "learning_rate": 0.0003300781822623992, + "loss": 0.4143, + "step": 139650 + }, + { + "epoch": 34.08, + "learning_rate": 0.0003300476423161495, + "loss": 0.3613, + "step": 139675 + }, + { + "epoch": 34.09, + "learning_rate": 0.0003300171023698998, + "loss": 0.3947, + "step": 139700 + }, + { + "epoch": 34.1, + "learning_rate": 0.0003299865624236502, + "loss": 0.3607, + "step": 139725 + }, + { + "epoch": 34.1, + "learning_rate": 0.00032995602247740043, + "loss": 0.3652, + "step": 139750 + }, + { + "epoch": 34.11, + "learning_rate": 0.00032992548253115073, + "loss": 0.3911, + "step": 139775 + }, + { + "epoch": 34.11, + "learning_rate": 0.00032989494258490104, + "loss": 0.4495, + "step": 139800 + }, + { + "epoch": 34.12, + "learning_rate": 0.00032986440263865134, + "loss": 0.3491, + "step": 139825 + }, + { + "epoch": 34.13, + "learning_rate": 0.0003298338626924017, + "loss": 0.3611, + "step": 139850 + }, + { + "epoch": 34.13, + "learning_rate": 0.000329803322746152, + "loss": 0.3669, + "step": 139875 + }, + { + "epoch": 34.14, + "learning_rate": 0.0003297727827999023, + "loss": 0.3968, + "step": 139900 + }, + { + "epoch": 34.14, + "learning_rate": 0.00032974224285365255, + "loss": 0.341, + "step": 139925 + }, + { + "epoch": 34.15, + "learning_rate": 0.00032971170290740286, + "loss": 0.3937, + "step": 139950 + }, + { + "epoch": 34.16, + "learning_rate": 0.0003296811629611532, + "loss": 0.3728, + "step": 139975 + }, + { + "epoch": 34.16, + "learning_rate": 0.0003296506230149035, + "loss": 0.3908, + "step": 140000 + }, + { + "epoch": 34.17, + "learning_rate": 0.0003296200830686538, + "loss": 0.3814, + "step": 140025 + }, + { + "epoch": 34.18, + "learning_rate": 0.0003295895431224041, + "loss": 0.3616, + "step": 140050 + }, + { + "epoch": 34.18, + "learning_rate": 0.0003295590031761544, + "loss": 0.3442, + "step": 140075 + }, + { + "epoch": 34.19, + "learning_rate": 0.00032952846322990473, + "loss": 0.3822, + "step": 140100 + }, + { + "epoch": 34.19, + "learning_rate": 0.00032949792328365504, + "loss": 0.3766, + "step": 140125 + }, + { + "epoch": 34.2, + "learning_rate": 0.00032946738333740534, + "loss": 0.4176, + "step": 140150 + }, + { + "epoch": 34.21, + "learning_rate": 0.00032943684339115564, + "loss": 0.3375, + "step": 140175 + }, + { + "epoch": 34.21, + "learning_rate": 0.00032940630344490595, + "loss": 0.3641, + "step": 140200 + }, + { + "epoch": 34.22, + "learning_rate": 0.00032937576349865625, + "loss": 0.3556, + "step": 140225 + }, + { + "epoch": 34.22, + "learning_rate": 0.00032934522355240655, + "loss": 0.3915, + "step": 140250 + }, + { + "epoch": 34.23, + "learning_rate": 0.00032931468360615686, + "loss": 0.348, + "step": 140275 + }, + { + "epoch": 34.24, + "learning_rate": 0.00032928414365990716, + "loss": 0.4115, + "step": 140300 + }, + { + "epoch": 34.24, + "learning_rate": 0.00032925360371365746, + "loss": 0.3459, + "step": 140325 + }, + { + "epoch": 34.25, + "learning_rate": 0.0003292230637674078, + "loss": 0.3965, + "step": 140350 + }, + { + "epoch": 34.25, + "learning_rate": 0.0003291925238211581, + "loss": 0.3507, + "step": 140375 + }, + { + "epoch": 34.26, + "learning_rate": 0.00032916198387490837, + "loss": 0.3652, + "step": 140400 + }, + { + "epoch": 34.27, + "learning_rate": 0.0003291314439286587, + "loss": 0.3429, + "step": 140425 + }, + { + "epoch": 34.27, + "learning_rate": 0.000329100903982409, + "loss": 0.3728, + "step": 140450 + }, + { + "epoch": 34.28, + "learning_rate": 0.0003290703640361593, + "loss": 0.3313, + "step": 140475 + }, + { + "epoch": 34.29, + "learning_rate": 0.00032903982408990964, + "loss": 0.4086, + "step": 140500 + }, + { + "epoch": 34.29, + "learning_rate": 0.00032900928414365994, + "loss": 0.3098, + "step": 140525 + }, + { + "epoch": 34.3, + "learning_rate": 0.0003289787441974102, + "loss": 0.3866, + "step": 140550 + }, + { + "epoch": 34.3, + "learning_rate": 0.0003289482042511605, + "loss": 0.3918, + "step": 140575 + }, + { + "epoch": 34.31, + "learning_rate": 0.0003289176643049108, + "loss": 0.3939, + "step": 140600 + }, + { + "epoch": 34.32, + "learning_rate": 0.00032888712435866116, + "loss": 0.3689, + "step": 140625 + }, + { + "epoch": 34.32, + "learning_rate": 0.00032885658441241146, + "loss": 0.4102, + "step": 140650 + }, + { + "epoch": 34.33, + "learning_rate": 0.00032882604446616176, + "loss": 0.4044, + "step": 140675 + }, + { + "epoch": 34.33, + "learning_rate": 0.000328795504519912, + "loss": 0.3637, + "step": 140700 + }, + { + "epoch": 34.34, + "learning_rate": 0.0003287649645736623, + "loss": 0.3501, + "step": 140725 + }, + { + "epoch": 34.35, + "learning_rate": 0.0003287344246274127, + "loss": 0.376, + "step": 140750 + }, + { + "epoch": 34.35, + "learning_rate": 0.000328703884681163, + "loss": 0.3654, + "step": 140775 + }, + { + "epoch": 34.36, + "learning_rate": 0.0003286733447349133, + "loss": 0.3961, + "step": 140800 + }, + { + "epoch": 34.36, + "learning_rate": 0.0003286428047886636, + "loss": 0.3486, + "step": 140825 + }, + { + "epoch": 34.37, + "learning_rate": 0.0003286122648424139, + "loss": 0.4076, + "step": 140850 + }, + { + "epoch": 34.38, + "learning_rate": 0.0003285817248961642, + "loss": 0.3979, + "step": 140875 + }, + { + "epoch": 34.38, + "learning_rate": 0.0003285511849499145, + "loss": 0.3874, + "step": 140900 + }, + { + "epoch": 34.39, + "learning_rate": 0.0003285206450036648, + "loss": 0.3311, + "step": 140925 + }, + { + "epoch": 34.39, + "learning_rate": 0.0003284901050574151, + "loss": 0.3656, + "step": 140950 + }, + { + "epoch": 34.4, + "learning_rate": 0.0003284595651111654, + "loss": 0.3687, + "step": 140975 + }, + { + "epoch": 34.41, + "learning_rate": 0.00032842902516491576, + "loss": 0.4042, + "step": 141000 + }, + { + "epoch": 34.41, + "eval_cer": 0.09400634477377494, + "eval_loss": 0.4195997714996338, + "eval_runtime": 149.5055, + "eval_samples_per_second": 28.046, + "eval_steps_per_second": 7.016, + "eval_wer": 0.39468189233278955, + "step": 141000 + }, + { + "epoch": 34.41, + "learning_rate": 0.000328398485218666, + "loss": 0.3471, + "step": 141025 + }, + { + "epoch": 34.42, + "learning_rate": 0.0003283679452724163, + "loss": 0.3915, + "step": 141050 + }, + { + "epoch": 34.43, + "learning_rate": 0.0003283374053261666, + "loss": 0.3888, + "step": 141075 + }, + { + "epoch": 34.43, + "learning_rate": 0.0003283068653799169, + "loss": 0.4085, + "step": 141100 + }, + { + "epoch": 34.44, + "learning_rate": 0.0003282763254336673, + "loss": 0.3797, + "step": 141125 + }, + { + "epoch": 34.44, + "learning_rate": 0.0003282457854874176, + "loss": 0.4164, + "step": 141150 + }, + { + "epoch": 34.45, + "learning_rate": 0.00032821524554116783, + "loss": 0.3819, + "step": 141175 + }, + { + "epoch": 34.46, + "learning_rate": 0.00032818470559491813, + "loss": 0.39, + "step": 141200 + }, + { + "epoch": 34.46, + "learning_rate": 0.00032815416564866844, + "loss": 0.3658, + "step": 141225 + }, + { + "epoch": 34.47, + "learning_rate": 0.0003281236257024188, + "loss": 0.3993, + "step": 141250 + }, + { + "epoch": 34.47, + "learning_rate": 0.0003280930857561691, + "loss": 0.3643, + "step": 141275 + }, + { + "epoch": 34.48, + "learning_rate": 0.0003280625458099194, + "loss": 0.3629, + "step": 141300 + }, + { + "epoch": 34.49, + "learning_rate": 0.0003280320058636697, + "loss": 0.3807, + "step": 141325 + }, + { + "epoch": 34.49, + "learning_rate": 0.00032800146591741995, + "loss": 0.4153, + "step": 141350 + }, + { + "epoch": 34.5, + "learning_rate": 0.0003279709259711703, + "loss": 0.4157, + "step": 141375 + }, + { + "epoch": 34.5, + "learning_rate": 0.0003279403860249206, + "loss": 0.343, + "step": 141400 + }, + { + "epoch": 34.51, + "learning_rate": 0.0003279098460786709, + "loss": 0.3603, + "step": 141425 + }, + { + "epoch": 34.52, + "learning_rate": 0.0003278793061324212, + "loss": 0.4158, + "step": 141450 + }, + { + "epoch": 34.52, + "learning_rate": 0.0003278487661861715, + "loss": 0.3832, + "step": 141475 + }, + { + "epoch": 34.53, + "learning_rate": 0.00032781822623992183, + "loss": 0.4119, + "step": 141500 + }, + { + "epoch": 34.54, + "learning_rate": 0.00032778768629367213, + "loss": 0.3631, + "step": 141525 + }, + { + "epoch": 34.54, + "learning_rate": 0.00032775714634742243, + "loss": 0.4149, + "step": 141550 + }, + { + "epoch": 34.55, + "learning_rate": 0.00032772660640117274, + "loss": 0.3623, + "step": 141575 + }, + { + "epoch": 34.55, + "learning_rate": 0.00032769606645492304, + "loss": 0.3814, + "step": 141600 + }, + { + "epoch": 34.56, + "learning_rate": 0.0003276655265086734, + "loss": 0.355, + "step": 141625 + }, + { + "epoch": 34.57, + "learning_rate": 0.00032763498656242365, + "loss": 0.4258, + "step": 141650 + }, + { + "epoch": 34.57, + "learning_rate": 0.00032760444661617395, + "loss": 0.3596, + "step": 141675 + }, + { + "epoch": 34.58, + "learning_rate": 0.00032757390666992425, + "loss": 0.3762, + "step": 141700 + }, + { + "epoch": 34.58, + "learning_rate": 0.00032754336672367456, + "loss": 0.3774, + "step": 141725 + }, + { + "epoch": 34.59, + "learning_rate": 0.0003275128267774249, + "loss": 0.433, + "step": 141750 + }, + { + "epoch": 34.6, + "learning_rate": 0.0003274822868311752, + "loss": 0.3318, + "step": 141775 + }, + { + "epoch": 34.6, + "learning_rate": 0.0003274517468849255, + "loss": 0.3979, + "step": 141800 + }, + { + "epoch": 34.61, + "learning_rate": 0.00032742120693867577, + "loss": 0.3382, + "step": 141825 + }, + { + "epoch": 34.61, + "learning_rate": 0.0003273906669924261, + "loss": 0.3676, + "step": 141850 + }, + { + "epoch": 34.62, + "learning_rate": 0.0003273601270461764, + "loss": 0.368, + "step": 141875 + }, + { + "epoch": 34.63, + "learning_rate": 0.00032732958709992674, + "loss": 0.4084, + "step": 141900 + }, + { + "epoch": 34.63, + "learning_rate": 0.00032729904715367704, + "loss": 0.3796, + "step": 141925 + }, + { + "epoch": 34.64, + "learning_rate": 0.00032726850720742734, + "loss": 0.3774, + "step": 141950 + }, + { + "epoch": 34.64, + "learning_rate": 0.0003272379672611776, + "loss": 0.348, + "step": 141975 + }, + { + "epoch": 34.65, + "learning_rate": 0.0003272074273149279, + "loss": 0.3722, + "step": 142000 + }, + { + "epoch": 34.66, + "learning_rate": 0.00032717688736867825, + "loss": 0.378, + "step": 142025 + }, + { + "epoch": 34.66, + "learning_rate": 0.00032714634742242856, + "loss": 0.3905, + "step": 142050 + }, + { + "epoch": 34.67, + "learning_rate": 0.00032711580747617886, + "loss": 0.3589, + "step": 142075 + }, + { + "epoch": 34.68, + "learning_rate": 0.00032708526752992916, + "loss": 0.3792, + "step": 142100 + }, + { + "epoch": 34.68, + "learning_rate": 0.0003270547275836794, + "loss": 0.3419, + "step": 142125 + }, + { + "epoch": 34.69, + "learning_rate": 0.00032702418763742977, + "loss": 0.3986, + "step": 142150 + }, + { + "epoch": 34.69, + "learning_rate": 0.00032699364769118007, + "loss": 0.3673, + "step": 142175 + }, + { + "epoch": 34.7, + "learning_rate": 0.0003269631077449304, + "loss": 0.3795, + "step": 142200 + }, + { + "epoch": 34.71, + "learning_rate": 0.0003269325677986807, + "loss": 0.3767, + "step": 142225 + }, + { + "epoch": 34.71, + "learning_rate": 0.000326902027852431, + "loss": 0.3885, + "step": 142250 + }, + { + "epoch": 34.72, + "learning_rate": 0.00032687148790618134, + "loss": 0.3423, + "step": 142275 + }, + { + "epoch": 34.72, + "learning_rate": 0.0003268409479599316, + "loss": 0.3885, + "step": 142300 + }, + { + "epoch": 34.73, + "learning_rate": 0.0003268104080136819, + "loss": 0.358, + "step": 142325 + }, + { + "epoch": 34.74, + "learning_rate": 0.0003267798680674322, + "loss": 0.4137, + "step": 142350 + }, + { + "epoch": 34.74, + "learning_rate": 0.0003267493281211825, + "loss": 0.3775, + "step": 142375 + }, + { + "epoch": 34.75, + "learning_rate": 0.00032671878817493286, + "loss": 0.4135, + "step": 142400 + }, + { + "epoch": 34.75, + "learning_rate": 0.00032668824822868316, + "loss": 0.3023, + "step": 142425 + }, + { + "epoch": 34.76, + "learning_rate": 0.0003266577082824334, + "loss": 0.4136, + "step": 142450 + }, + { + "epoch": 34.77, + "learning_rate": 0.0003266271683361837, + "loss": 0.3392, + "step": 142475 + }, + { + "epoch": 34.77, + "learning_rate": 0.000326596628389934, + "loss": 0.3892, + "step": 142500 + }, + { + "epoch": 34.78, + "learning_rate": 0.0003265660884436844, + "loss": 0.3577, + "step": 142525 + }, + { + "epoch": 34.79, + "learning_rate": 0.0003265355484974347, + "loss": 0.3798, + "step": 142550 + }, + { + "epoch": 34.79, + "learning_rate": 0.000326505008551185, + "loss": 0.3573, + "step": 142575 + }, + { + "epoch": 34.8, + "learning_rate": 0.00032647446860493523, + "loss": 0.3979, + "step": 142600 + }, + { + "epoch": 34.8, + "learning_rate": 0.00032644392865868553, + "loss": 0.3441, + "step": 142625 + }, + { + "epoch": 34.81, + "learning_rate": 0.0003264133887124359, + "loss": 0.3925, + "step": 142650 + }, + { + "epoch": 34.82, + "learning_rate": 0.0003263828487661862, + "loss": 0.3467, + "step": 142675 + }, + { + "epoch": 34.82, + "learning_rate": 0.0003263523088199365, + "loss": 0.3999, + "step": 142700 + }, + { + "epoch": 34.83, + "learning_rate": 0.0003263217688736868, + "loss": 0.3628, + "step": 142725 + }, + { + "epoch": 34.83, + "learning_rate": 0.00032629122892743705, + "loss": 0.4295, + "step": 142750 + }, + { + "epoch": 34.84, + "learning_rate": 0.0003262606889811874, + "loss": 0.3707, + "step": 142775 + }, + { + "epoch": 34.85, + "learning_rate": 0.0003262301490349377, + "loss": 0.4188, + "step": 142800 + }, + { + "epoch": 34.85, + "learning_rate": 0.000326199609088688, + "loss": 0.4034, + "step": 142825 + }, + { + "epoch": 34.86, + "learning_rate": 0.0003261690691424383, + "loss": 0.3764, + "step": 142850 + }, + { + "epoch": 34.86, + "learning_rate": 0.0003261385291961886, + "loss": 0.3556, + "step": 142875 + }, + { + "epoch": 34.87, + "learning_rate": 0.000326107989249939, + "loss": 0.3941, + "step": 142900 + }, + { + "epoch": 34.88, + "learning_rate": 0.0003260774493036892, + "loss": 0.3578, + "step": 142925 + }, + { + "epoch": 34.88, + "learning_rate": 0.00032604690935743953, + "loss": 0.3759, + "step": 142950 + }, + { + "epoch": 34.89, + "learning_rate": 0.00032601636941118983, + "loss": 0.3667, + "step": 142975 + }, + { + "epoch": 34.9, + "learning_rate": 0.00032598582946494014, + "loss": 0.3712, + "step": 143000 + }, + { + "epoch": 34.9, + "learning_rate": 0.0003259552895186905, + "loss": 0.3266, + "step": 143025 + }, + { + "epoch": 34.91, + "learning_rate": 0.0003259247495724408, + "loss": 0.4101, + "step": 143050 + }, + { + "epoch": 34.91, + "learning_rate": 0.00032589420962619105, + "loss": 0.3533, + "step": 143075 + }, + { + "epoch": 34.92, + "learning_rate": 0.00032586366967994135, + "loss": 0.4007, + "step": 143100 + }, + { + "epoch": 34.93, + "learning_rate": 0.00032583312973369165, + "loss": 0.3463, + "step": 143125 + }, + { + "epoch": 34.93, + "learning_rate": 0.00032580258978744196, + "loss": 0.4053, + "step": 143150 + }, + { + "epoch": 34.94, + "learning_rate": 0.0003257720498411923, + "loss": 0.3764, + "step": 143175 + }, + { + "epoch": 34.94, + "learning_rate": 0.0003257415098949426, + "loss": 0.3746, + "step": 143200 + }, + { + "epoch": 34.95, + "learning_rate": 0.00032571096994869287, + "loss": 0.3566, + "step": 143225 + }, + { + "epoch": 34.96, + "learning_rate": 0.00032568043000244317, + "loss": 0.3725, + "step": 143250 + }, + { + "epoch": 34.96, + "learning_rate": 0.0003256498900561935, + "loss": 0.3446, + "step": 143275 + }, + { + "epoch": 34.97, + "learning_rate": 0.00032561935010994383, + "loss": 0.395, + "step": 143300 + }, + { + "epoch": 34.97, + "learning_rate": 0.00032558881016369413, + "loss": 0.3806, + "step": 143325 + }, + { + "epoch": 34.98, + "learning_rate": 0.00032555827021744444, + "loss": 0.4025, + "step": 143350 + }, + { + "epoch": 34.99, + "learning_rate": 0.00032552773027119474, + "loss": 0.3337, + "step": 143375 + }, + { + "epoch": 34.99, + "learning_rate": 0.000325497190324945, + "loss": 0.3959, + "step": 143400 + }, + { + "epoch": 35.0, + "learning_rate": 0.00032546665037869535, + "loss": 0.3356, + "step": 143425 + }, + { + "epoch": 35.0, + "learning_rate": 0.00032543611043244565, + "loss": 0.3593, + "step": 143450 + }, + { + "epoch": 35.01, + "learning_rate": 0.00032540557048619595, + "loss": 0.3414, + "step": 143475 + }, + { + "epoch": 35.02, + "learning_rate": 0.00032537503053994626, + "loss": 0.3893, + "step": 143500 + }, + { + "epoch": 35.02, + "learning_rate": 0.00032534449059369656, + "loss": 0.3779, + "step": 143525 + }, + { + "epoch": 35.03, + "learning_rate": 0.00032531395064744686, + "loss": 0.3826, + "step": 143550 + }, + { + "epoch": 35.04, + "learning_rate": 0.00032528341070119717, + "loss": 0.3229, + "step": 143575 + }, + { + "epoch": 35.04, + "learning_rate": 0.00032525287075494747, + "loss": 0.3747, + "step": 143600 + }, + { + "epoch": 35.05, + "learning_rate": 0.0003252223308086978, + "loss": 0.3863, + "step": 143625 + }, + { + "epoch": 35.05, + "learning_rate": 0.0003251917908624481, + "loss": 0.3804, + "step": 143650 + }, + { + "epoch": 35.06, + "learning_rate": 0.00032516125091619844, + "loss": 0.3068, + "step": 143675 + }, + { + "epoch": 35.07, + "learning_rate": 0.0003251307109699487, + "loss": 0.3687, + "step": 143700 + }, + { + "epoch": 35.07, + "learning_rate": 0.000325100171023699, + "loss": 0.3628, + "step": 143725 + }, + { + "epoch": 35.08, + "learning_rate": 0.0003250696310774493, + "loss": 0.3683, + "step": 143750 + }, + { + "epoch": 35.08, + "learning_rate": 0.0003250390911311996, + "loss": 0.3492, + "step": 143775 + }, + { + "epoch": 35.09, + "learning_rate": 0.00032500855118494995, + "loss": 0.3791, + "step": 143800 + }, + { + "epoch": 35.1, + "learning_rate": 0.00032497801123870026, + "loss": 0.3718, + "step": 143825 + }, + { + "epoch": 35.1, + "learning_rate": 0.00032494747129245056, + "loss": 0.4213, + "step": 143850 + }, + { + "epoch": 35.11, + "learning_rate": 0.0003249169313462008, + "loss": 0.3575, + "step": 143875 + }, + { + "epoch": 35.11, + "learning_rate": 0.0003248863913999511, + "loss": 0.3555, + "step": 143900 + }, + { + "epoch": 35.12, + "learning_rate": 0.00032485585145370147, + "loss": 0.3463, + "step": 143925 + }, + { + "epoch": 35.13, + "learning_rate": 0.00032482531150745177, + "loss": 0.3952, + "step": 143950 + }, + { + "epoch": 35.13, + "learning_rate": 0.0003247947715612021, + "loss": 0.3151, + "step": 143975 + }, + { + "epoch": 35.14, + "learning_rate": 0.0003247642316149524, + "loss": 0.4055, + "step": 144000 + }, + { + "epoch": 35.14, + "eval_cer": 0.09494574089093766, + "eval_loss": 0.39560216665267944, + "eval_runtime": 149.4692, + "eval_samples_per_second": 28.053, + "eval_steps_per_second": 7.018, + "eval_wer": 0.38818923327895594, + "step": 144000 + }, + { + "epoch": 35.15, + "learning_rate": 0.00032473369166870263, + "loss": 0.3437, + "step": 144025 + }, + { + "epoch": 35.15, + "learning_rate": 0.000324703151722453, + "loss": 0.3985, + "step": 144050 + }, + { + "epoch": 35.16, + "learning_rate": 0.0003246726117762033, + "loss": 0.338, + "step": 144075 + }, + { + "epoch": 35.16, + "learning_rate": 0.0003246420718299536, + "loss": 0.4219, + "step": 144100 + }, + { + "epoch": 35.17, + "learning_rate": 0.0003246115318837039, + "loss": 0.3662, + "step": 144125 + }, + { + "epoch": 35.18, + "learning_rate": 0.0003245809919374542, + "loss": 0.3914, + "step": 144150 + }, + { + "epoch": 35.18, + "learning_rate": 0.0003245504519912045, + "loss": 0.3389, + "step": 144175 + }, + { + "epoch": 35.19, + "learning_rate": 0.0003245199120449548, + "loss": 0.3745, + "step": 144200 + }, + { + "epoch": 35.19, + "learning_rate": 0.0003244893720987051, + "loss": 0.3361, + "step": 144225 + }, + { + "epoch": 35.2, + "learning_rate": 0.0003244588321524554, + "loss": 0.4224, + "step": 144250 + }, + { + "epoch": 35.21, + "learning_rate": 0.0003244295138040557, + "loss": 0.3588, + "step": 144275 + }, + { + "epoch": 35.21, + "learning_rate": 0.000324398973857806, + "loss": 0.3742, + "step": 144300 + }, + { + "epoch": 35.22, + "learning_rate": 0.0003243684339115563, + "loss": 0.3108, + "step": 144325 + }, + { + "epoch": 35.22, + "learning_rate": 0.00032433789396530663, + "loss": 0.3738, + "step": 144350 + }, + { + "epoch": 35.23, + "learning_rate": 0.00032430735401905693, + "loss": 0.3379, + "step": 144375 + }, + { + "epoch": 35.24, + "learning_rate": 0.00032427681407280724, + "loss": 0.3941, + "step": 144400 + }, + { + "epoch": 35.24, + "learning_rate": 0.00032424627412655754, + "loss": 0.3378, + "step": 144425 + }, + { + "epoch": 35.25, + "learning_rate": 0.00032421573418030784, + "loss": 0.4398, + "step": 144450 + }, + { + "epoch": 35.26, + "learning_rate": 0.0003241851942340582, + "loss": 0.3265, + "step": 144475 + }, + { + "epoch": 35.26, + "learning_rate": 0.00032415465428780845, + "loss": 0.402, + "step": 144500 + }, + { + "epoch": 35.27, + "learning_rate": 0.00032412411434155875, + "loss": 0.3512, + "step": 144525 + }, + { + "epoch": 35.27, + "learning_rate": 0.00032409357439530906, + "loss": 0.434, + "step": 144550 + }, + { + "epoch": 35.28, + "learning_rate": 0.00032406303444905936, + "loss": 0.3559, + "step": 144575 + }, + { + "epoch": 35.29, + "learning_rate": 0.0003240324945028097, + "loss": 0.3925, + "step": 144600 + }, + { + "epoch": 35.29, + "learning_rate": 0.00032400195455656, + "loss": 0.3415, + "step": 144625 + }, + { + "epoch": 35.3, + "learning_rate": 0.00032397141461031027, + "loss": 0.4035, + "step": 144650 + }, + { + "epoch": 35.3, + "learning_rate": 0.00032394087466406057, + "loss": 0.3086, + "step": 144675 + }, + { + "epoch": 35.31, + "learning_rate": 0.0003239103347178109, + "loss": 0.3642, + "step": 144700 + }, + { + "epoch": 35.32, + "learning_rate": 0.00032387979477156123, + "loss": 0.3991, + "step": 144725 + }, + { + "epoch": 35.32, + "learning_rate": 0.00032384925482531154, + "loss": 0.4157, + "step": 144750 + }, + { + "epoch": 35.33, + "learning_rate": 0.00032381871487906184, + "loss": 0.3541, + "step": 144775 + }, + { + "epoch": 35.33, + "learning_rate": 0.00032378817493281214, + "loss": 0.3786, + "step": 144800 + }, + { + "epoch": 35.34, + "learning_rate": 0.0003237576349865624, + "loss": 0.327, + "step": 144825 + }, + { + "epoch": 35.35, + "learning_rate": 0.00032372709504031275, + "loss": 0.3758, + "step": 144850 + }, + { + "epoch": 35.35, + "learning_rate": 0.00032369655509406305, + "loss": 0.3576, + "step": 144875 + }, + { + "epoch": 35.36, + "learning_rate": 0.00032366601514781336, + "loss": 0.3495, + "step": 144900 + }, + { + "epoch": 35.36, + "learning_rate": 0.00032363547520156366, + "loss": 0.3452, + "step": 144925 + }, + { + "epoch": 35.37, + "learning_rate": 0.00032360493525531396, + "loss": 0.3905, + "step": 144950 + }, + { + "epoch": 35.38, + "learning_rate": 0.00032357439530906427, + "loss": 0.3453, + "step": 144975 + }, + { + "epoch": 35.38, + "learning_rate": 0.00032354385536281457, + "loss": 0.3825, + "step": 145000 + }, + { + "epoch": 35.39, + "learning_rate": 0.0003235133154165649, + "loss": 0.3431, + "step": 145025 + }, + { + "epoch": 35.4, + "learning_rate": 0.0003234827754703152, + "loss": 0.3646, + "step": 145050 + }, + { + "epoch": 35.4, + "learning_rate": 0.0003234522355240655, + "loss": 0.3521, + "step": 145075 + }, + { + "epoch": 35.41, + "learning_rate": 0.00032342169557781584, + "loss": 0.3978, + "step": 145100 + }, + { + "epoch": 35.41, + "learning_rate": 0.0003233911556315661, + "loss": 0.3244, + "step": 145125 + }, + { + "epoch": 35.42, + "learning_rate": 0.0003233606156853164, + "loss": 0.3913, + "step": 145150 + }, + { + "epoch": 35.43, + "learning_rate": 0.0003233300757390667, + "loss": 0.3628, + "step": 145175 + }, + { + "epoch": 35.43, + "learning_rate": 0.000323299535792817, + "loss": 0.3918, + "step": 145200 + }, + { + "epoch": 35.44, + "learning_rate": 0.0003232689958465673, + "loss": 0.3509, + "step": 145225 + }, + { + "epoch": 35.44, + "learning_rate": 0.00032323845590031766, + "loss": 0.3958, + "step": 145250 + }, + { + "epoch": 35.45, + "learning_rate": 0.00032320791595406796, + "loss": 0.3478, + "step": 145275 + }, + { + "epoch": 35.46, + "learning_rate": 0.0003231773760078182, + "loss": 0.4068, + "step": 145300 + }, + { + "epoch": 35.46, + "learning_rate": 0.0003231468360615685, + "loss": 0.3665, + "step": 145325 + }, + { + "epoch": 35.47, + "learning_rate": 0.0003231162961153188, + "loss": 0.4198, + "step": 145350 + }, + { + "epoch": 35.47, + "learning_rate": 0.0003230857561690692, + "loss": 0.3439, + "step": 145375 + }, + { + "epoch": 35.48, + "learning_rate": 0.0003230552162228195, + "loss": 0.377, + "step": 145400 + }, + { + "epoch": 35.49, + "learning_rate": 0.0003230246762765698, + "loss": 0.362, + "step": 145425 + }, + { + "epoch": 35.49, + "learning_rate": 0.00032299413633032003, + "loss": 0.415, + "step": 145450 + }, + { + "epoch": 35.5, + "learning_rate": 0.00032296359638407033, + "loss": 0.3535, + "step": 145475 + }, + { + "epoch": 35.51, + "learning_rate": 0.0003229330564378207, + "loss": 0.4043, + "step": 145500 + }, + { + "epoch": 35.51, + "learning_rate": 0.000322902516491571, + "loss": 0.326, + "step": 145525 + }, + { + "epoch": 35.52, + "learning_rate": 0.0003228719765453213, + "loss": 0.385, + "step": 145550 + }, + { + "epoch": 35.52, + "learning_rate": 0.0003228414365990716, + "loss": 0.3811, + "step": 145575 + }, + { + "epoch": 35.53, + "learning_rate": 0.00032281089665282185, + "loss": 0.3609, + "step": 145600 + }, + { + "epoch": 35.54, + "learning_rate": 0.0003227803567065722, + "loss": 0.357, + "step": 145625 + }, + { + "epoch": 35.54, + "learning_rate": 0.0003227498167603225, + "loss": 0.3908, + "step": 145650 + }, + { + "epoch": 35.55, + "learning_rate": 0.0003227192768140728, + "loss": 0.3159, + "step": 145675 + }, + { + "epoch": 35.55, + "learning_rate": 0.0003226887368678231, + "loss": 0.3898, + "step": 145700 + }, + { + "epoch": 35.56, + "learning_rate": 0.0003226581969215734, + "loss": 0.3226, + "step": 145725 + }, + { + "epoch": 35.57, + "learning_rate": 0.0003226276569753238, + "loss": 0.3833, + "step": 145750 + }, + { + "epoch": 35.57, + "learning_rate": 0.00032259711702907403, + "loss": 0.3699, + "step": 145775 + }, + { + "epoch": 35.58, + "learning_rate": 0.00032256657708282433, + "loss": 0.3777, + "step": 145800 + }, + { + "epoch": 35.58, + "learning_rate": 0.00032253603713657463, + "loss": 0.3697, + "step": 145825 + }, + { + "epoch": 35.59, + "learning_rate": 0.00032250549719032494, + "loss": 0.3952, + "step": 145850 + }, + { + "epoch": 35.6, + "learning_rate": 0.0003224749572440753, + "loss": 0.323, + "step": 145875 + }, + { + "epoch": 35.6, + "learning_rate": 0.0003224444172978256, + "loss": 0.3817, + "step": 145900 + }, + { + "epoch": 35.61, + "learning_rate": 0.00032241387735157585, + "loss": 0.3693, + "step": 145925 + }, + { + "epoch": 35.61, + "learning_rate": 0.00032238333740532615, + "loss": 0.3745, + "step": 145950 + }, + { + "epoch": 35.62, + "learning_rate": 0.00032235279745907645, + "loss": 0.3209, + "step": 145975 + }, + { + "epoch": 35.63, + "learning_rate": 0.00032232347911067676, + "loss": 0.3896, + "step": 146000 + }, + { + "epoch": 35.63, + "learning_rate": 0.00032229293916442706, + "loss": 0.3541, + "step": 146025 + }, + { + "epoch": 35.64, + "learning_rate": 0.0003222623992181774, + "loss": 0.3982, + "step": 146050 + }, + { + "epoch": 35.65, + "learning_rate": 0.00032223185927192767, + "loss": 0.3498, + "step": 146075 + }, + { + "epoch": 35.65, + "learning_rate": 0.000322201319325678, + "loss": 0.405, + "step": 146100 + }, + { + "epoch": 35.66, + "learning_rate": 0.0003221707793794283, + "loss": 0.3542, + "step": 146125 + }, + { + "epoch": 35.66, + "learning_rate": 0.0003221402394331786, + "loss": 0.4302, + "step": 146150 + }, + { + "epoch": 35.67, + "learning_rate": 0.00032210969948692894, + "loss": 0.3272, + "step": 146175 + }, + { + "epoch": 35.68, + "learning_rate": 0.00032207915954067924, + "loss": 0.3888, + "step": 146200 + }, + { + "epoch": 35.68, + "learning_rate": 0.00032204861959442955, + "loss": 0.394, + "step": 146225 + }, + { + "epoch": 35.69, + "learning_rate": 0.0003220180796481798, + "loss": 0.3891, + "step": 146250 + }, + { + "epoch": 35.69, + "learning_rate": 0.0003219875397019301, + "loss": 0.3566, + "step": 146275 + }, + { + "epoch": 35.7, + "learning_rate": 0.00032195699975568046, + "loss": 0.3858, + "step": 146300 + }, + { + "epoch": 35.71, + "learning_rate": 0.00032192645980943076, + "loss": 0.3621, + "step": 146325 + }, + { + "epoch": 35.71, + "learning_rate": 0.00032189591986318106, + "loss": 0.4315, + "step": 146350 + }, + { + "epoch": 35.72, + "learning_rate": 0.00032186537991693137, + "loss": 0.3582, + "step": 146375 + }, + { + "epoch": 35.72, + "learning_rate": 0.0003218348399706816, + "loss": 0.4036, + "step": 146400 + }, + { + "epoch": 35.73, + "learning_rate": 0.00032180430002443197, + "loss": 0.3515, + "step": 146425 + }, + { + "epoch": 35.74, + "learning_rate": 0.0003217737600781823, + "loss": 0.4004, + "step": 146450 + }, + { + "epoch": 35.74, + "learning_rate": 0.0003217432201319326, + "loss": 0.3602, + "step": 146475 + }, + { + "epoch": 35.75, + "learning_rate": 0.0003217126801856829, + "loss": 0.3917, + "step": 146500 + }, + { + "epoch": 35.76, + "learning_rate": 0.0003216821402394332, + "loss": 0.3357, + "step": 146525 + }, + { + "epoch": 35.76, + "learning_rate": 0.0003216516002931835, + "loss": 0.4125, + "step": 146550 + }, + { + "epoch": 35.77, + "learning_rate": 0.0003216210603469338, + "loss": 0.3342, + "step": 146575 + }, + { + "epoch": 35.77, + "learning_rate": 0.0003215905204006841, + "loss": 0.367, + "step": 146600 + }, + { + "epoch": 35.78, + "learning_rate": 0.0003215599804544344, + "loss": 0.3721, + "step": 146625 + }, + { + "epoch": 35.79, + "learning_rate": 0.0003215294405081847, + "loss": 0.387, + "step": 146650 + }, + { + "epoch": 35.79, + "learning_rate": 0.00032149890056193506, + "loss": 0.3573, + "step": 146675 + }, + { + "epoch": 35.8, + "learning_rate": 0.0003214683606156853, + "loss": 0.373, + "step": 146700 + }, + { + "epoch": 35.8, + "learning_rate": 0.0003214378206694356, + "loss": 0.3215, + "step": 146725 + }, + { + "epoch": 35.81, + "learning_rate": 0.0003214072807231859, + "loss": 0.3953, + "step": 146750 + }, + { + "epoch": 35.82, + "learning_rate": 0.0003213767407769362, + "loss": 0.3182, + "step": 146775 + }, + { + "epoch": 35.82, + "learning_rate": 0.0003213462008306866, + "loss": 0.4039, + "step": 146800 + }, + { + "epoch": 35.83, + "learning_rate": 0.0003213156608844369, + "loss": 0.3126, + "step": 146825 + }, + { + "epoch": 35.83, + "learning_rate": 0.0003212851209381872, + "loss": 0.3938, + "step": 146850 + }, + { + "epoch": 35.84, + "learning_rate": 0.00032125458099193743, + "loss": 0.3636, + "step": 146875 + }, + { + "epoch": 35.85, + "learning_rate": 0.00032122404104568774, + "loss": 0.3621, + "step": 146900 + }, + { + "epoch": 35.85, + "learning_rate": 0.0003211935010994381, + "loss": 0.3415, + "step": 146925 + }, + { + "epoch": 35.86, + "learning_rate": 0.0003211629611531884, + "loss": 0.4049, + "step": 146950 + }, + { + "epoch": 35.87, + "learning_rate": 0.0003211324212069387, + "loss": 0.2868, + "step": 146975 + }, + { + "epoch": 35.87, + "learning_rate": 0.000321101881260689, + "loss": 0.3831, + "step": 147000 + }, + { + "epoch": 35.87, + "eval_cer": 0.09333901419874131, + "eval_loss": 0.3962480425834656, + "eval_runtime": 148.6843, + "eval_samples_per_second": 28.201, + "eval_steps_per_second": 7.055, + "eval_wer": 0.3842414355628059, + "step": 147000 + }, + { + "epoch": 35.88, + "learning_rate": 0.00032107134131443925, + "loss": 0.3714, + "step": 147025 + }, + { + "epoch": 35.88, + "learning_rate": 0.0003210408013681896, + "loss": 0.4221, + "step": 147050 + }, + { + "epoch": 35.89, + "learning_rate": 0.0003210102614219399, + "loss": 0.3564, + "step": 147075 + }, + { + "epoch": 35.9, + "learning_rate": 0.0003209797214756902, + "loss": 0.398, + "step": 147100 + }, + { + "epoch": 35.9, + "learning_rate": 0.0003209491815294405, + "loss": 0.3744, + "step": 147125 + }, + { + "epoch": 35.91, + "learning_rate": 0.0003209186415831908, + "loss": 0.3761, + "step": 147150 + }, + { + "epoch": 35.91, + "learning_rate": 0.00032088810163694107, + "loss": 0.3845, + "step": 147175 + }, + { + "epoch": 35.92, + "learning_rate": 0.00032085756169069143, + "loss": 0.4164, + "step": 147200 + }, + { + "epoch": 35.93, + "learning_rate": 0.00032082702174444173, + "loss": 0.3672, + "step": 147225 + }, + { + "epoch": 35.93, + "learning_rate": 0.00032079648179819204, + "loss": 0.3552, + "step": 147250 + }, + { + "epoch": 35.94, + "learning_rate": 0.00032076594185194234, + "loss": 0.3435, + "step": 147275 + }, + { + "epoch": 35.94, + "learning_rate": 0.00032073540190569264, + "loss": 0.3759, + "step": 147300 + }, + { + "epoch": 35.95, + "learning_rate": 0.000320704861959443, + "loss": 0.3765, + "step": 147325 + }, + { + "epoch": 35.96, + "learning_rate": 0.00032067432201319325, + "loss": 0.3909, + "step": 147350 + }, + { + "epoch": 35.96, + "learning_rate": 0.00032064378206694355, + "loss": 0.3515, + "step": 147375 + }, + { + "epoch": 35.97, + "learning_rate": 0.00032061324212069386, + "loss": 0.3989, + "step": 147400 + }, + { + "epoch": 35.97, + "learning_rate": 0.00032058270217444416, + "loss": 0.3365, + "step": 147425 + }, + { + "epoch": 35.98, + "learning_rate": 0.0003205521622281945, + "loss": 0.3786, + "step": 147450 + }, + { + "epoch": 35.99, + "learning_rate": 0.0003205216222819448, + "loss": 0.3397, + "step": 147475 + }, + { + "epoch": 35.99, + "learning_rate": 0.00032049108233569507, + "loss": 0.3643, + "step": 147500 + }, + { + "epoch": 36.0, + "learning_rate": 0.0003204605423894454, + "loss": 0.4007, + "step": 147525 + }, + { + "epoch": 36.01, + "learning_rate": 0.0003204300024431957, + "loss": 0.3823, + "step": 147550 + }, + { + "epoch": 36.01, + "learning_rate": 0.00032039946249694603, + "loss": 0.329, + "step": 147575 + }, + { + "epoch": 36.02, + "learning_rate": 0.00032036892255069634, + "loss": 0.383, + "step": 147600 + }, + { + "epoch": 36.02, + "learning_rate": 0.00032033838260444664, + "loss": 0.3285, + "step": 147625 + }, + { + "epoch": 36.03, + "learning_rate": 0.0003203078426581969, + "loss": 0.3687, + "step": 147650 + }, + { + "epoch": 36.04, + "learning_rate": 0.0003202773027119472, + "loss": 0.3371, + "step": 147675 + }, + { + "epoch": 36.04, + "learning_rate": 0.00032024676276569755, + "loss": 0.3651, + "step": 147700 + }, + { + "epoch": 36.05, + "learning_rate": 0.00032021622281944785, + "loss": 0.3373, + "step": 147725 + }, + { + "epoch": 36.05, + "learning_rate": 0.00032018568287319816, + "loss": 0.3969, + "step": 147750 + }, + { + "epoch": 36.06, + "learning_rate": 0.00032015514292694846, + "loss": 0.3296, + "step": 147775 + }, + { + "epoch": 36.07, + "learning_rate": 0.00032012460298069876, + "loss": 0.378, + "step": 147800 + }, + { + "epoch": 36.07, + "learning_rate": 0.00032009406303444907, + "loss": 0.3491, + "step": 147825 + }, + { + "epoch": 36.08, + "learning_rate": 0.00032006352308819937, + "loss": 0.3889, + "step": 147850 + }, + { + "epoch": 36.08, + "learning_rate": 0.0003200329831419497, + "loss": 0.3165, + "step": 147875 + }, + { + "epoch": 36.09, + "learning_rate": 0.0003200024431957, + "loss": 0.3961, + "step": 147900 + }, + { + "epoch": 36.1, + "learning_rate": 0.0003199719032494503, + "loss": 0.3166, + "step": 147925 + }, + { + "epoch": 36.1, + "learning_rate": 0.00031994136330320064, + "loss": 0.3755, + "step": 147950 + }, + { + "epoch": 36.11, + "learning_rate": 0.0003199108233569509, + "loss": 0.3135, + "step": 147975 + }, + { + "epoch": 36.12, + "learning_rate": 0.0003198802834107012, + "loss": 0.3744, + "step": 148000 + }, + { + "epoch": 36.12, + "learning_rate": 0.0003198497434644515, + "loss": 0.3229, + "step": 148025 + }, + { + "epoch": 36.13, + "learning_rate": 0.0003198192035182018, + "loss": 0.3819, + "step": 148050 + }, + { + "epoch": 36.13, + "learning_rate": 0.00031978866357195216, + "loss": 0.3388, + "step": 148075 + }, + { + "epoch": 36.14, + "learning_rate": 0.00031975812362570246, + "loss": 0.3758, + "step": 148100 + }, + { + "epoch": 36.15, + "learning_rate": 0.0003197275836794527, + "loss": 0.3504, + "step": 148125 + }, + { + "epoch": 36.15, + "learning_rate": 0.000319697043733203, + "loss": 0.3758, + "step": 148150 + }, + { + "epoch": 36.16, + "learning_rate": 0.0003196665037869533, + "loss": 0.3839, + "step": 148175 + }, + { + "epoch": 36.16, + "learning_rate": 0.00031963596384070367, + "loss": 0.3664, + "step": 148200 + }, + { + "epoch": 36.17, + "learning_rate": 0.000319605423894454, + "loss": 0.3364, + "step": 148225 + }, + { + "epoch": 36.18, + "learning_rate": 0.0003195748839482043, + "loss": 0.3849, + "step": 148250 + }, + { + "epoch": 36.18, + "learning_rate": 0.0003195443440019546, + "loss": 0.3492, + "step": 148275 + }, + { + "epoch": 36.19, + "learning_rate": 0.00031951380405570483, + "loss": 0.3773, + "step": 148300 + }, + { + "epoch": 36.19, + "learning_rate": 0.0003194832641094552, + "loss": 0.3099, + "step": 148325 + }, + { + "epoch": 36.2, + "learning_rate": 0.0003194527241632055, + "loss": 0.3811, + "step": 148350 + }, + { + "epoch": 36.21, + "learning_rate": 0.0003194221842169558, + "loss": 0.3234, + "step": 148375 + }, + { + "epoch": 36.21, + "learning_rate": 0.0003193916442707061, + "loss": 0.4036, + "step": 148400 + }, + { + "epoch": 36.22, + "learning_rate": 0.0003193611043244564, + "loss": 0.2925, + "step": 148425 + }, + { + "epoch": 36.22, + "learning_rate": 0.00031933056437820665, + "loss": 0.3937, + "step": 148450 + }, + { + "epoch": 36.23, + "learning_rate": 0.000319300024431957, + "loss": 0.3269, + "step": 148475 + }, + { + "epoch": 36.24, + "learning_rate": 0.0003192694844857073, + "loss": 0.3872, + "step": 148500 + }, + { + "epoch": 36.24, + "learning_rate": 0.0003192389445394576, + "loss": 0.3289, + "step": 148525 + }, + { + "epoch": 36.25, + "learning_rate": 0.0003192084045932079, + "loss": 0.3613, + "step": 148550 + }, + { + "epoch": 36.26, + "learning_rate": 0.0003191778646469582, + "loss": 0.3232, + "step": 148575 + }, + { + "epoch": 36.26, + "learning_rate": 0.0003191473247007085, + "loss": 0.3684, + "step": 148600 + }, + { + "epoch": 36.27, + "learning_rate": 0.00031911678475445883, + "loss": 0.3468, + "step": 148625 + }, + { + "epoch": 36.27, + "learning_rate": 0.00031908624480820913, + "loss": 0.385, + "step": 148650 + }, + { + "epoch": 36.28, + "learning_rate": 0.00031905570486195944, + "loss": 0.3279, + "step": 148675 + }, + { + "epoch": 36.29, + "learning_rate": 0.00031902516491570974, + "loss": 0.3795, + "step": 148700 + }, + { + "epoch": 36.29, + "learning_rate": 0.0003189946249694601, + "loss": 0.3429, + "step": 148725 + }, + { + "epoch": 36.3, + "learning_rate": 0.0003189640850232104, + "loss": 0.3697, + "step": 148750 + }, + { + "epoch": 36.3, + "learning_rate": 0.00031893354507696065, + "loss": 0.3696, + "step": 148775 + }, + { + "epoch": 36.31, + "learning_rate": 0.00031890300513071095, + "loss": 0.3479, + "step": 148800 + }, + { + "epoch": 36.32, + "learning_rate": 0.00031887246518446126, + "loss": 0.3308, + "step": 148825 + }, + { + "epoch": 36.32, + "learning_rate": 0.0003188419252382116, + "loss": 0.3699, + "step": 148850 + }, + { + "epoch": 36.33, + "learning_rate": 0.0003188113852919619, + "loss": 0.3258, + "step": 148875 + }, + { + "epoch": 36.33, + "learning_rate": 0.0003187808453457122, + "loss": 0.3816, + "step": 148900 + }, + { + "epoch": 36.34, + "learning_rate": 0.00031875030539946247, + "loss": 0.3045, + "step": 148925 + }, + { + "epoch": 36.35, + "learning_rate": 0.00031871976545321277, + "loss": 0.3856, + "step": 148950 + }, + { + "epoch": 36.35, + "learning_rate": 0.00031868922550696313, + "loss": 0.3719, + "step": 148975 + }, + { + "epoch": 36.36, + "learning_rate": 0.00031865868556071343, + "loss": 0.3844, + "step": 149000 + }, + { + "epoch": 36.37, + "learning_rate": 0.00031862814561446374, + "loss": 0.3496, + "step": 149025 + }, + { + "epoch": 36.37, + "learning_rate": 0.00031859760566821404, + "loss": 0.379, + "step": 149050 + }, + { + "epoch": 36.38, + "learning_rate": 0.0003185670657219643, + "loss": 0.3435, + "step": 149075 + }, + { + "epoch": 36.38, + "learning_rate": 0.00031853652577571465, + "loss": 0.3707, + "step": 149100 + }, + { + "epoch": 36.39, + "learning_rate": 0.00031850598582946495, + "loss": 0.3272, + "step": 149125 + }, + { + "epoch": 36.4, + "learning_rate": 0.00031847544588321525, + "loss": 0.3826, + "step": 149150 + }, + { + "epoch": 36.4, + "learning_rate": 0.00031844490593696556, + "loss": 0.3228, + "step": 149175 + }, + { + "epoch": 36.41, + "learning_rate": 0.00031841436599071586, + "loss": 0.3787, + "step": 149200 + }, + { + "epoch": 36.41, + "learning_rate": 0.0003183838260444662, + "loss": 0.3101, + "step": 149225 + }, + { + "epoch": 36.42, + "learning_rate": 0.00031835328609821647, + "loss": 0.3894, + "step": 149250 + }, + { + "epoch": 36.43, + "learning_rate": 0.00031832274615196677, + "loss": 0.3226, + "step": 149275 + }, + { + "epoch": 36.43, + "learning_rate": 0.0003182922062057171, + "loss": 0.3965, + "step": 149300 + }, + { + "epoch": 36.44, + "learning_rate": 0.0003182616662594674, + "loss": 0.3584, + "step": 149325 + }, + { + "epoch": 36.44, + "learning_rate": 0.00031823112631321773, + "loss": 0.402, + "step": 149350 + }, + { + "epoch": 36.45, + "learning_rate": 0.00031820058636696804, + "loss": 0.3279, + "step": 149375 + }, + { + "epoch": 36.46, + "learning_rate": 0.0003181700464207183, + "loss": 0.3963, + "step": 149400 + }, + { + "epoch": 36.46, + "learning_rate": 0.0003181395064744686, + "loss": 0.3839, + "step": 149425 + }, + { + "epoch": 36.47, + "learning_rate": 0.0003181089665282189, + "loss": 0.3805, + "step": 149450 + }, + { + "epoch": 36.48, + "learning_rate": 0.00031807842658196925, + "loss": 0.3281, + "step": 149475 + }, + { + "epoch": 36.48, + "learning_rate": 0.00031804788663571955, + "loss": 0.4039, + "step": 149500 + }, + { + "epoch": 36.49, + "learning_rate": 0.00031801734668946986, + "loss": 0.3571, + "step": 149525 + }, + { + "epoch": 36.49, + "learning_rate": 0.0003179868067432201, + "loss": 0.3404, + "step": 149550 + }, + { + "epoch": 36.5, + "learning_rate": 0.0003179562667969704, + "loss": 0.3561, + "step": 149575 + }, + { + "epoch": 36.51, + "learning_rate": 0.00031792572685072077, + "loss": 0.3672, + "step": 149600 + }, + { + "epoch": 36.51, + "learning_rate": 0.00031789518690447107, + "loss": 0.3173, + "step": 149625 + }, + { + "epoch": 36.52, + "learning_rate": 0.0003178646469582214, + "loss": 0.4015, + "step": 149650 + }, + { + "epoch": 36.52, + "learning_rate": 0.0003178341070119717, + "loss": 0.3559, + "step": 149675 + }, + { + "epoch": 36.53, + "learning_rate": 0.00031780356706572193, + "loss": 0.3795, + "step": 149700 + }, + { + "epoch": 36.54, + "learning_rate": 0.00031777302711947223, + "loss": 0.3588, + "step": 149725 + }, + { + "epoch": 36.54, + "learning_rate": 0.0003177424871732226, + "loss": 0.4294, + "step": 149750 + }, + { + "epoch": 36.55, + "learning_rate": 0.0003177119472269729, + "loss": 0.3245, + "step": 149775 + }, + { + "epoch": 36.55, + "learning_rate": 0.0003176814072807232, + "loss": 0.3661, + "step": 149800 + }, + { + "epoch": 36.56, + "learning_rate": 0.0003176508673344735, + "loss": 0.3169, + "step": 149825 + }, + { + "epoch": 36.57, + "learning_rate": 0.0003176203273882238, + "loss": 0.3811, + "step": 149850 + }, + { + "epoch": 36.57, + "learning_rate": 0.0003175897874419741, + "loss": 0.377, + "step": 149875 + }, + { + "epoch": 36.58, + "learning_rate": 0.0003175592474957244, + "loss": 0.3724, + "step": 149900 + }, + { + "epoch": 36.58, + "learning_rate": 0.0003175287075494747, + "loss": 0.3341, + "step": 149925 + }, + { + "epoch": 36.59, + "learning_rate": 0.000317498167603225, + "loss": 0.3699, + "step": 149950 + }, + { + "epoch": 36.6, + "learning_rate": 0.0003174676276569753, + "loss": 0.3583, + "step": 149975 + }, + { + "epoch": 36.6, + "learning_rate": 0.0003174370877107257, + "loss": 0.408, + "step": 150000 + }, + { + "epoch": 36.6, + "eval_cer": 0.09135242240998737, + "eval_loss": 0.4018867313861847, + "eval_runtime": 149.0214, + "eval_samples_per_second": 28.137, + "eval_steps_per_second": 7.039, + "eval_wer": 0.3780750407830343, + "step": 150000 + }, + { + "epoch": 36.61, + "learning_rate": 0.0003174065477644759, + "loss": 0.3359, + "step": 150025 + }, + { + "epoch": 36.62, + "learning_rate": 0.00031737600781822623, + "loss": 0.3467, + "step": 150050 + }, + { + "epoch": 36.62, + "learning_rate": 0.00031734546787197653, + "loss": 0.3999, + "step": 150075 + }, + { + "epoch": 36.63, + "learning_rate": 0.00031731492792572684, + "loss": 0.3519, + "step": 150100 + }, + { + "epoch": 36.63, + "learning_rate": 0.0003172843879794772, + "loss": 0.3624, + "step": 150125 + }, + { + "epoch": 36.64, + "learning_rate": 0.0003172538480332275, + "loss": 0.4109, + "step": 150150 + }, + { + "epoch": 36.65, + "learning_rate": 0.00031722330808697775, + "loss": 0.3374, + "step": 150175 + }, + { + "epoch": 36.65, + "learning_rate": 0.00031719398973857805, + "loss": 0.4039, + "step": 150200 + }, + { + "epoch": 36.66, + "learning_rate": 0.00031716344979232835, + "loss": 0.3698, + "step": 150225 + }, + { + "epoch": 36.66, + "learning_rate": 0.00031713290984607866, + "loss": 0.3895, + "step": 150250 + }, + { + "epoch": 36.67, + "learning_rate": 0.000317102369899829, + "loss": 0.3492, + "step": 150275 + }, + { + "epoch": 36.68, + "learning_rate": 0.0003170718299535793, + "loss": 0.3893, + "step": 150300 + }, + { + "epoch": 36.68, + "learning_rate": 0.0003170412900073296, + "loss": 0.3069, + "step": 150325 + }, + { + "epoch": 36.69, + "learning_rate": 0.00031701075006107987, + "loss": 0.3858, + "step": 150350 + }, + { + "epoch": 36.69, + "learning_rate": 0.0003169802101148302, + "loss": 0.3083, + "step": 150375 + }, + { + "epoch": 36.7, + "learning_rate": 0.00031694967016858053, + "loss": 0.3714, + "step": 150400 + }, + { + "epoch": 36.71, + "learning_rate": 0.00031691913022233084, + "loss": 0.3288, + "step": 150425 + }, + { + "epoch": 36.71, + "learning_rate": 0.00031688859027608114, + "loss": 0.4096, + "step": 150450 + }, + { + "epoch": 36.72, + "learning_rate": 0.00031685805032983144, + "loss": 0.3209, + "step": 150475 + }, + { + "epoch": 36.73, + "learning_rate": 0.0003168275103835817, + "loss": 0.3546, + "step": 150500 + }, + { + "epoch": 36.73, + "learning_rate": 0.000316796970437332, + "loss": 0.3455, + "step": 150525 + }, + { + "epoch": 36.74, + "learning_rate": 0.00031676643049108235, + "loss": 0.3994, + "step": 150550 + }, + { + "epoch": 36.74, + "learning_rate": 0.00031673589054483266, + "loss": 0.3656, + "step": 150575 + }, + { + "epoch": 36.75, + "learning_rate": 0.00031670535059858296, + "loss": 0.3779, + "step": 150600 + }, + { + "epoch": 36.76, + "learning_rate": 0.00031667481065233326, + "loss": 0.3492, + "step": 150625 + }, + { + "epoch": 36.76, + "learning_rate": 0.0003166442707060835, + "loss": 0.3824, + "step": 150650 + }, + { + "epoch": 36.77, + "learning_rate": 0.00031661373075983387, + "loss": 0.3349, + "step": 150675 + }, + { + "epoch": 36.77, + "learning_rate": 0.00031658319081358417, + "loss": 0.3545, + "step": 150700 + }, + { + "epoch": 36.78, + "learning_rate": 0.0003165526508673345, + "loss": 0.3335, + "step": 150725 + }, + { + "epoch": 36.79, + "learning_rate": 0.0003165221109210848, + "loss": 0.3794, + "step": 150750 + }, + { + "epoch": 36.79, + "learning_rate": 0.0003164915709748351, + "loss": 0.3286, + "step": 150775 + }, + { + "epoch": 36.8, + "learning_rate": 0.00031646103102858544, + "loss": 0.4115, + "step": 150800 + }, + { + "epoch": 36.8, + "learning_rate": 0.0003164304910823357, + "loss": 0.3495, + "step": 150825 + }, + { + "epoch": 36.81, + "learning_rate": 0.000316399951136086, + "loss": 0.3778, + "step": 150850 + }, + { + "epoch": 36.82, + "learning_rate": 0.0003163694111898363, + "loss": 0.3178, + "step": 150875 + }, + { + "epoch": 36.82, + "learning_rate": 0.0003163388712435866, + "loss": 0.3725, + "step": 150900 + }, + { + "epoch": 36.83, + "learning_rate": 0.00031630833129733696, + "loss": 0.324, + "step": 150925 + }, + { + "epoch": 36.84, + "learning_rate": 0.00031627779135108726, + "loss": 0.3948, + "step": 150950 + }, + { + "epoch": 36.84, + "learning_rate": 0.0003162472514048375, + "loss": 0.3707, + "step": 150975 + }, + { + "epoch": 36.85, + "learning_rate": 0.0003162167114585878, + "loss": 0.3868, + "step": 151000 + }, + { + "epoch": 36.85, + "learning_rate": 0.0003161861715123381, + "loss": 0.3439, + "step": 151025 + }, + { + "epoch": 36.86, + "learning_rate": 0.0003161556315660885, + "loss": 0.3855, + "step": 151050 + }, + { + "epoch": 36.87, + "learning_rate": 0.0003161250916198388, + "loss": 0.3445, + "step": 151075 + }, + { + "epoch": 36.87, + "learning_rate": 0.0003160945516735891, + "loss": 0.3752, + "step": 151100 + }, + { + "epoch": 36.88, + "learning_rate": 0.00031606401172733933, + "loss": 0.3755, + "step": 151125 + }, + { + "epoch": 36.88, + "learning_rate": 0.00031603347178108963, + "loss": 0.4136, + "step": 151150 + }, + { + "epoch": 36.89, + "learning_rate": 0.00031600293183484, + "loss": 0.3776, + "step": 151175 + }, + { + "epoch": 36.9, + "learning_rate": 0.0003159723918885903, + "loss": 0.3947, + "step": 151200 + }, + { + "epoch": 36.9, + "learning_rate": 0.0003159418519423406, + "loss": 0.3663, + "step": 151225 + }, + { + "epoch": 36.91, + "learning_rate": 0.0003159113119960909, + "loss": 0.3671, + "step": 151250 + }, + { + "epoch": 36.91, + "learning_rate": 0.0003158807720498412, + "loss": 0.3609, + "step": 151275 + }, + { + "epoch": 36.92, + "learning_rate": 0.0003158502321035915, + "loss": 0.3713, + "step": 151300 + }, + { + "epoch": 36.93, + "learning_rate": 0.0003158196921573418, + "loss": 0.3369, + "step": 151325 + }, + { + "epoch": 36.93, + "learning_rate": 0.0003157891522110921, + "loss": 0.3894, + "step": 151350 + }, + { + "epoch": 36.94, + "learning_rate": 0.0003157586122648424, + "loss": 0.3614, + "step": 151375 + }, + { + "epoch": 36.94, + "learning_rate": 0.0003157280723185927, + "loss": 0.3813, + "step": 151400 + }, + { + "epoch": 36.95, + "learning_rate": 0.0003156975323723431, + "loss": 0.3522, + "step": 151425 + }, + { + "epoch": 36.96, + "learning_rate": 0.00031566699242609333, + "loss": 0.3855, + "step": 151450 + }, + { + "epoch": 36.96, + "learning_rate": 0.00031563645247984363, + "loss": 0.3148, + "step": 151475 + }, + { + "epoch": 36.97, + "learning_rate": 0.00031560591253359393, + "loss": 0.4214, + "step": 151500 + }, + { + "epoch": 36.98, + "learning_rate": 0.00031557537258734424, + "loss": 0.3241, + "step": 151525 + }, + { + "epoch": 36.98, + "learning_rate": 0.0003155448326410946, + "loss": 0.412, + "step": 151550 + }, + { + "epoch": 36.99, + "learning_rate": 0.0003155142926948449, + "loss": 0.397, + "step": 151575 + }, + { + "epoch": 36.99, + "learning_rate": 0.00031548375274859515, + "loss": 0.3947, + "step": 151600 + }, + { + "epoch": 37.0, + "learning_rate": 0.00031545321280234545, + "loss": 0.295, + "step": 151625 + }, + { + "epoch": 37.01, + "learning_rate": 0.00031542267285609575, + "loss": 0.4214, + "step": 151650 + }, + { + "epoch": 37.01, + "learning_rate": 0.0003153921329098461, + "loss": 0.3445, + "step": 151675 + }, + { + "epoch": 37.02, + "learning_rate": 0.0003153615929635964, + "loss": 0.371, + "step": 151700 + }, + { + "epoch": 37.02, + "learning_rate": 0.0003153310530173467, + "loss": 0.3183, + "step": 151725 + }, + { + "epoch": 37.03, + "learning_rate": 0.000315300513071097, + "loss": 0.3857, + "step": 151750 + }, + { + "epoch": 37.04, + "learning_rate": 0.00031526997312484727, + "loss": 0.3127, + "step": 151775 + }, + { + "epoch": 37.04, + "learning_rate": 0.0003152394331785976, + "loss": 0.3762, + "step": 151800 + }, + { + "epoch": 37.05, + "learning_rate": 0.00031520889323234793, + "loss": 0.3028, + "step": 151825 + }, + { + "epoch": 37.05, + "learning_rate": 0.00031517835328609824, + "loss": 0.3879, + "step": 151850 + }, + { + "epoch": 37.06, + "learning_rate": 0.00031514781333984854, + "loss": 0.3842, + "step": 151875 + }, + { + "epoch": 37.07, + "learning_rate": 0.00031511727339359884, + "loss": 0.3761, + "step": 151900 + }, + { + "epoch": 37.07, + "learning_rate": 0.0003150867334473491, + "loss": 0.346, + "step": 151925 + }, + { + "epoch": 37.08, + "learning_rate": 0.00031505619350109945, + "loss": 0.3817, + "step": 151950 + }, + { + "epoch": 37.09, + "learning_rate": 0.00031502565355484975, + "loss": 0.3488, + "step": 151975 + }, + { + "epoch": 37.09, + "learning_rate": 0.00031499511360860006, + "loss": 0.3675, + "step": 152000 + }, + { + "epoch": 37.1, + "learning_rate": 0.00031496457366235036, + "loss": 0.3434, + "step": 152025 + }, + { + "epoch": 37.1, + "learning_rate": 0.00031493403371610066, + "loss": 0.3962, + "step": 152050 + }, + { + "epoch": 37.11, + "learning_rate": 0.00031490349376985097, + "loss": 0.3325, + "step": 152075 + }, + { + "epoch": 37.12, + "learning_rate": 0.00031487295382360127, + "loss": 0.3673, + "step": 152100 + }, + { + "epoch": 37.12, + "learning_rate": 0.00031484241387735157, + "loss": 0.3133, + "step": 152125 + }, + { + "epoch": 37.13, + "learning_rate": 0.0003148118739311019, + "loss": 0.3723, + "step": 152150 + }, + { + "epoch": 37.13, + "learning_rate": 0.0003147813339848522, + "loss": 0.366, + "step": 152175 + }, + { + "epoch": 37.14, + "learning_rate": 0.00031475079403860254, + "loss": 0.3774, + "step": 152200 + }, + { + "epoch": 37.15, + "learning_rate": 0.00031472025409235284, + "loss": 0.3535, + "step": 152225 + }, + { + "epoch": 37.15, + "learning_rate": 0.0003146897141461031, + "loss": 0.3537, + "step": 152250 + }, + { + "epoch": 37.16, + "learning_rate": 0.0003146603957977034, + "loss": 0.309, + "step": 152275 + }, + { + "epoch": 37.16, + "learning_rate": 0.0003146298558514537, + "loss": 0.3716, + "step": 152300 + }, + { + "epoch": 37.17, + "learning_rate": 0.000314599315905204, + "loss": 0.3139, + "step": 152325 + }, + { + "epoch": 37.18, + "learning_rate": 0.00031456877595895436, + "loss": 0.3545, + "step": 152350 + }, + { + "epoch": 37.18, + "learning_rate": 0.00031453823601270466, + "loss": 0.3189, + "step": 152375 + }, + { + "epoch": 37.19, + "learning_rate": 0.0003145076960664549, + "loss": 0.375, + "step": 152400 + }, + { + "epoch": 37.19, + "learning_rate": 0.0003144771561202052, + "loss": 0.366, + "step": 152425 + }, + { + "epoch": 37.2, + "learning_rate": 0.0003144466161739555, + "loss": 0.3618, + "step": 152450 + }, + { + "epoch": 37.21, + "learning_rate": 0.0003144160762277059, + "loss": 0.3243, + "step": 152475 + }, + { + "epoch": 37.21, + "learning_rate": 0.0003143855362814562, + "loss": 0.3805, + "step": 152500 + }, + { + "epoch": 37.22, + "learning_rate": 0.0003143549963352065, + "loss": 0.3194, + "step": 152525 + }, + { + "epoch": 37.23, + "learning_rate": 0.00031432445638895673, + "loss": 0.3671, + "step": 152550 + }, + { + "epoch": 37.23, + "learning_rate": 0.00031429391644270704, + "loss": 0.3048, + "step": 152575 + }, + { + "epoch": 37.24, + "learning_rate": 0.00031426337649645734, + "loss": 0.3994, + "step": 152600 + }, + { + "epoch": 37.24, + "learning_rate": 0.0003142328365502077, + "loss": 0.3395, + "step": 152625 + }, + { + "epoch": 37.25, + "learning_rate": 0.000314202296603958, + "loss": 0.3874, + "step": 152650 + }, + { + "epoch": 37.26, + "learning_rate": 0.0003141717566577083, + "loss": 0.3063, + "step": 152675 + }, + { + "epoch": 37.26, + "learning_rate": 0.0003141412167114586, + "loss": 0.3598, + "step": 152700 + }, + { + "epoch": 37.27, + "learning_rate": 0.00031411067676520886, + "loss": 0.3066, + "step": 152725 + }, + { + "epoch": 37.27, + "learning_rate": 0.0003140801368189592, + "loss": 0.3716, + "step": 152750 + }, + { + "epoch": 37.28, + "learning_rate": 0.0003140495968727095, + "loss": 0.3447, + "step": 152775 + }, + { + "epoch": 37.29, + "learning_rate": 0.0003140190569264598, + "loss": 0.394, + "step": 152800 + }, + { + "epoch": 37.29, + "learning_rate": 0.0003139885169802101, + "loss": 0.3836, + "step": 152825 + }, + { + "epoch": 37.3, + "learning_rate": 0.0003139579770339604, + "loss": 0.3557, + "step": 152850 + }, + { + "epoch": 37.3, + "learning_rate": 0.00031392743708771073, + "loss": 0.3331, + "step": 152875 + }, + { + "epoch": 37.31, + "learning_rate": 0.00031389689714146103, + "loss": 0.379, + "step": 152900 + }, + { + "epoch": 37.32, + "learning_rate": 0.00031386635719521134, + "loss": 0.3065, + "step": 152925 + }, + { + "epoch": 37.32, + "learning_rate": 0.00031383581724896164, + "loss": 0.3761, + "step": 152950 + }, + { + "epoch": 37.33, + "learning_rate": 0.00031380527730271194, + "loss": 0.3338, + "step": 152975 + }, + { + "epoch": 37.34, + "learning_rate": 0.0003137747373564623, + "loss": 0.3632, + "step": 153000 + }, + { + "epoch": 37.34, + "eval_cer": 0.09168095438538854, + "eval_loss": 0.40829116106033325, + "eval_runtime": 148.4618, + "eval_samples_per_second": 28.243, + "eval_steps_per_second": 7.066, + "eval_wer": 0.38140293637846656, + "step": 153000 + }, + { + "epoch": 37.34, + "learning_rate": 0.00031374419741021255, + "loss": 0.3374, + "step": 153025 + }, + { + "epoch": 37.35, + "learning_rate": 0.00031371365746396285, + "loss": 0.383, + "step": 153050 + }, + { + "epoch": 37.35, + "learning_rate": 0.00031368311751771316, + "loss": 0.3429, + "step": 153075 + }, + { + "epoch": 37.36, + "learning_rate": 0.00031365257757146346, + "loss": 0.3699, + "step": 153100 + }, + { + "epoch": 37.37, + "learning_rate": 0.0003136220376252138, + "loss": 0.3116, + "step": 153125 + }, + { + "epoch": 37.37, + "learning_rate": 0.0003135914976789641, + "loss": 0.3865, + "step": 153150 + }, + { + "epoch": 37.38, + "learning_rate": 0.0003135609577327144, + "loss": 0.3409, + "step": 153175 + }, + { + "epoch": 37.38, + "learning_rate": 0.0003135304177864647, + "loss": 0.372, + "step": 153200 + }, + { + "epoch": 37.39, + "learning_rate": 0.000313499877840215, + "loss": 0.3812, + "step": 153225 + }, + { + "epoch": 37.4, + "learning_rate": 0.00031346933789396533, + "loss": 0.373, + "step": 153250 + }, + { + "epoch": 37.4, + "learning_rate": 0.00031343879794771564, + "loss": 0.3142, + "step": 153275 + }, + { + "epoch": 37.41, + "learning_rate": 0.00031340825800146594, + "loss": 0.3495, + "step": 153300 + }, + { + "epoch": 37.41, + "learning_rate": 0.00031337771805521624, + "loss": 0.3527, + "step": 153325 + }, + { + "epoch": 37.42, + "learning_rate": 0.0003133471781089665, + "loss": 0.3969, + "step": 153350 + }, + { + "epoch": 37.43, + "learning_rate": 0.00031331663816271685, + "loss": 0.3238, + "step": 153375 + }, + { + "epoch": 37.43, + "learning_rate": 0.00031328609821646715, + "loss": 0.3597, + "step": 153400 + }, + { + "epoch": 37.44, + "learning_rate": 0.00031325555827021746, + "loss": 0.3015, + "step": 153425 + }, + { + "epoch": 37.45, + "learning_rate": 0.00031322501832396776, + "loss": 0.3801, + "step": 153450 + }, + { + "epoch": 37.45, + "learning_rate": 0.00031319447837771806, + "loss": 0.3414, + "step": 153475 + }, + { + "epoch": 37.46, + "learning_rate": 0.00031316393843146837, + "loss": 0.3881, + "step": 153500 + }, + { + "epoch": 37.46, + "learning_rate": 0.00031313339848521867, + "loss": 0.3183, + "step": 153525 + }, + { + "epoch": 37.47, + "learning_rate": 0.000313102858538969, + "loss": 0.3875, + "step": 153550 + }, + { + "epoch": 37.48, + "learning_rate": 0.0003130723185927193, + "loss": 0.3188, + "step": 153575 + }, + { + "epoch": 37.48, + "learning_rate": 0.0003130417786464696, + "loss": 0.3813, + "step": 153600 + }, + { + "epoch": 37.49, + "learning_rate": 0.00031301123870021994, + "loss": 0.3453, + "step": 153625 + }, + { + "epoch": 37.49, + "learning_rate": 0.0003129806987539702, + "loss": 0.3438, + "step": 153650 + }, + { + "epoch": 37.5, + "learning_rate": 0.0003129501588077205, + "loss": 0.3138, + "step": 153675 + }, + { + "epoch": 37.51, + "learning_rate": 0.0003129196188614708, + "loss": 0.3745, + "step": 153700 + }, + { + "epoch": 37.51, + "learning_rate": 0.0003128890789152211, + "loss": 0.3121, + "step": 153725 + }, + { + "epoch": 37.52, + "learning_rate": 0.00031285853896897145, + "loss": 0.3774, + "step": 153750 + }, + { + "epoch": 37.52, + "learning_rate": 0.00031282799902272176, + "loss": 0.3335, + "step": 153775 + }, + { + "epoch": 37.53, + "learning_rate": 0.00031279745907647206, + "loss": 0.3647, + "step": 153800 + }, + { + "epoch": 37.54, + "learning_rate": 0.0003127669191302223, + "loss": 0.3647, + "step": 153825 + }, + { + "epoch": 37.54, + "learning_rate": 0.0003127363791839726, + "loss": 0.3418, + "step": 153850 + }, + { + "epoch": 37.55, + "learning_rate": 0.0003127058392377229, + "loss": 0.3247, + "step": 153875 + }, + { + "epoch": 37.55, + "learning_rate": 0.0003126752992914733, + "loss": 0.3909, + "step": 153900 + }, + { + "epoch": 37.56, + "learning_rate": 0.0003126447593452236, + "loss": 0.334, + "step": 153925 + }, + { + "epoch": 37.57, + "learning_rate": 0.0003126142193989739, + "loss": 0.3984, + "step": 153950 + }, + { + "epoch": 37.57, + "learning_rate": 0.00031258367945272413, + "loss": 0.3609, + "step": 153975 + }, + { + "epoch": 37.58, + "learning_rate": 0.00031255313950647443, + "loss": 0.3759, + "step": 154000 + }, + { + "epoch": 37.59, + "learning_rate": 0.0003125225995602248, + "loss": 0.3416, + "step": 154025 + }, + { + "epoch": 37.59, + "learning_rate": 0.0003124920596139751, + "loss": 0.4028, + "step": 154050 + }, + { + "epoch": 37.6, + "learning_rate": 0.0003124615196677254, + "loss": 0.341, + "step": 154075 + }, + { + "epoch": 37.6, + "learning_rate": 0.0003124309797214757, + "loss": 0.3857, + "step": 154100 + }, + { + "epoch": 37.61, + "learning_rate": 0.00031240043977522595, + "loss": 0.3042, + "step": 154125 + }, + { + "epoch": 37.62, + "learning_rate": 0.0003123698998289763, + "loss": 0.3616, + "step": 154150 + }, + { + "epoch": 37.62, + "learning_rate": 0.0003123393598827266, + "loss": 0.3524, + "step": 154175 + }, + { + "epoch": 37.63, + "learning_rate": 0.0003123088199364769, + "loss": 0.3803, + "step": 154200 + }, + { + "epoch": 37.63, + "learning_rate": 0.0003122782799902272, + "loss": 0.2806, + "step": 154225 + }, + { + "epoch": 37.64, + "learning_rate": 0.0003122477400439775, + "loss": 0.3637, + "step": 154250 + }, + { + "epoch": 37.65, + "learning_rate": 0.0003122172000977279, + "loss": 0.337, + "step": 154275 + }, + { + "epoch": 37.65, + "learning_rate": 0.00031218666015147813, + "loss": 0.3736, + "step": 154300 + }, + { + "epoch": 37.66, + "learning_rate": 0.00031215612020522843, + "loss": 0.3206, + "step": 154325 + }, + { + "epoch": 37.66, + "learning_rate": 0.00031212558025897874, + "loss": 0.346, + "step": 154350 + }, + { + "epoch": 37.67, + "learning_rate": 0.00031209504031272904, + "loss": 0.3539, + "step": 154375 + }, + { + "epoch": 37.68, + "learning_rate": 0.0003120645003664794, + "loss": 0.376, + "step": 154400 + }, + { + "epoch": 37.68, + "learning_rate": 0.0003120339604202297, + "loss": 0.3605, + "step": 154425 + }, + { + "epoch": 37.69, + "learning_rate": 0.00031200342047397995, + "loss": 0.3651, + "step": 154450 + }, + { + "epoch": 37.7, + "learning_rate": 0.00031197288052773025, + "loss": 0.3858, + "step": 154475 + }, + { + "epoch": 37.7, + "learning_rate": 0.00031194234058148056, + "loss": 0.3746, + "step": 154500 + }, + { + "epoch": 37.71, + "learning_rate": 0.0003119118006352309, + "loss": 0.3329, + "step": 154525 + }, + { + "epoch": 37.71, + "learning_rate": 0.0003118812606889812, + "loss": 0.3976, + "step": 154550 + }, + { + "epoch": 37.72, + "learning_rate": 0.0003118507207427315, + "loss": 0.3131, + "step": 154575 + }, + { + "epoch": 37.73, + "learning_rate": 0.00031182018079648177, + "loss": 0.3685, + "step": 154600 + }, + { + "epoch": 37.73, + "learning_rate": 0.00031178964085023207, + "loss": 0.3311, + "step": 154625 + }, + { + "epoch": 37.74, + "learning_rate": 0.00031175910090398243, + "loss": 0.3813, + "step": 154650 + }, + { + "epoch": 37.74, + "learning_rate": 0.00031172856095773273, + "loss": 0.3179, + "step": 154675 + }, + { + "epoch": 37.75, + "learning_rate": 0.00031169802101148304, + "loss": 0.38, + "step": 154700 + }, + { + "epoch": 37.76, + "learning_rate": 0.00031166748106523334, + "loss": 0.2989, + "step": 154725 + }, + { + "epoch": 37.76, + "learning_rate": 0.00031163694111898364, + "loss": 0.3676, + "step": 154750 + }, + { + "epoch": 37.77, + "learning_rate": 0.00031160640117273395, + "loss": 0.3427, + "step": 154775 + }, + { + "epoch": 37.77, + "learning_rate": 0.00031157586122648425, + "loss": 0.3874, + "step": 154800 + }, + { + "epoch": 37.78, + "learning_rate": 0.00031154532128023455, + "loss": 0.3477, + "step": 154825 + }, + { + "epoch": 37.79, + "learning_rate": 0.00031151478133398486, + "loss": 0.344, + "step": 154850 + }, + { + "epoch": 37.79, + "learning_rate": 0.00031148424138773516, + "loss": 0.3357, + "step": 154875 + }, + { + "epoch": 37.8, + "learning_rate": 0.0003114537014414855, + "loss": 0.3821, + "step": 154900 + }, + { + "epoch": 37.81, + "learning_rate": 0.00031142316149523577, + "loss": 0.3115, + "step": 154925 + }, + { + "epoch": 37.81, + "learning_rate": 0.00031139262154898607, + "loss": 0.3384, + "step": 154950 + }, + { + "epoch": 37.82, + "learning_rate": 0.0003113620816027364, + "loss": 0.3625, + "step": 154975 + }, + { + "epoch": 37.82, + "learning_rate": 0.0003113315416564867, + "loss": 0.383, + "step": 155000 + }, + { + "epoch": 37.83, + "learning_rate": 0.00031130100171023703, + "loss": 0.3745, + "step": 155025 + }, + { + "epoch": 37.84, + "learning_rate": 0.00031127046176398734, + "loss": 0.3998, + "step": 155050 + }, + { + "epoch": 37.84, + "learning_rate": 0.0003112399218177376, + "loss": 0.3262, + "step": 155075 + }, + { + "epoch": 37.85, + "learning_rate": 0.0003112093818714879, + "loss": 0.3842, + "step": 155100 + }, + { + "epoch": 37.85, + "learning_rate": 0.0003111800635230882, + "loss": 0.3746, + "step": 155125 + }, + { + "epoch": 37.86, + "learning_rate": 0.0003111495235768385, + "loss": 0.37, + "step": 155150 + }, + { + "epoch": 37.87, + "learning_rate": 0.0003111189836305888, + "loss": 0.3215, + "step": 155175 + }, + { + "epoch": 37.87, + "learning_rate": 0.00031108844368433916, + "loss": 0.3761, + "step": 155200 + }, + { + "epoch": 37.88, + "learning_rate": 0.00031105790373808946, + "loss": 0.3683, + "step": 155225 + }, + { + "epoch": 37.88, + "learning_rate": 0.0003110273637918397, + "loss": 0.3582, + "step": 155250 + }, + { + "epoch": 37.89, + "learning_rate": 0.00031099682384559, + "loss": 0.3242, + "step": 155275 + }, + { + "epoch": 37.9, + "learning_rate": 0.0003109662838993403, + "loss": 0.3859, + "step": 155300 + }, + { + "epoch": 37.9, + "learning_rate": 0.0003109357439530907, + "loss": 0.3175, + "step": 155325 + }, + { + "epoch": 37.91, + "learning_rate": 0.000310905204006841, + "loss": 0.3666, + "step": 155350 + }, + { + "epoch": 37.91, + "learning_rate": 0.0003108746640605913, + "loss": 0.3116, + "step": 155375 + }, + { + "epoch": 37.92, + "learning_rate": 0.00031084412411434153, + "loss": 0.3966, + "step": 155400 + }, + { + "epoch": 37.93, + "learning_rate": 0.00031081358416809184, + "loss": 0.3215, + "step": 155425 + }, + { + "epoch": 37.93, + "learning_rate": 0.0003107830442218422, + "loss": 0.3751, + "step": 155450 + }, + { + "epoch": 37.94, + "learning_rate": 0.0003107525042755925, + "loss": 0.3868, + "step": 155475 + }, + { + "epoch": 37.95, + "learning_rate": 0.0003107219643293428, + "loss": 0.3995, + "step": 155500 + }, + { + "epoch": 37.95, + "learning_rate": 0.0003106914243830931, + "loss": 0.3341, + "step": 155525 + }, + { + "epoch": 37.96, + "learning_rate": 0.00031066088443684335, + "loss": 0.3976, + "step": 155550 + }, + { + "epoch": 37.96, + "learning_rate": 0.0003106303444905937, + "loss": 0.3575, + "step": 155575 + }, + { + "epoch": 37.97, + "learning_rate": 0.000310599804544344, + "loss": 0.3953, + "step": 155600 + }, + { + "epoch": 37.98, + "learning_rate": 0.0003105692645980943, + "loss": 0.3328, + "step": 155625 + }, + { + "epoch": 37.98, + "learning_rate": 0.0003105387246518446, + "loss": 0.383, + "step": 155650 + }, + { + "epoch": 37.99, + "learning_rate": 0.0003105081847055949, + "loss": 0.3547, + "step": 155675 + }, + { + "epoch": 37.99, + "learning_rate": 0.0003104776447593453, + "loss": 0.3654, + "step": 155700 + }, + { + "epoch": 38.0, + "learning_rate": 0.00031044710481309553, + "loss": 0.3441, + "step": 155725 + }, + { + "epoch": 38.01, + "learning_rate": 0.00031041656486684583, + "loss": 0.3477, + "step": 155750 + }, + { + "epoch": 38.01, + "learning_rate": 0.00031038602492059614, + "loss": 0.339, + "step": 155775 + }, + { + "epoch": 38.02, + "learning_rate": 0.00031035548497434644, + "loss": 0.4182, + "step": 155800 + }, + { + "epoch": 38.02, + "learning_rate": 0.0003103249450280968, + "loss": 0.3457, + "step": 155825 + }, + { + "epoch": 38.03, + "learning_rate": 0.0003102944050818471, + "loss": 0.3448, + "step": 155850 + }, + { + "epoch": 38.04, + "learning_rate": 0.00031026386513559735, + "loss": 0.3479, + "step": 155875 + }, + { + "epoch": 38.04, + "learning_rate": 0.00031023332518934765, + "loss": 0.3582, + "step": 155900 + }, + { + "epoch": 38.05, + "learning_rate": 0.00031020278524309796, + "loss": 0.338, + "step": 155925 + }, + { + "epoch": 38.06, + "learning_rate": 0.00031017224529684826, + "loss": 0.3746, + "step": 155950 + }, + { + "epoch": 38.06, + "learning_rate": 0.0003101417053505986, + "loss": 0.2483, + "step": 155975 + }, + { + "epoch": 38.07, + "learning_rate": 0.0003101111654043489, + "loss": 0.381, + "step": 156000 + }, + { + "epoch": 38.07, + "eval_cer": 0.09138835559479687, + "eval_loss": 0.4063064157962799, + "eval_runtime": 149.0731, + "eval_samples_per_second": 28.127, + "eval_steps_per_second": 7.037, + "eval_wer": 0.373768352365416, + "step": 156000 + }, + { + "epoch": 38.07, + "learning_rate": 0.00031008062545809917, + "loss": 0.3356, + "step": 156025 + }, + { + "epoch": 38.08, + "learning_rate": 0.0003100500855118495, + "loss": 0.3456, + "step": 156050 + }, + { + "epoch": 38.09, + "learning_rate": 0.0003100195455655998, + "loss": 0.3717, + "step": 156075 + }, + { + "epoch": 38.09, + "learning_rate": 0.00030998900561935014, + "loss": 0.3781, + "step": 156100 + }, + { + "epoch": 38.1, + "learning_rate": 0.00030995846567310044, + "loss": 0.2897, + "step": 156125 + }, + { + "epoch": 38.1, + "learning_rate": 0.00030992792572685074, + "loss": 0.3618, + "step": 156150 + }, + { + "epoch": 38.11, + "learning_rate": 0.00030989738578060105, + "loss": 0.3098, + "step": 156175 + }, + { + "epoch": 38.12, + "learning_rate": 0.0003098668458343513, + "loss": 0.3536, + "step": 156200 + }, + { + "epoch": 38.12, + "learning_rate": 0.00030983630588810165, + "loss": 0.3248, + "step": 156225 + }, + { + "epoch": 38.13, + "learning_rate": 0.00030980576594185196, + "loss": 0.3859, + "step": 156250 + }, + { + "epoch": 38.13, + "learning_rate": 0.00030977522599560226, + "loss": 0.3119, + "step": 156275 + }, + { + "epoch": 38.14, + "learning_rate": 0.00030974468604935256, + "loss": 0.3489, + "step": 156300 + }, + { + "epoch": 38.15, + "learning_rate": 0.00030971414610310287, + "loss": 0.3205, + "step": 156325 + }, + { + "epoch": 38.15, + "learning_rate": 0.00030968360615685317, + "loss": 0.3643, + "step": 156350 + }, + { + "epoch": 38.16, + "learning_rate": 0.00030965306621060347, + "loss": 0.3497, + "step": 156375 + }, + { + "epoch": 38.16, + "learning_rate": 0.0003096225262643538, + "loss": 0.3789, + "step": 156400 + }, + { + "epoch": 38.17, + "learning_rate": 0.0003095919863181041, + "loss": 0.3531, + "step": 156425 + }, + { + "epoch": 38.18, + "learning_rate": 0.0003095614463718544, + "loss": 0.3614, + "step": 156450 + }, + { + "epoch": 38.18, + "learning_rate": 0.00030953090642560474, + "loss": 0.3456, + "step": 156475 + }, + { + "epoch": 38.19, + "learning_rate": 0.000309500366479355, + "loss": 0.3613, + "step": 156500 + }, + { + "epoch": 38.2, + "learning_rate": 0.0003094698265331053, + "loss": 0.2974, + "step": 156525 + }, + { + "epoch": 38.2, + "learning_rate": 0.0003094392865868556, + "loss": 0.3759, + "step": 156550 + }, + { + "epoch": 38.21, + "learning_rate": 0.0003094087466406059, + "loss": 0.3586, + "step": 156575 + }, + { + "epoch": 38.21, + "learning_rate": 0.00030937820669435626, + "loss": 0.3498, + "step": 156600 + }, + { + "epoch": 38.22, + "learning_rate": 0.00030934766674810656, + "loss": 0.3484, + "step": 156625 + }, + { + "epoch": 38.23, + "learning_rate": 0.0003093171268018568, + "loss": 0.3656, + "step": 156650 + }, + { + "epoch": 38.23, + "learning_rate": 0.0003092865868556071, + "loss": 0.3113, + "step": 156675 + }, + { + "epoch": 38.24, + "learning_rate": 0.0003092560469093574, + "loss": 0.3757, + "step": 156700 + }, + { + "epoch": 38.24, + "learning_rate": 0.0003092255069631078, + "loss": 0.3385, + "step": 156725 + }, + { + "epoch": 38.25, + "learning_rate": 0.0003091949670168581, + "loss": 0.3611, + "step": 156750 + }, + { + "epoch": 38.26, + "learning_rate": 0.0003091644270706084, + "loss": 0.3193, + "step": 156775 + }, + { + "epoch": 38.26, + "learning_rate": 0.0003091338871243587, + "loss": 0.3628, + "step": 156800 + }, + { + "epoch": 38.27, + "learning_rate": 0.00030910334717810893, + "loss": 0.3189, + "step": 156825 + }, + { + "epoch": 38.27, + "learning_rate": 0.0003090728072318593, + "loss": 0.3541, + "step": 156850 + }, + { + "epoch": 38.28, + "learning_rate": 0.0003090422672856096, + "loss": 0.2861, + "step": 156875 + }, + { + "epoch": 38.29, + "learning_rate": 0.0003090117273393599, + "loss": 0.366, + "step": 156900 + }, + { + "epoch": 38.29, + "learning_rate": 0.0003089811873931102, + "loss": 0.3202, + "step": 156925 + }, + { + "epoch": 38.3, + "learning_rate": 0.0003089506474468605, + "loss": 0.3439, + "step": 156950 + }, + { + "epoch": 38.31, + "learning_rate": 0.0003089201075006108, + "loss": 0.3096, + "step": 156975 + }, + { + "epoch": 38.31, + "learning_rate": 0.0003088895675543611, + "loss": 0.3748, + "step": 157000 + }, + { + "epoch": 38.32, + "learning_rate": 0.0003088590276081114, + "loss": 0.3443, + "step": 157025 + }, + { + "epoch": 38.32, + "learning_rate": 0.0003088284876618617, + "loss": 0.3491, + "step": 157050 + }, + { + "epoch": 38.33, + "learning_rate": 0.000308797947715612, + "loss": 0.3376, + "step": 157075 + }, + { + "epoch": 38.34, + "learning_rate": 0.0003087674077693624, + "loss": 0.3932, + "step": 157100 + }, + { + "epoch": 38.34, + "learning_rate": 0.0003087368678231126, + "loss": 0.3509, + "step": 157125 + }, + { + "epoch": 38.35, + "learning_rate": 0.00030870754947471293, + "loss": 0.37, + "step": 157150 + }, + { + "epoch": 38.35, + "learning_rate": 0.00030867700952846324, + "loss": 0.3191, + "step": 157175 + }, + { + "epoch": 38.36, + "learning_rate": 0.00030864646958221354, + "loss": 0.3615, + "step": 157200 + }, + { + "epoch": 38.37, + "learning_rate": 0.00030861592963596384, + "loss": 0.3703, + "step": 157225 + }, + { + "epoch": 38.37, + "learning_rate": 0.00030858538968971415, + "loss": 0.3829, + "step": 157250 + }, + { + "epoch": 38.38, + "learning_rate": 0.0003085548497434645, + "loss": 0.3682, + "step": 157275 + }, + { + "epoch": 38.38, + "learning_rate": 0.00030852430979721475, + "loss": 0.3631, + "step": 157300 + }, + { + "epoch": 38.39, + "learning_rate": 0.00030849376985096506, + "loss": 0.3219, + "step": 157325 + }, + { + "epoch": 38.4, + "learning_rate": 0.00030846322990471536, + "loss": 0.3675, + "step": 157350 + }, + { + "epoch": 38.4, + "learning_rate": 0.00030843268995846566, + "loss": 0.3204, + "step": 157375 + }, + { + "epoch": 38.41, + "learning_rate": 0.000308402150012216, + "loss": 0.3539, + "step": 157400 + }, + { + "epoch": 38.42, + "learning_rate": 0.0003083716100659663, + "loss": 0.3556, + "step": 157425 + }, + { + "epoch": 38.42, + "learning_rate": 0.0003083410701197166, + "loss": 0.3787, + "step": 157450 + }, + { + "epoch": 38.43, + "learning_rate": 0.0003083105301734669, + "loss": 0.3152, + "step": 157475 + }, + { + "epoch": 38.43, + "learning_rate": 0.0003082799902272172, + "loss": 0.3738, + "step": 157500 + }, + { + "epoch": 38.44, + "learning_rate": 0.00030824945028096754, + "loss": 0.3171, + "step": 157525 + }, + { + "epoch": 38.45, + "learning_rate": 0.00030821891033471784, + "loss": 0.3718, + "step": 157550 + }, + { + "epoch": 38.45, + "learning_rate": 0.00030818837038846814, + "loss": 0.3166, + "step": 157575 + }, + { + "epoch": 38.46, + "learning_rate": 0.0003081578304422184, + "loss": 0.385, + "step": 157600 + }, + { + "epoch": 38.46, + "learning_rate": 0.0003081272904959687, + "loss": 0.3285, + "step": 157625 + }, + { + "epoch": 38.47, + "learning_rate": 0.00030809675054971905, + "loss": 0.3749, + "step": 157650 + }, + { + "epoch": 38.48, + "learning_rate": 0.00030806621060346936, + "loss": 0.3479, + "step": 157675 + }, + { + "epoch": 38.48, + "learning_rate": 0.00030803567065721966, + "loss": 0.3662, + "step": 157700 + }, + { + "epoch": 38.49, + "learning_rate": 0.00030800513071096996, + "loss": 0.2701, + "step": 157725 + }, + { + "epoch": 38.49, + "learning_rate": 0.00030797459076472027, + "loss": 0.3413, + "step": 157750 + }, + { + "epoch": 38.5, + "learning_rate": 0.00030794405081847057, + "loss": 0.3228, + "step": 157775 + }, + { + "epoch": 38.51, + "learning_rate": 0.0003079135108722209, + "loss": 0.3578, + "step": 157800 + }, + { + "epoch": 38.51, + "learning_rate": 0.0003078829709259712, + "loss": 0.3163, + "step": 157825 + }, + { + "epoch": 38.52, + "learning_rate": 0.0003078524309797215, + "loss": 0.4182, + "step": 157850 + }, + { + "epoch": 38.52, + "learning_rate": 0.0003078218910334718, + "loss": 0.3249, + "step": 157875 + }, + { + "epoch": 38.53, + "learning_rate": 0.00030779135108722214, + "loss": 0.3338, + "step": 157900 + }, + { + "epoch": 38.54, + "learning_rate": 0.0003077608111409724, + "loss": 0.3573, + "step": 157925 + }, + { + "epoch": 38.54, + "learning_rate": 0.0003077302711947227, + "loss": 0.3489, + "step": 157950 + }, + { + "epoch": 38.55, + "learning_rate": 0.000307699731248473, + "loss": 0.3266, + "step": 157975 + }, + { + "epoch": 38.56, + "learning_rate": 0.0003076691913022233, + "loss": 0.3913, + "step": 158000 + }, + { + "epoch": 38.56, + "learning_rate": 0.0003076386513559736, + "loss": 0.3552, + "step": 158025 + }, + { + "epoch": 38.57, + "learning_rate": 0.00030760811140972396, + "loss": 0.3592, + "step": 158050 + }, + { + "epoch": 38.57, + "learning_rate": 0.0003075775714634742, + "loss": 0.3313, + "step": 158075 + }, + { + "epoch": 38.58, + "learning_rate": 0.0003075470315172245, + "loss": 0.3816, + "step": 158100 + }, + { + "epoch": 38.59, + "learning_rate": 0.0003075164915709748, + "loss": 0.2628, + "step": 158125 + }, + { + "epoch": 38.59, + "learning_rate": 0.0003074859516247251, + "loss": 0.3693, + "step": 158150 + }, + { + "epoch": 38.6, + "learning_rate": 0.0003074554116784755, + "loss": 0.3403, + "step": 158175 + }, + { + "epoch": 38.6, + "learning_rate": 0.0003074248717322258, + "loss": 0.3769, + "step": 158200 + }, + { + "epoch": 38.61, + "learning_rate": 0.0003073943317859761, + "loss": 0.3627, + "step": 158225 + }, + { + "epoch": 38.62, + "learning_rate": 0.00030736379183972633, + "loss": 0.3698, + "step": 158250 + }, + { + "epoch": 38.62, + "learning_rate": 0.00030733325189347664, + "loss": 0.3424, + "step": 158275 + }, + { + "epoch": 38.63, + "learning_rate": 0.000307302711947227, + "loss": 0.3883, + "step": 158300 + }, + { + "epoch": 38.63, + "learning_rate": 0.0003072721720009773, + "loss": 0.3199, + "step": 158325 + }, + { + "epoch": 38.64, + "learning_rate": 0.0003072416320547276, + "loss": 0.3781, + "step": 158350 + }, + { + "epoch": 38.65, + "learning_rate": 0.0003072110921084779, + "loss": 0.3001, + "step": 158375 + }, + { + "epoch": 38.65, + "learning_rate": 0.00030718055216222815, + "loss": 0.3562, + "step": 158400 + }, + { + "epoch": 38.66, + "learning_rate": 0.0003071500122159785, + "loss": 0.317, + "step": 158425 + }, + { + "epoch": 38.67, + "learning_rate": 0.0003071194722697288, + "loss": 0.3913, + "step": 158450 + }, + { + "epoch": 38.67, + "learning_rate": 0.0003070889323234791, + "loss": 0.3584, + "step": 158475 + }, + { + "epoch": 38.68, + "learning_rate": 0.0003070583923772294, + "loss": 0.3619, + "step": 158500 + }, + { + "epoch": 38.68, + "learning_rate": 0.0003070278524309797, + "loss": 0.347, + "step": 158525 + }, + { + "epoch": 38.69, + "learning_rate": 0.00030699731248473003, + "loss": 0.3808, + "step": 158550 + }, + { + "epoch": 38.7, + "learning_rate": 0.00030696677253848033, + "loss": 0.3607, + "step": 158575 + }, + { + "epoch": 38.7, + "learning_rate": 0.00030693623259223064, + "loss": 0.3674, + "step": 158600 + }, + { + "epoch": 38.71, + "learning_rate": 0.00030690569264598094, + "loss": 0.3131, + "step": 158625 + }, + { + "epoch": 38.71, + "learning_rate": 0.00030687515269973124, + "loss": 0.3722, + "step": 158650 + }, + { + "epoch": 38.72, + "learning_rate": 0.0003068446127534816, + "loss": 0.346, + "step": 158675 + }, + { + "epoch": 38.73, + "learning_rate": 0.0003068140728072319, + "loss": 0.3828, + "step": 158700 + }, + { + "epoch": 38.73, + "learning_rate": 0.00030678353286098215, + "loss": 0.3791, + "step": 158725 + }, + { + "epoch": 38.74, + "learning_rate": 0.00030675299291473246, + "loss": 0.3738, + "step": 158750 + }, + { + "epoch": 38.74, + "learning_rate": 0.00030672245296848276, + "loss": 0.3576, + "step": 158775 + }, + { + "epoch": 38.75, + "learning_rate": 0.0003066919130222331, + "loss": 0.3791, + "step": 158800 + }, + { + "epoch": 38.76, + "learning_rate": 0.0003066613730759834, + "loss": 0.2818, + "step": 158825 + }, + { + "epoch": 38.76, + "learning_rate": 0.0003066308331297337, + "loss": 0.3524, + "step": 158850 + }, + { + "epoch": 38.77, + "learning_rate": 0.00030660029318348397, + "loss": 0.3395, + "step": 158875 + }, + { + "epoch": 38.78, + "learning_rate": 0.0003065697532372343, + "loss": 0.3586, + "step": 158900 + }, + { + "epoch": 38.78, + "learning_rate": 0.00030653921329098463, + "loss": 0.3633, + "step": 158925 + }, + { + "epoch": 38.79, + "learning_rate": 0.00030650867334473494, + "loss": 0.3851, + "step": 158950 + }, + { + "epoch": 38.79, + "learning_rate": 0.00030647813339848524, + "loss": 0.3311, + "step": 158975 + }, + { + "epoch": 38.8, + "learning_rate": 0.00030644759345223554, + "loss": 0.3891, + "step": 159000 + }, + { + "epoch": 38.8, + "eval_cer": 0.09004342782049835, + "eval_loss": 0.4059583842754364, + "eval_runtime": 152.7166, + "eval_samples_per_second": 27.456, + "eval_steps_per_second": 6.869, + "eval_wer": 0.3733768352365416, + "step": 159000 + }, + { + "epoch": 38.81, + "learning_rate": 0.0003064170535059858, + "loss": 0.3558, + "step": 159025 + }, + { + "epoch": 38.81, + "learning_rate": 0.00030638651355973615, + "loss": 0.3752, + "step": 159050 + }, + { + "epoch": 38.82, + "learning_rate": 0.00030635597361348645, + "loss": 0.2948, + "step": 159075 + }, + { + "epoch": 38.82, + "learning_rate": 0.00030632543366723676, + "loss": 0.3565, + "step": 159100 + }, + { + "epoch": 38.83, + "learning_rate": 0.00030629489372098706, + "loss": 0.3322, + "step": 159125 + }, + { + "epoch": 38.84, + "learning_rate": 0.00030626435377473736, + "loss": 0.3378, + "step": 159150 + }, + { + "epoch": 38.84, + "learning_rate": 0.0003062338138284877, + "loss": 0.3024, + "step": 159175 + }, + { + "epoch": 38.85, + "learning_rate": 0.00030620327388223797, + "loss": 0.3415, + "step": 159200 + }, + { + "epoch": 38.85, + "learning_rate": 0.0003061727339359883, + "loss": 0.303, + "step": 159225 + }, + { + "epoch": 38.86, + "learning_rate": 0.0003061421939897386, + "loss": 0.3643, + "step": 159250 + }, + { + "epoch": 38.87, + "learning_rate": 0.0003061128756413389, + "loss": 0.3538, + "step": 159275 + }, + { + "epoch": 38.87, + "learning_rate": 0.0003060823356950892, + "loss": 0.3531, + "step": 159300 + }, + { + "epoch": 38.88, + "learning_rate": 0.0003060517957488395, + "loss": 0.2936, + "step": 159325 + }, + { + "epoch": 38.88, + "learning_rate": 0.0003060212558025898, + "loss": 0.3812, + "step": 159350 + }, + { + "epoch": 38.89, + "learning_rate": 0.0003059907158563401, + "loss": 0.2826, + "step": 159375 + }, + { + "epoch": 38.9, + "learning_rate": 0.0003059601759100904, + "loss": 0.3285, + "step": 159400 + }, + { + "epoch": 38.9, + "learning_rate": 0.0003059296359638407, + "loss": 0.3135, + "step": 159425 + }, + { + "epoch": 38.91, + "learning_rate": 0.000305899096017591, + "loss": 0.3443, + "step": 159450 + }, + { + "epoch": 38.92, + "learning_rate": 0.00030586855607134136, + "loss": 0.3174, + "step": 159475 + }, + { + "epoch": 38.92, + "learning_rate": 0.0003058380161250916, + "loss": 0.3853, + "step": 159500 + }, + { + "epoch": 38.93, + "learning_rate": 0.0003058074761788419, + "loss": 0.3711, + "step": 159525 + }, + { + "epoch": 38.93, + "learning_rate": 0.0003057769362325922, + "loss": 0.3791, + "step": 159550 + }, + { + "epoch": 38.94, + "learning_rate": 0.0003057463962863425, + "loss": 0.3156, + "step": 159575 + }, + { + "epoch": 38.95, + "learning_rate": 0.0003057158563400929, + "loss": 0.355, + "step": 159600 + }, + { + "epoch": 38.95, + "learning_rate": 0.0003056853163938432, + "loss": 0.3496, + "step": 159625 + }, + { + "epoch": 38.96, + "learning_rate": 0.0003056547764475935, + "loss": 0.3647, + "step": 159650 + }, + { + "epoch": 38.96, + "learning_rate": 0.00030562423650134374, + "loss": 0.3236, + "step": 159675 + }, + { + "epoch": 38.97, + "learning_rate": 0.00030559369655509404, + "loss": 0.3881, + "step": 159700 + }, + { + "epoch": 38.98, + "learning_rate": 0.0003055631566088444, + "loss": 0.3831, + "step": 159725 + }, + { + "epoch": 38.98, + "learning_rate": 0.0003055326166625947, + "loss": 0.3445, + "step": 159750 + }, + { + "epoch": 38.99, + "learning_rate": 0.000305502076716345, + "loss": 0.346, + "step": 159775 + }, + { + "epoch": 38.99, + "learning_rate": 0.0003054715367700953, + "loss": 0.358, + "step": 159800 + }, + { + "epoch": 39.0, + "learning_rate": 0.00030544099682384556, + "loss": 0.3103, + "step": 159825 + }, + { + "epoch": 39.01, + "learning_rate": 0.0003054104568775959, + "loss": 0.3739, + "step": 159850 + }, + { + "epoch": 39.01, + "learning_rate": 0.0003053799169313462, + "loss": 0.2863, + "step": 159875 + }, + { + "epoch": 39.02, + "learning_rate": 0.0003053493769850965, + "loss": 0.3753, + "step": 159900 + }, + { + "epoch": 39.03, + "learning_rate": 0.0003053188370388468, + "loss": 0.3675, + "step": 159925 + }, + { + "epoch": 39.03, + "learning_rate": 0.00030528829709259713, + "loss": 0.3794, + "step": 159950 + }, + { + "epoch": 39.04, + "learning_rate": 0.0003052577571463474, + "loss": 0.358, + "step": 159975 + }, + { + "epoch": 39.04, + "learning_rate": 0.00030522721720009773, + "loss": 0.3563, + "step": 160000 + }, + { + "epoch": 39.05, + "learning_rate": 0.00030519667725384804, + "loss": 0.3202, + "step": 160025 + }, + { + "epoch": 39.06, + "learning_rate": 0.00030516613730759834, + "loss": 0.3827, + "step": 160050 + }, + { + "epoch": 39.06, + "learning_rate": 0.00030513559736134864, + "loss": 0.2992, + "step": 160075 + }, + { + "epoch": 39.07, + "learning_rate": 0.00030510505741509895, + "loss": 0.3799, + "step": 160100 + }, + { + "epoch": 39.07, + "learning_rate": 0.0003050745174688493, + "loss": 0.3517, + "step": 160125 + }, + { + "epoch": 39.08, + "learning_rate": 0.00030504397752259955, + "loss": 0.3921, + "step": 160150 + }, + { + "epoch": 39.09, + "learning_rate": 0.00030501343757634986, + "loss": 0.3031, + "step": 160175 + }, + { + "epoch": 39.09, + "learning_rate": 0.00030498289763010016, + "loss": 0.3653, + "step": 160200 + }, + { + "epoch": 39.1, + "learning_rate": 0.00030495235768385046, + "loss": 0.379, + "step": 160225 + }, + { + "epoch": 39.1, + "learning_rate": 0.0003049218177376008, + "loss": 0.3623, + "step": 160250 + }, + { + "epoch": 39.11, + "learning_rate": 0.0003048912777913511, + "loss": 0.337, + "step": 160275 + }, + { + "epoch": 39.12, + "learning_rate": 0.0003048607378451014, + "loss": 0.345, + "step": 160300 + }, + { + "epoch": 39.12, + "learning_rate": 0.0003048301978988517, + "loss": 0.3205, + "step": 160325 + }, + { + "epoch": 39.13, + "learning_rate": 0.000304799657952602, + "loss": 0.3479, + "step": 160350 + }, + { + "epoch": 39.13, + "learning_rate": 0.00030476911800635234, + "loss": 0.3246, + "step": 160375 + }, + { + "epoch": 39.14, + "learning_rate": 0.00030473857806010264, + "loss": 0.3478, + "step": 160400 + }, + { + "epoch": 39.15, + "learning_rate": 0.00030470803811385295, + "loss": 0.295, + "step": 160425 + }, + { + "epoch": 39.15, + "learning_rate": 0.0003046774981676032, + "loss": 0.3245, + "step": 160450 + }, + { + "epoch": 39.16, + "learning_rate": 0.0003046469582213535, + "loss": 0.3547, + "step": 160475 + }, + { + "epoch": 39.17, + "learning_rate": 0.00030461641827510386, + "loss": 0.3722, + "step": 160500 + }, + { + "epoch": 39.17, + "learning_rate": 0.00030458587832885416, + "loss": 0.3288, + "step": 160525 + }, + { + "epoch": 39.18, + "learning_rate": 0.00030455533838260446, + "loss": 0.4058, + "step": 160550 + }, + { + "epoch": 39.18, + "learning_rate": 0.00030452479843635477, + "loss": 0.2893, + "step": 160575 + }, + { + "epoch": 39.19, + "learning_rate": 0.000304494258490105, + "loss": 0.3485, + "step": 160600 + }, + { + "epoch": 39.2, + "learning_rate": 0.00030446371854385537, + "loss": 0.3285, + "step": 160625 + }, + { + "epoch": 39.2, + "learning_rate": 0.0003044331785976057, + "loss": 0.3315, + "step": 160650 + }, + { + "epoch": 39.21, + "learning_rate": 0.000304402638651356, + "loss": 0.32, + "step": 160675 + }, + { + "epoch": 39.21, + "learning_rate": 0.0003043720987051063, + "loss": 0.3428, + "step": 160700 + }, + { + "epoch": 39.22, + "learning_rate": 0.0003043415587588566, + "loss": 0.297, + "step": 160725 + }, + { + "epoch": 39.23, + "learning_rate": 0.00030431101881260694, + "loss": 0.3625, + "step": 160750 + }, + { + "epoch": 39.23, + "learning_rate": 0.0003042804788663572, + "loss": 0.3106, + "step": 160775 + }, + { + "epoch": 39.24, + "learning_rate": 0.0003042499389201075, + "loss": 0.3413, + "step": 160800 + }, + { + "epoch": 39.24, + "learning_rate": 0.0003042193989738578, + "loss": 0.2959, + "step": 160825 + }, + { + "epoch": 39.25, + "learning_rate": 0.0003041888590276081, + "loss": 0.3455, + "step": 160850 + }, + { + "epoch": 39.26, + "learning_rate": 0.00030415831908135846, + "loss": 0.3409, + "step": 160875 + }, + { + "epoch": 39.26, + "learning_rate": 0.00030412777913510876, + "loss": 0.3663, + "step": 160900 + }, + { + "epoch": 39.27, + "learning_rate": 0.000304097239188859, + "loss": 0.3359, + "step": 160925 + }, + { + "epoch": 39.28, + "learning_rate": 0.0003040666992426093, + "loss": 0.375, + "step": 160950 + }, + { + "epoch": 39.28, + "learning_rate": 0.0003040361592963596, + "loss": 0.3297, + "step": 160975 + }, + { + "epoch": 39.29, + "learning_rate": 0.00030400561935011, + "loss": 0.3621, + "step": 161000 + }, + { + "epoch": 39.29, + "learning_rate": 0.0003039750794038603, + "loss": 0.3113, + "step": 161025 + }, + { + "epoch": 39.3, + "learning_rate": 0.0003039445394576106, + "loss": 0.3815, + "step": 161050 + }, + { + "epoch": 39.31, + "learning_rate": 0.00030391399951136083, + "loss": 0.2934, + "step": 161075 + }, + { + "epoch": 39.31, + "learning_rate": 0.00030388345956511114, + "loss": 0.3274, + "step": 161100 + }, + { + "epoch": 39.32, + "learning_rate": 0.0003038529196188615, + "loss": 0.3138, + "step": 161125 + }, + { + "epoch": 39.32, + "learning_rate": 0.0003038223796726118, + "loss": 0.3716, + "step": 161150 + }, + { + "epoch": 39.33, + "learning_rate": 0.0003037918397263621, + "loss": 0.3124, + "step": 161175 + }, + { + "epoch": 39.34, + "learning_rate": 0.0003037612997801124, + "loss": 0.3633, + "step": 161200 + }, + { + "epoch": 39.34, + "learning_rate": 0.0003037307598338627, + "loss": 0.327, + "step": 161225 + }, + { + "epoch": 39.35, + "learning_rate": 0.000303700219887613, + "loss": 0.3636, + "step": 161250 + }, + { + "epoch": 39.35, + "learning_rate": 0.0003036696799413633, + "loss": 0.3756, + "step": 161275 + }, + { + "epoch": 39.36, + "learning_rate": 0.0003036391399951136, + "loss": 0.3734, + "step": 161300 + }, + { + "epoch": 39.37, + "learning_rate": 0.0003036086000488639, + "loss": 0.3191, + "step": 161325 + }, + { + "epoch": 39.37, + "learning_rate": 0.0003035780601026142, + "loss": 0.3649, + "step": 161350 + }, + { + "epoch": 39.38, + "learning_rate": 0.0003035475201563646, + "loss": 0.3288, + "step": 161375 + }, + { + "epoch": 39.39, + "learning_rate": 0.00030351698021011483, + "loss": 0.3663, + "step": 161400 + }, + { + "epoch": 39.39, + "learning_rate": 0.00030348644026386513, + "loss": 0.3615, + "step": 161425 + }, + { + "epoch": 39.4, + "learning_rate": 0.00030345590031761544, + "loss": 0.3597, + "step": 161450 + }, + { + "epoch": 39.4, + "learning_rate": 0.00030342536037136574, + "loss": 0.3365, + "step": 161475 + }, + { + "epoch": 39.41, + "learning_rate": 0.00030339482042511604, + "loss": 0.3327, + "step": 161500 + }, + { + "epoch": 39.42, + "learning_rate": 0.0003033642804788664, + "loss": 0.3703, + "step": 161525 + }, + { + "epoch": 39.42, + "learning_rate": 0.00030333374053261665, + "loss": 0.3808, + "step": 161550 + }, + { + "epoch": 39.43, + "learning_rate": 0.00030330320058636695, + "loss": 0.3423, + "step": 161575 + }, + { + "epoch": 39.43, + "learning_rate": 0.00030327266064011726, + "loss": 0.3588, + "step": 161600 + }, + { + "epoch": 39.44, + "learning_rate": 0.00030324212069386756, + "loss": 0.3462, + "step": 161625 + }, + { + "epoch": 39.45, + "learning_rate": 0.0003032115807476179, + "loss": 0.3527, + "step": 161650 + }, + { + "epoch": 39.45, + "learning_rate": 0.0003031810408013682, + "loss": 0.341, + "step": 161675 + }, + { + "epoch": 39.46, + "learning_rate": 0.0003031505008551185, + "loss": 0.3785, + "step": 161700 + }, + { + "epoch": 39.46, + "learning_rate": 0.0003031199609088688, + "loss": 0.2958, + "step": 161725 + }, + { + "epoch": 39.47, + "learning_rate": 0.0003030894209626191, + "loss": 0.402, + "step": 161750 + }, + { + "epoch": 39.48, + "learning_rate": 0.00030305888101636943, + "loss": 0.3029, + "step": 161775 + }, + { + "epoch": 39.48, + "learning_rate": 0.00030302834107011974, + "loss": 0.373, + "step": 161800 + }, + { + "epoch": 39.49, + "learning_rate": 0.00030299780112387004, + "loss": 0.3279, + "step": 161825 + }, + { + "epoch": 39.49, + "learning_rate": 0.00030296726117762034, + "loss": 0.3434, + "step": 161850 + }, + { + "epoch": 39.5, + "learning_rate": 0.0003029367212313706, + "loss": 0.3362, + "step": 161875 + }, + { + "epoch": 39.51, + "learning_rate": 0.00030290618128512095, + "loss": 0.3598, + "step": 161900 + }, + { + "epoch": 39.51, + "learning_rate": 0.00030287686293672126, + "loss": 0.3523, + "step": 161925 + }, + { + "epoch": 39.52, + "learning_rate": 0.00030284632299047156, + "loss": 0.354, + "step": 161950 + }, + { + "epoch": 39.53, + "learning_rate": 0.00030281578304422186, + "loss": 0.3426, + "step": 161975 + }, + { + "epoch": 39.53, + "learning_rate": 0.00030278524309797217, + "loss": 0.3668, + "step": 162000 + }, + { + "epoch": 39.53, + "eval_cer": 0.08933503074853957, + "eval_loss": 0.4087386727333069, + "eval_runtime": 152.8656, + "eval_samples_per_second": 27.429, + "eval_steps_per_second": 6.862, + "eval_wer": 0.3700815660685155, + "step": 162000 + }, + { + "epoch": 39.54, + "learning_rate": 0.0003027547031517224, + "loss": 0.3361, + "step": 162025 + }, + { + "epoch": 39.54, + "learning_rate": 0.0003027241632054727, + "loss": 0.3544, + "step": 162050 + }, + { + "epoch": 39.55, + "learning_rate": 0.0003026936232592231, + "loss": 0.3459, + "step": 162075 + }, + { + "epoch": 39.56, + "learning_rate": 0.0003026630833129734, + "loss": 0.3486, + "step": 162100 + }, + { + "epoch": 39.56, + "learning_rate": 0.0003026325433667237, + "loss": 0.3441, + "step": 162125 + }, + { + "epoch": 39.57, + "learning_rate": 0.000302602003420474, + "loss": 0.3544, + "step": 162150 + }, + { + "epoch": 39.57, + "learning_rate": 0.0003025714634742243, + "loss": 0.3274, + "step": 162175 + }, + { + "epoch": 39.58, + "learning_rate": 0.0003025409235279746, + "loss": 0.3809, + "step": 162200 + }, + { + "epoch": 39.59, + "learning_rate": 0.0003025103835817249, + "loss": 0.293, + "step": 162225 + }, + { + "epoch": 39.59, + "learning_rate": 0.0003024798436354752, + "loss": 0.3687, + "step": 162250 + }, + { + "epoch": 39.6, + "learning_rate": 0.0003024493036892255, + "loss": 0.2723, + "step": 162275 + }, + { + "epoch": 39.6, + "learning_rate": 0.0003024187637429758, + "loss": 0.3782, + "step": 162300 + }, + { + "epoch": 39.61, + "learning_rate": 0.00030238822379672617, + "loss": 0.3465, + "step": 162325 + }, + { + "epoch": 39.62, + "learning_rate": 0.0003023576838504764, + "loss": 0.3483, + "step": 162350 + }, + { + "epoch": 39.62, + "learning_rate": 0.0003023271439042267, + "loss": 0.314, + "step": 162375 + }, + { + "epoch": 39.63, + "learning_rate": 0.000302296603957977, + "loss": 0.376, + "step": 162400 + }, + { + "epoch": 39.64, + "learning_rate": 0.0003022660640117273, + "loss": 0.3641, + "step": 162425 + }, + { + "epoch": 39.64, + "learning_rate": 0.0003022355240654777, + "loss": 0.3611, + "step": 162450 + }, + { + "epoch": 39.65, + "learning_rate": 0.000302204984119228, + "loss": 0.2945, + "step": 162475 + }, + { + "epoch": 39.65, + "learning_rate": 0.00030217444417297823, + "loss": 0.3313, + "step": 162500 + }, + { + "epoch": 39.66, + "learning_rate": 0.00030214390422672854, + "loss": 0.3319, + "step": 162525 + }, + { + "epoch": 39.67, + "learning_rate": 0.00030211336428047884, + "loss": 0.3411, + "step": 162550 + }, + { + "epoch": 39.67, + "learning_rate": 0.0003020828243342292, + "loss": 0.2996, + "step": 162575 + }, + { + "epoch": 39.68, + "learning_rate": 0.0003020522843879795, + "loss": 0.3635, + "step": 162600 + }, + { + "epoch": 39.68, + "learning_rate": 0.0003020217444417298, + "loss": 0.3447, + "step": 162625 + }, + { + "epoch": 39.69, + "learning_rate": 0.0003019912044954801, + "loss": 0.3559, + "step": 162650 + }, + { + "epoch": 39.7, + "learning_rate": 0.00030196066454923036, + "loss": 0.3664, + "step": 162675 + }, + { + "epoch": 39.7, + "learning_rate": 0.0003019301246029807, + "loss": 0.3482, + "step": 162700 + }, + { + "epoch": 39.71, + "learning_rate": 0.000301899584656731, + "loss": 0.3171, + "step": 162725 + }, + { + "epoch": 39.71, + "learning_rate": 0.0003018690447104813, + "loss": 0.367, + "step": 162750 + }, + { + "epoch": 39.72, + "learning_rate": 0.0003018385047642316, + "loss": 0.3359, + "step": 162775 + }, + { + "epoch": 39.73, + "learning_rate": 0.00030180796481798193, + "loss": 0.3473, + "step": 162800 + }, + { + "epoch": 39.73, + "learning_rate": 0.00030177742487173223, + "loss": 0.3301, + "step": 162825 + }, + { + "epoch": 39.74, + "learning_rate": 0.00030174688492548254, + "loss": 0.3561, + "step": 162850 + }, + { + "epoch": 39.74, + "learning_rate": 0.00030171634497923284, + "loss": 0.3127, + "step": 162875 + }, + { + "epoch": 39.75, + "learning_rate": 0.00030168580503298314, + "loss": 0.3439, + "step": 162900 + }, + { + "epoch": 39.76, + "learning_rate": 0.00030165526508673345, + "loss": 0.2874, + "step": 162925 + }, + { + "epoch": 39.76, + "learning_rate": 0.0003016247251404838, + "loss": 0.3598, + "step": 162950 + }, + { + "epoch": 39.77, + "learning_rate": 0.00030159418519423405, + "loss": 0.2957, + "step": 162975 + }, + { + "epoch": 39.78, + "learning_rate": 0.00030156364524798436, + "loss": 0.3637, + "step": 163000 + }, + { + "epoch": 39.78, + "learning_rate": 0.00030153310530173466, + "loss": 0.3313, + "step": 163025 + }, + { + "epoch": 39.79, + "learning_rate": 0.00030150256535548496, + "loss": 0.3765, + "step": 163050 + }, + { + "epoch": 39.79, + "learning_rate": 0.0003014720254092353, + "loss": 0.3241, + "step": 163075 + }, + { + "epoch": 39.8, + "learning_rate": 0.0003014414854629856, + "loss": 0.351, + "step": 163100 + }, + { + "epoch": 39.81, + "learning_rate": 0.0003014109455167359, + "loss": 0.3051, + "step": 163125 + }, + { + "epoch": 39.81, + "learning_rate": 0.0003013804055704862, + "loss": 0.3359, + "step": 163150 + }, + { + "epoch": 39.82, + "learning_rate": 0.0003013498656242365, + "loss": 0.3172, + "step": 163175 + }, + { + "epoch": 39.82, + "learning_rate": 0.00030131932567798684, + "loss": 0.3753, + "step": 163200 + }, + { + "epoch": 39.83, + "learning_rate": 0.00030128878573173714, + "loss": 0.3561, + "step": 163225 + }, + { + "epoch": 39.84, + "learning_rate": 0.00030125824578548744, + "loss": 0.3807, + "step": 163250 + }, + { + "epoch": 39.84, + "learning_rate": 0.00030122770583923775, + "loss": 0.2925, + "step": 163275 + }, + { + "epoch": 39.85, + "learning_rate": 0.000301197165892988, + "loss": 0.3456, + "step": 163300 + }, + { + "epoch": 39.85, + "learning_rate": 0.0003011666259467383, + "loss": 0.3528, + "step": 163325 + }, + { + "epoch": 39.86, + "learning_rate": 0.00030113608600048866, + "loss": 0.3625, + "step": 163350 + }, + { + "epoch": 39.87, + "learning_rate": 0.00030110554605423896, + "loss": 0.3056, + "step": 163375 + }, + { + "epoch": 39.87, + "learning_rate": 0.00030107500610798926, + "loss": 0.3511, + "step": 163400 + }, + { + "epoch": 39.88, + "learning_rate": 0.00030104446616173957, + "loss": 0.3334, + "step": 163425 + }, + { + "epoch": 39.89, + "learning_rate": 0.0003010139262154898, + "loss": 0.348, + "step": 163450 + }, + { + "epoch": 39.89, + "learning_rate": 0.0003009833862692402, + "loss": 0.3457, + "step": 163475 + }, + { + "epoch": 39.9, + "learning_rate": 0.0003009528463229905, + "loss": 0.3472, + "step": 163500 + }, + { + "epoch": 39.9, + "learning_rate": 0.0003009223063767408, + "loss": 0.3753, + "step": 163525 + }, + { + "epoch": 39.91, + "learning_rate": 0.0003008917664304911, + "loss": 0.3817, + "step": 163550 + }, + { + "epoch": 39.92, + "learning_rate": 0.0003008612264842414, + "loss": 0.3385, + "step": 163575 + }, + { + "epoch": 39.92, + "learning_rate": 0.00030083068653799174, + "loss": 0.3407, + "step": 163600 + }, + { + "epoch": 39.93, + "learning_rate": 0.000300800146591742, + "loss": 0.274, + "step": 163625 + }, + { + "epoch": 39.93, + "learning_rate": 0.0003007696066454923, + "loss": 0.3358, + "step": 163650 + }, + { + "epoch": 39.94, + "learning_rate": 0.0003007390666992426, + "loss": 0.2925, + "step": 163675 + }, + { + "epoch": 39.95, + "learning_rate": 0.0003007085267529929, + "loss": 0.3619, + "step": 163700 + }, + { + "epoch": 39.95, + "learning_rate": 0.00030067798680674326, + "loss": 0.3223, + "step": 163725 + }, + { + "epoch": 39.96, + "learning_rate": 0.00030064744686049356, + "loss": 0.3764, + "step": 163750 + }, + { + "epoch": 39.96, + "learning_rate": 0.0003006169069142438, + "loss": 0.2987, + "step": 163775 + }, + { + "epoch": 39.97, + "learning_rate": 0.0003005863669679941, + "loss": 0.3724, + "step": 163800 + }, + { + "epoch": 39.98, + "learning_rate": 0.0003005558270217444, + "loss": 0.3446, + "step": 163825 + }, + { + "epoch": 39.98, + "learning_rate": 0.0003005252870754948, + "loss": 0.3664, + "step": 163850 + }, + { + "epoch": 39.99, + "learning_rate": 0.0003004947471292451, + "loss": 0.3606, + "step": 163875 + }, + { + "epoch": 40.0, + "learning_rate": 0.0003004642071829954, + "loss": 0.3275, + "step": 163900 + }, + { + "epoch": 40.0, + "learning_rate": 0.00030043366723674563, + "loss": 0.3197, + "step": 163925 + }, + { + "epoch": 40.01, + "learning_rate": 0.00030040312729049594, + "loss": 0.3236, + "step": 163950 + }, + { + "epoch": 40.01, + "learning_rate": 0.0003003725873442463, + "loss": 0.3119, + "step": 163975 + }, + { + "epoch": 40.02, + "learning_rate": 0.0003003420473979966, + "loss": 0.3327, + "step": 164000 + }, + { + "epoch": 132.6, + "learning_rate": 0.00013210073820669788, + "loss": 0.3925, + "step": 164025 + }, + { + "epoch": 132.62, + "learning_rate": 0.00013204447245228666, + "loss": 0.3782, + "step": 164050 + }, + { + "epoch": 132.64, + "learning_rate": 0.0001319882066978754, + "loss": 0.3837, + "step": 164075 + }, + { + "epoch": 132.66, + "learning_rate": 0.00013193194094346416, + "loss": 0.4232, + "step": 164100 + }, + { + "epoch": 132.68, + "learning_rate": 0.00013187567518905294, + "loss": 0.3438, + "step": 164125 + }, + { + "epoch": 132.7, + "learning_rate": 0.00013181940943464171, + "loss": 0.3733, + "step": 164150 + }, + { + "epoch": 132.72, + "learning_rate": 0.00013176314368023047, + "loss": 0.3464, + "step": 164175 + }, + { + "epoch": 132.74, + "learning_rate": 0.00013170687792581922, + "loss": 0.3868, + "step": 164200 + }, + { + "epoch": 132.76, + "learning_rate": 0.000131650612171408, + "loss": 0.3679, + "step": 164225 + }, + { + "epoch": 132.78, + "learning_rate": 0.00013159434641699677, + "loss": 0.3511, + "step": 164250 + }, + { + "epoch": 132.8, + "learning_rate": 0.00013153808066258552, + "loss": 0.3603, + "step": 164275 + }, + { + "epoch": 132.82, + "learning_rate": 0.0001314818149081743, + "loss": 0.3171, + "step": 164300 + }, + { + "epoch": 132.84, + "learning_rate": 0.00013142554915376305, + "loss": 0.3233, + "step": 164325 + }, + { + "epoch": 132.86, + "learning_rate": 0.0001313692833993518, + "loss": 0.3759, + "step": 164350 + }, + { + "epoch": 132.88, + "learning_rate": 0.00013131301764494058, + "loss": 0.3586, + "step": 164375 + }, + { + "epoch": 132.9, + "learning_rate": 0.00013125675189052936, + "loss": 0.3792, + "step": 164400 + }, + { + "epoch": 132.92, + "learning_rate": 0.00013120048613611811, + "loss": 0.3269, + "step": 164425 + }, + { + "epoch": 132.94, + "learning_rate": 0.00013114422038170686, + "loss": 0.383, + "step": 164450 + }, + { + "epoch": 132.96, + "learning_rate": 0.00013108795462729564, + "loss": 0.3353, + "step": 164475 + }, + { + "epoch": 132.98, + "learning_rate": 0.00013103168887288442, + "loss": 0.3276, + "step": 164500 + }, + { + "epoch": 133.0, + "learning_rate": 0.00013097542311847317, + "loss": 0.3406, + "step": 164525 + }, + { + "epoch": 133.02, + "learning_rate": 0.00013091915736406192, + "loss": 0.3269, + "step": 164550 + }, + { + "epoch": 133.04, + "learning_rate": 0.0001308628916096507, + "loss": 0.3718, + "step": 164575 + }, + { + "epoch": 133.06, + "learning_rate": 0.00013080662585523948, + "loss": 0.3165, + "step": 164600 + }, + { + "epoch": 133.08, + "learning_rate": 0.00013075036010082826, + "loss": 0.341, + "step": 164625 + }, + { + "epoch": 133.1, + "learning_rate": 0.00013069409434641698, + "loss": 0.3919, + "step": 164650 + }, + { + "epoch": 133.12, + "learning_rate": 0.00013063782859200576, + "loss": 0.3463, + "step": 164675 + }, + { + "epoch": 133.14, + "learning_rate": 0.00013058156283759454, + "loss": 0.3437, + "step": 164700 + }, + { + "epoch": 133.16, + "learning_rate": 0.0001305252970831833, + "loss": 0.3789, + "step": 164725 + }, + { + "epoch": 133.19, + "learning_rate": 0.00013046903132877204, + "loss": 0.3604, + "step": 164750 + }, + { + "epoch": 133.21, + "learning_rate": 0.00013041276557436082, + "loss": 0.3047, + "step": 164775 + }, + { + "epoch": 133.23, + "learning_rate": 0.0001303564998199496, + "loss": 0.3157, + "step": 164800 + }, + { + "epoch": 133.25, + "learning_rate": 0.00013030023406553835, + "loss": 0.3391, + "step": 164825 + }, + { + "epoch": 133.27, + "learning_rate": 0.0001302439683111271, + "loss": 0.3064, + "step": 164850 + }, + { + "epoch": 133.29, + "learning_rate": 0.00013018770255671588, + "loss": 0.316, + "step": 164875 + }, + { + "epoch": 133.31, + "learning_rate": 0.00013013143680230466, + "loss": 0.3451, + "step": 164900 + }, + { + "epoch": 133.33, + "learning_rate": 0.0001300751710478934, + "loss": 0.3783, + "step": 164925 + }, + { + "epoch": 133.35, + "learning_rate": 0.0001300189052934822, + "loss": 0.3264, + "step": 164950 + }, + { + "epoch": 133.37, + "learning_rate": 0.00012996263953907094, + "loss": 0.3266, + "step": 164975 + }, + { + "epoch": 133.39, + "learning_rate": 0.00012990637378465972, + "loss": 0.3243, + "step": 165000 + }, + { + "epoch": 133.39, + "eval_cer": 0.082004661047401, + "eval_loss": 0.38078561425209045, + "eval_runtime": 149.725, + "eval_samples_per_second": 28.005, + "eval_steps_per_second": 7.006, + "eval_wer": 0.3460032626427406, + "step": 165000 + }, + { + "epoch": 133.41, + "learning_rate": 0.00012985235866042492, + "loss": 0.3781, + "step": 165025 + }, + { + "epoch": 133.43, + "learning_rate": 0.0001297960929060137, + "loss": 0.3568, + "step": 165050 + }, + { + "epoch": 133.45, + "learning_rate": 0.00012973982715160245, + "loss": 0.3452, + "step": 165075 + }, + { + "epoch": 133.47, + "learning_rate": 0.00012968356139719122, + "loss": 0.3334, + "step": 165100 + }, + { + "epoch": 133.49, + "learning_rate": 0.00012962729564277998, + "loss": 0.3706, + "step": 165125 + }, + { + "epoch": 133.51, + "learning_rate": 0.00012957102988836875, + "loss": 0.3022, + "step": 165150 + }, + { + "epoch": 133.53, + "learning_rate": 0.0001295147641339575, + "loss": 0.3669, + "step": 165175 + }, + { + "epoch": 133.55, + "learning_rate": 0.00012945849837954626, + "loss": 0.3328, + "step": 165200 + }, + { + "epoch": 133.57, + "learning_rate": 0.00012940223262513503, + "loss": 0.3602, + "step": 165225 + }, + { + "epoch": 133.59, + "learning_rate": 0.0001293459668707238, + "loss": 0.3087, + "step": 165250 + }, + { + "epoch": 133.61, + "learning_rate": 0.0001292897011163126, + "loss": 0.3497, + "step": 165275 + }, + { + "epoch": 133.63, + "learning_rate": 0.00012923343536190132, + "loss": 0.3157, + "step": 165300 + }, + { + "epoch": 133.65, + "learning_rate": 0.0001291771696074901, + "loss": 0.3685, + "step": 165325 + }, + { + "epoch": 133.67, + "learning_rate": 0.00012912090385307887, + "loss": 0.3191, + "step": 165350 + }, + { + "epoch": 133.69, + "learning_rate": 0.00012906463809866765, + "loss": 0.3419, + "step": 165375 + }, + { + "epoch": 133.71, + "learning_rate": 0.00012900837234425637, + "loss": 0.3458, + "step": 165400 + }, + { + "epoch": 133.73, + "learning_rate": 0.00012895210658984515, + "loss": 0.3708, + "step": 165425 + }, + { + "epoch": 133.75, + "learning_rate": 0.00012889584083543393, + "loss": 0.3363, + "step": 165450 + }, + { + "epoch": 133.77, + "learning_rate": 0.00012883957508102268, + "loss": 0.3356, + "step": 165475 + }, + { + "epoch": 133.79, + "learning_rate": 0.00012878330932661143, + "loss": 0.3318, + "step": 165500 + }, + { + "epoch": 133.81, + "learning_rate": 0.0001287270435722002, + "loss": 0.3353, + "step": 165525 + }, + { + "epoch": 133.83, + "learning_rate": 0.000128670777817789, + "loss": 0.3232, + "step": 165550 + }, + { + "epoch": 133.85, + "learning_rate": 0.00012861451206337774, + "loss": 0.3464, + "step": 165575 + }, + { + "epoch": 133.87, + "learning_rate": 0.00012855824630896652, + "loss": 0.318, + "step": 165600 + }, + { + "epoch": 133.89, + "learning_rate": 0.00012850198055455527, + "loss": 0.3313, + "step": 165625 + }, + { + "epoch": 133.91, + "learning_rate": 0.00012844571480014405, + "loss": 0.3521, + "step": 165650 + }, + { + "epoch": 133.93, + "learning_rate": 0.0001283894490457328, + "loss": 0.3293, + "step": 165675 + }, + { + "epoch": 133.95, + "learning_rate": 0.00012833318329132158, + "loss": 0.3308, + "step": 165700 + }, + { + "epoch": 133.97, + "learning_rate": 0.00012827691753691033, + "loss": 0.3869, + "step": 165725 + }, + { + "epoch": 133.99, + "learning_rate": 0.0001282206517824991, + "loss": 0.3079, + "step": 165750 + }, + { + "epoch": 134.01, + "learning_rate": 0.00012816438602808786, + "loss": 0.3746, + "step": 165775 + }, + { + "epoch": 134.03, + "learning_rate": 0.00012810812027367664, + "loss": 0.3151, + "step": 165800 + }, + { + "epoch": 134.05, + "learning_rate": 0.00012805185451926542, + "loss": 0.3134, + "step": 165825 + }, + { + "epoch": 134.07, + "learning_rate": 0.00012799558876485414, + "loss": 0.3314, + "step": 165850 + }, + { + "epoch": 134.09, + "learning_rate": 0.00012793932301044292, + "loss": 0.3433, + "step": 165875 + }, + { + "epoch": 134.11, + "learning_rate": 0.0001278830572560317, + "loss": 0.3068, + "step": 165900 + }, + { + "epoch": 134.14, + "learning_rate": 0.00012782679150162048, + "loss": 0.3531, + "step": 165925 + }, + { + "epoch": 134.16, + "learning_rate": 0.0001277705257472092, + "loss": 0.2854, + "step": 165950 + }, + { + "epoch": 134.18, + "learning_rate": 0.00012771425999279798, + "loss": 0.3131, + "step": 165975 + }, + { + "epoch": 134.2, + "learning_rate": 0.00012765799423838676, + "loss": 0.3166, + "step": 166000 + }, + { + "epoch": 134.22, + "learning_rate": 0.00012760172848397554, + "loss": 0.3593, + "step": 166025 + }, + { + "epoch": 134.24, + "learning_rate": 0.00012754546272956426, + "loss": 0.2937, + "step": 166050 + }, + { + "epoch": 134.26, + "learning_rate": 0.00012748919697515304, + "loss": 0.3275, + "step": 166075 + }, + { + "epoch": 134.28, + "learning_rate": 0.00012743293122074182, + "loss": 0.31, + "step": 166100 + }, + { + "epoch": 134.3, + "learning_rate": 0.0001273766654663306, + "loss": 0.3444, + "step": 166125 + }, + { + "epoch": 134.32, + "learning_rate": 0.00012732039971191932, + "loss": 0.3116, + "step": 166150 + }, + { + "epoch": 134.34, + "learning_rate": 0.0001272641339575081, + "loss": 0.3177, + "step": 166175 + }, + { + "epoch": 134.36, + "learning_rate": 0.00012720786820309688, + "loss": 0.3111, + "step": 166200 + }, + { + "epoch": 134.38, + "learning_rate": 0.00012715160244868563, + "loss": 0.3299, + "step": 166225 + }, + { + "epoch": 134.4, + "learning_rate": 0.0001270953366942744, + "loss": 0.3308, + "step": 166250 + }, + { + "epoch": 134.42, + "learning_rate": 0.00012703907093986316, + "loss": 0.3252, + "step": 166275 + }, + { + "epoch": 134.44, + "learning_rate": 0.00012698280518545193, + "loss": 0.3124, + "step": 166300 + }, + { + "epoch": 134.46, + "learning_rate": 0.00012692653943104069, + "loss": 0.332, + "step": 166325 + }, + { + "epoch": 134.48, + "learning_rate": 0.00012687027367662946, + "loss": 0.3465, + "step": 166350 + }, + { + "epoch": 134.5, + "learning_rate": 0.00012681400792221822, + "loss": 0.3512, + "step": 166375 + }, + { + "epoch": 134.52, + "learning_rate": 0.000126757742167807, + "loss": 0.2847, + "step": 166400 + }, + { + "epoch": 134.54, + "learning_rate": 0.00012670147641339575, + "loss": 0.3292, + "step": 166425 + }, + { + "epoch": 134.56, + "learning_rate": 0.00012664521065898452, + "loss": 0.3211, + "step": 166450 + }, + { + "epoch": 134.58, + "learning_rate": 0.0001265889449045733, + "loss": 0.3182, + "step": 166475 + }, + { + "epoch": 134.6, + "learning_rate": 0.00012653267915016205, + "loss": 0.3041, + "step": 166500 + }, + { + "epoch": 134.62, + "learning_rate": 0.0001264764133957508, + "loss": 0.3265, + "step": 166525 + }, + { + "epoch": 134.64, + "learning_rate": 0.00012642014764133958, + "loss": 0.3068, + "step": 166550 + }, + { + "epoch": 134.66, + "learning_rate": 0.00012636388188692836, + "loss": 0.3571, + "step": 166575 + }, + { + "epoch": 134.68, + "learning_rate": 0.00012630761613251709, + "loss": 0.2864, + "step": 166600 + }, + { + "epoch": 134.7, + "learning_rate": 0.00012625135037810586, + "loss": 0.3247, + "step": 166625 + }, + { + "epoch": 134.72, + "learning_rate": 0.00012619508462369464, + "loss": 0.3179, + "step": 166650 + }, + { + "epoch": 134.74, + "learning_rate": 0.00012613881886928342, + "loss": 0.383, + "step": 166675 + }, + { + "epoch": 134.76, + "learning_rate": 0.00012608255311487214, + "loss": 0.3227, + "step": 166700 + }, + { + "epoch": 134.78, + "learning_rate": 0.00012602628736046092, + "loss": 0.3244, + "step": 166725 + }, + { + "epoch": 134.8, + "learning_rate": 0.0001259700216060497, + "loss": 0.3133, + "step": 166750 + }, + { + "epoch": 134.82, + "learning_rate": 0.00012591375585163848, + "loss": 0.3224, + "step": 166775 + }, + { + "epoch": 134.84, + "learning_rate": 0.00012585749009722723, + "loss": 0.3206, + "step": 166800 + }, + { + "epoch": 134.86, + "learning_rate": 0.00012580122434281598, + "loss": 0.368, + "step": 166825 + }, + { + "epoch": 134.88, + "learning_rate": 0.00012574495858840476, + "loss": 0.3022, + "step": 166850 + }, + { + "epoch": 134.9, + "learning_rate": 0.00012568869283399354, + "loss": 0.3127, + "step": 166875 + }, + { + "epoch": 134.92, + "learning_rate": 0.0001256324270795823, + "loss": 0.332, + "step": 166900 + }, + { + "epoch": 134.94, + "learning_rate": 0.00012557616132517104, + "loss": 0.3249, + "step": 166925 + }, + { + "epoch": 134.96, + "learning_rate": 0.00012551989557075982, + "loss": 0.3103, + "step": 166950 + }, + { + "epoch": 134.98, + "learning_rate": 0.00012546362981634857, + "loss": 0.3777, + "step": 166975 + }, + { + "epoch": 135.0, + "learning_rate": 0.00012540736406193735, + "loss": 0.3212, + "step": 167000 + }, + { + "epoch": 135.02, + "learning_rate": 0.0001253510983075261, + "loss": 0.3258, + "step": 167025 + }, + { + "epoch": 135.04, + "learning_rate": 0.00012529483255311488, + "loss": 0.3189, + "step": 167050 + }, + { + "epoch": 135.06, + "learning_rate": 0.00012523856679870363, + "loss": 0.2856, + "step": 167075 + }, + { + "epoch": 135.08, + "learning_rate": 0.0001251823010442924, + "loss": 0.3336, + "step": 167100 + }, + { + "epoch": 135.11, + "learning_rate": 0.0001251260352898812, + "loss": 0.3283, + "step": 167125 + }, + { + "epoch": 135.13, + "learning_rate": 0.00012506976953546994, + "loss": 0.2868, + "step": 167150 + }, + { + "epoch": 135.15, + "learning_rate": 0.0001250135037810587, + "loss": 0.2945, + "step": 167175 + }, + { + "epoch": 135.17, + "learning_rate": 0.00012495723802664747, + "loss": 0.3234, + "step": 167200 + }, + { + "epoch": 135.19, + "learning_rate": 0.00012490097227223625, + "loss": 0.3029, + "step": 167225 + }, + { + "epoch": 135.21, + "learning_rate": 0.000124844706517825, + "loss": 0.3149, + "step": 167250 + }, + { + "epoch": 135.23, + "learning_rate": 0.00012478844076341375, + "loss": 0.3135, + "step": 167275 + }, + { + "epoch": 135.25, + "learning_rate": 0.00012473217500900253, + "loss": 0.3306, + "step": 167300 + }, + { + "epoch": 135.27, + "learning_rate": 0.00012467815988476773, + "loss": 0.3093, + "step": 167325 + }, + { + "epoch": 135.29, + "learning_rate": 0.0001246218941303565, + "loss": 0.3139, + "step": 167350 + }, + { + "epoch": 135.31, + "learning_rate": 0.00012456562837594526, + "loss": 0.3219, + "step": 167375 + }, + { + "epoch": 135.33, + "learning_rate": 0.00012450936262153403, + "loss": 0.3237, + "step": 167400 + }, + { + "epoch": 135.35, + "learning_rate": 0.00012445309686712279, + "loss": 0.3151, + "step": 167425 + }, + { + "epoch": 135.37, + "learning_rate": 0.00012439683111271156, + "loss": 0.3459, + "step": 167450 + }, + { + "epoch": 135.39, + "learning_rate": 0.00012434056535830031, + "loss": 0.3431, + "step": 167475 + }, + { + "epoch": 135.41, + "learning_rate": 0.0001242842996038891, + "loss": 0.3127, + "step": 167500 + }, + { + "epoch": 135.43, + "learning_rate": 0.00012422803384947784, + "loss": 0.313, + "step": 167525 + }, + { + "epoch": 135.45, + "learning_rate": 0.00012417176809506662, + "loss": 0.303, + "step": 167550 + }, + { + "epoch": 135.47, + "learning_rate": 0.00012411550234065537, + "loss": 0.3268, + "step": 167575 + }, + { + "epoch": 135.49, + "learning_rate": 0.00012405923658624415, + "loss": 0.3701, + "step": 167600 + }, + { + "epoch": 135.51, + "learning_rate": 0.0001240029708318329, + "loss": 0.3157, + "step": 167625 + }, + { + "epoch": 135.53, + "learning_rate": 0.00012394670507742168, + "loss": 0.2676, + "step": 167650 + }, + { + "epoch": 135.55, + "learning_rate": 0.00012389043932301043, + "loss": 0.3035, + "step": 167675 + }, + { + "epoch": 135.57, + "learning_rate": 0.0001238341735685992, + "loss": 0.3092, + "step": 167700 + }, + { + "epoch": 135.59, + "learning_rate": 0.00012377790781418796, + "loss": 0.3087, + "step": 167725 + }, + { + "epoch": 135.61, + "learning_rate": 0.00012372164205977674, + "loss": 0.3078, + "step": 167750 + }, + { + "epoch": 135.63, + "learning_rate": 0.00012366537630536552, + "loss": 0.3105, + "step": 167775 + }, + { + "epoch": 135.65, + "learning_rate": 0.00012360911055095427, + "loss": 0.3049, + "step": 167800 + }, + { + "epoch": 135.67, + "learning_rate": 0.00012355284479654305, + "loss": 0.3142, + "step": 167825 + }, + { + "epoch": 135.69, + "learning_rate": 0.0001234965790421318, + "loss": 0.3163, + "step": 167850 + }, + { + "epoch": 135.71, + "learning_rate": 0.00012344031328772058, + "loss": 0.3115, + "step": 167875 + }, + { + "epoch": 135.73, + "learning_rate": 0.00012338404753330933, + "loss": 0.313, + "step": 167900 + }, + { + "epoch": 135.75, + "learning_rate": 0.0001233277817788981, + "loss": 0.3197, + "step": 167925 + }, + { + "epoch": 135.77, + "learning_rate": 0.00012327151602448686, + "loss": 0.3004, + "step": 167950 + }, + { + "epoch": 135.79, + "learning_rate": 0.00012321525027007564, + "loss": 0.3218, + "step": 167975 + }, + { + "epoch": 135.81, + "learning_rate": 0.0001231589845156644, + "loss": 0.2861, + "step": 168000 + }, + { + "epoch": 135.81, + "eval_cer": 0.07884254078416476, + "eval_loss": 0.39860469102859497, + "eval_runtime": 150.7158, + "eval_samples_per_second": 27.821, + "eval_steps_per_second": 6.96, + "eval_wer": 0.33210440456769985, + "step": 168000 + }, + { + "epoch": 135.83, + "learning_rate": 0.00012310271876125317, + "loss": 0.2921, + "step": 168025 + }, + { + "epoch": 135.85, + "learning_rate": 0.00012304645300684192, + "loss": 0.3139, + "step": 168050 + }, + { + "epoch": 135.87, + "learning_rate": 0.00012299018725243067, + "loss": 0.3147, + "step": 168075 + }, + { + "epoch": 135.89, + "learning_rate": 0.00012293392149801945, + "loss": 0.3194, + "step": 168100 + }, + { + "epoch": 135.91, + "learning_rate": 0.0001228776557436082, + "loss": 0.3239, + "step": 168125 + }, + { + "epoch": 135.93, + "learning_rate": 0.00012282138998919698, + "loss": 0.2988, + "step": 168150 + }, + { + "epoch": 135.95, + "learning_rate": 0.00012276512423478573, + "loss": 0.3145, + "step": 168175 + }, + { + "epoch": 135.97, + "learning_rate": 0.0001227088584803745, + "loss": 0.3016, + "step": 168200 + }, + { + "epoch": 135.99, + "learning_rate": 0.00012265259272596326, + "loss": 0.2996, + "step": 168225 + }, + { + "epoch": 136.01, + "learning_rate": 0.00012259632697155204, + "loss": 0.3197, + "step": 168250 + }, + { + "epoch": 136.03, + "learning_rate": 0.0001225400612171408, + "loss": 0.3165, + "step": 168275 + }, + { + "epoch": 136.05, + "learning_rate": 0.00012248379546272957, + "loss": 0.3363, + "step": 168300 + }, + { + "epoch": 136.08, + "learning_rate": 0.00012242752970831832, + "loss": 0.3163, + "step": 168325 + }, + { + "epoch": 136.1, + "learning_rate": 0.0001223712639539071, + "loss": 0.3296, + "step": 168350 + }, + { + "epoch": 136.12, + "learning_rate": 0.00012231499819949587, + "loss": 0.2873, + "step": 168375 + }, + { + "epoch": 136.14, + "learning_rate": 0.00012225873244508463, + "loss": 0.322, + "step": 168400 + }, + { + "epoch": 136.16, + "learning_rate": 0.0001222024666906734, + "loss": 0.2893, + "step": 168425 + }, + { + "epoch": 136.18, + "learning_rate": 0.00012214620093626216, + "loss": 0.3518, + "step": 168450 + }, + { + "epoch": 136.2, + "learning_rate": 0.00012208993518185093, + "loss": 0.301, + "step": 168475 + }, + { + "epoch": 136.22, + "learning_rate": 0.00012203366942743968, + "loss": 0.335, + "step": 168500 + }, + { + "epoch": 136.24, + "learning_rate": 0.00012197740367302845, + "loss": 0.2887, + "step": 168525 + }, + { + "epoch": 136.26, + "learning_rate": 0.00012192113791861721, + "loss": 0.3269, + "step": 168550 + }, + { + "epoch": 136.28, + "learning_rate": 0.00012186487216420598, + "loss": 0.277, + "step": 168575 + }, + { + "epoch": 136.3, + "learning_rate": 0.00012180860640979474, + "loss": 0.3189, + "step": 168600 + }, + { + "epoch": 136.32, + "learning_rate": 0.00012175234065538351, + "loss": 0.2905, + "step": 168625 + }, + { + "epoch": 136.34, + "learning_rate": 0.00012169607490097227, + "loss": 0.3169, + "step": 168650 + }, + { + "epoch": 136.36, + "learning_rate": 0.00012163980914656104, + "loss": 0.3394, + "step": 168675 + }, + { + "epoch": 136.38, + "learning_rate": 0.0001215835433921498, + "loss": 0.3289, + "step": 168700 + }, + { + "epoch": 136.4, + "learning_rate": 0.00012152727763773858, + "loss": 0.3032, + "step": 168725 + }, + { + "epoch": 136.42, + "learning_rate": 0.00012147101188332733, + "loss": 0.3371, + "step": 168750 + }, + { + "epoch": 136.44, + "learning_rate": 0.0001214147461289161, + "loss": 0.3093, + "step": 168775 + }, + { + "epoch": 136.46, + "learning_rate": 0.00012135848037450486, + "loss": 0.3675, + "step": 168800 + }, + { + "epoch": 136.48, + "learning_rate": 0.00012130221462009363, + "loss": 0.2731, + "step": 168825 + }, + { + "epoch": 136.5, + "learning_rate": 0.00012124594886568239, + "loss": 0.3193, + "step": 168850 + }, + { + "epoch": 136.52, + "learning_rate": 0.00012118968311127116, + "loss": 0.2995, + "step": 168875 + }, + { + "epoch": 136.54, + "learning_rate": 0.00012113341735685992, + "loss": 0.3197, + "step": 168900 + }, + { + "epoch": 136.56, + "learning_rate": 0.00012107715160244869, + "loss": 0.286, + "step": 168925 + }, + { + "epoch": 136.58, + "learning_rate": 0.00012102088584803745, + "loss": 0.3061, + "step": 168950 + }, + { + "epoch": 136.6, + "learning_rate": 0.00012096462009362622, + "loss": 0.3494, + "step": 168975 + }, + { + "epoch": 136.62, + "learning_rate": 0.00012090835433921498, + "loss": 0.298, + "step": 169000 + }, + { + "epoch": 136.64, + "learning_rate": 0.00012085208858480375, + "loss": 0.2882, + "step": 169025 + }, + { + "epoch": 136.66, + "learning_rate": 0.00012079582283039252, + "loss": 0.3382, + "step": 169050 + }, + { + "epoch": 136.68, + "learning_rate": 0.00012073955707598128, + "loss": 0.2833, + "step": 169075 + }, + { + "epoch": 136.7, + "learning_rate": 0.00012068329132157005, + "loss": 0.2912, + "step": 169100 + }, + { + "epoch": 136.72, + "learning_rate": 0.0001206270255671588, + "loss": 0.3223, + "step": 169125 + }, + { + "epoch": 136.74, + "learning_rate": 0.00012057075981274757, + "loss": 0.3128, + "step": 169150 + }, + { + "epoch": 136.76, + "learning_rate": 0.00012051449405833633, + "loss": 0.294, + "step": 169175 + }, + { + "epoch": 136.78, + "learning_rate": 0.0001204582283039251, + "loss": 0.2779, + "step": 169200 + }, + { + "epoch": 136.8, + "learning_rate": 0.00012040196254951386, + "loss": 0.3011, + "step": 169225 + }, + { + "epoch": 136.82, + "learning_rate": 0.00012034569679510263, + "loss": 0.3261, + "step": 169250 + }, + { + "epoch": 136.84, + "learning_rate": 0.0001202894310406914, + "loss": 0.2565, + "step": 169275 + }, + { + "epoch": 136.86, + "learning_rate": 0.00012023316528628016, + "loss": 0.3077, + "step": 169300 + }, + { + "epoch": 136.88, + "learning_rate": 0.00012017689953186892, + "loss": 0.3274, + "step": 169325 + }, + { + "epoch": 136.9, + "learning_rate": 0.00012012063377745769, + "loss": 0.3226, + "step": 169350 + }, + { + "epoch": 136.92, + "learning_rate": 0.00012006436802304647, + "loss": 0.3182, + "step": 169375 + }, + { + "epoch": 136.94, + "learning_rate": 0.00012000810226863522, + "loss": 0.3158, + "step": 169400 + }, + { + "epoch": 136.96, + "learning_rate": 0.000119951836514224, + "loss": 0.3394, + "step": 169425 + }, + { + "epoch": 136.98, + "learning_rate": 0.00011989557075981275, + "loss": 0.2783, + "step": 169450 + }, + { + "epoch": 137.0, + "learning_rate": 0.00011983930500540151, + "loss": 0.3017, + "step": 169475 + }, + { + "epoch": 137.03, + "learning_rate": 0.00011978303925099028, + "loss": 0.3023, + "step": 169500 + }, + { + "epoch": 137.05, + "learning_rate": 0.00011972677349657904, + "loss": 0.2827, + "step": 169525 + }, + { + "epoch": 137.07, + "learning_rate": 0.0001196705077421678, + "loss": 0.2734, + "step": 169550 + }, + { + "epoch": 137.09, + "learning_rate": 0.00011961424198775657, + "loss": 0.3511, + "step": 169575 + }, + { + "epoch": 137.11, + "learning_rate": 0.00011955797623334534, + "loss": 0.3267, + "step": 169600 + }, + { + "epoch": 137.13, + "learning_rate": 0.0001195017104789341, + "loss": 0.2964, + "step": 169625 + }, + { + "epoch": 137.15, + "learning_rate": 0.00011944544472452288, + "loss": 0.2819, + "step": 169650 + }, + { + "epoch": 137.17, + "learning_rate": 0.00011938917897011163, + "loss": 0.3149, + "step": 169675 + }, + { + "epoch": 137.19, + "learning_rate": 0.00011933291321570041, + "loss": 0.313, + "step": 169700 + }, + { + "epoch": 137.21, + "learning_rate": 0.00011927664746128916, + "loss": 0.2858, + "step": 169725 + }, + { + "epoch": 137.23, + "learning_rate": 0.00011922038170687794, + "loss": 0.2711, + "step": 169750 + }, + { + "epoch": 137.25, + "learning_rate": 0.00011916411595246669, + "loss": 0.3047, + "step": 169775 + }, + { + "epoch": 137.27, + "learning_rate": 0.00011910785019805547, + "loss": 0.2944, + "step": 169800 + }, + { + "epoch": 137.29, + "learning_rate": 0.00011905158444364422, + "loss": 0.2697, + "step": 169825 + }, + { + "epoch": 137.31, + "learning_rate": 0.00011899531868923298, + "loss": 0.2926, + "step": 169850 + }, + { + "epoch": 137.33, + "learning_rate": 0.00011893905293482175, + "loss": 0.29, + "step": 169875 + }, + { + "epoch": 137.35, + "learning_rate": 0.00011888503781058696, + "loss": 0.2891, + "step": 169900 + }, + { + "epoch": 137.37, + "learning_rate": 0.00011882877205617573, + "loss": 0.3194, + "step": 169925 + }, + { + "epoch": 137.39, + "learning_rate": 0.00011877250630176449, + "loss": 0.3081, + "step": 169950 + }, + { + "epoch": 137.41, + "learning_rate": 0.00011871624054735327, + "loss": 0.2835, + "step": 169975 + }, + { + "epoch": 137.43, + "learning_rate": 0.00011865997479294202, + "loss": 0.2794, + "step": 170000 + }, + { + "epoch": 137.45, + "learning_rate": 0.0001186037090385308, + "loss": 0.2922, + "step": 170025 + }, + { + "epoch": 137.47, + "learning_rate": 0.00011854744328411955, + "loss": 0.3218, + "step": 170050 + }, + { + "epoch": 137.49, + "learning_rate": 0.00011849117752970833, + "loss": 0.2572, + "step": 170075 + }, + { + "epoch": 137.51, + "learning_rate": 0.00011843491177529708, + "loss": 0.306, + "step": 170100 + }, + { + "epoch": 137.53, + "learning_rate": 0.00011837864602088586, + "loss": 0.287, + "step": 170125 + }, + { + "epoch": 137.55, + "learning_rate": 0.00011832238026647461, + "loss": 0.2955, + "step": 170150 + }, + { + "epoch": 137.57, + "learning_rate": 0.00011826611451206339, + "loss": 0.278, + "step": 170175 + }, + { + "epoch": 137.59, + "learning_rate": 0.00011820984875765214, + "loss": 0.2853, + "step": 170200 + }, + { + "epoch": 137.61, + "learning_rate": 0.00011815358300324092, + "loss": 0.3193, + "step": 170225 + }, + { + "epoch": 137.63, + "learning_rate": 0.00011809731724882967, + "loss": 0.2939, + "step": 170250 + }, + { + "epoch": 137.65, + "learning_rate": 0.00011804105149441843, + "loss": 0.2987, + "step": 170275 + }, + { + "epoch": 137.67, + "learning_rate": 0.00011798478574000721, + "loss": 0.3462, + "step": 170300 + }, + { + "epoch": 137.69, + "learning_rate": 0.00011792851998559596, + "loss": 0.3188, + "step": 170325 + }, + { + "epoch": 137.71, + "learning_rate": 0.00011787225423118474, + "loss": 0.2941, + "step": 170350 + }, + { + "epoch": 137.73, + "learning_rate": 0.00011781598847677349, + "loss": 0.3043, + "step": 170375 + }, + { + "epoch": 137.75, + "learning_rate": 0.00011775972272236227, + "loss": 0.3037, + "step": 170400 + }, + { + "epoch": 137.77, + "learning_rate": 0.00011770345696795102, + "loss": 0.3143, + "step": 170425 + }, + { + "epoch": 137.79, + "learning_rate": 0.0001176471912135398, + "loss": 0.3184, + "step": 170450 + }, + { + "epoch": 137.81, + "learning_rate": 0.00011759092545912855, + "loss": 0.3059, + "step": 170475 + }, + { + "epoch": 137.83, + "learning_rate": 0.00011753465970471733, + "loss": 0.2957, + "step": 170500 + }, + { + "epoch": 137.85, + "learning_rate": 0.00011747839395030608, + "loss": 0.2845, + "step": 170525 + }, + { + "epoch": 137.87, + "learning_rate": 0.00011742212819589486, + "loss": 0.2972, + "step": 170550 + }, + { + "epoch": 137.89, + "learning_rate": 0.00011736586244148361, + "loss": 0.28, + "step": 170575 + }, + { + "epoch": 137.91, + "learning_rate": 0.00011731184731724884, + "loss": 0.3189, + "step": 170600 + }, + { + "epoch": 137.93, + "learning_rate": 0.0001172555815628376, + "loss": 0.2701, + "step": 170625 + }, + { + "epoch": 137.95, + "learning_rate": 0.00011719931580842637, + "loss": 0.3023, + "step": 170650 + }, + { + "epoch": 137.97, + "learning_rate": 0.00011714305005401513, + "loss": 0.2986, + "step": 170675 + }, + { + "epoch": 138.0, + "learning_rate": 0.00011708678429960388, + "loss": 0.2969, + "step": 170700 + }, + { + "epoch": 138.02, + "learning_rate": 0.00011703051854519266, + "loss": 0.2963, + "step": 170725 + }, + { + "epoch": 138.04, + "learning_rate": 0.00011697425279078141, + "loss": 0.2854, + "step": 170750 + }, + { + "epoch": 138.06, + "learning_rate": 0.00011691798703637019, + "loss": 0.302, + "step": 170775 + }, + { + "epoch": 138.08, + "learning_rate": 0.00011686172128195894, + "loss": 0.2673, + "step": 170800 + }, + { + "epoch": 138.1, + "learning_rate": 0.00011680545552754772, + "loss": 0.3032, + "step": 170825 + }, + { + "epoch": 138.12, + "learning_rate": 0.00011674918977313647, + "loss": 0.2525, + "step": 170850 + }, + { + "epoch": 138.14, + "learning_rate": 0.00011669292401872525, + "loss": 0.3259, + "step": 170875 + }, + { + "epoch": 138.16, + "learning_rate": 0.000116636658264314, + "loss": 0.278, + "step": 170900 + }, + { + "epoch": 138.18, + "learning_rate": 0.00011658039250990278, + "loss": 0.2929, + "step": 170925 + }, + { + "epoch": 138.2, + "learning_rate": 0.00011652412675549154, + "loss": 0.2807, + "step": 170950 + }, + { + "epoch": 138.22, + "learning_rate": 0.00011646786100108031, + "loss": 0.3071, + "step": 170975 + }, + { + "epoch": 138.24, + "learning_rate": 0.00011641159524666907, + "loss": 0.2684, + "step": 171000 + }, + { + "epoch": 138.24, + "eval_cer": 0.07738468014332207, + "eval_loss": 0.4014652967453003, + "eval_runtime": 148.1695, + "eval_samples_per_second": 28.299, + "eval_steps_per_second": 7.08, + "eval_wer": 0.3298531810766721, + "step": 171000 + }, + { + "epoch": 138.26, + "learning_rate": 0.00011635532949225784, + "loss": 0.3076, + "step": 171025 + }, + { + "epoch": 138.28, + "learning_rate": 0.0001162990637378466, + "loss": 0.2608, + "step": 171050 + }, + { + "epoch": 138.3, + "learning_rate": 0.00011624279798343535, + "loss": 0.263, + "step": 171075 + }, + { + "epoch": 138.32, + "learning_rate": 0.00011618653222902413, + "loss": 0.2851, + "step": 171100 + }, + { + "epoch": 138.34, + "learning_rate": 0.00011613026647461288, + "loss": 0.3014, + "step": 171125 + }, + { + "epoch": 138.36, + "learning_rate": 0.00011607400072020166, + "loss": 0.2999, + "step": 171150 + }, + { + "epoch": 138.38, + "learning_rate": 0.00011601773496579041, + "loss": 0.282, + "step": 171175 + }, + { + "epoch": 138.4, + "learning_rate": 0.00011596146921137919, + "loss": 0.294, + "step": 171200 + }, + { + "epoch": 138.42, + "learning_rate": 0.00011590520345696794, + "loss": 0.2917, + "step": 171225 + }, + { + "epoch": 138.44, + "learning_rate": 0.00011584893770255672, + "loss": 0.2989, + "step": 171250 + }, + { + "epoch": 138.46, + "learning_rate": 0.00011579267194814549, + "loss": 0.2784, + "step": 171275 + }, + { + "epoch": 138.48, + "learning_rate": 0.00011573640619373425, + "loss": 0.2769, + "step": 171300 + }, + { + "epoch": 138.5, + "learning_rate": 0.00011568014043932302, + "loss": 0.3011, + "step": 171325 + }, + { + "epoch": 138.52, + "learning_rate": 0.00011562387468491178, + "loss": 0.2945, + "step": 171350 + }, + { + "epoch": 138.54, + "learning_rate": 0.00011556760893050055, + "loss": 0.2648, + "step": 171375 + }, + { + "epoch": 138.56, + "learning_rate": 0.0001155113431760893, + "loss": 0.2837, + "step": 171400 + }, + { + "epoch": 138.58, + "learning_rate": 0.00011545507742167808, + "loss": 0.29, + "step": 171425 + }, + { + "epoch": 138.6, + "learning_rate": 0.00011539881166726683, + "loss": 0.2791, + "step": 171450 + }, + { + "epoch": 138.62, + "learning_rate": 0.0001153425459128556, + "loss": 0.3383, + "step": 171475 + }, + { + "epoch": 138.64, + "learning_rate": 0.00011528628015844436, + "loss": 0.2563, + "step": 171500 + }, + { + "epoch": 138.66, + "learning_rate": 0.00011523001440403313, + "loss": 0.3518, + "step": 171525 + }, + { + "epoch": 138.68, + "learning_rate": 0.00011517374864962189, + "loss": 0.2703, + "step": 171550 + }, + { + "epoch": 138.7, + "learning_rate": 0.00011511748289521066, + "loss": 0.2963, + "step": 171575 + }, + { + "epoch": 138.72, + "learning_rate": 0.00011506121714079943, + "loss": 0.2854, + "step": 171600 + }, + { + "epoch": 138.74, + "learning_rate": 0.0001150049513863882, + "loss": 0.3061, + "step": 171625 + }, + { + "epoch": 138.76, + "learning_rate": 0.00011494868563197696, + "loss": 0.2825, + "step": 171650 + }, + { + "epoch": 138.78, + "learning_rate": 0.00011489241987756572, + "loss": 0.307, + "step": 171675 + }, + { + "epoch": 138.8, + "learning_rate": 0.00011483615412315449, + "loss": 0.2979, + "step": 171700 + }, + { + "epoch": 138.82, + "learning_rate": 0.00011477988836874325, + "loss": 0.2978, + "step": 171725 + }, + { + "epoch": 138.84, + "learning_rate": 0.00011472362261433202, + "loss": 0.2819, + "step": 171750 + }, + { + "epoch": 138.86, + "learning_rate": 0.00011466735685992077, + "loss": 0.299, + "step": 171775 + }, + { + "epoch": 138.88, + "learning_rate": 0.00011461109110550955, + "loss": 0.2925, + "step": 171800 + }, + { + "epoch": 138.9, + "learning_rate": 0.0001145548253510983, + "loss": 0.2929, + "step": 171825 + }, + { + "epoch": 138.92, + "learning_rate": 0.00011449855959668708, + "loss": 0.2999, + "step": 171850 + }, + { + "epoch": 138.95, + "learning_rate": 0.00011444229384227584, + "loss": 0.2954, + "step": 171875 + }, + { + "epoch": 138.97, + "learning_rate": 0.00011438602808786461, + "loss": 0.3031, + "step": 171900 + }, + { + "epoch": 138.99, + "learning_rate": 0.00011432976233345337, + "loss": 0.2931, + "step": 171925 + }, + { + "epoch": 139.01, + "learning_rate": 0.00011427349657904214, + "loss": 0.2981, + "step": 171950 + }, + { + "epoch": 139.03, + "learning_rate": 0.0001142172308246309, + "loss": 0.2876, + "step": 171975 + }, + { + "epoch": 139.05, + "learning_rate": 0.00011416096507021967, + "loss": 0.2828, + "step": 172000 + }, + { + "epoch": 139.07, + "learning_rate": 0.00011410469931580843, + "loss": 0.2878, + "step": 172025 + }, + { + "epoch": 139.09, + "learning_rate": 0.0001140484335613972, + "loss": 0.312, + "step": 172050 + }, + { + "epoch": 139.11, + "learning_rate": 0.00011399216780698596, + "loss": 0.2955, + "step": 172075 + }, + { + "epoch": 139.13, + "learning_rate": 0.00011393590205257471, + "loss": 0.2678, + "step": 172100 + }, + { + "epoch": 139.15, + "learning_rate": 0.00011387963629816349, + "loss": 0.2801, + "step": 172125 + }, + { + "epoch": 139.17, + "learning_rate": 0.00011382337054375224, + "loss": 0.2742, + "step": 172150 + }, + { + "epoch": 139.19, + "learning_rate": 0.00011376710478934102, + "loss": 0.2767, + "step": 172175 + }, + { + "epoch": 139.21, + "learning_rate": 0.00011371083903492978, + "loss": 0.2836, + "step": 172200 + }, + { + "epoch": 139.23, + "learning_rate": 0.00011365457328051855, + "loss": 0.2982, + "step": 172225 + }, + { + "epoch": 139.25, + "learning_rate": 0.00011359830752610731, + "loss": 0.2699, + "step": 172250 + }, + { + "epoch": 139.27, + "learning_rate": 0.00011354204177169608, + "loss": 0.3034, + "step": 172275 + }, + { + "epoch": 139.29, + "learning_rate": 0.00011348577601728484, + "loss": 0.3068, + "step": 172300 + }, + { + "epoch": 139.31, + "learning_rate": 0.00011342951026287361, + "loss": 0.2779, + "step": 172325 + }, + { + "epoch": 139.33, + "learning_rate": 0.00011337324450846237, + "loss": 0.2628, + "step": 172350 + }, + { + "epoch": 139.35, + "learning_rate": 0.00011331697875405114, + "loss": 0.2489, + "step": 172375 + }, + { + "epoch": 139.37, + "learning_rate": 0.0001132607129996399, + "loss": 0.3067, + "step": 172400 + }, + { + "epoch": 139.39, + "learning_rate": 0.00011320444724522867, + "loss": 0.2742, + "step": 172425 + }, + { + "epoch": 139.41, + "learning_rate": 0.00011314818149081743, + "loss": 0.2872, + "step": 172450 + }, + { + "epoch": 139.43, + "learning_rate": 0.00011309191573640618, + "loss": 0.2746, + "step": 172475 + }, + { + "epoch": 139.45, + "learning_rate": 0.00011303564998199496, + "loss": 0.3101, + "step": 172500 + }, + { + "epoch": 139.47, + "learning_rate": 0.00011297938422758373, + "loss": 0.2742, + "step": 172525 + }, + { + "epoch": 139.49, + "learning_rate": 0.00011292311847317249, + "loss": 0.2837, + "step": 172550 + }, + { + "epoch": 139.51, + "learning_rate": 0.00011286685271876126, + "loss": 0.2966, + "step": 172575 + }, + { + "epoch": 139.53, + "learning_rate": 0.00011281058696435002, + "loss": 0.2651, + "step": 172600 + }, + { + "epoch": 139.55, + "learning_rate": 0.00011275432120993879, + "loss": 0.2917, + "step": 172625 + }, + { + "epoch": 139.57, + "learning_rate": 0.00011269805545552755, + "loss": 0.325, + "step": 172650 + }, + { + "epoch": 139.59, + "learning_rate": 0.00011264178970111632, + "loss": 0.2883, + "step": 172675 + }, + { + "epoch": 139.61, + "learning_rate": 0.00011258552394670508, + "loss": 0.318, + "step": 172700 + }, + { + "epoch": 139.63, + "learning_rate": 0.00011252925819229385, + "loss": 0.2515, + "step": 172725 + }, + { + "epoch": 139.65, + "learning_rate": 0.00011247299243788261, + "loss": 0.302, + "step": 172750 + }, + { + "epoch": 139.67, + "learning_rate": 0.00011241672668347137, + "loss": 0.3091, + "step": 172775 + }, + { + "epoch": 139.69, + "learning_rate": 0.00011236046092906014, + "loss": 0.2583, + "step": 172800 + }, + { + "epoch": 139.71, + "learning_rate": 0.0001123041951746489, + "loss": 0.287, + "step": 172825 + }, + { + "epoch": 139.73, + "learning_rate": 0.00011224792942023767, + "loss": 0.2717, + "step": 172850 + }, + { + "epoch": 139.75, + "learning_rate": 0.00011219166366582643, + "loss": 0.2837, + "step": 172875 + }, + { + "epoch": 139.77, + "learning_rate": 0.0001121353979114152, + "loss": 0.3425, + "step": 172900 + }, + { + "epoch": 139.79, + "learning_rate": 0.00011207913215700396, + "loss": 0.2964, + "step": 172925 + }, + { + "epoch": 139.81, + "learning_rate": 0.00011202286640259273, + "loss": 0.2905, + "step": 172950 + }, + { + "epoch": 139.83, + "learning_rate": 0.00011196660064818149, + "loss": 0.2925, + "step": 172975 + }, + { + "epoch": 139.85, + "learning_rate": 0.00011191033489377026, + "loss": 0.2624, + "step": 173000 + }, + { + "epoch": 139.87, + "learning_rate": 0.00011185406913935902, + "loss": 0.2889, + "step": 173025 + }, + { + "epoch": 139.89, + "learning_rate": 0.00011179780338494779, + "loss": 0.2856, + "step": 173050 + }, + { + "epoch": 139.92, + "learning_rate": 0.00011174153763053655, + "loss": 0.3082, + "step": 173075 + }, + { + "epoch": 139.94, + "learning_rate": 0.00011168527187612532, + "loss": 0.2864, + "step": 173100 + }, + { + "epoch": 139.96, + "learning_rate": 0.00011162900612171408, + "loss": 0.305, + "step": 173125 + }, + { + "epoch": 139.98, + "learning_rate": 0.00011157274036730285, + "loss": 0.2429, + "step": 173150 + }, + { + "epoch": 140.0, + "learning_rate": 0.00011151647461289161, + "loss": 0.2649, + "step": 173175 + }, + { + "epoch": 140.02, + "learning_rate": 0.00011146020885848038, + "loss": 0.2885, + "step": 173200 + }, + { + "epoch": 140.04, + "learning_rate": 0.00011140394310406914, + "loss": 0.268, + "step": 173225 + }, + { + "epoch": 140.06, + "learning_rate": 0.0001113476773496579, + "loss": 0.261, + "step": 173250 + }, + { + "epoch": 140.08, + "learning_rate": 0.00011129141159524667, + "loss": 0.2635, + "step": 173275 + }, + { + "epoch": 140.1, + "learning_rate": 0.00011123514584083544, + "loss": 0.2925, + "step": 173300 + }, + { + "epoch": 140.12, + "learning_rate": 0.0001111788800864242, + "loss": 0.258, + "step": 173325 + }, + { + "epoch": 140.14, + "learning_rate": 0.00011112261433201297, + "loss": 0.2917, + "step": 173350 + }, + { + "epoch": 140.16, + "learning_rate": 0.00011106634857760173, + "loss": 0.2612, + "step": 173375 + }, + { + "epoch": 140.18, + "learning_rate": 0.0001110100828231905, + "loss": 0.2843, + "step": 173400 + }, + { + "epoch": 140.2, + "learning_rate": 0.00011095381706877926, + "loss": 0.2835, + "step": 173425 + }, + { + "epoch": 140.22, + "learning_rate": 0.00011089755131436802, + "loss": 0.2705, + "step": 173450 + }, + { + "epoch": 140.24, + "learning_rate": 0.00011084128555995679, + "loss": 0.2501, + "step": 173475 + }, + { + "epoch": 140.26, + "learning_rate": 0.00011078501980554557, + "loss": 0.2746, + "step": 173500 + }, + { + "epoch": 140.28, + "learning_rate": 0.00011072875405113432, + "loss": 0.3089, + "step": 173525 + }, + { + "epoch": 140.3, + "learning_rate": 0.00011067248829672308, + "loss": 0.2911, + "step": 173550 + }, + { + "epoch": 140.32, + "learning_rate": 0.00011061622254231185, + "loss": 0.2676, + "step": 173575 + }, + { + "epoch": 140.34, + "learning_rate": 0.00011055995678790061, + "loss": 0.3069, + "step": 173600 + }, + { + "epoch": 140.36, + "learning_rate": 0.00011050369103348938, + "loss": 0.2712, + "step": 173625 + }, + { + "epoch": 140.38, + "learning_rate": 0.00011044742527907814, + "loss": 0.3218, + "step": 173650 + }, + { + "epoch": 140.4, + "learning_rate": 0.00011039115952466691, + "loss": 0.2947, + "step": 173675 + }, + { + "epoch": 140.42, + "learning_rate": 0.00011033489377025567, + "loss": 0.2914, + "step": 173700 + }, + { + "epoch": 140.44, + "learning_rate": 0.00011027862801584444, + "loss": 0.2393, + "step": 173725 + }, + { + "epoch": 140.46, + "learning_rate": 0.0001102223622614332, + "loss": 0.2852, + "step": 173750 + }, + { + "epoch": 140.48, + "learning_rate": 0.00011016609650702197, + "loss": 0.2695, + "step": 173775 + }, + { + "epoch": 140.5, + "learning_rate": 0.00011010983075261073, + "loss": 0.2816, + "step": 173800 + }, + { + "epoch": 140.52, + "learning_rate": 0.00011005356499819951, + "loss": 0.3011, + "step": 173825 + }, + { + "epoch": 140.54, + "learning_rate": 0.00010999729924378826, + "loss": 0.273, + "step": 173850 + }, + { + "epoch": 140.56, + "learning_rate": 0.00010994103348937704, + "loss": 0.2642, + "step": 173875 + }, + { + "epoch": 140.58, + "learning_rate": 0.00010988476773496579, + "loss": 0.3017, + "step": 173900 + }, + { + "epoch": 140.6, + "learning_rate": 0.00010982850198055456, + "loss": 0.2992, + "step": 173925 + }, + { + "epoch": 140.62, + "learning_rate": 0.00010977223622614332, + "loss": 0.2861, + "step": 173950 + }, + { + "epoch": 140.64, + "learning_rate": 0.00010971597047173209, + "loss": 0.2856, + "step": 173975 + }, + { + "epoch": 140.66, + "learning_rate": 0.00010965970471732085, + "loss": 0.3027, + "step": 174000 + }, + { + "epoch": 140.66, + "eval_cer": 0.07708181472849912, + "eval_loss": 0.4022682011127472, + "eval_runtime": 148.8918, + "eval_samples_per_second": 28.161, + "eval_steps_per_second": 7.045, + "eval_wer": 0.3271778140293638, + "step": 174000 + }, + { + "epoch": 140.68, + "learning_rate": 0.00010960343896290961, + "loss": 0.2699, + "step": 174025 + }, + { + "epoch": 140.7, + "learning_rate": 0.00010954717320849838, + "loss": 0.3009, + "step": 174050 + }, + { + "epoch": 140.72, + "learning_rate": 0.00010949090745408714, + "loss": 0.2494, + "step": 174075 + }, + { + "epoch": 140.74, + "learning_rate": 0.00010943464169967591, + "loss": 0.2995, + "step": 174100 + }, + { + "epoch": 140.76, + "learning_rate": 0.00010937837594526467, + "loss": 0.2852, + "step": 174125 + }, + { + "epoch": 140.78, + "learning_rate": 0.00010932211019085345, + "loss": 0.2718, + "step": 174150 + }, + { + "epoch": 140.8, + "learning_rate": 0.0001092658444364422, + "loss": 0.2706, + "step": 174175 + }, + { + "epoch": 140.82, + "learning_rate": 0.00010920957868203098, + "loss": 0.2943, + "step": 174200 + }, + { + "epoch": 140.84, + "learning_rate": 0.00010915331292761973, + "loss": 0.2803, + "step": 174225 + }, + { + "epoch": 140.86, + "learning_rate": 0.0001090970471732085, + "loss": 0.3043, + "step": 174250 + }, + { + "epoch": 140.89, + "learning_rate": 0.00010904078141879726, + "loss": 0.2994, + "step": 174275 + }, + { + "epoch": 140.91, + "learning_rate": 0.00010898451566438603, + "loss": 0.2499, + "step": 174300 + }, + { + "epoch": 140.93, + "learning_rate": 0.00010892824990997479, + "loss": 0.255, + "step": 174325 + }, + { + "epoch": 140.95, + "learning_rate": 0.00010887198415556356, + "loss": 0.3099, + "step": 174350 + }, + { + "epoch": 140.97, + "learning_rate": 0.00010881571840115232, + "loss": 0.2674, + "step": 174375 + }, + { + "epoch": 140.99, + "learning_rate": 0.00010875945264674109, + "loss": 0.286, + "step": 174400 + }, + { + "epoch": 141.01, + "learning_rate": 0.00010870318689232987, + "loss": 0.2941, + "step": 174425 + }, + { + "epoch": 141.03, + "learning_rate": 0.00010864692113791862, + "loss": 0.2946, + "step": 174450 + }, + { + "epoch": 141.05, + "learning_rate": 0.0001085906553835074, + "loss": 0.2516, + "step": 174475 + }, + { + "epoch": 141.07, + "learning_rate": 0.00010853438962909615, + "loss": 0.2951, + "step": 174500 + }, + { + "epoch": 141.09, + "learning_rate": 0.00010847812387468492, + "loss": 0.2711, + "step": 174525 + }, + { + "epoch": 141.11, + "learning_rate": 0.00010842185812027368, + "loss": 0.2711, + "step": 174550 + }, + { + "epoch": 141.13, + "learning_rate": 0.00010836559236586245, + "loss": 0.2735, + "step": 174575 + }, + { + "epoch": 141.15, + "learning_rate": 0.0001083093266114512, + "loss": 0.2538, + "step": 174600 + }, + { + "epoch": 141.17, + "learning_rate": 0.00010825306085703997, + "loss": 0.292, + "step": 174625 + }, + { + "epoch": 141.19, + "learning_rate": 0.00010819679510262873, + "loss": 0.2676, + "step": 174650 + }, + { + "epoch": 141.21, + "learning_rate": 0.0001081405293482175, + "loss": 0.3015, + "step": 174675 + }, + { + "epoch": 141.23, + "learning_rate": 0.00010808426359380626, + "loss": 0.2743, + "step": 174700 + }, + { + "epoch": 141.25, + "learning_rate": 0.00010802799783939503, + "loss": 0.3051, + "step": 174725 + }, + { + "epoch": 141.27, + "learning_rate": 0.00010797173208498381, + "loss": 0.2722, + "step": 174750 + }, + { + "epoch": 141.29, + "learning_rate": 0.000107917716960749, + "loss": 0.2842, + "step": 174775 + }, + { + "epoch": 141.31, + "learning_rate": 0.00010786145120633778, + "loss": 0.2956, + "step": 174800 + }, + { + "epoch": 141.33, + "learning_rate": 0.00010780518545192654, + "loss": 0.2599, + "step": 174825 + }, + { + "epoch": 141.35, + "learning_rate": 0.00010774891969751531, + "loss": 0.2926, + "step": 174850 + }, + { + "epoch": 141.37, + "learning_rate": 0.00010769265394310407, + "loss": 0.273, + "step": 174875 + }, + { + "epoch": 141.39, + "learning_rate": 0.00010763638818869284, + "loss": 0.2931, + "step": 174900 + }, + { + "epoch": 141.41, + "learning_rate": 0.0001075801224342816, + "loss": 0.2713, + "step": 174925 + }, + { + "epoch": 141.43, + "learning_rate": 0.00010752385667987037, + "loss": 0.2927, + "step": 174950 + }, + { + "epoch": 141.45, + "learning_rate": 0.00010746759092545912, + "loss": 0.2819, + "step": 174975 + }, + { + "epoch": 141.47, + "learning_rate": 0.0001074113251710479, + "loss": 0.2662, + "step": 175000 + }, + { + "epoch": 141.49, + "learning_rate": 0.00010735505941663665, + "loss": 0.2878, + "step": 175025 + }, + { + "epoch": 141.51, + "learning_rate": 0.00010729879366222542, + "loss": 0.2845, + "step": 175050 + }, + { + "epoch": 141.53, + "learning_rate": 0.0001072425279078142, + "loss": 0.2991, + "step": 175075 + }, + { + "epoch": 141.55, + "learning_rate": 0.00010718626215340295, + "loss": 0.2895, + "step": 175100 + }, + { + "epoch": 141.57, + "learning_rate": 0.00010712999639899173, + "loss": 0.2725, + "step": 175125 + }, + { + "epoch": 141.59, + "learning_rate": 0.00010707373064458048, + "loss": 0.278, + "step": 175150 + }, + { + "epoch": 141.61, + "learning_rate": 0.00010701746489016926, + "loss": 0.3198, + "step": 175175 + }, + { + "epoch": 141.63, + "learning_rate": 0.00010696119913575801, + "loss": 0.2396, + "step": 175200 + }, + { + "epoch": 141.65, + "learning_rate": 0.00010690493338134679, + "loss": 0.2867, + "step": 175225 + }, + { + "epoch": 141.67, + "learning_rate": 0.00010684866762693554, + "loss": 0.261, + "step": 175250 + }, + { + "epoch": 141.69, + "learning_rate": 0.00010679240187252432, + "loss": 0.2841, + "step": 175275 + }, + { + "epoch": 141.71, + "learning_rate": 0.00010673613611811307, + "loss": 0.2834, + "step": 175300 + }, + { + "epoch": 141.73, + "learning_rate": 0.00010667987036370185, + "loss": 0.3053, + "step": 175325 + }, + { + "epoch": 141.75, + "learning_rate": 0.0001066236046092906, + "loss": 0.266, + "step": 175350 + }, + { + "epoch": 141.77, + "learning_rate": 0.00010656733885487936, + "loss": 0.243, + "step": 175375 + }, + { + "epoch": 141.79, + "learning_rate": 0.00010651107310046814, + "loss": 0.2668, + "step": 175400 + }, + { + "epoch": 141.81, + "learning_rate": 0.00010645480734605689, + "loss": 0.2564, + "step": 175425 + }, + { + "epoch": 141.84, + "learning_rate": 0.00010639854159164567, + "loss": 0.28, + "step": 175450 + }, + { + "epoch": 141.86, + "learning_rate": 0.00010634227583723442, + "loss": 0.2736, + "step": 175475 + }, + { + "epoch": 141.88, + "learning_rate": 0.0001062860100828232, + "loss": 0.2765, + "step": 175500 + }, + { + "epoch": 141.9, + "learning_rate": 0.00010622974432841195, + "loss": 0.2498, + "step": 175525 + }, + { + "epoch": 141.92, + "learning_rate": 0.00010617347857400073, + "loss": 0.2621, + "step": 175550 + }, + { + "epoch": 141.94, + "learning_rate": 0.00010611721281958948, + "loss": 0.2964, + "step": 175575 + }, + { + "epoch": 141.96, + "learning_rate": 0.00010606094706517826, + "loss": 0.2681, + "step": 175600 + }, + { + "epoch": 141.98, + "learning_rate": 0.00010600468131076701, + "loss": 0.2661, + "step": 175625 + }, + { + "epoch": 142.0, + "learning_rate": 0.00010594841555635579, + "loss": 0.3061, + "step": 175650 + }, + { + "epoch": 142.02, + "learning_rate": 0.00010589214980194454, + "loss": 0.2647, + "step": 175675 + }, + { + "epoch": 142.04, + "learning_rate": 0.00010583588404753332, + "loss": 0.2527, + "step": 175700 + }, + { + "epoch": 142.06, + "learning_rate": 0.00010577961829312208, + "loss": 0.2711, + "step": 175725 + }, + { + "epoch": 142.08, + "learning_rate": 0.00010572335253871083, + "loss": 0.2901, + "step": 175750 + }, + { + "epoch": 142.1, + "learning_rate": 0.00010566708678429961, + "loss": 0.2703, + "step": 175775 + }, + { + "epoch": 142.12, + "learning_rate": 0.00010561082102988836, + "loss": 0.2531, + "step": 175800 + }, + { + "epoch": 142.14, + "learning_rate": 0.00010555455527547714, + "loss": 0.2782, + "step": 175825 + }, + { + "epoch": 142.16, + "learning_rate": 0.00010549828952106589, + "loss": 0.2693, + "step": 175850 + }, + { + "epoch": 142.18, + "learning_rate": 0.00010544202376665467, + "loss": 0.2651, + "step": 175875 + }, + { + "epoch": 142.2, + "learning_rate": 0.00010538575801224342, + "loss": 0.2791, + "step": 175900 + }, + { + "epoch": 142.22, + "learning_rate": 0.0001053294922578322, + "loss": 0.2897, + "step": 175925 + }, + { + "epoch": 142.24, + "learning_rate": 0.00010527322650342095, + "loss": 0.2439, + "step": 175950 + }, + { + "epoch": 142.26, + "learning_rate": 0.00010521696074900973, + "loss": 0.2884, + "step": 175975 + }, + { + "epoch": 142.28, + "learning_rate": 0.00010516069499459848, + "loss": 0.255, + "step": 176000 + }, + { + "epoch": 142.3, + "learning_rate": 0.00010510442924018726, + "loss": 0.2626, + "step": 176025 + }, + { + "epoch": 142.32, + "learning_rate": 0.00010504816348577602, + "loss": 0.2629, + "step": 176050 + }, + { + "epoch": 142.34, + "learning_rate": 0.00010499189773136479, + "loss": 0.2627, + "step": 176075 + }, + { + "epoch": 142.36, + "learning_rate": 0.00010493563197695355, + "loss": 0.2666, + "step": 176100 + }, + { + "epoch": 142.38, + "learning_rate": 0.0001048793662225423, + "loss": 0.256, + "step": 176125 + }, + { + "epoch": 142.4, + "learning_rate": 0.00010482310046813108, + "loss": 0.2422, + "step": 176150 + }, + { + "epoch": 142.42, + "learning_rate": 0.00010476683471371984, + "loss": 0.2624, + "step": 176175 + }, + { + "epoch": 142.44, + "learning_rate": 0.00010471056895930861, + "loss": 0.2484, + "step": 176200 + }, + { + "epoch": 142.46, + "learning_rate": 0.00010465430320489736, + "loss": 0.2808, + "step": 176225 + }, + { + "epoch": 142.48, + "learning_rate": 0.00010459803745048614, + "loss": 0.2721, + "step": 176250 + }, + { + "epoch": 142.5, + "learning_rate": 0.0001045417716960749, + "loss": 0.2502, + "step": 176275 + }, + { + "epoch": 142.52, + "learning_rate": 0.00010448550594166367, + "loss": 0.2818, + "step": 176300 + }, + { + "epoch": 142.54, + "learning_rate": 0.00010442924018725242, + "loss": 0.2806, + "step": 176325 + }, + { + "epoch": 142.56, + "learning_rate": 0.0001043729744328412, + "loss": 0.2663, + "step": 176350 + }, + { + "epoch": 142.58, + "learning_rate": 0.00010431670867842997, + "loss": 0.2644, + "step": 176375 + }, + { + "epoch": 142.6, + "learning_rate": 0.00010426044292401873, + "loss": 0.2705, + "step": 176400 + }, + { + "epoch": 142.62, + "learning_rate": 0.0001042041771696075, + "loss": 0.2603, + "step": 176425 + }, + { + "epoch": 142.64, + "learning_rate": 0.00010414791141519625, + "loss": 0.2746, + "step": 176450 + }, + { + "epoch": 142.66, + "learning_rate": 0.00010409164566078503, + "loss": 0.3054, + "step": 176475 + }, + { + "epoch": 142.68, + "learning_rate": 0.00010403537990637378, + "loss": 0.2514, + "step": 176500 + }, + { + "epoch": 142.7, + "learning_rate": 0.00010397911415196256, + "loss": 0.2954, + "step": 176525 + }, + { + "epoch": 142.72, + "learning_rate": 0.00010392284839755131, + "loss": 0.2764, + "step": 176550 + }, + { + "epoch": 142.74, + "learning_rate": 0.00010386658264314009, + "loss": 0.3033, + "step": 176575 + }, + { + "epoch": 142.76, + "learning_rate": 0.00010381031688872884, + "loss": 0.2734, + "step": 176600 + }, + { + "epoch": 142.78, + "learning_rate": 0.00010375405113431762, + "loss": 0.2748, + "step": 176625 + }, + { + "epoch": 142.81, + "learning_rate": 0.00010369778537990637, + "loss": 0.291, + "step": 176650 + }, + { + "epoch": 142.83, + "learning_rate": 0.00010364151962549514, + "loss": 0.2815, + "step": 176675 + }, + { + "epoch": 142.85, + "learning_rate": 0.00010358525387108391, + "loss": 0.2591, + "step": 176700 + }, + { + "epoch": 142.87, + "learning_rate": 0.00010352898811667267, + "loss": 0.2985, + "step": 176725 + }, + { + "epoch": 142.89, + "learning_rate": 0.00010347272236226144, + "loss": 0.2495, + "step": 176750 + }, + { + "epoch": 142.91, + "learning_rate": 0.0001034164566078502, + "loss": 0.2591, + "step": 176775 + }, + { + "epoch": 142.93, + "learning_rate": 0.00010336019085343897, + "loss": 0.2359, + "step": 176800 + }, + { + "epoch": 142.95, + "learning_rate": 0.00010330392509902772, + "loss": 0.3169, + "step": 176825 + }, + { + "epoch": 142.97, + "learning_rate": 0.0001032476593446165, + "loss": 0.2446, + "step": 176850 + }, + { + "epoch": 142.99, + "learning_rate": 0.00010319139359020525, + "loss": 0.251, + "step": 176875 + }, + { + "epoch": 143.01, + "learning_rate": 0.00010313512783579403, + "loss": 0.2533, + "step": 176900 + }, + { + "epoch": 143.03, + "learning_rate": 0.00010307886208138278, + "loss": 0.2458, + "step": 176925 + }, + { + "epoch": 143.05, + "learning_rate": 0.00010302259632697156, + "loss": 0.2945, + "step": 176950 + }, + { + "epoch": 143.07, + "learning_rate": 0.00010296633057256031, + "loss": 0.2787, + "step": 176975 + }, + { + "epoch": 143.09, + "learning_rate": 0.00010291006481814909, + "loss": 0.2742, + "step": 177000 + }, + { + "epoch": 143.09, + "eval_cer": 0.07704074823157397, + "eval_loss": 0.4133159816265106, + "eval_runtime": 148.921, + "eval_samples_per_second": 28.156, + "eval_steps_per_second": 7.044, + "eval_wer": 0.3272756933115824, + "step": 177000 + }, + { + "epoch": 143.11, + "learning_rate": 0.00010285379906373785, + "loss": 0.3223, + "step": 177025 + }, + { + "epoch": 143.13, + "learning_rate": 0.00010279753330932662, + "loss": 0.2516, + "step": 177050 + }, + { + "epoch": 143.15, + "learning_rate": 0.00010274126755491538, + "loss": 0.2412, + "step": 177075 + }, + { + "epoch": 143.17, + "learning_rate": 0.00010268500180050415, + "loss": 0.3262, + "step": 177100 + }, + { + "epoch": 143.19, + "learning_rate": 0.00010262873604609291, + "loss": 0.2569, + "step": 177125 + }, + { + "epoch": 143.21, + "learning_rate": 0.00010257247029168168, + "loss": 0.2536, + "step": 177150 + }, + { + "epoch": 143.23, + "learning_rate": 0.00010251620453727044, + "loss": 0.2279, + "step": 177175 + }, + { + "epoch": 143.25, + "learning_rate": 0.00010245993878285919, + "loss": 0.2628, + "step": 177200 + }, + { + "epoch": 143.27, + "learning_rate": 0.00010240367302844797, + "loss": 0.2487, + "step": 177225 + }, + { + "epoch": 143.29, + "learning_rate": 0.00010234740727403672, + "loss": 0.2353, + "step": 177250 + }, + { + "epoch": 143.31, + "learning_rate": 0.0001022911415196255, + "loss": 0.27, + "step": 177275 + }, + { + "epoch": 143.33, + "learning_rate": 0.00010223487576521426, + "loss": 0.2688, + "step": 177300 + }, + { + "epoch": 143.35, + "learning_rate": 0.00010217861001080303, + "loss": 0.2563, + "step": 177325 + }, + { + "epoch": 143.37, + "learning_rate": 0.0001021223442563918, + "loss": 0.2587, + "step": 177350 + }, + { + "epoch": 143.39, + "learning_rate": 0.00010206607850198056, + "loss": 0.2638, + "step": 177375 + }, + { + "epoch": 143.41, + "learning_rate": 0.00010201206337774577, + "loss": 0.2754, + "step": 177400 + }, + { + "epoch": 143.43, + "learning_rate": 0.00010195579762333454, + "loss": 0.296, + "step": 177425 + }, + { + "epoch": 143.45, + "learning_rate": 0.0001018995318689233, + "loss": 0.2548, + "step": 177450 + }, + { + "epoch": 143.47, + "learning_rate": 0.00010184326611451207, + "loss": 0.2865, + "step": 177475 + }, + { + "epoch": 143.49, + "learning_rate": 0.00010178700036010083, + "loss": 0.2461, + "step": 177500 + }, + { + "epoch": 143.51, + "learning_rate": 0.0001017307346056896, + "loss": 0.2623, + "step": 177525 + }, + { + "epoch": 143.53, + "learning_rate": 0.00010167446885127836, + "loss": 0.2453, + "step": 177550 + }, + { + "epoch": 143.55, + "learning_rate": 0.00010161820309686713, + "loss": 0.2594, + "step": 177575 + }, + { + "epoch": 143.57, + "learning_rate": 0.00010156193734245589, + "loss": 0.2596, + "step": 177600 + }, + { + "epoch": 143.59, + "learning_rate": 0.00010150567158804465, + "loss": 0.2489, + "step": 177625 + }, + { + "epoch": 143.61, + "learning_rate": 0.00010144940583363342, + "loss": 0.3084, + "step": 177650 + }, + { + "epoch": 143.63, + "learning_rate": 0.00010139314007922218, + "loss": 0.2514, + "step": 177675 + }, + { + "epoch": 143.65, + "learning_rate": 0.00010133687432481095, + "loss": 0.2738, + "step": 177700 + }, + { + "epoch": 143.67, + "learning_rate": 0.00010128060857039971, + "loss": 0.2646, + "step": 177725 + }, + { + "epoch": 143.69, + "learning_rate": 0.00010122659344616493, + "loss": 0.2791, + "step": 177750 + }, + { + "epoch": 143.71, + "learning_rate": 0.00010117032769175369, + "loss": 0.2591, + "step": 177775 + }, + { + "epoch": 143.73, + "learning_rate": 0.00010111406193734246, + "loss": 0.285, + "step": 177800 + }, + { + "epoch": 143.76, + "learning_rate": 0.00010105779618293122, + "loss": 0.2542, + "step": 177825 + }, + { + "epoch": 143.78, + "learning_rate": 0.00010100153042851999, + "loss": 0.2748, + "step": 177850 + }, + { + "epoch": 143.8, + "learning_rate": 0.00010094526467410875, + "loss": 0.2367, + "step": 177875 + }, + { + "epoch": 143.82, + "learning_rate": 0.00010088899891969752, + "loss": 0.2801, + "step": 177900 + }, + { + "epoch": 143.84, + "learning_rate": 0.00010083273316528628, + "loss": 0.26, + "step": 177925 + }, + { + "epoch": 143.86, + "learning_rate": 0.00010077646741087506, + "loss": 0.2576, + "step": 177950 + }, + { + "epoch": 143.88, + "learning_rate": 0.00010072020165646381, + "loss": 0.2953, + "step": 177975 + }, + { + "epoch": 143.9, + "learning_rate": 0.00010066393590205259, + "loss": 0.2709, + "step": 178000 + }, + { + "epoch": 143.92, + "learning_rate": 0.00010060767014764134, + "loss": 0.2523, + "step": 178025 + }, + { + "epoch": 143.94, + "learning_rate": 0.0001005514043932301, + "loss": 0.2694, + "step": 178050 + }, + { + "epoch": 143.96, + "learning_rate": 0.00010049513863881887, + "loss": 0.2635, + "step": 178075 + }, + { + "epoch": 143.98, + "learning_rate": 0.00010043887288440763, + "loss": 0.2893, + "step": 178100 + }, + { + "epoch": 144.0, + "learning_rate": 0.0001003826071299964, + "loss": 0.2153, + "step": 178125 + }, + { + "epoch": 144.02, + "learning_rate": 0.00010032634137558516, + "loss": 0.2666, + "step": 178150 + }, + { + "epoch": 144.04, + "learning_rate": 0.00010027007562117393, + "loss": 0.2425, + "step": 178175 + }, + { + "epoch": 144.06, + "learning_rate": 0.00010021380986676269, + "loss": 0.3232, + "step": 178200 + }, + { + "epoch": 144.08, + "learning_rate": 0.00010015754411235146, + "loss": 0.2406, + "step": 178225 + }, + { + "epoch": 144.1, + "learning_rate": 0.00010010127835794022, + "loss": 0.2781, + "step": 178250 + }, + { + "epoch": 144.12, + "learning_rate": 0.000100045012603529, + "loss": 0.2836, + "step": 178275 + }, + { + "epoch": 144.14, + "learning_rate": 9.998874684911775e-05, + "loss": 0.2649, + "step": 178300 + }, + { + "epoch": 144.16, + "learning_rate": 9.993248109470653e-05, + "loss": 0.2533, + "step": 178325 + }, + { + "epoch": 144.18, + "learning_rate": 9.987621534029528e-05, + "loss": 0.2742, + "step": 178350 + }, + { + "epoch": 144.2, + "learning_rate": 9.981994958588405e-05, + "loss": 0.2831, + "step": 178375 + }, + { + "epoch": 144.22, + "learning_rate": 9.976368383147281e-05, + "loss": 0.2591, + "step": 178400 + }, + { + "epoch": 144.24, + "learning_rate": 9.970741807706158e-05, + "loss": 0.3329, + "step": 178425 + }, + { + "epoch": 144.26, + "learning_rate": 9.965115232265034e-05, + "loss": 0.2753, + "step": 178450 + }, + { + "epoch": 144.28, + "learning_rate": 9.95948865682391e-05, + "loss": 0.2812, + "step": 178475 + }, + { + "epoch": 144.3, + "learning_rate": 9.953862081382787e-05, + "loss": 0.2858, + "step": 178500 + }, + { + "epoch": 144.32, + "learning_rate": 9.948235505941664e-05, + "loss": 0.2483, + "step": 178525 + }, + { + "epoch": 144.34, + "learning_rate": 9.942608930500541e-05, + "loss": 0.2794, + "step": 178550 + }, + { + "epoch": 144.36, + "learning_rate": 9.936982355059417e-05, + "loss": 0.2633, + "step": 178575 + }, + { + "epoch": 144.38, + "learning_rate": 9.931355779618294e-05, + "loss": 0.2647, + "step": 178600 + }, + { + "epoch": 144.4, + "learning_rate": 9.92572920417717e-05, + "loss": 0.2696, + "step": 178625 + }, + { + "epoch": 144.42, + "learning_rate": 9.920102628736047e-05, + "loss": 0.2561, + "step": 178650 + }, + { + "epoch": 144.44, + "learning_rate": 9.914476053294922e-05, + "loss": 0.2813, + "step": 178675 + }, + { + "epoch": 144.46, + "learning_rate": 9.9088494778538e-05, + "loss": 0.263, + "step": 178700 + }, + { + "epoch": 144.48, + "learning_rate": 9.903222902412675e-05, + "loss": 0.2509, + "step": 178725 + }, + { + "epoch": 144.5, + "learning_rate": 9.897596326971552e-05, + "loss": 0.2884, + "step": 178750 + }, + { + "epoch": 144.52, + "learning_rate": 9.891969751530428e-05, + "loss": 0.234, + "step": 178775 + }, + { + "epoch": 144.54, + "learning_rate": 9.886343176089305e-05, + "loss": 0.269, + "step": 178800 + }, + { + "epoch": 144.56, + "learning_rate": 9.880716600648181e-05, + "loss": 0.2357, + "step": 178825 + }, + { + "epoch": 144.58, + "learning_rate": 9.875090025207058e-05, + "loss": 0.2629, + "step": 178850 + }, + { + "epoch": 144.6, + "learning_rate": 9.869463449765936e-05, + "loss": 0.2591, + "step": 178875 + }, + { + "epoch": 144.62, + "learning_rate": 9.863836874324811e-05, + "loss": 0.2542, + "step": 178900 + }, + { + "epoch": 144.64, + "learning_rate": 9.858210298883689e-05, + "loss": 0.2394, + "step": 178925 + }, + { + "epoch": 144.66, + "learning_rate": 9.852583723442564e-05, + "loss": 0.2625, + "step": 178950 + }, + { + "epoch": 144.68, + "learning_rate": 9.846957148001442e-05, + "loss": 0.2806, + "step": 178975 + }, + { + "epoch": 144.7, + "learning_rate": 9.841330572560317e-05, + "loss": 0.2456, + "step": 179000 + }, + { + "epoch": 144.73, + "learning_rate": 9.835703997119195e-05, + "loss": 0.2521, + "step": 179025 + }, + { + "epoch": 144.75, + "learning_rate": 9.83007742167807e-05, + "loss": 0.2492, + "step": 179050 + }, + { + "epoch": 144.77, + "learning_rate": 9.824450846236947e-05, + "loss": 0.2117, + "step": 179075 + }, + { + "epoch": 144.79, + "learning_rate": 9.818824270795823e-05, + "loss": 0.2542, + "step": 179100 + }, + { + "epoch": 144.81, + "learning_rate": 9.813197695354699e-05, + "loss": 0.2675, + "step": 179125 + }, + { + "epoch": 144.83, + "learning_rate": 9.807571119913576e-05, + "loss": 0.283, + "step": 179150 + }, + { + "epoch": 144.85, + "learning_rate": 9.801944544472452e-05, + "loss": 0.2702, + "step": 179175 + }, + { + "epoch": 144.87, + "learning_rate": 9.79631796903133e-05, + "loss": 0.2926, + "step": 179200 + }, + { + "epoch": 144.89, + "learning_rate": 9.790691393590205e-05, + "loss": 0.2802, + "step": 179225 + }, + { + "epoch": 144.91, + "learning_rate": 9.785064818149083e-05, + "loss": 0.2731, + "step": 179250 + }, + { + "epoch": 144.93, + "learning_rate": 9.779438242707958e-05, + "loss": 0.2636, + "step": 179275 + }, + { + "epoch": 144.95, + "learning_rate": 9.773811667266836e-05, + "loss": 0.2672, + "step": 179300 + }, + { + "epoch": 144.97, + "learning_rate": 9.768185091825711e-05, + "loss": 0.2679, + "step": 179325 + }, + { + "epoch": 144.99, + "learning_rate": 9.762558516384589e-05, + "loss": 0.277, + "step": 179350 + }, + { + "epoch": 145.01, + "learning_rate": 9.756931940943464e-05, + "loss": 0.2467, + "step": 179375 + }, + { + "epoch": 145.03, + "learning_rate": 9.751305365502342e-05, + "loss": 0.2388, + "step": 179400 + }, + { + "epoch": 145.05, + "learning_rate": 9.745678790061217e-05, + "loss": 0.2745, + "step": 179425 + }, + { + "epoch": 145.07, + "learning_rate": 9.740052214620093e-05, + "loss": 0.2472, + "step": 179450 + }, + { + "epoch": 145.09, + "learning_rate": 9.73442563917897e-05, + "loss": 0.2608, + "step": 179475 + }, + { + "epoch": 145.11, + "learning_rate": 9.728799063737846e-05, + "loss": 0.2417, + "step": 179500 + }, + { + "epoch": 145.13, + "learning_rate": 9.723172488296724e-05, + "loss": 0.2602, + "step": 179525 + }, + { + "epoch": 145.15, + "learning_rate": 9.717545912855599e-05, + "loss": 0.265, + "step": 179550 + }, + { + "epoch": 145.17, + "learning_rate": 9.711919337414477e-05, + "loss": 0.2563, + "step": 179575 + }, + { + "epoch": 145.19, + "learning_rate": 9.706292761973352e-05, + "loss": 0.2417, + "step": 179600 + }, + { + "epoch": 145.21, + "learning_rate": 9.70066618653223e-05, + "loss": 0.2727, + "step": 179625 + }, + { + "epoch": 145.23, + "learning_rate": 9.695039611091105e-05, + "loss": 0.2765, + "step": 179650 + }, + { + "epoch": 145.25, + "learning_rate": 9.689413035649983e-05, + "loss": 0.2681, + "step": 179675 + }, + { + "epoch": 145.27, + "learning_rate": 9.683786460208858e-05, + "loss": 0.2429, + "step": 179700 + }, + { + "epoch": 145.29, + "learning_rate": 9.678159884767736e-05, + "loss": 0.2514, + "step": 179725 + }, + { + "epoch": 145.31, + "learning_rate": 9.672533309326611e-05, + "loss": 0.2567, + "step": 179750 + }, + { + "epoch": 145.33, + "learning_rate": 9.666906733885489e-05, + "loss": 0.2719, + "step": 179775 + }, + { + "epoch": 145.35, + "learning_rate": 9.661280158444364e-05, + "loss": 0.2475, + "step": 179800 + }, + { + "epoch": 145.37, + "learning_rate": 9.65565358300324e-05, + "loss": 0.2627, + "step": 179825 + }, + { + "epoch": 145.39, + "learning_rate": 9.650027007562118e-05, + "loss": 0.2742, + "step": 179850 + }, + { + "epoch": 145.41, + "learning_rate": 9.644400432120993e-05, + "loss": 0.2662, + "step": 179875 + }, + { + "epoch": 145.43, + "learning_rate": 9.638773856679871e-05, + "loss": 0.2762, + "step": 179900 + }, + { + "epoch": 145.45, + "learning_rate": 9.633147281238746e-05, + "loss": 0.2654, + "step": 179925 + }, + { + "epoch": 145.47, + "learning_rate": 9.627520705797624e-05, + "loss": 0.267, + "step": 179950 + }, + { + "epoch": 145.49, + "learning_rate": 9.6218941303565e-05, + "loss": 0.272, + "step": 179975 + }, + { + "epoch": 145.51, + "learning_rate": 9.616267554915377e-05, + "loss": 0.2339, + "step": 180000 + }, + { + "epoch": 145.51, + "eval_cer": 0.07711774791330862, + "eval_loss": 0.428690105676651, + "eval_runtime": 149.384, + "eval_samples_per_second": 28.069, + "eval_steps_per_second": 7.022, + "eval_wer": 0.3267536704730832, + "step": 180000 + }, + { + "epoch": 145.53, + "learning_rate": 9.610640979474252e-05, + "loss": 0.2665, + "step": 180025 + }, + { + "epoch": 145.55, + "learning_rate": 9.60501440403313e-05, + "loss": 0.2467, + "step": 180050 + }, + { + "epoch": 145.57, + "learning_rate": 9.599387828592005e-05, + "loss": 0.2536, + "step": 180075 + }, + { + "epoch": 145.59, + "learning_rate": 9.593761253150883e-05, + "loss": 0.2215, + "step": 180100 + }, + { + "epoch": 145.61, + "learning_rate": 9.588134677709758e-05, + "loss": 0.2676, + "step": 180125 + }, + { + "epoch": 145.63, + "learning_rate": 9.582508102268635e-05, + "loss": 0.2845, + "step": 180150 + }, + { + "epoch": 145.65, + "learning_rate": 9.576881526827513e-05, + "loss": 0.2815, + "step": 180175 + }, + { + "epoch": 145.68, + "learning_rate": 9.571254951386388e-05, + "loss": 0.2321, + "step": 180200 + }, + { + "epoch": 145.7, + "learning_rate": 9.565628375945266e-05, + "loss": 0.2314, + "step": 180225 + }, + { + "epoch": 145.72, + "learning_rate": 9.56000180050414e-05, + "loss": 0.2685, + "step": 180250 + }, + { + "epoch": 145.74, + "learning_rate": 9.554375225063019e-05, + "loss": 0.282, + "step": 180275 + }, + { + "epoch": 145.76, + "learning_rate": 9.548748649621894e-05, + "loss": 0.2542, + "step": 180300 + }, + { + "epoch": 145.78, + "learning_rate": 9.543122074180771e-05, + "loss": 0.2701, + "step": 180325 + }, + { + "epoch": 145.8, + "learning_rate": 9.537495498739647e-05, + "loss": 0.2636, + "step": 180350 + }, + { + "epoch": 145.82, + "learning_rate": 9.531868923298524e-05, + "loss": 0.3032, + "step": 180375 + }, + { + "epoch": 145.84, + "learning_rate": 9.5262423478574e-05, + "loss": 0.2669, + "step": 180400 + }, + { + "epoch": 145.86, + "learning_rate": 9.520615772416277e-05, + "loss": 0.287, + "step": 180425 + }, + { + "epoch": 145.88, + "learning_rate": 9.514989196975153e-05, + "loss": 0.2689, + "step": 180450 + }, + { + "epoch": 145.9, + "learning_rate": 9.50936262153403e-05, + "loss": 0.2868, + "step": 180475 + }, + { + "epoch": 145.92, + "learning_rate": 9.503736046092907e-05, + "loss": 0.2729, + "step": 180500 + }, + { + "epoch": 145.94, + "learning_rate": 9.498109470651782e-05, + "loss": 0.266, + "step": 180525 + }, + { + "epoch": 145.96, + "learning_rate": 9.49248289521066e-05, + "loss": 0.2661, + "step": 180550 + }, + { + "epoch": 145.98, + "learning_rate": 9.486856319769535e-05, + "loss": 0.2618, + "step": 180575 + }, + { + "epoch": 146.0, + "learning_rate": 9.481229744328413e-05, + "loss": 0.2463, + "step": 180600 + }, + { + "epoch": 146.02, + "learning_rate": 9.475603168887288e-05, + "loss": 0.2412, + "step": 180625 + }, + { + "epoch": 146.04, + "learning_rate": 9.469976593446166e-05, + "loss": 0.2517, + "step": 180650 + }, + { + "epoch": 146.06, + "learning_rate": 9.464350018005041e-05, + "loss": 0.2745, + "step": 180675 + }, + { + "epoch": 146.08, + "learning_rate": 9.458723442563919e-05, + "loss": 0.2349, + "step": 180700 + }, + { + "epoch": 146.1, + "learning_rate": 9.453096867122794e-05, + "loss": 0.2567, + "step": 180725 + }, + { + "epoch": 146.12, + "learning_rate": 9.447470291681672e-05, + "loss": 0.2081, + "step": 180750 + }, + { + "epoch": 146.14, + "learning_rate": 9.441843716240547e-05, + "loss": 0.2739, + "step": 180775 + }, + { + "epoch": 146.16, + "learning_rate": 9.436217140799425e-05, + "loss": 0.2464, + "step": 180800 + }, + { + "epoch": 146.18, + "learning_rate": 9.430590565358301e-05, + "loss": 0.2567, + "step": 180825 + }, + { + "epoch": 146.2, + "learning_rate": 9.424963989917178e-05, + "loss": 0.2657, + "step": 180850 + }, + { + "epoch": 146.22, + "learning_rate": 9.419337414476054e-05, + "loss": 0.2507, + "step": 180875 + }, + { + "epoch": 146.24, + "learning_rate": 9.413710839034929e-05, + "loss": 0.2496, + "step": 180900 + }, + { + "epoch": 146.26, + "learning_rate": 9.408084263593807e-05, + "loss": 0.2255, + "step": 180925 + }, + { + "epoch": 146.28, + "learning_rate": 9.402457688152682e-05, + "loss": 0.236, + "step": 180950 + }, + { + "epoch": 146.3, + "learning_rate": 9.39683111271156e-05, + "loss": 0.2439, + "step": 180975 + }, + { + "epoch": 146.32, + "learning_rate": 9.391204537270435e-05, + "loss": 0.2623, + "step": 181000 + }, + { + "epoch": 146.34, + "learning_rate": 9.385577961829313e-05, + "loss": 0.278, + "step": 181025 + }, + { + "epoch": 146.36, + "learning_rate": 9.379951386388188e-05, + "loss": 0.2782, + "step": 181050 + }, + { + "epoch": 146.38, + "learning_rate": 9.374324810947066e-05, + "loss": 0.2576, + "step": 181075 + }, + { + "epoch": 146.4, + "learning_rate": 9.368698235505941e-05, + "loss": 0.2764, + "step": 181100 + }, + { + "epoch": 146.42, + "learning_rate": 9.363071660064819e-05, + "loss": 0.276, + "step": 181125 + }, + { + "epoch": 146.44, + "learning_rate": 9.357445084623695e-05, + "loss": 0.2534, + "step": 181150 + }, + { + "epoch": 146.46, + "learning_rate": 9.351818509182572e-05, + "loss": 0.2563, + "step": 181175 + }, + { + "epoch": 146.48, + "learning_rate": 9.346191933741448e-05, + "loss": 0.2341, + "step": 181200 + }, + { + "epoch": 146.5, + "learning_rate": 9.340565358300323e-05, + "loss": 0.2514, + "step": 181225 + }, + { + "epoch": 146.52, + "learning_rate": 9.334938782859201e-05, + "loss": 0.2452, + "step": 181250 + }, + { + "epoch": 146.54, + "learning_rate": 9.329312207418076e-05, + "loss": 0.2607, + "step": 181275 + }, + { + "epoch": 146.56, + "learning_rate": 9.323685631976954e-05, + "loss": 0.2634, + "step": 181300 + }, + { + "epoch": 146.58, + "learning_rate": 9.318059056535829e-05, + "loss": 0.2678, + "step": 181325 + }, + { + "epoch": 146.6, + "learning_rate": 9.312432481094707e-05, + "loss": 0.228, + "step": 181350 + }, + { + "epoch": 146.62, + "learning_rate": 9.306805905653582e-05, + "loss": 0.2766, + "step": 181375 + }, + { + "epoch": 146.65, + "learning_rate": 9.30117933021246e-05, + "loss": 0.2583, + "step": 181400 + }, + { + "epoch": 146.67, + "learning_rate": 9.295552754771335e-05, + "loss": 0.2615, + "step": 181425 + }, + { + "epoch": 146.69, + "learning_rate": 9.289926179330213e-05, + "loss": 0.2496, + "step": 181450 + }, + { + "epoch": 146.71, + "learning_rate": 9.28429960388909e-05, + "loss": 0.2688, + "step": 181475 + }, + { + "epoch": 146.73, + "learning_rate": 9.278673028447966e-05, + "loss": 0.2621, + "step": 181500 + }, + { + "epoch": 146.75, + "learning_rate": 9.273046453006842e-05, + "loss": 0.2605, + "step": 181525 + }, + { + "epoch": 146.77, + "learning_rate": 9.267419877565719e-05, + "loss": 0.2803, + "step": 181550 + }, + { + "epoch": 146.79, + "learning_rate": 9.261793302124595e-05, + "loss": 0.2872, + "step": 181575 + }, + { + "epoch": 146.81, + "learning_rate": 9.25616672668347e-05, + "loss": 0.2439, + "step": 181600 + }, + { + "epoch": 146.83, + "learning_rate": 9.250540151242348e-05, + "loss": 0.2783, + "step": 181625 + }, + { + "epoch": 146.85, + "learning_rate": 9.244913575801224e-05, + "loss": 0.2359, + "step": 181650 + }, + { + "epoch": 146.87, + "learning_rate": 9.239287000360101e-05, + "loss": 0.2689, + "step": 181675 + }, + { + "epoch": 146.89, + "learning_rate": 9.233660424918977e-05, + "loss": 0.2645, + "step": 181700 + }, + { + "epoch": 146.91, + "learning_rate": 9.228033849477854e-05, + "loss": 0.2623, + "step": 181725 + }, + { + "epoch": 146.93, + "learning_rate": 9.22240727403673e-05, + "loss": 0.2612, + "step": 181750 + }, + { + "epoch": 146.95, + "learning_rate": 9.216780698595607e-05, + "loss": 0.2524, + "step": 181775 + }, + { + "epoch": 146.97, + "learning_rate": 9.211154123154484e-05, + "loss": 0.2505, + "step": 181800 + }, + { + "epoch": 146.99, + "learning_rate": 9.20552754771336e-05, + "loss": 0.2467, + "step": 181825 + }, + { + "epoch": 147.01, + "learning_rate": 9.199900972272237e-05, + "loss": 0.2356, + "step": 181850 + }, + { + "epoch": 147.03, + "learning_rate": 9.194274396831113e-05, + "loss": 0.2552, + "step": 181875 + }, + { + "epoch": 147.05, + "learning_rate": 9.18864782138999e-05, + "loss": 0.2573, + "step": 181900 + }, + { + "epoch": 147.07, + "learning_rate": 9.183021245948866e-05, + "loss": 0.2314, + "step": 181925 + }, + { + "epoch": 147.09, + "learning_rate": 9.177394670507743e-05, + "loss": 0.2382, + "step": 181950 + }, + { + "epoch": 147.11, + "learning_rate": 9.171768095066618e-05, + "loss": 0.2383, + "step": 181975 + }, + { + "epoch": 147.13, + "learning_rate": 9.166141519625496e-05, + "loss": 0.2562, + "step": 182000 + }, + { + "epoch": 147.15, + "learning_rate": 9.160514944184371e-05, + "loss": 0.2514, + "step": 182025 + }, + { + "epoch": 147.17, + "learning_rate": 9.154888368743249e-05, + "loss": 0.2235, + "step": 182050 + }, + { + "epoch": 147.19, + "learning_rate": 9.149261793302125e-05, + "loss": 0.2309, + "step": 182075 + }, + { + "epoch": 147.21, + "learning_rate": 9.143635217861002e-05, + "loss": 0.2431, + "step": 182100 + }, + { + "epoch": 147.23, + "learning_rate": 9.138008642419878e-05, + "loss": 0.2409, + "step": 182125 + }, + { + "epoch": 147.25, + "learning_rate": 9.132382066978754e-05, + "loss": 0.2604, + "step": 182150 + }, + { + "epoch": 147.27, + "learning_rate": 9.126755491537631e-05, + "loss": 0.2481, + "step": 182175 + }, + { + "epoch": 147.29, + "learning_rate": 9.121128916096507e-05, + "loss": 0.2883, + "step": 182200 + }, + { + "epoch": 147.31, + "learning_rate": 9.115502340655384e-05, + "loss": 0.2286, + "step": 182225 + }, + { + "epoch": 147.33, + "learning_rate": 9.10987576521426e-05, + "loss": 0.2696, + "step": 182250 + }, + { + "epoch": 147.35, + "learning_rate": 9.104249189773137e-05, + "loss": 0.2482, + "step": 182275 + }, + { + "epoch": 147.37, + "learning_rate": 9.098622614332012e-05, + "loss": 0.2588, + "step": 182300 + }, + { + "epoch": 147.39, + "learning_rate": 9.09299603889089e-05, + "loss": 0.2588, + "step": 182325 + }, + { + "epoch": 147.41, + "learning_rate": 9.087369463449765e-05, + "loss": 0.2528, + "step": 182350 + }, + { + "epoch": 147.43, + "learning_rate": 9.081742888008643e-05, + "loss": 0.2473, + "step": 182375 + }, + { + "epoch": 147.45, + "learning_rate": 9.076116312567519e-05, + "loss": 0.29, + "step": 182400 + }, + { + "epoch": 147.47, + "learning_rate": 9.070489737126396e-05, + "loss": 0.2481, + "step": 182425 + }, + { + "epoch": 147.49, + "learning_rate": 9.064863161685272e-05, + "loss": 0.2873, + "step": 182450 + }, + { + "epoch": 147.51, + "learning_rate": 9.059236586244149e-05, + "loss": 0.2778, + "step": 182475 + }, + { + "epoch": 147.53, + "learning_rate": 9.053610010803025e-05, + "loss": 0.2449, + "step": 182500 + }, + { + "epoch": 147.55, + "learning_rate": 9.047983435361902e-05, + "loss": 0.2394, + "step": 182525 + }, + { + "epoch": 147.57, + "learning_rate": 9.042356859920778e-05, + "loss": 0.2331, + "step": 182550 + }, + { + "epoch": 147.59, + "learning_rate": 9.0369553474973e-05, + "loss": 0.2373, + "step": 182575 + }, + { + "epoch": 147.62, + "learning_rate": 9.031328772056176e-05, + "loss": 0.2741, + "step": 182600 + }, + { + "epoch": 147.64, + "learning_rate": 9.025702196615052e-05, + "loss": 0.2569, + "step": 182625 + }, + { + "epoch": 147.66, + "learning_rate": 9.020075621173929e-05, + "loss": 0.2636, + "step": 182650 + }, + { + "epoch": 147.68, + "learning_rate": 9.014449045732805e-05, + "loss": 0.2395, + "step": 182675 + }, + { + "epoch": 147.7, + "learning_rate": 9.008822470291682e-05, + "loss": 0.2618, + "step": 182700 + }, + { + "epoch": 147.72, + "learning_rate": 9.003195894850558e-05, + "loss": 0.2482, + "step": 182725 + }, + { + "epoch": 147.74, + "learning_rate": 8.997569319409435e-05, + "loss": 0.2572, + "step": 182750 + }, + { + "epoch": 147.76, + "learning_rate": 8.991942743968311e-05, + "loss": 0.2241, + "step": 182775 + }, + { + "epoch": 147.78, + "learning_rate": 8.986316168527188e-05, + "loss": 0.2586, + "step": 182800 + }, + { + "epoch": 147.8, + "learning_rate": 8.980689593086064e-05, + "loss": 0.2482, + "step": 182825 + }, + { + "epoch": 147.82, + "learning_rate": 8.975063017644941e-05, + "loss": 0.2951, + "step": 182850 + }, + { + "epoch": 147.84, + "learning_rate": 8.969436442203817e-05, + "loss": 0.2154, + "step": 182875 + }, + { + "epoch": 147.86, + "learning_rate": 8.963809866762694e-05, + "loss": 0.2295, + "step": 182900 + }, + { + "epoch": 147.88, + "learning_rate": 8.95818329132157e-05, + "loss": 0.2438, + "step": 182925 + }, + { + "epoch": 147.9, + "learning_rate": 8.952556715880447e-05, + "loss": 0.1849, + "step": 182950 + }, + { + "epoch": 147.92, + "learning_rate": 8.946930140439323e-05, + "loss": 0.2155, + "step": 182975 + }, + { + "epoch": 147.94, + "learning_rate": 8.9413035649982e-05, + "loss": 0.2547, + "step": 183000 + }, + { + "epoch": 147.94, + "eval_cer": 0.07676868268944488, + "eval_loss": 0.4395972192287445, + "eval_runtime": 150.3968, + "eval_samples_per_second": 27.88, + "eval_steps_per_second": 6.975, + "eval_wer": 0.3253507340946166, + "step": 183000 + }, + { + "epoch": 147.96, + "learning_rate": 8.935676989557076e-05, + "loss": 0.2438, + "step": 183025 + }, + { + "epoch": 147.98, + "learning_rate": 8.930050414115954e-05, + "loss": 0.2418, + "step": 183050 + }, + { + "epoch": 148.0, + "learning_rate": 8.924423838674829e-05, + "loss": 0.2301, + "step": 183075 + }, + { + "epoch": 148.02, + "learning_rate": 8.919022326251352e-05, + "loss": 0.2259, + "step": 183100 + }, + { + "epoch": 148.04, + "learning_rate": 8.913395750810227e-05, + "loss": 0.2529, + "step": 183125 + }, + { + "epoch": 148.06, + "learning_rate": 8.907769175369103e-05, + "loss": 0.223, + "step": 183150 + }, + { + "epoch": 148.08, + "learning_rate": 8.90214259992798e-05, + "loss": 0.2741, + "step": 183175 + }, + { + "epoch": 148.1, + "learning_rate": 8.896516024486856e-05, + "loss": 0.2585, + "step": 183200 + }, + { + "epoch": 148.12, + "learning_rate": 8.890889449045733e-05, + "loss": 0.241, + "step": 183225 + }, + { + "epoch": 148.14, + "learning_rate": 8.885262873604609e-05, + "loss": 0.2538, + "step": 183250 + }, + { + "epoch": 148.16, + "learning_rate": 8.879636298163486e-05, + "loss": 0.2224, + "step": 183275 + }, + { + "epoch": 148.18, + "learning_rate": 8.874009722722362e-05, + "loss": 0.2388, + "step": 183300 + }, + { + "epoch": 148.2, + "learning_rate": 8.86838314728124e-05, + "loss": 0.2234, + "step": 183325 + }, + { + "epoch": 148.22, + "learning_rate": 8.862756571840115e-05, + "loss": 0.2426, + "step": 183350 + }, + { + "epoch": 148.24, + "learning_rate": 8.857129996398993e-05, + "loss": 0.2038, + "step": 183375 + }, + { + "epoch": 148.26, + "learning_rate": 8.851503420957868e-05, + "loss": 0.2496, + "step": 183400 + }, + { + "epoch": 148.28, + "learning_rate": 8.845876845516746e-05, + "loss": 0.2406, + "step": 183425 + }, + { + "epoch": 148.3, + "learning_rate": 8.840250270075621e-05, + "loss": 0.2573, + "step": 183450 + }, + { + "epoch": 148.32, + "learning_rate": 8.834623694634499e-05, + "loss": 0.23, + "step": 183475 + }, + { + "epoch": 148.34, + "learning_rate": 8.828997119193374e-05, + "loss": 0.2747, + "step": 183500 + }, + { + "epoch": 148.36, + "learning_rate": 8.82337054375225e-05, + "loss": 0.2621, + "step": 183525 + }, + { + "epoch": 148.38, + "learning_rate": 8.817743968311127e-05, + "loss": 0.2474, + "step": 183550 + }, + { + "epoch": 148.4, + "learning_rate": 8.812117392870003e-05, + "loss": 0.2303, + "step": 183575 + }, + { + "epoch": 148.42, + "learning_rate": 8.80649081742888e-05, + "loss": 0.2598, + "step": 183600 + }, + { + "epoch": 148.44, + "learning_rate": 8.800864241987756e-05, + "loss": 0.2554, + "step": 183625 + }, + { + "epoch": 148.46, + "learning_rate": 8.795237666546634e-05, + "loss": 0.2547, + "step": 183650 + }, + { + "epoch": 148.48, + "learning_rate": 8.78961109110551e-05, + "loss": 0.2592, + "step": 183675 + }, + { + "epoch": 148.5, + "learning_rate": 8.783984515664387e-05, + "loss": 0.2723, + "step": 183700 + }, + { + "epoch": 148.52, + "learning_rate": 8.778357940223262e-05, + "loss": 0.2315, + "step": 183725 + }, + { + "epoch": 148.54, + "learning_rate": 8.77273136478214e-05, + "loss": 0.2444, + "step": 183750 + }, + { + "epoch": 148.57, + "learning_rate": 8.767104789341015e-05, + "loss": 0.2418, + "step": 183775 + }, + { + "epoch": 148.59, + "learning_rate": 8.761478213899893e-05, + "loss": 0.2439, + "step": 183800 + }, + { + "epoch": 148.61, + "learning_rate": 8.755851638458768e-05, + "loss": 0.2374, + "step": 183825 + }, + { + "epoch": 148.63, + "learning_rate": 8.750225063017646e-05, + "loss": 0.2548, + "step": 183850 + }, + { + "epoch": 148.65, + "learning_rate": 8.744598487576521e-05, + "loss": 0.2225, + "step": 183875 + }, + { + "epoch": 148.67, + "learning_rate": 8.738971912135398e-05, + "loss": 0.2514, + "step": 183900 + }, + { + "epoch": 148.69, + "learning_rate": 8.733345336694274e-05, + "loss": 0.2674, + "step": 183925 + }, + { + "epoch": 148.71, + "learning_rate": 8.72771876125315e-05, + "loss": 0.2733, + "step": 183950 + }, + { + "epoch": 148.73, + "learning_rate": 8.722092185812028e-05, + "loss": 0.2434, + "step": 183975 + }, + { + "epoch": 148.75, + "learning_rate": 8.716465610370904e-05, + "loss": 0.2764, + "step": 184000 + }, + { + "epoch": 148.77, + "learning_rate": 8.710839034929781e-05, + "loss": 0.2095, + "step": 184025 + }, + { + "epoch": 148.79, + "learning_rate": 8.705212459488657e-05, + "loss": 0.2386, + "step": 184050 + }, + { + "epoch": 148.81, + "learning_rate": 8.699585884047534e-05, + "loss": 0.1872, + "step": 184075 + }, + { + "epoch": 148.83, + "learning_rate": 8.69395930860641e-05, + "loss": 0.253, + "step": 184100 + }, + { + "epoch": 148.85, + "learning_rate": 8.688332733165287e-05, + "loss": 0.2379, + "step": 184125 + }, + { + "epoch": 148.87, + "learning_rate": 8.682706157724162e-05, + "loss": 0.2736, + "step": 184150 + }, + { + "epoch": 148.89, + "learning_rate": 8.67707958228304e-05, + "loss": 0.2587, + "step": 184175 + }, + { + "epoch": 148.91, + "learning_rate": 8.671453006841915e-05, + "loss": 0.2599, + "step": 184200 + }, + { + "epoch": 148.93, + "learning_rate": 8.665826431400792e-05, + "loss": 0.2492, + "step": 184225 + }, + { + "epoch": 148.95, + "learning_rate": 8.660199855959668e-05, + "loss": 0.2701, + "step": 184250 + }, + { + "epoch": 148.97, + "learning_rate": 8.654573280518545e-05, + "loss": 0.2593, + "step": 184275 + }, + { + "epoch": 148.99, + "learning_rate": 8.648946705077423e-05, + "loss": 0.2218, + "step": 184300 + }, + { + "epoch": 149.01, + "learning_rate": 8.643320129636298e-05, + "loss": 0.2569, + "step": 184325 + }, + { + "epoch": 149.03, + "learning_rate": 8.637693554195176e-05, + "loss": 0.213, + "step": 184350 + }, + { + "epoch": 149.05, + "learning_rate": 8.632066978754051e-05, + "loss": 0.2683, + "step": 184375 + }, + { + "epoch": 149.07, + "learning_rate": 8.626440403312929e-05, + "loss": 0.2441, + "step": 184400 + }, + { + "epoch": 149.09, + "learning_rate": 8.620813827871804e-05, + "loss": 0.2504, + "step": 184425 + }, + { + "epoch": 149.11, + "learning_rate": 8.615187252430682e-05, + "loss": 0.2652, + "step": 184450 + }, + { + "epoch": 149.13, + "learning_rate": 8.609560676989557e-05, + "loss": 0.2908, + "step": 184475 + }, + { + "epoch": 149.15, + "learning_rate": 8.603934101548435e-05, + "loss": 0.243, + "step": 184500 + }, + { + "epoch": 149.17, + "learning_rate": 8.59830752610731e-05, + "loss": 0.2683, + "step": 184525 + }, + { + "epoch": 149.19, + "learning_rate": 8.592680950666187e-05, + "loss": 0.2351, + "step": 184550 + }, + { + "epoch": 149.21, + "learning_rate": 8.587054375225063e-05, + "loss": 0.2483, + "step": 184575 + }, + { + "epoch": 149.23, + "learning_rate": 8.581427799783939e-05, + "loss": 0.2449, + "step": 184600 + }, + { + "epoch": 149.25, + "learning_rate": 8.575801224342817e-05, + "loss": 0.2198, + "step": 184625 + }, + { + "epoch": 149.27, + "learning_rate": 8.570174648901692e-05, + "loss": 0.2365, + "step": 184650 + }, + { + "epoch": 149.29, + "learning_rate": 8.56454807346057e-05, + "loss": 0.2766, + "step": 184675 + }, + { + "epoch": 149.31, + "learning_rate": 8.558921498019445e-05, + "loss": 0.2583, + "step": 184700 + }, + { + "epoch": 149.33, + "learning_rate": 8.553294922578323e-05, + "loss": 0.2544, + "step": 184725 + }, + { + "epoch": 149.35, + "learning_rate": 8.547668347137198e-05, + "loss": 0.2424, + "step": 184750 + }, + { + "epoch": 149.37, + "learning_rate": 8.542041771696076e-05, + "loss": 0.2458, + "step": 184775 + }, + { + "epoch": 149.39, + "learning_rate": 8.536415196254951e-05, + "loss": 0.2223, + "step": 184800 + }, + { + "epoch": 149.41, + "learning_rate": 8.530788620813829e-05, + "loss": 0.2389, + "step": 184825 + }, + { + "epoch": 149.43, + "learning_rate": 8.525162045372704e-05, + "loss": 0.2231, + "step": 184850 + }, + { + "epoch": 149.45, + "learning_rate": 8.519535469931582e-05, + "loss": 0.236, + "step": 184875 + }, + { + "epoch": 149.47, + "learning_rate": 8.513908894490457e-05, + "loss": 0.2126, + "step": 184900 + }, + { + "epoch": 149.49, + "learning_rate": 8.508282319049333e-05, + "loss": 0.2418, + "step": 184925 + }, + { + "epoch": 149.51, + "learning_rate": 8.502655743608211e-05, + "loss": 0.2328, + "step": 184950 + }, + { + "epoch": 149.54, + "learning_rate": 8.497029168167086e-05, + "loss": 0.2368, + "step": 184975 + }, + { + "epoch": 149.56, + "learning_rate": 8.491402592725964e-05, + "loss": 0.227, + "step": 185000 + }, + { + "epoch": 149.58, + "learning_rate": 8.485776017284839e-05, + "loss": 0.2445, + "step": 185025 + }, + { + "epoch": 149.6, + "learning_rate": 8.480149441843717e-05, + "loss": 0.2377, + "step": 185050 + }, + { + "epoch": 149.62, + "learning_rate": 8.474522866402592e-05, + "loss": 0.2296, + "step": 185075 + }, + { + "epoch": 149.64, + "learning_rate": 8.46889629096147e-05, + "loss": 0.2326, + "step": 185100 + }, + { + "epoch": 149.66, + "learning_rate": 8.463269715520345e-05, + "loss": 0.241, + "step": 185125 + }, + { + "epoch": 149.68, + "learning_rate": 8.457643140079223e-05, + "loss": 0.2221, + "step": 185150 + }, + { + "epoch": 149.7, + "learning_rate": 8.452016564638098e-05, + "loss": 0.2295, + "step": 185175 + }, + { + "epoch": 149.72, + "learning_rate": 8.446615052214621e-05, + "loss": 0.2696, + "step": 185200 + }, + { + "epoch": 149.74, + "learning_rate": 8.440988476773496e-05, + "loss": 0.2305, + "step": 185225 + }, + { + "epoch": 149.76, + "learning_rate": 8.435361901332374e-05, + "loss": 0.2355, + "step": 185250 + }, + { + "epoch": 149.78, + "learning_rate": 8.42973532589125e-05, + "loss": 0.3044, + "step": 185275 + }, + { + "epoch": 149.8, + "learning_rate": 8.424108750450127e-05, + "loss": 0.2521, + "step": 185300 + }, + { + "epoch": 149.82, + "learning_rate": 8.418482175009003e-05, + "loss": 0.224, + "step": 185325 + }, + { + "epoch": 149.84, + "learning_rate": 8.412855599567878e-05, + "loss": 0.2408, + "step": 185350 + }, + { + "epoch": 149.86, + "learning_rate": 8.407229024126756e-05, + "loss": 0.2726, + "step": 185375 + }, + { + "epoch": 149.88, + "learning_rate": 8.401602448685631e-05, + "loss": 0.2534, + "step": 185400 + }, + { + "epoch": 149.9, + "learning_rate": 8.395975873244509e-05, + "loss": 0.2088, + "step": 185425 + }, + { + "epoch": 149.92, + "learning_rate": 8.390349297803384e-05, + "loss": 0.2246, + "step": 185450 + }, + { + "epoch": 149.94, + "learning_rate": 8.384722722362262e-05, + "loss": 0.2466, + "step": 185475 + }, + { + "epoch": 149.96, + "learning_rate": 8.379096146921137e-05, + "loss": 0.2467, + "step": 185500 + }, + { + "epoch": 149.98, + "learning_rate": 8.373469571480015e-05, + "loss": 0.2591, + "step": 185525 + }, + { + "epoch": 150.0, + "learning_rate": 8.36784299603889e-05, + "loss": 0.2049, + "step": 185550 + }, + { + "epoch": 150.02, + "learning_rate": 8.362216420597768e-05, + "loss": 0.2339, + "step": 185575 + }, + { + "epoch": 150.04, + "learning_rate": 8.356589845156644e-05, + "loss": 0.2122, + "step": 185600 + }, + { + "epoch": 150.06, + "learning_rate": 8.350963269715521e-05, + "loss": 0.2562, + "step": 185625 + }, + { + "epoch": 150.08, + "learning_rate": 8.345336694274397e-05, + "loss": 0.2575, + "step": 185650 + }, + { + "epoch": 150.1, + "learning_rate": 8.339710118833274e-05, + "loss": 0.2611, + "step": 185675 + }, + { + "epoch": 150.12, + "learning_rate": 8.33408354339215e-05, + "loss": 0.2384, + "step": 185700 + }, + { + "epoch": 150.14, + "learning_rate": 8.328456967951025e-05, + "loss": 0.2435, + "step": 185725 + }, + { + "epoch": 150.16, + "learning_rate": 8.322830392509903e-05, + "loss": 0.2407, + "step": 185750 + }, + { + "epoch": 150.18, + "learning_rate": 8.317203817068778e-05, + "loss": 0.2448, + "step": 185775 + }, + { + "epoch": 150.2, + "learning_rate": 8.311577241627656e-05, + "loss": 0.2177, + "step": 185800 + }, + { + "epoch": 150.22, + "learning_rate": 8.305950666186531e-05, + "loss": 0.2452, + "step": 185825 + }, + { + "epoch": 150.24, + "learning_rate": 8.300324090745409e-05, + "loss": 0.2237, + "step": 185850 + }, + { + "epoch": 150.26, + "learning_rate": 8.294697515304284e-05, + "loss": 0.2466, + "step": 185875 + }, + { + "epoch": 150.28, + "learning_rate": 8.289070939863162e-05, + "loss": 0.2356, + "step": 185900 + }, + { + "epoch": 150.3, + "learning_rate": 8.283444364422039e-05, + "loss": 0.2661, + "step": 185925 + }, + { + "epoch": 150.32, + "learning_rate": 8.277817788980915e-05, + "loss": 0.2332, + "step": 185950 + }, + { + "epoch": 150.34, + "learning_rate": 8.272191213539792e-05, + "loss": 0.243, + "step": 185975 + }, + { + "epoch": 150.36, + "learning_rate": 8.266564638098668e-05, + "loss": 0.2072, + "step": 186000 + }, + { + "epoch": 150.36, + "eval_cer": 0.07735388027062821, + "eval_loss": 0.4585643708705902, + "eval_runtime": 148.6768, + "eval_samples_per_second": 28.202, + "eval_steps_per_second": 7.056, + "eval_wer": 0.3288743882544861, + "step": 186000 + }, + { + "epoch": 150.38, + "learning_rate": 8.260938062657545e-05, + "loss": 0.2533, + "step": 186025 + }, + { + "epoch": 150.4, + "learning_rate": 8.255311487216421e-05, + "loss": 0.2254, + "step": 186050 + }, + { + "epoch": 150.42, + "learning_rate": 8.249684911775298e-05, + "loss": 0.2465, + "step": 186075 + }, + { + "epoch": 150.44, + "learning_rate": 8.244058336334173e-05, + "loss": 0.2551, + "step": 186100 + }, + { + "epoch": 150.46, + "learning_rate": 8.23843176089305e-05, + "loss": 0.2728, + "step": 186125 + }, + { + "epoch": 150.49, + "learning_rate": 8.232805185451926e-05, + "loss": 0.2044, + "step": 186150 + }, + { + "epoch": 150.51, + "learning_rate": 8.227178610010803e-05, + "loss": 0.2728, + "step": 186175 + }, + { + "epoch": 150.53, + "learning_rate": 8.22155203456968e-05, + "loss": 0.2426, + "step": 186200 + }, + { + "epoch": 150.55, + "learning_rate": 8.215925459128556e-05, + "loss": 0.2366, + "step": 186225 + }, + { + "epoch": 150.57, + "learning_rate": 8.210298883687433e-05, + "loss": 0.2211, + "step": 186250 + }, + { + "epoch": 150.59, + "learning_rate": 8.20467230824631e-05, + "loss": 0.2591, + "step": 186275 + }, + { + "epoch": 150.61, + "learning_rate": 8.199045732805186e-05, + "loss": 0.2458, + "step": 186300 + }, + { + "epoch": 150.63, + "learning_rate": 8.193419157364062e-05, + "loss": 0.247, + "step": 186325 + }, + { + "epoch": 150.65, + "learning_rate": 8.187792581922939e-05, + "loss": 0.2158, + "step": 186350 + }, + { + "epoch": 150.67, + "learning_rate": 8.182166006481815e-05, + "loss": 0.2425, + "step": 186375 + }, + { + "epoch": 150.69, + "learning_rate": 8.176539431040692e-05, + "loss": 0.2253, + "step": 186400 + }, + { + "epoch": 150.71, + "learning_rate": 8.170912855599567e-05, + "loss": 0.2422, + "step": 186425 + }, + { + "epoch": 150.73, + "learning_rate": 8.165286280158445e-05, + "loss": 0.2539, + "step": 186450 + }, + { + "epoch": 150.75, + "learning_rate": 8.15965970471732e-05, + "loss": 0.2591, + "step": 186475 + }, + { + "epoch": 150.77, + "learning_rate": 8.154033129276198e-05, + "loss": 0.2537, + "step": 186500 + }, + { + "epoch": 150.79, + "learning_rate": 8.148406553835074e-05, + "loss": 0.2706, + "step": 186525 + }, + { + "epoch": 150.81, + "learning_rate": 8.14277997839395e-05, + "loss": 0.2407, + "step": 186550 + }, + { + "epoch": 150.83, + "learning_rate": 8.137153402952827e-05, + "loss": 0.27, + "step": 186575 + }, + { + "epoch": 150.85, + "learning_rate": 8.131526827511704e-05, + "loss": 0.2428, + "step": 186600 + }, + { + "epoch": 150.87, + "learning_rate": 8.12590025207058e-05, + "loss": 0.2493, + "step": 186625 + }, + { + "epoch": 150.89, + "learning_rate": 8.120273676629457e-05, + "loss": 0.2124, + "step": 186650 + }, + { + "epoch": 150.91, + "learning_rate": 8.114647101188333e-05, + "loss": 0.2553, + "step": 186675 + }, + { + "epoch": 150.93, + "learning_rate": 8.10902052574721e-05, + "loss": 0.2606, + "step": 186700 + }, + { + "epoch": 150.95, + "learning_rate": 8.103393950306086e-05, + "loss": 0.2538, + "step": 186725 + }, + { + "epoch": 150.97, + "learning_rate": 8.097767374864962e-05, + "loss": 0.2262, + "step": 186750 + }, + { + "epoch": 150.99, + "learning_rate": 8.092140799423839e-05, + "loss": 0.275, + "step": 186775 + }, + { + "epoch": 151.01, + "learning_rate": 8.086514223982714e-05, + "loss": 0.2215, + "step": 186800 + }, + { + "epoch": 151.03, + "learning_rate": 8.080887648541592e-05, + "loss": 0.2329, + "step": 186825 + }, + { + "epoch": 151.05, + "learning_rate": 8.075261073100468e-05, + "loss": 0.2574, + "step": 186850 + }, + { + "epoch": 151.07, + "learning_rate": 8.069634497659345e-05, + "loss": 0.243, + "step": 186875 + }, + { + "epoch": 151.09, + "learning_rate": 8.064007922218221e-05, + "loss": 0.232, + "step": 186900 + }, + { + "epoch": 151.11, + "learning_rate": 8.058381346777098e-05, + "loss": 0.2434, + "step": 186925 + }, + { + "epoch": 151.13, + "learning_rate": 8.052754771335974e-05, + "loss": 0.242, + "step": 186950 + }, + { + "epoch": 151.15, + "learning_rate": 8.047128195894851e-05, + "loss": 0.1852, + "step": 186975 + }, + { + "epoch": 151.17, + "learning_rate": 8.041501620453727e-05, + "loss": 0.2491, + "step": 187000 + }, + { + "epoch": 151.19, + "learning_rate": 8.035875045012604e-05, + "loss": 0.2206, + "step": 187025 + }, + { + "epoch": 151.21, + "learning_rate": 8.03024846957148e-05, + "loss": 0.2376, + "step": 187050 + }, + { + "epoch": 151.23, + "learning_rate": 8.024621894130357e-05, + "loss": 0.2447, + "step": 187075 + }, + { + "epoch": 151.25, + "learning_rate": 8.018995318689233e-05, + "loss": 0.2547, + "step": 187100 + }, + { + "epoch": 151.27, + "learning_rate": 8.01336874324811e-05, + "loss": 0.2324, + "step": 187125 + }, + { + "epoch": 151.29, + "learning_rate": 8.007742167806986e-05, + "loss": 0.2326, + "step": 187150 + }, + { + "epoch": 151.31, + "learning_rate": 8.002115592365863e-05, + "loss": 0.2488, + "step": 187175 + }, + { + "epoch": 151.33, + "learning_rate": 7.996489016924739e-05, + "loss": 0.2404, + "step": 187200 + }, + { + "epoch": 151.35, + "learning_rate": 7.990862441483616e-05, + "loss": 0.2286, + "step": 187225 + }, + { + "epoch": 151.37, + "learning_rate": 7.985235866042492e-05, + "loss": 0.2559, + "step": 187250 + }, + { + "epoch": 151.39, + "learning_rate": 7.979834353619013e-05, + "loss": 0.2392, + "step": 187275 + }, + { + "epoch": 151.41, + "learning_rate": 7.97420777817789e-05, + "loss": 0.2791, + "step": 187300 + }, + { + "epoch": 151.43, + "learning_rate": 7.968581202736766e-05, + "loss": 0.2096, + "step": 187325 + }, + { + "epoch": 151.46, + "learning_rate": 7.962954627295643e-05, + "loss": 0.2229, + "step": 187350 + }, + { + "epoch": 151.48, + "learning_rate": 7.957328051854519e-05, + "loss": 0.2372, + "step": 187375 + }, + { + "epoch": 151.5, + "learning_rate": 7.951701476413396e-05, + "loss": 0.2234, + "step": 187400 + }, + { + "epoch": 151.52, + "learning_rate": 7.946074900972272e-05, + "loss": 0.1954, + "step": 187425 + }, + { + "epoch": 151.54, + "learning_rate": 7.940448325531149e-05, + "loss": 0.253, + "step": 187450 + }, + { + "epoch": 151.56, + "learning_rate": 7.934821750090025e-05, + "loss": 0.2445, + "step": 187475 + }, + { + "epoch": 151.58, + "learning_rate": 7.929195174648903e-05, + "loss": 0.2517, + "step": 187500 + }, + { + "epoch": 151.6, + "learning_rate": 7.923568599207778e-05, + "loss": 0.232, + "step": 187525 + }, + { + "epoch": 151.62, + "learning_rate": 7.917942023766656e-05, + "loss": 0.2241, + "step": 187550 + }, + { + "epoch": 151.64, + "learning_rate": 7.912315448325531e-05, + "loss": 0.2243, + "step": 187575 + }, + { + "epoch": 151.66, + "learning_rate": 7.906688872884408e-05, + "loss": 0.232, + "step": 187600 + }, + { + "epoch": 151.68, + "learning_rate": 7.901062297443284e-05, + "loss": 0.2587, + "step": 187625 + }, + { + "epoch": 151.7, + "learning_rate": 7.89543572200216e-05, + "loss": 0.244, + "step": 187650 + }, + { + "epoch": 151.72, + "learning_rate": 7.889809146561037e-05, + "loss": 0.2174, + "step": 187675 + }, + { + "epoch": 151.74, + "learning_rate": 7.884182571119914e-05, + "loss": 0.2759, + "step": 187700 + }, + { + "epoch": 151.76, + "learning_rate": 7.87855599567879e-05, + "loss": 0.2542, + "step": 187725 + }, + { + "epoch": 151.78, + "learning_rate": 7.872929420237666e-05, + "loss": 0.2479, + "step": 187750 + }, + { + "epoch": 151.8, + "learning_rate": 7.867302844796543e-05, + "loss": 0.2559, + "step": 187775 + }, + { + "epoch": 151.82, + "learning_rate": 7.86167626935542e-05, + "loss": 0.2481, + "step": 187800 + }, + { + "epoch": 151.84, + "learning_rate": 7.856049693914297e-05, + "loss": 0.2493, + "step": 187825 + }, + { + "epoch": 151.86, + "learning_rate": 7.850423118473172e-05, + "loss": 0.2427, + "step": 187850 + }, + { + "epoch": 151.88, + "learning_rate": 7.84479654303205e-05, + "loss": 0.2342, + "step": 187875 + }, + { + "epoch": 151.9, + "learning_rate": 7.839169967590925e-05, + "loss": 0.2367, + "step": 187900 + }, + { + "epoch": 151.92, + "learning_rate": 7.833543392149802e-05, + "loss": 0.2207, + "step": 187925 + }, + { + "epoch": 151.94, + "learning_rate": 7.827916816708678e-05, + "loss": 0.2621, + "step": 187950 + }, + { + "epoch": 151.96, + "learning_rate": 7.822290241267555e-05, + "loss": 0.2345, + "step": 187975 + }, + { + "epoch": 151.98, + "learning_rate": 7.816663665826431e-05, + "loss": 0.2754, + "step": 188000 + }, + { + "epoch": 152.0, + "learning_rate": 7.811037090385308e-05, + "loss": 0.2283, + "step": 188025 + }, + { + "epoch": 152.02, + "learning_rate": 7.805410514944184e-05, + "loss": 0.2487, + "step": 188050 + }, + { + "epoch": 152.04, + "learning_rate": 7.799783939503061e-05, + "loss": 0.2386, + "step": 188075 + }, + { + "epoch": 152.06, + "learning_rate": 7.794157364061939e-05, + "loss": 0.2449, + "step": 188100 + }, + { + "epoch": 152.08, + "learning_rate": 7.788530788620814e-05, + "loss": 0.2767, + "step": 188125 + }, + { + "epoch": 152.1, + "learning_rate": 7.782904213179692e-05, + "loss": 0.2534, + "step": 188150 + }, + { + "epoch": 152.12, + "learning_rate": 7.777277637738567e-05, + "loss": 0.2175, + "step": 188175 + }, + { + "epoch": 152.14, + "learning_rate": 7.771651062297444e-05, + "loss": 0.2289, + "step": 188200 + }, + { + "epoch": 152.16, + "learning_rate": 7.76602448685632e-05, + "loss": 0.1924, + "step": 188225 + }, + { + "epoch": 152.18, + "learning_rate": 7.760397911415197e-05, + "loss": 0.2595, + "step": 188250 + }, + { + "epoch": 152.2, + "learning_rate": 7.754771335974073e-05, + "loss": 0.2235, + "step": 188275 + }, + { + "epoch": 152.22, + "learning_rate": 7.749144760532949e-05, + "loss": 0.2349, + "step": 188300 + }, + { + "epoch": 152.24, + "learning_rate": 7.743518185091826e-05, + "loss": 0.2049, + "step": 188325 + }, + { + "epoch": 152.26, + "learning_rate": 7.737891609650702e-05, + "loss": 0.2321, + "step": 188350 + }, + { + "epoch": 152.28, + "learning_rate": 7.732265034209578e-05, + "loss": 0.1949, + "step": 188375 + }, + { + "epoch": 152.3, + "learning_rate": 7.726638458768455e-05, + "loss": 0.232, + "step": 188400 + }, + { + "epoch": 152.32, + "learning_rate": 7.721011883327333e-05, + "loss": 0.2478, + "step": 188425 + }, + { + "epoch": 152.34, + "learning_rate": 7.715385307886208e-05, + "loss": 0.2493, + "step": 188450 + }, + { + "epoch": 152.36, + "learning_rate": 7.709758732445086e-05, + "loss": 0.2047, + "step": 188475 + }, + { + "epoch": 152.38, + "learning_rate": 7.704132157003961e-05, + "loss": 0.2377, + "step": 188500 + }, + { + "epoch": 152.41, + "learning_rate": 7.698505581562839e-05, + "loss": 0.2217, + "step": 188525 + }, + { + "epoch": 152.43, + "learning_rate": 7.692879006121714e-05, + "loss": 0.2379, + "step": 188550 + }, + { + "epoch": 152.45, + "learning_rate": 7.687252430680592e-05, + "loss": 0.2238, + "step": 188575 + }, + { + "epoch": 152.47, + "learning_rate": 7.681625855239467e-05, + "loss": 0.2216, + "step": 188600 + }, + { + "epoch": 152.49, + "learning_rate": 7.675999279798343e-05, + "loss": 0.2229, + "step": 188625 + }, + { + "epoch": 152.51, + "learning_rate": 7.67037270435722e-05, + "loss": 0.2629, + "step": 188650 + }, + { + "epoch": 152.53, + "learning_rate": 7.664746128916096e-05, + "loss": 0.2448, + "step": 188675 + }, + { + "epoch": 152.55, + "learning_rate": 7.659119553474973e-05, + "loss": 0.2494, + "step": 188700 + }, + { + "epoch": 152.57, + "learning_rate": 7.653492978033849e-05, + "loss": 0.2113, + "step": 188725 + }, + { + "epoch": 152.59, + "learning_rate": 7.647866402592727e-05, + "loss": 0.2247, + "step": 188750 + }, + { + "epoch": 152.61, + "learning_rate": 7.642239827151602e-05, + "loss": 0.2647, + "step": 188775 + }, + { + "epoch": 152.63, + "learning_rate": 7.63661325171048e-05, + "loss": 0.2634, + "step": 188800 + }, + { + "epoch": 152.65, + "learning_rate": 7.630986676269355e-05, + "loss": 0.2549, + "step": 188825 + }, + { + "epoch": 152.67, + "learning_rate": 7.625360100828233e-05, + "loss": 0.2276, + "step": 188850 + }, + { + "epoch": 152.69, + "learning_rate": 7.619733525387108e-05, + "loss": 0.2175, + "step": 188875 + }, + { + "epoch": 152.71, + "learning_rate": 7.614106949945986e-05, + "loss": 0.2392, + "step": 188900 + }, + { + "epoch": 152.73, + "learning_rate": 7.608480374504861e-05, + "loss": 0.2177, + "step": 188925 + }, + { + "epoch": 152.75, + "learning_rate": 7.602853799063739e-05, + "loss": 0.2344, + "step": 188950 + }, + { + "epoch": 152.77, + "learning_rate": 7.597227223622614e-05, + "loss": 0.2275, + "step": 188975 + }, + { + "epoch": 152.79, + "learning_rate": 7.59160064818149e-05, + "loss": 0.2444, + "step": 189000 + }, + { + "epoch": 152.79, + "eval_cer": 0.07623481822941798, + "eval_loss": 0.45240142941474915, + "eval_runtime": 150.3487, + "eval_samples_per_second": 27.889, + "eval_steps_per_second": 6.977, + "eval_wer": 0.32388254486133766, + "step": 189000 + }, + { + "epoch": 152.81, + "learning_rate": 7.585974072740367e-05, + "loss": 0.2367, + "step": 189025 + }, + { + "epoch": 152.83, + "learning_rate": 7.580347497299243e-05, + "loss": 0.2331, + "step": 189050 + }, + { + "epoch": 152.85, + "learning_rate": 7.574720921858121e-05, + "loss": 0.2564, + "step": 189075 + }, + { + "epoch": 152.87, + "learning_rate": 7.569094346416996e-05, + "loss": 0.2473, + "step": 189100 + }, + { + "epoch": 152.89, + "learning_rate": 7.563467770975874e-05, + "loss": 0.2096, + "step": 189125 + }, + { + "epoch": 152.91, + "learning_rate": 7.55784119553475e-05, + "loss": 0.2707, + "step": 189150 + }, + { + "epoch": 152.93, + "learning_rate": 7.552214620093627e-05, + "loss": 0.2173, + "step": 189175 + }, + { + "epoch": 152.95, + "learning_rate": 7.546588044652502e-05, + "loss": 0.2174, + "step": 189200 + }, + { + "epoch": 152.97, + "learning_rate": 7.54096146921138e-05, + "loss": 0.2082, + "step": 189225 + }, + { + "epoch": 152.99, + "learning_rate": 7.535334893770255e-05, + "loss": 0.2535, + "step": 189250 + }, + { + "epoch": 153.01, + "learning_rate": 7.529708318329133e-05, + "loss": 0.2413, + "step": 189275 + }, + { + "epoch": 153.03, + "learning_rate": 7.524081742888008e-05, + "loss": 0.2138, + "step": 189300 + }, + { + "epoch": 153.05, + "learning_rate": 7.518455167446886e-05, + "loss": 0.2521, + "step": 189325 + }, + { + "epoch": 153.07, + "learning_rate": 7.512828592005761e-05, + "loss": 0.2148, + "step": 189350 + }, + { + "epoch": 153.09, + "learning_rate": 7.507202016564638e-05, + "loss": 0.22, + "step": 189375 + }, + { + "epoch": 153.11, + "learning_rate": 7.501575441123516e-05, + "loss": 0.2497, + "step": 189400 + }, + { + "epoch": 153.13, + "learning_rate": 7.49594886568239e-05, + "loss": 0.2299, + "step": 189425 + }, + { + "epoch": 153.15, + "learning_rate": 7.490322290241268e-05, + "loss": 0.2348, + "step": 189450 + }, + { + "epoch": 153.17, + "learning_rate": 7.484695714800144e-05, + "loss": 0.2554, + "step": 189475 + }, + { + "epoch": 153.19, + "learning_rate": 7.479069139359021e-05, + "loss": 0.1973, + "step": 189500 + }, + { + "epoch": 153.21, + "learning_rate": 7.473442563917897e-05, + "loss": 0.2412, + "step": 189525 + }, + { + "epoch": 153.23, + "learning_rate": 7.467815988476774e-05, + "loss": 0.2277, + "step": 189550 + }, + { + "epoch": 153.25, + "learning_rate": 7.46218941303565e-05, + "loss": 0.2222, + "step": 189575 + }, + { + "epoch": 153.27, + "learning_rate": 7.456562837594527e-05, + "loss": 0.2381, + "step": 189600 + }, + { + "epoch": 153.29, + "learning_rate": 7.450936262153402e-05, + "loss": 0.2318, + "step": 189625 + }, + { + "epoch": 153.31, + "learning_rate": 7.44530968671228e-05, + "loss": 0.2303, + "step": 189650 + }, + { + "epoch": 153.33, + "learning_rate": 7.439683111271155e-05, + "loss": 0.2455, + "step": 189675 + }, + { + "epoch": 153.35, + "learning_rate": 7.434056535830032e-05, + "loss": 0.2171, + "step": 189700 + }, + { + "epoch": 153.38, + "learning_rate": 7.42842996038891e-05, + "loss": 0.2435, + "step": 189725 + }, + { + "epoch": 153.4, + "learning_rate": 7.422803384947785e-05, + "loss": 0.2469, + "step": 189750 + }, + { + "epoch": 153.42, + "learning_rate": 7.417176809506663e-05, + "loss": 0.2263, + "step": 189775 + }, + { + "epoch": 153.44, + "learning_rate": 7.411550234065538e-05, + "loss": 0.2311, + "step": 189800 + }, + { + "epoch": 153.46, + "learning_rate": 7.405923658624416e-05, + "loss": 0.2528, + "step": 189825 + }, + { + "epoch": 153.48, + "learning_rate": 7.400297083183291e-05, + "loss": 0.2196, + "step": 189850 + }, + { + "epoch": 153.5, + "learning_rate": 7.394670507742169e-05, + "loss": 0.2193, + "step": 189875 + }, + { + "epoch": 153.52, + "learning_rate": 7.389043932301044e-05, + "loss": 0.238, + "step": 189900 + }, + { + "epoch": 153.54, + "learning_rate": 7.383417356859922e-05, + "loss": 0.2361, + "step": 189925 + }, + { + "epoch": 153.56, + "learning_rate": 7.377790781418797e-05, + "loss": 0.2492, + "step": 189950 + }, + { + "epoch": 153.58, + "learning_rate": 7.372164205977675e-05, + "loss": 0.2293, + "step": 189975 + }, + { + "epoch": 153.6, + "learning_rate": 7.36653763053655e-05, + "loss": 0.2377, + "step": 190000 + }, + { + "epoch": 153.62, + "learning_rate": 7.360911055095427e-05, + "loss": 0.2156, + "step": 190025 + }, + { + "epoch": 153.64, + "learning_rate": 7.355284479654304e-05, + "loss": 0.2152, + "step": 190050 + }, + { + "epoch": 153.66, + "learning_rate": 7.349657904213179e-05, + "loss": 0.234, + "step": 190075 + }, + { + "epoch": 153.68, + "learning_rate": 7.344031328772057e-05, + "loss": 0.2216, + "step": 190100 + }, + { + "epoch": 153.7, + "learning_rate": 7.338404753330932e-05, + "loss": 0.2155, + "step": 190125 + }, + { + "epoch": 153.72, + "learning_rate": 7.33277817788981e-05, + "loss": 0.2125, + "step": 190150 + }, + { + "epoch": 153.74, + "learning_rate": 7.327151602448685e-05, + "loss": 0.2174, + "step": 190175 + }, + { + "epoch": 153.76, + "learning_rate": 7.321525027007563e-05, + "loss": 0.1994, + "step": 190200 + }, + { + "epoch": 153.78, + "learning_rate": 7.315898451566438e-05, + "loss": 0.2014, + "step": 190225 + }, + { + "epoch": 153.8, + "learning_rate": 7.310271876125316e-05, + "loss": 0.2064, + "step": 190250 + }, + { + "epoch": 153.82, + "learning_rate": 7.304645300684191e-05, + "loss": 0.247, + "step": 190275 + }, + { + "epoch": 153.84, + "learning_rate": 7.299018725243069e-05, + "loss": 0.2307, + "step": 190300 + }, + { + "epoch": 153.86, + "learning_rate": 7.293392149801944e-05, + "loss": 0.2136, + "step": 190325 + }, + { + "epoch": 153.88, + "learning_rate": 7.287765574360822e-05, + "loss": 0.2163, + "step": 190350 + }, + { + "epoch": 153.9, + "learning_rate": 7.282138998919698e-05, + "loss": 0.2388, + "step": 190375 + }, + { + "epoch": 153.92, + "learning_rate": 7.276512423478575e-05, + "loss": 0.2372, + "step": 190400 + }, + { + "epoch": 153.94, + "learning_rate": 7.270885848037451e-05, + "loss": 0.2427, + "step": 190425 + }, + { + "epoch": 153.96, + "learning_rate": 7.265259272596326e-05, + "loss": 0.2014, + "step": 190450 + }, + { + "epoch": 153.98, + "learning_rate": 7.259632697155204e-05, + "loss": 0.2028, + "step": 190475 + }, + { + "epoch": 154.0, + "learning_rate": 7.254006121714079e-05, + "loss": 0.3995, + "step": 190500 + }, + { + "epoch": 154.02, + "learning_rate": 7.248379546272957e-05, + "loss": 0.2444, + "step": 190525 + }, + { + "epoch": 154.04, + "learning_rate": 7.242752970831832e-05, + "loss": 0.2182, + "step": 190550 + }, + { + "epoch": 154.06, + "learning_rate": 7.23712639539071e-05, + "loss": 0.2397, + "step": 190575 + }, + { + "epoch": 154.08, + "learning_rate": 7.231499819949585e-05, + "loss": 0.2091, + "step": 190600 + }, + { + "epoch": 154.1, + "learning_rate": 7.225873244508463e-05, + "loss": 0.2603, + "step": 190625 + }, + { + "epoch": 154.12, + "learning_rate": 7.220246669067338e-05, + "loss": 0.1942, + "step": 190650 + }, + { + "epoch": 154.14, + "learning_rate": 7.214620093626216e-05, + "loss": 0.2209, + "step": 190675 + }, + { + "epoch": 154.16, + "learning_rate": 7.208993518185092e-05, + "loss": 0.2305, + "step": 190700 + }, + { + "epoch": 154.18, + "learning_rate": 7.203366942743969e-05, + "loss": 0.2347, + "step": 190725 + }, + { + "epoch": 154.2, + "learning_rate": 7.197740367302845e-05, + "loss": 0.2093, + "step": 190750 + }, + { + "epoch": 154.22, + "learning_rate": 7.19211379186172e-05, + "loss": 0.2282, + "step": 190775 + }, + { + "epoch": 154.24, + "learning_rate": 7.186487216420598e-05, + "loss": 0.2018, + "step": 190800 + }, + { + "epoch": 154.26, + "learning_rate": 7.180860640979474e-05, + "loss": 0.2247, + "step": 190825 + }, + { + "epoch": 154.28, + "learning_rate": 7.175234065538351e-05, + "loss": 0.2136, + "step": 190850 + }, + { + "epoch": 154.3, + "learning_rate": 7.169607490097226e-05, + "loss": 0.2416, + "step": 190875 + }, + { + "epoch": 154.32, + "learning_rate": 7.163980914656104e-05, + "loss": 0.2178, + "step": 190900 + }, + { + "epoch": 154.35, + "learning_rate": 7.15835433921498e-05, + "loss": 0.2408, + "step": 190925 + }, + { + "epoch": 154.37, + "learning_rate": 7.152727763773857e-05, + "loss": 0.216, + "step": 190950 + }, + { + "epoch": 154.39, + "learning_rate": 7.147101188332732e-05, + "loss": 0.2245, + "step": 190975 + }, + { + "epoch": 154.41, + "learning_rate": 7.14147461289161e-05, + "loss": 0.234, + "step": 191000 + }, + { + "epoch": 154.43, + "learning_rate": 7.135848037450487e-05, + "loss": 0.2355, + "step": 191025 + }, + { + "epoch": 154.45, + "learning_rate": 7.130221462009363e-05, + "loss": 0.2217, + "step": 191050 + }, + { + "epoch": 154.47, + "learning_rate": 7.12459488656824e-05, + "loss": 0.245, + "step": 191075 + }, + { + "epoch": 154.49, + "learning_rate": 7.118968311127116e-05, + "loss": 0.2192, + "step": 191100 + }, + { + "epoch": 154.51, + "learning_rate": 7.113341735685993e-05, + "loss": 0.2443, + "step": 191125 + }, + { + "epoch": 154.53, + "learning_rate": 7.107715160244868e-05, + "loss": 0.2346, + "step": 191150 + }, + { + "epoch": 154.55, + "learning_rate": 7.102088584803746e-05, + "loss": 0.2395, + "step": 191175 + }, + { + "epoch": 154.57, + "learning_rate": 7.096462009362621e-05, + "loss": 0.2436, + "step": 191200 + }, + { + "epoch": 154.59, + "learning_rate": 7.090835433921499e-05, + "loss": 0.2365, + "step": 191225 + }, + { + "epoch": 154.61, + "learning_rate": 7.085208858480374e-05, + "loss": 0.24, + "step": 191250 + }, + { + "epoch": 154.63, + "learning_rate": 7.079582283039251e-05, + "loss": 0.2425, + "step": 191275 + }, + { + "epoch": 154.65, + "learning_rate": 7.073955707598127e-05, + "loss": 0.2055, + "step": 191300 + }, + { + "epoch": 154.67, + "learning_rate": 7.068329132157004e-05, + "loss": 0.2431, + "step": 191325 + }, + { + "epoch": 154.69, + "learning_rate": 7.062702556715881e-05, + "loss": 0.2072, + "step": 191350 + }, + { + "epoch": 154.71, + "learning_rate": 7.057075981274757e-05, + "loss": 0.2459, + "step": 191375 + }, + { + "epoch": 154.73, + "learning_rate": 7.051449405833634e-05, + "loss": 0.2247, + "step": 191400 + }, + { + "epoch": 154.75, + "learning_rate": 7.04582283039251e-05, + "loss": 0.2301, + "step": 191425 + }, + { + "epoch": 154.77, + "learning_rate": 7.040196254951387e-05, + "loss": 0.2022, + "step": 191450 + }, + { + "epoch": 154.79, + "learning_rate": 7.034569679510262e-05, + "loss": 0.2515, + "step": 191475 + }, + { + "epoch": 154.81, + "learning_rate": 7.02894310406914e-05, + "loss": 0.1996, + "step": 191500 + }, + { + "epoch": 154.83, + "learning_rate": 7.023316528628015e-05, + "loss": 0.2401, + "step": 191525 + }, + { + "epoch": 154.85, + "learning_rate": 7.017689953186893e-05, + "loss": 0.2216, + "step": 191550 + }, + { + "epoch": 154.87, + "learning_rate": 7.012063377745768e-05, + "loss": 0.2277, + "step": 191575 + }, + { + "epoch": 154.89, + "learning_rate": 7.006436802304646e-05, + "loss": 0.2025, + "step": 191600 + }, + { + "epoch": 154.91, + "learning_rate": 7.000810226863521e-05, + "loss": 0.2423, + "step": 191625 + }, + { + "epoch": 154.93, + "learning_rate": 6.995408714440043e-05, + "loss": 0.2019, + "step": 191650 + }, + { + "epoch": 154.95, + "learning_rate": 6.990007202016565e-05, + "loss": 0.2271, + "step": 191675 + }, + { + "epoch": 154.97, + "learning_rate": 6.984380626575441e-05, + "loss": 0.2214, + "step": 191700 + }, + { + "epoch": 154.99, + "learning_rate": 6.978754051134318e-05, + "loss": 0.2428, + "step": 191725 + }, + { + "epoch": 155.01, + "learning_rate": 6.973127475693194e-05, + "loss": 0.2019, + "step": 191750 + }, + { + "epoch": 155.03, + "learning_rate": 6.96750090025207e-05, + "loss": 0.23, + "step": 191775 + }, + { + "epoch": 155.05, + "learning_rate": 6.961874324810947e-05, + "loss": 0.2473, + "step": 191800 + }, + { + "epoch": 155.07, + "learning_rate": 6.956247749369824e-05, + "loss": 0.2076, + "step": 191825 + }, + { + "epoch": 155.09, + "learning_rate": 6.9506211739287e-05, + "loss": 0.2534, + "step": 191850 + }, + { + "epoch": 155.11, + "learning_rate": 6.944994598487577e-05, + "loss": 0.2278, + "step": 191875 + }, + { + "epoch": 155.13, + "learning_rate": 6.939368023046453e-05, + "loss": 0.2109, + "step": 191900 + }, + { + "epoch": 155.15, + "learning_rate": 6.93374144760533e-05, + "loss": 0.224, + "step": 191925 + }, + { + "epoch": 155.17, + "learning_rate": 6.928114872164207e-05, + "loss": 0.2067, + "step": 191950 + }, + { + "epoch": 155.19, + "learning_rate": 6.922488296723082e-05, + "loss": 0.1854, + "step": 191975 + }, + { + "epoch": 155.21, + "learning_rate": 6.916861721281959e-05, + "loss": 0.2272, + "step": 192000 + }, + { + "epoch": 155.21, + "eval_cer": 0.0758806196934386, + "eval_loss": 0.46198299527168274, + "eval_runtime": 150.7236, + "eval_samples_per_second": 27.819, + "eval_steps_per_second": 6.96, + "eval_wer": 0.32218597063621535, + "step": 192000 + }, + { + "epoch": 155.23, + "learning_rate": 6.911235145840835e-05, + "loss": 0.1919, + "step": 192025 + }, + { + "epoch": 155.25, + "learning_rate": 6.905608570399712e-05, + "loss": 0.228, + "step": 192050 + }, + { + "epoch": 155.27, + "learning_rate": 6.899981994958588e-05, + "loss": 0.1864, + "step": 192075 + }, + { + "epoch": 155.3, + "learning_rate": 6.894355419517465e-05, + "loss": 0.2503, + "step": 192100 + }, + { + "epoch": 155.32, + "learning_rate": 6.888728844076341e-05, + "loss": 0.2288, + "step": 192125 + }, + { + "epoch": 155.34, + "learning_rate": 6.883102268635218e-05, + "loss": 0.2405, + "step": 192150 + }, + { + "epoch": 155.36, + "learning_rate": 6.877475693194094e-05, + "loss": 0.226, + "step": 192175 + }, + { + "epoch": 155.38, + "learning_rate": 6.871849117752971e-05, + "loss": 0.2376, + "step": 192200 + }, + { + "epoch": 155.4, + "learning_rate": 6.866222542311847e-05, + "loss": 0.2325, + "step": 192225 + }, + { + "epoch": 155.42, + "learning_rate": 6.860595966870724e-05, + "loss": 0.2236, + "step": 192250 + }, + { + "epoch": 155.44, + "learning_rate": 6.854969391429602e-05, + "loss": 0.2091, + "step": 192275 + }, + { + "epoch": 155.46, + "learning_rate": 6.849342815988477e-05, + "loss": 0.2424, + "step": 192300 + }, + { + "epoch": 155.48, + "learning_rate": 6.843716240547355e-05, + "loss": 0.2122, + "step": 192325 + }, + { + "epoch": 155.5, + "learning_rate": 6.83808966510623e-05, + "loss": 0.2159, + "step": 192350 + }, + { + "epoch": 155.52, + "learning_rate": 6.832463089665106e-05, + "loss": 0.2481, + "step": 192375 + }, + { + "epoch": 155.54, + "learning_rate": 6.826836514223983e-05, + "loss": 0.2146, + "step": 192400 + }, + { + "epoch": 155.56, + "learning_rate": 6.821209938782859e-05, + "loss": 0.1996, + "step": 192425 + }, + { + "epoch": 155.58, + "learning_rate": 6.815583363341736e-05, + "loss": 0.2338, + "step": 192450 + }, + { + "epoch": 155.6, + "learning_rate": 6.809956787900612e-05, + "loss": 0.2209, + "step": 192475 + }, + { + "epoch": 155.62, + "learning_rate": 6.804330212459489e-05, + "loss": 0.242, + "step": 192500 + }, + { + "epoch": 155.64, + "learning_rate": 6.798703637018365e-05, + "loss": 0.2416, + "step": 192525 + }, + { + "epoch": 155.66, + "learning_rate": 6.793077061577242e-05, + "loss": 0.2224, + "step": 192550 + }, + { + "epoch": 155.68, + "learning_rate": 6.787450486136118e-05, + "loss": 0.2458, + "step": 192575 + }, + { + "epoch": 155.7, + "learning_rate": 6.781823910694996e-05, + "loss": 0.2218, + "step": 192600 + }, + { + "epoch": 155.72, + "learning_rate": 6.776197335253871e-05, + "loss": 0.2382, + "step": 192625 + }, + { + "epoch": 155.74, + "learning_rate": 6.770570759812749e-05, + "loss": 0.2254, + "step": 192650 + }, + { + "epoch": 155.76, + "learning_rate": 6.764944184371624e-05, + "loss": 0.2037, + "step": 192675 + }, + { + "epoch": 155.78, + "learning_rate": 6.7593176089305e-05, + "loss": 0.221, + "step": 192700 + }, + { + "epoch": 155.8, + "learning_rate": 6.753691033489377e-05, + "loss": 0.229, + "step": 192725 + }, + { + "epoch": 155.82, + "learning_rate": 6.748064458048253e-05, + "loss": 0.2352, + "step": 192750 + }, + { + "epoch": 155.84, + "learning_rate": 6.74243788260713e-05, + "loss": 0.2127, + "step": 192775 + }, + { + "epoch": 155.86, + "learning_rate": 6.736811307166006e-05, + "loss": 0.234, + "step": 192800 + }, + { + "epoch": 155.88, + "learning_rate": 6.731184731724883e-05, + "loss": 0.2289, + "step": 192825 + }, + { + "epoch": 155.9, + "learning_rate": 6.725558156283759e-05, + "loss": 0.2334, + "step": 192850 + }, + { + "epoch": 155.92, + "learning_rate": 6.719931580842637e-05, + "loss": 0.2458, + "step": 192875 + }, + { + "epoch": 155.94, + "learning_rate": 6.714305005401512e-05, + "loss": 0.2094, + "step": 192900 + }, + { + "epoch": 155.96, + "learning_rate": 6.70867842996039e-05, + "loss": 0.2045, + "step": 192925 + }, + { + "epoch": 155.98, + "learning_rate": 6.703051854519265e-05, + "loss": 0.2256, + "step": 192950 + }, + { + "epoch": 156.0, + "learning_rate": 6.697425279078143e-05, + "loss": 0.1937, + "step": 192975 + }, + { + "epoch": 156.02, + "learning_rate": 6.691798703637018e-05, + "loss": 0.2296, + "step": 193000 + }, + { + "epoch": 156.04, + "learning_rate": 6.686172128195896e-05, + "loss": 0.2489, + "step": 193025 + }, + { + "epoch": 156.06, + "learning_rate": 6.680545552754771e-05, + "loss": 0.2634, + "step": 193050 + }, + { + "epoch": 156.08, + "learning_rate": 6.674918977313648e-05, + "loss": 0.2301, + "step": 193075 + }, + { + "epoch": 156.1, + "learning_rate": 6.669292401872524e-05, + "loss": 0.194, + "step": 193100 + }, + { + "epoch": 156.12, + "learning_rate": 6.6636658264314e-05, + "loss": 0.2145, + "step": 193125 + }, + { + "epoch": 156.14, + "learning_rate": 6.658039250990277e-05, + "loss": 0.2503, + "step": 193150 + }, + { + "epoch": 156.16, + "learning_rate": 6.652412675549154e-05, + "loss": 0.2152, + "step": 193175 + }, + { + "epoch": 156.18, + "learning_rate": 6.646786100108031e-05, + "loss": 0.2306, + "step": 193200 + }, + { + "epoch": 156.2, + "learning_rate": 6.641159524666906e-05, + "loss": 0.22, + "step": 193225 + }, + { + "epoch": 156.22, + "learning_rate": 6.635532949225784e-05, + "loss": 0.2105, + "step": 193250 + }, + { + "epoch": 156.24, + "learning_rate": 6.62990637378466e-05, + "loss": 0.2004, + "step": 193275 + }, + { + "epoch": 156.27, + "learning_rate": 6.624279798343537e-05, + "loss": 0.2387, + "step": 193300 + }, + { + "epoch": 156.29, + "learning_rate": 6.618653222902412e-05, + "loss": 0.2132, + "step": 193325 + }, + { + "epoch": 156.31, + "learning_rate": 6.61302664746129e-05, + "loss": 0.2178, + "step": 193350 + }, + { + "epoch": 156.33, + "learning_rate": 6.607400072020165e-05, + "loss": 0.2301, + "step": 193375 + }, + { + "epoch": 156.35, + "learning_rate": 6.601773496579042e-05, + "loss": 0.2328, + "step": 193400 + }, + { + "epoch": 156.37, + "learning_rate": 6.596146921137918e-05, + "loss": 0.182, + "step": 193425 + }, + { + "epoch": 156.39, + "learning_rate": 6.590520345696795e-05, + "loss": 0.2293, + "step": 193450 + }, + { + "epoch": 156.41, + "learning_rate": 6.584893770255671e-05, + "loss": 0.2109, + "step": 193475 + }, + { + "epoch": 156.43, + "learning_rate": 6.579267194814548e-05, + "loss": 0.2151, + "step": 193500 + }, + { + "epoch": 156.45, + "learning_rate": 6.573640619373426e-05, + "loss": 0.2366, + "step": 193525 + }, + { + "epoch": 156.47, + "learning_rate": 6.568014043932301e-05, + "loss": 0.2333, + "step": 193550 + }, + { + "epoch": 156.49, + "learning_rate": 6.562387468491179e-05, + "loss": 0.2129, + "step": 193575 + }, + { + "epoch": 156.51, + "learning_rate": 6.556760893050054e-05, + "loss": 0.2277, + "step": 193600 + }, + { + "epoch": 156.53, + "learning_rate": 6.551134317608932e-05, + "loss": 0.1766, + "step": 193625 + }, + { + "epoch": 156.55, + "learning_rate": 6.545507742167807e-05, + "loss": 0.2129, + "step": 193650 + }, + { + "epoch": 156.57, + "learning_rate": 6.539881166726684e-05, + "loss": 0.2477, + "step": 193675 + }, + { + "epoch": 156.59, + "learning_rate": 6.53425459128556e-05, + "loss": 0.2421, + "step": 193700 + }, + { + "epoch": 156.61, + "learning_rate": 6.528628015844437e-05, + "loss": 0.1967, + "step": 193725 + }, + { + "epoch": 156.63, + "learning_rate": 6.523001440403313e-05, + "loss": 0.2341, + "step": 193750 + }, + { + "epoch": 156.65, + "learning_rate": 6.517374864962189e-05, + "loss": 0.1614, + "step": 193775 + }, + { + "epoch": 156.67, + "learning_rate": 6.511748289521066e-05, + "loss": 0.2197, + "step": 193800 + }, + { + "epoch": 156.69, + "learning_rate": 6.506121714079942e-05, + "loss": 0.2228, + "step": 193825 + }, + { + "epoch": 156.71, + "learning_rate": 6.50049513863882e-05, + "loss": 0.24, + "step": 193850 + }, + { + "epoch": 156.73, + "learning_rate": 6.494868563197695e-05, + "loss": 0.2053, + "step": 193875 + }, + { + "epoch": 156.75, + "learning_rate": 6.489241987756573e-05, + "loss": 0.235, + "step": 193900 + }, + { + "epoch": 156.77, + "learning_rate": 6.483615412315448e-05, + "loss": 0.1891, + "step": 193925 + }, + { + "epoch": 156.79, + "learning_rate": 6.477988836874326e-05, + "loss": 0.2285, + "step": 193950 + }, + { + "epoch": 156.81, + "learning_rate": 6.472362261433201e-05, + "loss": 0.2047, + "step": 193975 + }, + { + "epoch": 156.83, + "learning_rate": 6.466735685992079e-05, + "loss": 0.2422, + "step": 194000 + }, + { + "epoch": 156.85, + "learning_rate": 6.461109110550954e-05, + "loss": 0.2219, + "step": 194025 + }, + { + "epoch": 156.87, + "learning_rate": 6.455482535109832e-05, + "loss": 0.2377, + "step": 194050 + }, + { + "epoch": 156.89, + "learning_rate": 6.449855959668707e-05, + "loss": 0.2314, + "step": 194075 + }, + { + "epoch": 156.91, + "learning_rate": 6.444229384227585e-05, + "loss": 0.2444, + "step": 194100 + }, + { + "epoch": 156.93, + "learning_rate": 6.43860280878646e-05, + "loss": 0.1989, + "step": 194125 + }, + { + "epoch": 156.95, + "learning_rate": 6.432976233345336e-05, + "loss": 0.2266, + "step": 194150 + }, + { + "epoch": 156.97, + "learning_rate": 6.427349657904214e-05, + "loss": 0.2442, + "step": 194175 + }, + { + "epoch": 156.99, + "learning_rate": 6.421723082463089e-05, + "loss": 0.2409, + "step": 194200 + }, + { + "epoch": 157.01, + "learning_rate": 6.416096507021967e-05, + "loss": 0.2476, + "step": 194225 + }, + { + "epoch": 157.03, + "learning_rate": 6.410469931580842e-05, + "loss": 0.1957, + "step": 194250 + }, + { + "epoch": 157.05, + "learning_rate": 6.40484335613972e-05, + "loss": 0.221, + "step": 194275 + }, + { + "epoch": 157.07, + "learning_rate": 6.399216780698595e-05, + "loss": 0.2055, + "step": 194300 + }, + { + "epoch": 157.09, + "learning_rate": 6.393590205257473e-05, + "loss": 0.2165, + "step": 194325 + }, + { + "epoch": 157.11, + "learning_rate": 6.387963629816348e-05, + "loss": 0.1957, + "step": 194350 + }, + { + "epoch": 157.13, + "learning_rate": 6.382337054375226e-05, + "loss": 0.2212, + "step": 194375 + }, + { + "epoch": 157.15, + "learning_rate": 6.376710478934101e-05, + "loss": 0.2048, + "step": 194400 + }, + { + "epoch": 157.17, + "learning_rate": 6.371083903492979e-05, + "loss": 0.249, + "step": 194425 + }, + { + "epoch": 157.19, + "learning_rate": 6.365457328051854e-05, + "loss": 0.2055, + "step": 194450 + }, + { + "epoch": 157.22, + "learning_rate": 6.35983075261073e-05, + "loss": 0.231, + "step": 194475 + }, + { + "epoch": 157.24, + "learning_rate": 6.354204177169608e-05, + "loss": 0.211, + "step": 194500 + }, + { + "epoch": 157.26, + "learning_rate": 6.348577601728483e-05, + "loss": 0.2182, + "step": 194525 + }, + { + "epoch": 157.28, + "learning_rate": 6.342951026287361e-05, + "loss": 0.2143, + "step": 194550 + }, + { + "epoch": 157.3, + "learning_rate": 6.337324450846236e-05, + "loss": 0.212, + "step": 194575 + }, + { + "epoch": 157.32, + "learning_rate": 6.331697875405114e-05, + "loss": 0.2317, + "step": 194600 + }, + { + "epoch": 157.34, + "learning_rate": 6.32607129996399e-05, + "loss": 0.2148, + "step": 194625 + }, + { + "epoch": 157.36, + "learning_rate": 6.320444724522867e-05, + "loss": 0.2185, + "step": 194650 + }, + { + "epoch": 157.38, + "learning_rate": 6.314818149081742e-05, + "loss": 0.2312, + "step": 194675 + }, + { + "epoch": 157.4, + "learning_rate": 6.30919157364062e-05, + "loss": 0.2312, + "step": 194700 + }, + { + "epoch": 157.42, + "learning_rate": 6.303564998199495e-05, + "loss": 0.2471, + "step": 194725 + }, + { + "epoch": 157.44, + "learning_rate": 6.297938422758373e-05, + "loss": 0.2164, + "step": 194750 + }, + { + "epoch": 157.46, + "learning_rate": 6.292311847317248e-05, + "loss": 0.2311, + "step": 194775 + }, + { + "epoch": 157.48, + "learning_rate": 6.286685271876126e-05, + "loss": 0.2, + "step": 194800 + }, + { + "epoch": 157.5, + "learning_rate": 6.281058696435003e-05, + "loss": 0.2278, + "step": 194825 + }, + { + "epoch": 157.52, + "learning_rate": 6.275432120993878e-05, + "loss": 0.2307, + "step": 194850 + }, + { + "epoch": 157.54, + "learning_rate": 6.269805545552756e-05, + "loss": 0.2185, + "step": 194875 + }, + { + "epoch": 157.56, + "learning_rate": 6.26417897011163e-05, + "loss": 0.2261, + "step": 194900 + }, + { + "epoch": 157.58, + "learning_rate": 6.258552394670508e-05, + "loss": 0.2419, + "step": 194925 + }, + { + "epoch": 157.6, + "learning_rate": 6.252925819229384e-05, + "loss": 0.1713, + "step": 194950 + }, + { + "epoch": 157.62, + "learning_rate": 6.247299243788261e-05, + "loss": 0.2293, + "step": 194975 + }, + { + "epoch": 157.64, + "learning_rate": 6.241672668347137e-05, + "loss": 0.2102, + "step": 195000 + }, + { + "epoch": 157.64, + "eval_cer": 0.07536215516975864, + "eval_loss": 0.45333951711654663, + "eval_runtime": 150.7124, + "eval_samples_per_second": 27.821, + "eval_steps_per_second": 6.96, + "eval_wer": 0.32120717781402935, + "step": 195000 + }, + { + "epoch": 157.66, + "learning_rate": 6.236046092906013e-05, + "loss": 0.2039, + "step": 195025 + }, + { + "epoch": 157.68, + "learning_rate": 6.23041951746489e-05, + "loss": 0.1991, + "step": 195050 + }, + { + "epoch": 157.7, + "learning_rate": 6.224792942023766e-05, + "loss": 0.2326, + "step": 195075 + }, + { + "epoch": 157.72, + "learning_rate": 6.219166366582642e-05, + "loss": 0.2278, + "step": 195100 + }, + { + "epoch": 157.74, + "learning_rate": 6.21353979114152e-05, + "loss": 0.2313, + "step": 195125 + }, + { + "epoch": 157.76, + "learning_rate": 6.207913215700397e-05, + "loss": 0.2003, + "step": 195150 + }, + { + "epoch": 157.78, + "learning_rate": 6.202286640259273e-05, + "loss": 0.2438, + "step": 195175 + }, + { + "epoch": 157.8, + "learning_rate": 6.19666006481815e-05, + "loss": 0.203, + "step": 195200 + }, + { + "epoch": 157.82, + "learning_rate": 6.191033489377026e-05, + "loss": 0.2163, + "step": 195225 + }, + { + "epoch": 157.84, + "learning_rate": 6.185406913935903e-05, + "loss": 0.2048, + "step": 195250 + }, + { + "epoch": 157.86, + "learning_rate": 6.179780338494779e-05, + "loss": 0.2448, + "step": 195275 + }, + { + "epoch": 157.88, + "learning_rate": 6.174153763053656e-05, + "loss": 0.2062, + "step": 195300 + }, + { + "epoch": 157.9, + "learning_rate": 6.168527187612532e-05, + "loss": 0.2055, + "step": 195325 + }, + { + "epoch": 157.92, + "learning_rate": 6.162900612171409e-05, + "loss": 0.2309, + "step": 195350 + }, + { + "epoch": 157.94, + "learning_rate": 6.157274036730284e-05, + "loss": 0.2249, + "step": 195375 + }, + { + "epoch": 157.96, + "learning_rate": 6.15164746128916e-05, + "loss": 0.2243, + "step": 195400 + }, + { + "epoch": 157.98, + "learning_rate": 6.146020885848037e-05, + "loss": 0.2109, + "step": 195425 + }, + { + "epoch": 158.0, + "learning_rate": 6.140394310406915e-05, + "loss": 0.1838, + "step": 195450 + }, + { + "epoch": 158.02, + "learning_rate": 6.134767734965791e-05, + "loss": 0.2381, + "step": 195475 + }, + { + "epoch": 158.04, + "learning_rate": 6.129141159524668e-05, + "loss": 0.1997, + "step": 195500 + }, + { + "epoch": 158.06, + "learning_rate": 6.123514584083544e-05, + "loss": 0.2122, + "step": 195525 + }, + { + "epoch": 158.08, + "learning_rate": 6.11788800864242e-05, + "loss": 0.1902, + "step": 195550 + }, + { + "epoch": 158.1, + "learning_rate": 6.112261433201297e-05, + "loss": 0.2381, + "step": 195575 + }, + { + "epoch": 158.12, + "learning_rate": 6.106634857760173e-05, + "loss": 0.2255, + "step": 195600 + }, + { + "epoch": 158.14, + "learning_rate": 6.10100828231905e-05, + "loss": 0.1934, + "step": 195625 + }, + { + "epoch": 158.16, + "learning_rate": 6.0953817068779264e-05, + "loss": 0.212, + "step": 195650 + }, + { + "epoch": 158.19, + "learning_rate": 6.089755131436803e-05, + "loss": 0.2282, + "step": 195675 + }, + { + "epoch": 158.21, + "learning_rate": 6.0841285559956794e-05, + "loss": 0.2013, + "step": 195700 + }, + { + "epoch": 158.23, + "learning_rate": 6.078501980554555e-05, + "loss": 0.2444, + "step": 195725 + }, + { + "epoch": 158.25, + "learning_rate": 6.0728754051134316e-05, + "loss": 0.2717, + "step": 195750 + }, + { + "epoch": 158.27, + "learning_rate": 6.067248829672308e-05, + "loss": 0.2383, + "step": 195775 + }, + { + "epoch": 158.29, + "learning_rate": 6.0616222542311846e-05, + "loss": 0.174, + "step": 195800 + }, + { + "epoch": 158.31, + "learning_rate": 6.055995678790061e-05, + "loss": 0.2235, + "step": 195825 + }, + { + "epoch": 158.33, + "learning_rate": 6.0503691033489376e-05, + "loss": 0.1992, + "step": 195850 + }, + { + "epoch": 158.35, + "learning_rate": 6.044742527907814e-05, + "loss": 0.2396, + "step": 195875 + }, + { + "epoch": 158.37, + "learning_rate": 6.0391159524666905e-05, + "loss": 0.2072, + "step": 195900 + }, + { + "epoch": 158.39, + "learning_rate": 6.033489377025568e-05, + "loss": 0.2484, + "step": 195925 + }, + { + "epoch": 158.41, + "learning_rate": 6.027862801584444e-05, + "loss": 0.2344, + "step": 195950 + }, + { + "epoch": 158.43, + "learning_rate": 6.0222362261433206e-05, + "loss": 0.2205, + "step": 195975 + }, + { + "epoch": 158.45, + "learning_rate": 6.016609650702197e-05, + "loss": 0.2186, + "step": 196000 + }, + { + "epoch": 158.47, + "learning_rate": 6.0109830752610736e-05, + "loss": 0.1948, + "step": 196025 + }, + { + "epoch": 158.49, + "learning_rate": 6.00535649981995e-05, + "loss": 0.24, + "step": 196050 + }, + { + "epoch": 158.51, + "learning_rate": 5.999729924378826e-05, + "loss": 0.2104, + "step": 196075 + }, + { + "epoch": 158.53, + "learning_rate": 5.9941033489377024e-05, + "loss": 0.206, + "step": 196100 + }, + { + "epoch": 158.55, + "learning_rate": 5.988476773496579e-05, + "loss": 0.2317, + "step": 196125 + }, + { + "epoch": 158.57, + "learning_rate": 5.982850198055455e-05, + "loss": 0.2192, + "step": 196150 + }, + { + "epoch": 158.59, + "learning_rate": 5.9774486856319766e-05, + "loss": 0.1975, + "step": 196175 + }, + { + "epoch": 158.61, + "learning_rate": 5.971822110190853e-05, + "loss": 0.2098, + "step": 196200 + }, + { + "epoch": 158.63, + "learning_rate": 5.9661955347497295e-05, + "loss": 0.2464, + "step": 196225 + }, + { + "epoch": 158.65, + "learning_rate": 5.960568959308607e-05, + "loss": 0.2105, + "step": 196250 + }, + { + "epoch": 158.67, + "learning_rate": 5.954942383867483e-05, + "loss": 0.2118, + "step": 196275 + }, + { + "epoch": 158.69, + "learning_rate": 5.9493158084263597e-05, + "loss": 0.2251, + "step": 196300 + }, + { + "epoch": 158.71, + "learning_rate": 5.943689232985236e-05, + "loss": 0.2299, + "step": 196325 + }, + { + "epoch": 158.73, + "learning_rate": 5.9380626575441126e-05, + "loss": 0.2053, + "step": 196350 + }, + { + "epoch": 158.75, + "learning_rate": 5.932436082102989e-05, + "loss": 0.259, + "step": 196375 + }, + { + "epoch": 158.77, + "learning_rate": 5.9268095066618656e-05, + "loss": 0.2073, + "step": 196400 + }, + { + "epoch": 158.79, + "learning_rate": 5.921182931220742e-05, + "loss": 0.1926, + "step": 196425 + }, + { + "epoch": 158.81, + "learning_rate": 5.9155563557796185e-05, + "loss": 0.1656, + "step": 196450 + }, + { + "epoch": 158.83, + "learning_rate": 5.909929780338495e-05, + "loss": 0.2462, + "step": 196475 + }, + { + "epoch": 158.85, + "learning_rate": 5.904303204897371e-05, + "loss": 0.2064, + "step": 196500 + }, + { + "epoch": 158.87, + "learning_rate": 5.898676629456247e-05, + "loss": 0.2116, + "step": 196525 + }, + { + "epoch": 158.89, + "learning_rate": 5.8930500540151245e-05, + "loss": 0.1963, + "step": 196550 + }, + { + "epoch": 158.91, + "learning_rate": 5.887423478574001e-05, + "loss": 0.2498, + "step": 196575 + }, + { + "epoch": 158.93, + "learning_rate": 5.8817969031328774e-05, + "loss": 0.2001, + "step": 196600 + }, + { + "epoch": 158.95, + "learning_rate": 5.876170327691754e-05, + "loss": 0.2215, + "step": 196625 + }, + { + "epoch": 158.97, + "learning_rate": 5.8705437522506304e-05, + "loss": 0.2016, + "step": 196650 + }, + { + "epoch": 158.99, + "learning_rate": 5.864917176809507e-05, + "loss": 0.2508, + "step": 196675 + }, + { + "epoch": 159.01, + "learning_rate": 5.859290601368383e-05, + "loss": 0.2308, + "step": 196700 + }, + { + "epoch": 159.03, + "learning_rate": 5.85366402592726e-05, + "loss": 0.1911, + "step": 196725 + }, + { + "epoch": 159.05, + "learning_rate": 5.848037450486136e-05, + "loss": 0.2246, + "step": 196750 + }, + { + "epoch": 159.07, + "learning_rate": 5.8426359380626575e-05, + "loss": 0.2202, + "step": 196775 + }, + { + "epoch": 159.09, + "learning_rate": 5.837009362621534e-05, + "loss": 0.2251, + "step": 196800 + }, + { + "epoch": 159.11, + "learning_rate": 5.8313827871804105e-05, + "loss": 0.1669, + "step": 196825 + }, + { + "epoch": 159.14, + "learning_rate": 5.825756211739287e-05, + "loss": 0.2453, + "step": 196850 + }, + { + "epoch": 159.16, + "learning_rate": 5.820129636298164e-05, + "loss": 0.195, + "step": 196875 + }, + { + "epoch": 159.18, + "learning_rate": 5.8145030608570406e-05, + "loss": 0.2235, + "step": 196900 + }, + { + "epoch": 159.2, + "learning_rate": 5.8088764854159164e-05, + "loss": 0.2228, + "step": 196925 + }, + { + "epoch": 159.22, + "learning_rate": 5.803249909974793e-05, + "loss": 0.2062, + "step": 196950 + }, + { + "epoch": 159.24, + "learning_rate": 5.7976233345336694e-05, + "loss": 0.2005, + "step": 196975 + }, + { + "epoch": 159.26, + "learning_rate": 5.791996759092546e-05, + "loss": 0.2018, + "step": 197000 + }, + { + "epoch": 159.28, + "learning_rate": 5.7863701836514223e-05, + "loss": 0.2171, + "step": 197025 + }, + { + "epoch": 159.3, + "learning_rate": 5.780743608210299e-05, + "loss": 0.2398, + "step": 197050 + }, + { + "epoch": 159.32, + "learning_rate": 5.775117032769175e-05, + "loss": 0.1838, + "step": 197075 + }, + { + "epoch": 159.34, + "learning_rate": 5.769490457328052e-05, + "loss": 0.2108, + "step": 197100 + }, + { + "epoch": 159.36, + "learning_rate": 5.763863881886928e-05, + "loss": 0.2035, + "step": 197125 + }, + { + "epoch": 159.38, + "learning_rate": 5.758237306445805e-05, + "loss": 0.2166, + "step": 197150 + }, + { + "epoch": 159.4, + "learning_rate": 5.752610731004682e-05, + "loss": 0.2265, + "step": 197175 + }, + { + "epoch": 159.42, + "learning_rate": 5.7469841555635584e-05, + "loss": 0.2085, + "step": 197200 + }, + { + "epoch": 159.44, + "learning_rate": 5.741357580122435e-05, + "loss": 0.2277, + "step": 197225 + }, + { + "epoch": 159.46, + "learning_rate": 5.7357310046813113e-05, + "loss": 0.2095, + "step": 197250 + }, + { + "epoch": 159.48, + "learning_rate": 5.730104429240188e-05, + "loss": 0.2066, + "step": 197275 + }, + { + "epoch": 159.5, + "learning_rate": 5.7244778537990636e-05, + "loss": 0.2441, + "step": 197300 + }, + { + "epoch": 159.52, + "learning_rate": 5.71885127835794e-05, + "loss": 0.1938, + "step": 197325 + }, + { + "epoch": 159.54, + "learning_rate": 5.7132247029168166e-05, + "loss": 0.2241, + "step": 197350 + }, + { + "epoch": 159.56, + "learning_rate": 5.707598127475693e-05, + "loss": 0.2147, + "step": 197375 + }, + { + "epoch": 159.58, + "learning_rate": 5.7019715520345695e-05, + "loss": 0.2061, + "step": 197400 + }, + { + "epoch": 159.6, + "learning_rate": 5.696344976593446e-05, + "loss": 0.2328, + "step": 197425 + }, + { + "epoch": 159.62, + "learning_rate": 5.6907184011523225e-05, + "loss": 0.2262, + "step": 197450 + }, + { + "epoch": 159.64, + "learning_rate": 5.685091825711199e-05, + "loss": 0.2212, + "step": 197475 + }, + { + "epoch": 159.66, + "learning_rate": 5.679465250270076e-05, + "loss": 0.2308, + "step": 197500 + }, + { + "epoch": 159.68, + "learning_rate": 5.6738386748289526e-05, + "loss": 0.2058, + "step": 197525 + }, + { + "epoch": 159.7, + "learning_rate": 5.668212099387829e-05, + "loss": 0.2286, + "step": 197550 + }, + { + "epoch": 159.72, + "learning_rate": 5.6625855239467056e-05, + "loss": 0.2089, + "step": 197575 + }, + { + "epoch": 159.74, + "learning_rate": 5.656958948505582e-05, + "loss": 0.2438, + "step": 197600 + }, + { + "epoch": 159.76, + "learning_rate": 5.6513323730644585e-05, + "loss": 0.2046, + "step": 197625 + }, + { + "epoch": 159.78, + "learning_rate": 5.6457057976233343e-05, + "loss": 0.2079, + "step": 197650 + }, + { + "epoch": 159.8, + "learning_rate": 5.640079222182211e-05, + "loss": 0.1749, + "step": 197675 + }, + { + "epoch": 159.82, + "learning_rate": 5.634452646741087e-05, + "loss": 0.2364, + "step": 197700 + }, + { + "epoch": 159.84, + "learning_rate": 5.628826071299964e-05, + "loss": 0.1952, + "step": 197725 + }, + { + "epoch": 159.86, + "learning_rate": 5.62319949585884e-05, + "loss": 0.2134, + "step": 197750 + }, + { + "epoch": 159.88, + "learning_rate": 5.617572920417717e-05, + "loss": 0.1913, + "step": 197775 + }, + { + "epoch": 159.9, + "learning_rate": 5.611946344976593e-05, + "loss": 0.2211, + "step": 197800 + }, + { + "epoch": 159.92, + "learning_rate": 5.6063197695354704e-05, + "loss": 0.1965, + "step": 197825 + }, + { + "epoch": 159.94, + "learning_rate": 5.600693194094347e-05, + "loss": 0.2465, + "step": 197850 + }, + { + "epoch": 159.96, + "learning_rate": 5.5950666186532233e-05, + "loss": 0.243, + "step": 197875 + }, + { + "epoch": 159.98, + "learning_rate": 5.5894400432121e-05, + "loss": 0.2337, + "step": 197900 + }, + { + "epoch": 160.0, + "learning_rate": 5.583813467770976e-05, + "loss": 0.1881, + "step": 197925 + }, + { + "epoch": 160.02, + "learning_rate": 5.578186892329853e-05, + "loss": 0.2028, + "step": 197950 + }, + { + "epoch": 160.04, + "learning_rate": 5.572560316888729e-05, + "loss": 0.2267, + "step": 197975 + }, + { + "epoch": 160.06, + "learning_rate": 5.566933741447605e-05, + "loss": 0.2231, + "step": 198000 + }, + { + "epoch": 160.06, + "eval_cer": 0.07449462542221492, + "eval_loss": 0.45625007152557373, + "eval_runtime": 150.0374, + "eval_samples_per_second": 27.946, + "eval_steps_per_second": 6.992, + "eval_wer": 0.31830342577487764, + "step": 198000 + }, + { + "epoch": 160.08, + "learning_rate": 5.5613071660064815e-05, + "loss": 0.2143, + "step": 198025 + }, + { + "epoch": 160.11, + "learning_rate": 5.555680590565358e-05, + "loss": 0.2117, + "step": 198050 + }, + { + "epoch": 160.13, + "learning_rate": 5.5500540151242345e-05, + "loss": 0.2071, + "step": 198075 + }, + { + "epoch": 160.15, + "learning_rate": 5.544427439683111e-05, + "loss": 0.219, + "step": 198100 + }, + { + "epoch": 160.17, + "learning_rate": 5.5388008642419875e-05, + "loss": 0.1927, + "step": 198125 + }, + { + "epoch": 160.19, + "learning_rate": 5.5331742888008646e-05, + "loss": 0.2291, + "step": 198150 + }, + { + "epoch": 160.21, + "learning_rate": 5.527547713359741e-05, + "loss": 0.2125, + "step": 198175 + }, + { + "epoch": 160.23, + "learning_rate": 5.5219211379186176e-05, + "loss": 0.2172, + "step": 198200 + }, + { + "epoch": 160.25, + "learning_rate": 5.516294562477494e-05, + "loss": 0.2213, + "step": 198225 + }, + { + "epoch": 160.27, + "learning_rate": 5.5106679870363705e-05, + "loss": 0.2123, + "step": 198250 + }, + { + "epoch": 160.29, + "learning_rate": 5.505041411595247e-05, + "loss": 0.1807, + "step": 198275 + }, + { + "epoch": 160.31, + "learning_rate": 5.4994148361541235e-05, + "loss": 0.2112, + "step": 198300 + }, + { + "epoch": 160.33, + "learning_rate": 5.493788260713e-05, + "loss": 0.2075, + "step": 198325 + }, + { + "epoch": 160.35, + "learning_rate": 5.488161685271876e-05, + "loss": 0.2219, + "step": 198350 + }, + { + "epoch": 160.37, + "learning_rate": 5.482535109830752e-05, + "loss": 0.2084, + "step": 198375 + }, + { + "epoch": 160.39, + "learning_rate": 5.476908534389629e-05, + "loss": 0.2309, + "step": 198400 + }, + { + "epoch": 160.41, + "learning_rate": 5.471281958948505e-05, + "loss": 0.203, + "step": 198425 + }, + { + "epoch": 160.43, + "learning_rate": 5.465655383507382e-05, + "loss": 0.2272, + "step": 198450 + }, + { + "epoch": 160.45, + "learning_rate": 5.460028808066259e-05, + "loss": 0.1892, + "step": 198475 + }, + { + "epoch": 160.47, + "learning_rate": 5.4544022326251353e-05, + "loss": 0.2235, + "step": 198500 + }, + { + "epoch": 160.49, + "learning_rate": 5.448775657184012e-05, + "loss": 0.202, + "step": 198525 + }, + { + "epoch": 160.51, + "learning_rate": 5.443149081742888e-05, + "loss": 0.2377, + "step": 198550 + }, + { + "epoch": 160.53, + "learning_rate": 5.437522506301765e-05, + "loss": 0.1722, + "step": 198575 + }, + { + "epoch": 160.55, + "learning_rate": 5.431895930860641e-05, + "loss": 0.2065, + "step": 198600 + }, + { + "epoch": 160.57, + "learning_rate": 5.426269355419518e-05, + "loss": 0.1852, + "step": 198625 + }, + { + "epoch": 160.59, + "learning_rate": 5.420642779978394e-05, + "loss": 0.2182, + "step": 198650 + }, + { + "epoch": 160.61, + "learning_rate": 5.415016204537271e-05, + "loss": 0.2017, + "step": 198675 + }, + { + "epoch": 160.63, + "learning_rate": 5.409389629096147e-05, + "loss": 0.2293, + "step": 198700 + }, + { + "epoch": 160.65, + "learning_rate": 5.403763053655023e-05, + "loss": 0.2215, + "step": 198725 + }, + { + "epoch": 160.67, + "learning_rate": 5.3981364782138995e-05, + "loss": 0.2229, + "step": 198750 + }, + { + "epoch": 160.69, + "learning_rate": 5.3925099027727766e-05, + "loss": 0.2306, + "step": 198775 + }, + { + "epoch": 160.71, + "learning_rate": 5.386883327331653e-05, + "loss": 0.2306, + "step": 198800 + }, + { + "epoch": 160.73, + "learning_rate": 5.3812567518905296e-05, + "loss": 0.2359, + "step": 198825 + }, + { + "epoch": 160.75, + "learning_rate": 5.375630176449406e-05, + "loss": 0.2417, + "step": 198850 + }, + { + "epoch": 160.77, + "learning_rate": 5.3700036010082825e-05, + "loss": 0.2112, + "step": 198875 + }, + { + "epoch": 160.79, + "learning_rate": 5.364377025567159e-05, + "loss": 0.2106, + "step": 198900 + }, + { + "epoch": 160.81, + "learning_rate": 5.3587504501260355e-05, + "loss": 0.1836, + "step": 198925 + }, + { + "epoch": 160.83, + "learning_rate": 5.353123874684912e-05, + "loss": 0.2248, + "step": 198950 + }, + { + "epoch": 160.85, + "learning_rate": 5.3474972992437885e-05, + "loss": 0.2018, + "step": 198975 + }, + { + "epoch": 160.87, + "learning_rate": 5.341870723802665e-05, + "loss": 0.239, + "step": 199000 + }, + { + "epoch": 160.89, + "learning_rate": 5.3362441483615414e-05, + "loss": 0.2044, + "step": 199025 + }, + { + "epoch": 160.91, + "learning_rate": 5.330617572920418e-05, + "loss": 0.2236, + "step": 199050 + }, + { + "epoch": 160.93, + "learning_rate": 5.324990997479294e-05, + "loss": 0.2218, + "step": 199075 + }, + { + "epoch": 160.95, + "learning_rate": 5.319364422038171e-05, + "loss": 0.2156, + "step": 199100 + }, + { + "epoch": 160.97, + "learning_rate": 5.3137378465970473e-05, + "loss": 0.2013, + "step": 199125 + }, + { + "epoch": 160.99, + "learning_rate": 5.308111271155924e-05, + "loss": 0.2044, + "step": 199150 + }, + { + "epoch": 161.01, + "learning_rate": 5.3024846957148e-05, + "loss": 0.218, + "step": 199175 + }, + { + "epoch": 161.03, + "learning_rate": 5.296858120273677e-05, + "loss": 0.1846, + "step": 199200 + }, + { + "epoch": 161.05, + "learning_rate": 5.291231544832553e-05, + "loss": 0.2346, + "step": 199225 + }, + { + "epoch": 161.08, + "learning_rate": 5.28560496939143e-05, + "loss": 0.2067, + "step": 199250 + }, + { + "epoch": 161.1, + "learning_rate": 5.279978393950306e-05, + "loss": 0.2165, + "step": 199275 + }, + { + "epoch": 161.12, + "learning_rate": 5.274351818509183e-05, + "loss": 0.2015, + "step": 199300 + }, + { + "epoch": 161.14, + "learning_rate": 5.268725243068059e-05, + "loss": 0.2392, + "step": 199325 + }, + { + "epoch": 161.16, + "learning_rate": 5.2630986676269357e-05, + "loss": 0.2152, + "step": 199350 + }, + { + "epoch": 161.18, + "learning_rate": 5.257472092185812e-05, + "loss": 0.2017, + "step": 199375 + }, + { + "epoch": 161.2, + "learning_rate": 5.2518455167446886e-05, + "loss": 0.2026, + "step": 199400 + }, + { + "epoch": 161.22, + "learning_rate": 5.246218941303565e-05, + "loss": 0.2313, + "step": 199425 + }, + { + "epoch": 161.24, + "learning_rate": 5.2405923658624416e-05, + "loss": 0.2153, + "step": 199450 + }, + { + "epoch": 161.26, + "learning_rate": 5.234965790421318e-05, + "loss": 0.1926, + "step": 199475 + }, + { + "epoch": 161.28, + "learning_rate": 5.2293392149801945e-05, + "loss": 0.1938, + "step": 199500 + }, + { + "epoch": 161.3, + "learning_rate": 5.223712639539071e-05, + "loss": 0.1948, + "step": 199525 + }, + { + "epoch": 161.32, + "learning_rate": 5.2180860640979475e-05, + "loss": 0.2009, + "step": 199550 + }, + { + "epoch": 161.34, + "learning_rate": 5.212459488656824e-05, + "loss": 0.2141, + "step": 199575 + }, + { + "epoch": 161.36, + "learning_rate": 5.2068329132157005e-05, + "loss": 0.1755, + "step": 199600 + }, + { + "epoch": 161.38, + "learning_rate": 5.201206337774577e-05, + "loss": 0.2034, + "step": 199625 + }, + { + "epoch": 161.4, + "learning_rate": 5.1955797623334534e-05, + "loss": 0.2053, + "step": 199650 + }, + { + "epoch": 161.42, + "learning_rate": 5.18995318689233e-05, + "loss": 0.2017, + "step": 199675 + }, + { + "epoch": 161.44, + "learning_rate": 5.1843266114512064e-05, + "loss": 0.1859, + "step": 199700 + }, + { + "epoch": 161.46, + "learning_rate": 5.178700036010083e-05, + "loss": 0.195, + "step": 199725 + }, + { + "epoch": 161.48, + "learning_rate": 5.17307346056896e-05, + "loss": 0.1947, + "step": 199750 + }, + { + "epoch": 161.5, + "learning_rate": 5.167446885127836e-05, + "loss": 0.2052, + "step": 199775 + }, + { + "epoch": 161.52, + "learning_rate": 5.161820309686712e-05, + "loss": 0.1932, + "step": 199800 + }, + { + "epoch": 161.54, + "learning_rate": 5.156193734245589e-05, + "loss": 0.2126, + "step": 199825 + }, + { + "epoch": 161.56, + "learning_rate": 5.150567158804465e-05, + "loss": 0.2163, + "step": 199850 + }, + { + "epoch": 161.58, + "learning_rate": 5.144940583363342e-05, + "loss": 0.2018, + "step": 199875 + }, + { + "epoch": 161.6, + "learning_rate": 5.139314007922218e-05, + "loss": 0.2023, + "step": 199900 + }, + { + "epoch": 161.62, + "learning_rate": 5.133687432481095e-05, + "loss": 0.2208, + "step": 199925 + }, + { + "epoch": 161.64, + "learning_rate": 5.128060857039971e-05, + "loss": 0.2094, + "step": 199950 + }, + { + "epoch": 161.66, + "learning_rate": 5.1224342815988477e-05, + "loss": 0.2119, + "step": 199975 + }, + { + "epoch": 161.68, + "learning_rate": 5.116807706157724e-05, + "loss": 0.1994, + "step": 200000 + }, + { + "epoch": 161.7, + "learning_rate": 5.1111811307166006e-05, + "loss": 0.2172, + "step": 200025 + }, + { + "epoch": 161.72, + "learning_rate": 5.105554555275478e-05, + "loss": 0.1885, + "step": 200050 + }, + { + "epoch": 161.74, + "learning_rate": 5.099927979834354e-05, + "loss": 0.2093, + "step": 200075 + }, + { + "epoch": 161.76, + "learning_rate": 5.094301404393231e-05, + "loss": 0.197, + "step": 200100 + }, + { + "epoch": 161.78, + "learning_rate": 5.088674828952107e-05, + "loss": 0.2085, + "step": 200125 + }, + { + "epoch": 161.8, + "learning_rate": 5.083048253510983e-05, + "loss": 0.2121, + "step": 200150 + }, + { + "epoch": 161.82, + "learning_rate": 5.0774216780698595e-05, + "loss": 0.2206, + "step": 200175 + }, + { + "epoch": 161.84, + "learning_rate": 5.071795102628736e-05, + "loss": 0.1871, + "step": 200200 + }, + { + "epoch": 161.86, + "learning_rate": 5.0661685271876125e-05, + "loss": 0.2268, + "step": 200225 + }, + { + "epoch": 161.88, + "learning_rate": 5.060541951746489e-05, + "loss": 0.2047, + "step": 200250 + }, + { + "epoch": 161.9, + "learning_rate": 5.0549153763053654e-05, + "loss": 0.2072, + "step": 200275 + }, + { + "epoch": 161.92, + "learning_rate": 5.049288800864242e-05, + "loss": 0.2092, + "step": 200300 + }, + { + "epoch": 161.94, + "learning_rate": 5.0436622254231184e-05, + "loss": 0.2105, + "step": 200325 + }, + { + "epoch": 161.96, + "learning_rate": 5.038035649981995e-05, + "loss": 0.1982, + "step": 200350 + }, + { + "epoch": 161.98, + "learning_rate": 5.032409074540872e-05, + "loss": 0.2074, + "step": 200375 + }, + { + "epoch": 162.0, + "learning_rate": 5.0267824990997485e-05, + "loss": 0.2017, + "step": 200400 + }, + { + "epoch": 162.03, + "learning_rate": 5.021155923658625e-05, + "loss": 0.2278, + "step": 200425 + }, + { + "epoch": 162.05, + "learning_rate": 5.0155293482175015e-05, + "loss": 0.1947, + "step": 200450 + }, + { + "epoch": 162.07, + "learning_rate": 5.009902772776378e-05, + "loss": 0.2217, + "step": 200475 + }, + { + "epoch": 162.09, + "learning_rate": 5.004276197335254e-05, + "loss": 0.1645, + "step": 200500 + }, + { + "epoch": 162.11, + "learning_rate": 4.99864962189413e-05, + "loss": 0.2206, + "step": 200525 + }, + { + "epoch": 162.13, + "learning_rate": 4.993023046453007e-05, + "loss": 0.1874, + "step": 200550 + }, + { + "epoch": 162.15, + "learning_rate": 4.987396471011883e-05, + "loss": 0.1963, + "step": 200575 + }, + { + "epoch": 162.17, + "learning_rate": 4.9817698955707597e-05, + "loss": 0.1973, + "step": 200600 + }, + { + "epoch": 162.19, + "learning_rate": 4.976143320129636e-05, + "loss": 0.211, + "step": 200625 + }, + { + "epoch": 162.21, + "learning_rate": 4.9705167446885126e-05, + "loss": 0.1913, + "step": 200650 + }, + { + "epoch": 162.23, + "learning_rate": 4.964890169247389e-05, + "loss": 0.1771, + "step": 200675 + }, + { + "epoch": 162.25, + "learning_rate": 4.959263593806266e-05, + "loss": 0.1889, + "step": 200700 + }, + { + "epoch": 162.27, + "learning_rate": 4.953637018365143e-05, + "loss": 0.1948, + "step": 200725 + }, + { + "epoch": 162.29, + "learning_rate": 4.948010442924019e-05, + "loss": 0.1882, + "step": 200750 + }, + { + "epoch": 162.31, + "learning_rate": 4.942383867482896e-05, + "loss": 0.2305, + "step": 200775 + }, + { + "epoch": 162.33, + "learning_rate": 4.936757292041772e-05, + "loss": 0.2434, + "step": 200800 + }, + { + "epoch": 162.35, + "learning_rate": 4.9311307166006487e-05, + "loss": 0.2083, + "step": 200825 + }, + { + "epoch": 162.37, + "learning_rate": 4.9255041411595245e-05, + "loss": 0.2171, + "step": 200850 + }, + { + "epoch": 162.39, + "learning_rate": 4.919877565718401e-05, + "loss": 0.2204, + "step": 200875 + }, + { + "epoch": 162.41, + "learning_rate": 4.914476053294923e-05, + "loss": 0.2159, + "step": 200900 + }, + { + "epoch": 162.43, + "learning_rate": 4.908849477853799e-05, + "loss": 0.2106, + "step": 200925 + }, + { + "epoch": 162.45, + "learning_rate": 4.903222902412675e-05, + "loss": 0.2034, + "step": 200950 + }, + { + "epoch": 162.47, + "learning_rate": 4.8975963269715516e-05, + "loss": 0.2063, + "step": 200975 + }, + { + "epoch": 162.49, + "learning_rate": 4.891969751530428e-05, + "loss": 0.2096, + "step": 201000 + }, + { + "epoch": 162.49, + "eval_cer": 0.07474615771588144, + "eval_loss": 0.46688565611839294, + "eval_runtime": 150.852, + "eval_samples_per_second": 27.795, + "eval_steps_per_second": 6.954, + "eval_wer": 0.31830342577487764, + "step": 201000 + }, + { + "epoch": 162.51, + "learning_rate": 4.886343176089305e-05, + "loss": 0.2181, + "step": 201025 + }, + { + "epoch": 162.53, + "learning_rate": 4.880716600648182e-05, + "loss": 0.222, + "step": 201050 + }, + { + "epoch": 162.55, + "learning_rate": 4.875090025207058e-05, + "loss": 0.2604, + "step": 201075 + }, + { + "epoch": 162.57, + "learning_rate": 4.869463449765935e-05, + "loss": 0.1897, + "step": 201100 + }, + { + "epoch": 162.59, + "learning_rate": 4.863836874324811e-05, + "loss": 0.2158, + "step": 201125 + }, + { + "epoch": 162.61, + "learning_rate": 4.858210298883688e-05, + "loss": 0.1764, + "step": 201150 + }, + { + "epoch": 162.63, + "learning_rate": 4.852583723442564e-05, + "loss": 0.2127, + "step": 201175 + }, + { + "epoch": 162.65, + "learning_rate": 4.8469571480014406e-05, + "loss": 0.2119, + "step": 201200 + }, + { + "epoch": 162.67, + "learning_rate": 4.841330572560317e-05, + "loss": 0.2366, + "step": 201225 + }, + { + "epoch": 162.69, + "learning_rate": 4.8357039971191936e-05, + "loss": 0.1995, + "step": 201250 + }, + { + "epoch": 162.71, + "learning_rate": 4.8300774216780694e-05, + "loss": 0.2321, + "step": 201275 + }, + { + "epoch": 162.73, + "learning_rate": 4.824450846236946e-05, + "loss": 0.2315, + "step": 201300 + }, + { + "epoch": 162.75, + "learning_rate": 4.818824270795823e-05, + "loss": 0.2366, + "step": 201325 + }, + { + "epoch": 162.77, + "learning_rate": 4.8131976953546995e-05, + "loss": 0.1815, + "step": 201350 + }, + { + "epoch": 162.79, + "learning_rate": 4.807571119913576e-05, + "loss": 0.2202, + "step": 201375 + }, + { + "epoch": 162.81, + "learning_rate": 4.8019445444724525e-05, + "loss": 0.1994, + "step": 201400 + }, + { + "epoch": 162.83, + "learning_rate": 4.796317969031329e-05, + "loss": 0.2294, + "step": 201425 + }, + { + "epoch": 162.85, + "learning_rate": 4.7906913935902054e-05, + "loss": 0.2178, + "step": 201450 + }, + { + "epoch": 162.87, + "learning_rate": 4.785064818149082e-05, + "loss": 0.2219, + "step": 201475 + }, + { + "epoch": 162.89, + "learning_rate": 4.7794382427079584e-05, + "loss": 0.2385, + "step": 201500 + }, + { + "epoch": 162.91, + "learning_rate": 4.773811667266835e-05, + "loss": 0.2135, + "step": 201525 + }, + { + "epoch": 162.93, + "learning_rate": 4.7681850918257113e-05, + "loss": 0.1894, + "step": 201550 + }, + { + "epoch": 162.95, + "learning_rate": 4.762558516384588e-05, + "loss": 0.2315, + "step": 201575 + }, + { + "epoch": 162.97, + "learning_rate": 4.756931940943464e-05, + "loss": 0.2276, + "step": 201600 + }, + { + "epoch": 163.0, + "learning_rate": 4.75130536550234e-05, + "loss": 0.2329, + "step": 201625 + }, + { + "epoch": 163.02, + "learning_rate": 4.745678790061217e-05, + "loss": 0.2242, + "step": 201650 + }, + { + "epoch": 163.04, + "learning_rate": 4.740052214620094e-05, + "loss": 0.1868, + "step": 201675 + }, + { + "epoch": 163.06, + "learning_rate": 4.73442563917897e-05, + "loss": 0.2309, + "step": 201700 + }, + { + "epoch": 163.08, + "learning_rate": 4.728799063737847e-05, + "loss": 0.1948, + "step": 201725 + }, + { + "epoch": 163.1, + "learning_rate": 4.723172488296723e-05, + "loss": 0.2059, + "step": 201750 + }, + { + "epoch": 163.12, + "learning_rate": 4.7175459128556e-05, + "loss": 0.1922, + "step": 201775 + }, + { + "epoch": 163.14, + "learning_rate": 4.711919337414476e-05, + "loss": 0.216, + "step": 201800 + }, + { + "epoch": 163.16, + "learning_rate": 4.7062927619733526e-05, + "loss": 0.1945, + "step": 201825 + }, + { + "epoch": 163.18, + "learning_rate": 4.700666186532229e-05, + "loss": 0.2139, + "step": 201850 + }, + { + "epoch": 163.2, + "learning_rate": 4.6950396110911056e-05, + "loss": 0.2057, + "step": 201875 + }, + { + "epoch": 163.22, + "learning_rate": 4.689413035649982e-05, + "loss": 0.2023, + "step": 201900 + }, + { + "epoch": 163.24, + "learning_rate": 4.6837864602088585e-05, + "loss": 0.181, + "step": 201925 + }, + { + "epoch": 163.26, + "learning_rate": 4.678159884767735e-05, + "loss": 0.1965, + "step": 201950 + }, + { + "epoch": 163.28, + "learning_rate": 4.672533309326612e-05, + "loss": 0.1885, + "step": 201975 + }, + { + "epoch": 163.3, + "learning_rate": 4.666906733885488e-05, + "loss": 0.2403, + "step": 202000 + }, + { + "epoch": 163.32, + "learning_rate": 4.6612801584443645e-05, + "loss": 0.2078, + "step": 202025 + }, + { + "epoch": 163.34, + "learning_rate": 4.655653583003241e-05, + "loss": 0.2031, + "step": 202050 + }, + { + "epoch": 163.36, + "learning_rate": 4.6500270075621174e-05, + "loss": 0.21, + "step": 202075 + }, + { + "epoch": 163.38, + "learning_rate": 4.644400432120994e-05, + "loss": 0.2163, + "step": 202100 + }, + { + "epoch": 163.4, + "learning_rate": 4.6387738566798704e-05, + "loss": 0.1928, + "step": 202125 + }, + { + "epoch": 163.42, + "learning_rate": 4.633147281238747e-05, + "loss": 0.2349, + "step": 202150 + }, + { + "epoch": 163.44, + "learning_rate": 4.6275207057976233e-05, + "loss": 0.2285, + "step": 202175 + }, + { + "epoch": 163.46, + "learning_rate": 4.6218941303565e-05, + "loss": 0.2194, + "step": 202200 + }, + { + "epoch": 163.48, + "learning_rate": 4.616267554915376e-05, + "loss": 0.2165, + "step": 202225 + }, + { + "epoch": 163.5, + "learning_rate": 4.610640979474253e-05, + "loss": 0.2098, + "step": 202250 + }, + { + "epoch": 163.52, + "learning_rate": 4.605014404033129e-05, + "loss": 0.1859, + "step": 202275 + }, + { + "epoch": 163.54, + "learning_rate": 4.5993878285920064e-05, + "loss": 0.2116, + "step": 202300 + }, + { + "epoch": 163.56, + "learning_rate": 4.593761253150883e-05, + "loss": 0.2373, + "step": 202325 + }, + { + "epoch": 163.58, + "learning_rate": 4.588134677709759e-05, + "loss": 0.2213, + "step": 202350 + }, + { + "epoch": 163.6, + "learning_rate": 4.582508102268635e-05, + "loss": 0.2096, + "step": 202375 + }, + { + "epoch": 163.62, + "learning_rate": 4.576881526827512e-05, + "loss": 0.2153, + "step": 202400 + }, + { + "epoch": 163.64, + "learning_rate": 4.571254951386388e-05, + "loss": 0.2167, + "step": 202425 + }, + { + "epoch": 163.66, + "learning_rate": 4.5656283759452646e-05, + "loss": 0.2291, + "step": 202450 + }, + { + "epoch": 163.68, + "learning_rate": 4.560226863521786e-05, + "loss": 0.2253, + "step": 202475 + }, + { + "epoch": 163.7, + "learning_rate": 4.5546002880806624e-05, + "loss": 0.2502, + "step": 202500 + }, + { + "epoch": 163.72, + "learning_rate": 4.548973712639539e-05, + "loss": 0.1777, + "step": 202525 + }, + { + "epoch": 163.74, + "learning_rate": 4.543347137198415e-05, + "loss": 0.2006, + "step": 202550 + }, + { + "epoch": 163.76, + "learning_rate": 4.537720561757292e-05, + "loss": 0.2072, + "step": 202575 + }, + { + "epoch": 163.78, + "learning_rate": 4.532093986316169e-05, + "loss": 0.2245, + "step": 202600 + }, + { + "epoch": 163.8, + "learning_rate": 4.5264674108750454e-05, + "loss": 0.1904, + "step": 202625 + }, + { + "epoch": 163.82, + "learning_rate": 4.520840835433922e-05, + "loss": 0.1858, + "step": 202650 + }, + { + "epoch": 163.84, + "learning_rate": 4.5152142599927984e-05, + "loss": 0.2207, + "step": 202675 + }, + { + "epoch": 163.86, + "learning_rate": 4.509587684551675e-05, + "loss": 0.2185, + "step": 202700 + }, + { + "epoch": 163.88, + "learning_rate": 4.5039611091105514e-05, + "loss": 0.1909, + "step": 202725 + }, + { + "epoch": 163.9, + "learning_rate": 4.498334533669428e-05, + "loss": 0.1961, + "step": 202750 + }, + { + "epoch": 163.92, + "learning_rate": 4.4927079582283036e-05, + "loss": 0.2139, + "step": 202775 + }, + { + "epoch": 163.95, + "learning_rate": 4.48708138278718e-05, + "loss": 0.2081, + "step": 202800 + }, + { + "epoch": 163.97, + "learning_rate": 4.4814548073460566e-05, + "loss": 0.1896, + "step": 202825 + }, + { + "epoch": 163.99, + "learning_rate": 4.475828231904933e-05, + "loss": 0.1879, + "step": 202850 + }, + { + "epoch": 164.01, + "learning_rate": 4.4702016564638096e-05, + "loss": 0.1993, + "step": 202875 + }, + { + "epoch": 164.03, + "learning_rate": 4.464575081022686e-05, + "loss": 0.2381, + "step": 202900 + }, + { + "epoch": 164.05, + "learning_rate": 4.458948505581563e-05, + "loss": 0.1972, + "step": 202925 + }, + { + "epoch": 164.07, + "learning_rate": 4.45332193014044e-05, + "loss": 0.2297, + "step": 202950 + }, + { + "epoch": 164.09, + "learning_rate": 4.447695354699316e-05, + "loss": 0.1591, + "step": 202975 + }, + { + "epoch": 164.11, + "learning_rate": 4.4420687792581926e-05, + "loss": 0.1925, + "step": 203000 + }, + { + "epoch": 164.13, + "learning_rate": 4.436442203817069e-05, + "loss": 0.1655, + "step": 203025 + }, + { + "epoch": 164.15, + "learning_rate": 4.4308156283759456e-05, + "loss": 0.223, + "step": 203050 + }, + { + "epoch": 164.17, + "learning_rate": 4.425189052934822e-05, + "loss": 0.2068, + "step": 203075 + }, + { + "epoch": 164.19, + "learning_rate": 4.4195624774936986e-05, + "loss": 0.1982, + "step": 203100 + }, + { + "epoch": 164.21, + "learning_rate": 4.4139359020525744e-05, + "loss": 0.1926, + "step": 203125 + }, + { + "epoch": 164.23, + "learning_rate": 4.408309326611451e-05, + "loss": 0.1827, + "step": 203150 + }, + { + "epoch": 164.25, + "learning_rate": 4.402682751170327e-05, + "loss": 0.2055, + "step": 203175 + }, + { + "epoch": 164.27, + "learning_rate": 4.397056175729204e-05, + "loss": 0.1942, + "step": 203200 + }, + { + "epoch": 164.29, + "learning_rate": 4.39142960028808e-05, + "loss": 0.2065, + "step": 203225 + }, + { + "epoch": 164.31, + "learning_rate": 4.3858030248469574e-05, + "loss": 0.2095, + "step": 203250 + }, + { + "epoch": 164.33, + "learning_rate": 4.380176449405834e-05, + "loss": 0.2005, + "step": 203275 + }, + { + "epoch": 164.35, + "learning_rate": 4.3745498739647104e-05, + "loss": 0.2359, + "step": 203300 + }, + { + "epoch": 164.37, + "learning_rate": 4.368923298523587e-05, + "loss": 0.179, + "step": 203325 + }, + { + "epoch": 164.39, + "learning_rate": 4.3632967230824634e-05, + "loss": 0.2012, + "step": 203350 + }, + { + "epoch": 164.41, + "learning_rate": 4.35767014764134e-05, + "loss": 0.1984, + "step": 203375 + }, + { + "epoch": 164.43, + "learning_rate": 4.352043572200216e-05, + "loss": 0.1977, + "step": 203400 + }, + { + "epoch": 164.45, + "learning_rate": 4.346416996759093e-05, + "loss": 0.1622, + "step": 203425 + }, + { + "epoch": 164.47, + "learning_rate": 4.340790421317969e-05, + "loss": 0.205, + "step": 203450 + }, + { + "epoch": 164.49, + "learning_rate": 4.335163845876846e-05, + "loss": 0.1705, + "step": 203475 + }, + { + "epoch": 164.51, + "learning_rate": 4.3295372704357216e-05, + "loss": 0.1874, + "step": 203500 + }, + { + "epoch": 164.53, + "learning_rate": 4.323910694994598e-05, + "loss": 0.2105, + "step": 203525 + }, + { + "epoch": 164.55, + "learning_rate": 4.318284119553475e-05, + "loss": 0.2178, + "step": 203550 + }, + { + "epoch": 164.57, + "learning_rate": 4.312657544112352e-05, + "loss": 0.2348, + "step": 203575 + }, + { + "epoch": 164.59, + "learning_rate": 4.307030968671228e-05, + "loss": 0.2285, + "step": 203600 + }, + { + "epoch": 164.61, + "learning_rate": 4.3014043932301046e-05, + "loss": 0.2005, + "step": 203625 + }, + { + "epoch": 164.63, + "learning_rate": 4.295777817788981e-05, + "loss": 0.2259, + "step": 203650 + }, + { + "epoch": 164.65, + "learning_rate": 4.2901512423478576e-05, + "loss": 0.1709, + "step": 203675 + }, + { + "epoch": 164.67, + "learning_rate": 4.284524666906734e-05, + "loss": 0.1984, + "step": 203700 + }, + { + "epoch": 164.69, + "learning_rate": 4.2788980914656106e-05, + "loss": 0.1833, + "step": 203725 + }, + { + "epoch": 164.71, + "learning_rate": 4.273271516024487e-05, + "loss": 0.2113, + "step": 203750 + }, + { + "epoch": 164.73, + "learning_rate": 4.2676449405833635e-05, + "loss": 0.2044, + "step": 203775 + }, + { + "epoch": 164.75, + "learning_rate": 4.26201836514224e-05, + "loss": 0.2236, + "step": 203800 + }, + { + "epoch": 164.77, + "learning_rate": 4.2563917897011165e-05, + "loss": 0.2011, + "step": 203825 + }, + { + "epoch": 164.79, + "learning_rate": 4.250765214259992e-05, + "loss": 0.2171, + "step": 203850 + }, + { + "epoch": 164.81, + "learning_rate": 4.2451386388188694e-05, + "loss": 0.1913, + "step": 203875 + }, + { + "epoch": 164.83, + "learning_rate": 4.239512063377746e-05, + "loss": 0.2069, + "step": 203900 + }, + { + "epoch": 164.85, + "learning_rate": 4.2338854879366224e-05, + "loss": 0.1633, + "step": 203925 + }, + { + "epoch": 164.87, + "learning_rate": 4.228258912495499e-05, + "loss": 0.206, + "step": 203950 + }, + { + "epoch": 164.89, + "learning_rate": 4.2226323370543754e-05, + "loss": 0.1939, + "step": 203975 + }, + { + "epoch": 164.92, + "learning_rate": 4.217005761613252e-05, + "loss": 0.2173, + "step": 204000 + }, + { + "epoch": 164.92, + "eval_cer": 0.07462809153722165, + "eval_loss": 0.47042977809906006, + "eval_runtime": 151.4427, + "eval_samples_per_second": 27.687, + "eval_steps_per_second": 6.927, + "eval_wer": 0.3180097879282219, + "step": 204000 + }, + { + "epoch": 164.94, + "learning_rate": 4.211379186172128e-05, + "loss": 0.2402, + "step": 204025 + }, + { + "epoch": 164.96, + "learning_rate": 4.205752610731005e-05, + "loss": 0.2072, + "step": 204050 + }, + { + "epoch": 164.98, + "learning_rate": 4.200126035289881e-05, + "loss": 0.2063, + "step": 204075 + }, + { + "epoch": 165.0, + "learning_rate": 4.194499459848758e-05, + "loss": 0.196, + "step": 204100 + }, + { + "epoch": 165.02, + "learning_rate": 4.188872884407634e-05, + "loss": 0.1877, + "step": 204125 + }, + { + "epoch": 165.04, + "learning_rate": 4.183246308966511e-05, + "loss": 0.1892, + "step": 204150 + }, + { + "epoch": 165.06, + "learning_rate": 4.177619733525387e-05, + "loss": 0.2035, + "step": 204175 + }, + { + "epoch": 165.08, + "learning_rate": 4.171993158084264e-05, + "loss": 0.1885, + "step": 204200 + }, + { + "epoch": 165.1, + "learning_rate": 4.16636658264314e-05, + "loss": 0.2331, + "step": 204225 + }, + { + "epoch": 165.12, + "learning_rate": 4.1607400072020166e-05, + "loss": 0.1998, + "step": 204250 + }, + { + "epoch": 165.14, + "learning_rate": 4.155113431760893e-05, + "loss": 0.199, + "step": 204275 + }, + { + "epoch": 165.16, + "learning_rate": 4.1494868563197696e-05, + "loss": 0.227, + "step": 204300 + }, + { + "epoch": 165.18, + "learning_rate": 4.143860280878646e-05, + "loss": 0.2145, + "step": 204325 + }, + { + "epoch": 165.2, + "learning_rate": 4.1382337054375226e-05, + "loss": 0.1827, + "step": 204350 + }, + { + "epoch": 165.22, + "learning_rate": 4.132607129996399e-05, + "loss": 0.2053, + "step": 204375 + }, + { + "epoch": 165.24, + "learning_rate": 4.1269805545552755e-05, + "loss": 0.2036, + "step": 204400 + }, + { + "epoch": 165.26, + "learning_rate": 4.121353979114152e-05, + "loss": 0.2201, + "step": 204425 + }, + { + "epoch": 165.28, + "learning_rate": 4.1157274036730285e-05, + "loss": 0.1936, + "step": 204450 + }, + { + "epoch": 165.3, + "learning_rate": 4.110100828231905e-05, + "loss": 0.2106, + "step": 204475 + }, + { + "epoch": 165.32, + "learning_rate": 4.1044742527907814e-05, + "loss": 0.1847, + "step": 204500 + }, + { + "epoch": 165.34, + "learning_rate": 4.0988476773496586e-05, + "loss": 0.2236, + "step": 204525 + }, + { + "epoch": 165.36, + "learning_rate": 4.0932211019085344e-05, + "loss": 0.1982, + "step": 204550 + }, + { + "epoch": 165.38, + "learning_rate": 4.087594526467411e-05, + "loss": 0.2164, + "step": 204575 + }, + { + "epoch": 165.4, + "learning_rate": 4.0819679510262874e-05, + "loss": 0.1648, + "step": 204600 + }, + { + "epoch": 165.42, + "learning_rate": 4.076341375585164e-05, + "loss": 0.2193, + "step": 204625 + }, + { + "epoch": 165.44, + "learning_rate": 4.07071480014404e-05, + "loss": 0.2154, + "step": 204650 + }, + { + "epoch": 165.46, + "learning_rate": 4.065088224702917e-05, + "loss": 0.2004, + "step": 204675 + }, + { + "epoch": 165.48, + "learning_rate": 4.059461649261793e-05, + "loss": 0.2009, + "step": 204700 + }, + { + "epoch": 165.5, + "learning_rate": 4.05383507382067e-05, + "loss": 0.1868, + "step": 204725 + }, + { + "epoch": 165.52, + "learning_rate": 4.048208498379546e-05, + "loss": 0.2233, + "step": 204750 + }, + { + "epoch": 165.54, + "learning_rate": 4.042581922938423e-05, + "loss": 0.1929, + "step": 204775 + }, + { + "epoch": 165.56, + "learning_rate": 4.036955347497299e-05, + "loss": 0.2148, + "step": 204800 + }, + { + "epoch": 165.58, + "learning_rate": 4.031328772056176e-05, + "loss": 0.19, + "step": 204825 + }, + { + "epoch": 165.6, + "learning_rate": 4.025702196615053e-05, + "loss": 0.1779, + "step": 204850 + }, + { + "epoch": 165.62, + "learning_rate": 4.020075621173929e-05, + "loss": 0.1936, + "step": 204875 + }, + { + "epoch": 165.64, + "learning_rate": 4.014449045732806e-05, + "loss": 0.2117, + "step": 204900 + }, + { + "epoch": 165.66, + "learning_rate": 4.0088224702916816e-05, + "loss": 0.2124, + "step": 204925 + }, + { + "epoch": 165.68, + "learning_rate": 4.003195894850558e-05, + "loss": 0.2178, + "step": 204950 + }, + { + "epoch": 165.7, + "learning_rate": 3.9975693194094346e-05, + "loss": 0.2006, + "step": 204975 + }, + { + "epoch": 165.72, + "learning_rate": 3.991942743968311e-05, + "loss": 0.1948, + "step": 205000 + }, + { + "epoch": 165.74, + "learning_rate": 3.9863161685271875e-05, + "loss": 0.2193, + "step": 205025 + }, + { + "epoch": 165.76, + "learning_rate": 3.980689593086064e-05, + "loss": 0.1978, + "step": 205050 + }, + { + "epoch": 165.78, + "learning_rate": 3.9750630176449405e-05, + "loss": 0.2219, + "step": 205075 + }, + { + "epoch": 165.8, + "learning_rate": 3.969436442203817e-05, + "loss": 0.1989, + "step": 205100 + }, + { + "epoch": 165.82, + "learning_rate": 3.9638098667626934e-05, + "loss": 0.2189, + "step": 205125 + }, + { + "epoch": 165.84, + "learning_rate": 3.9581832913215706e-05, + "loss": 0.1913, + "step": 205150 + }, + { + "epoch": 165.86, + "learning_rate": 3.952556715880447e-05, + "loss": 0.2138, + "step": 205175 + }, + { + "epoch": 165.89, + "learning_rate": 3.9469301404393236e-05, + "loss": 0.1843, + "step": 205200 + }, + { + "epoch": 165.91, + "learning_rate": 3.9413035649982e-05, + "loss": 0.212, + "step": 205225 + }, + { + "epoch": 165.93, + "learning_rate": 3.9356769895570765e-05, + "loss": 0.1992, + "step": 205250 + }, + { + "epoch": 165.95, + "learning_rate": 3.930050414115952e-05, + "loss": 0.2029, + "step": 205275 + }, + { + "epoch": 165.97, + "learning_rate": 3.924423838674829e-05, + "loss": 0.2163, + "step": 205300 + }, + { + "epoch": 165.99, + "learning_rate": 3.918797263233705e-05, + "loss": 0.2093, + "step": 205325 + }, + { + "epoch": 166.01, + "learning_rate": 3.913170687792582e-05, + "loss": 0.191, + "step": 205350 + }, + { + "epoch": 166.03, + "learning_rate": 3.907544112351458e-05, + "loss": 0.2049, + "step": 205375 + }, + { + "epoch": 166.05, + "learning_rate": 3.901917536910335e-05, + "loss": 0.1871, + "step": 205400 + }, + { + "epoch": 166.07, + "learning_rate": 3.896290961469211e-05, + "loss": 0.1957, + "step": 205425 + }, + { + "epoch": 166.09, + "learning_rate": 3.8908894490457325e-05, + "loss": 0.19, + "step": 205450 + }, + { + "epoch": 166.11, + "learning_rate": 3.8852628736046096e-05, + "loss": 0.2078, + "step": 205475 + }, + { + "epoch": 166.13, + "learning_rate": 3.879636298163486e-05, + "loss": 0.1838, + "step": 205500 + }, + { + "epoch": 166.15, + "learning_rate": 3.8740097227223626e-05, + "loss": 0.2019, + "step": 205525 + }, + { + "epoch": 166.17, + "learning_rate": 3.868383147281239e-05, + "loss": 0.1774, + "step": 205550 + }, + { + "epoch": 166.19, + "learning_rate": 3.8627565718401155e-05, + "loss": 0.2137, + "step": 205575 + }, + { + "epoch": 166.21, + "learning_rate": 3.857129996398992e-05, + "loss": 0.2002, + "step": 205600 + }, + { + "epoch": 166.23, + "learning_rate": 3.8515034209578685e-05, + "loss": 0.1927, + "step": 205625 + }, + { + "epoch": 166.25, + "learning_rate": 3.845876845516745e-05, + "loss": 0.1999, + "step": 205650 + }, + { + "epoch": 166.27, + "learning_rate": 3.8402502700756214e-05, + "loss": 0.2, + "step": 205675 + }, + { + "epoch": 166.29, + "learning_rate": 3.834623694634497e-05, + "loss": 0.1938, + "step": 205700 + }, + { + "epoch": 166.31, + "learning_rate": 3.828997119193374e-05, + "loss": 0.2143, + "step": 205725 + }, + { + "epoch": 166.33, + "learning_rate": 3.82337054375225e-05, + "loss": 0.1971, + "step": 205750 + }, + { + "epoch": 166.35, + "learning_rate": 3.817743968311127e-05, + "loss": 0.2325, + "step": 205775 + }, + { + "epoch": 166.37, + "learning_rate": 3.812117392870004e-05, + "loss": 0.2128, + "step": 205800 + }, + { + "epoch": 166.39, + "learning_rate": 3.80649081742888e-05, + "loss": 0.1917, + "step": 205825 + }, + { + "epoch": 166.41, + "learning_rate": 3.800864241987757e-05, + "loss": 0.179, + "step": 205850 + }, + { + "epoch": 166.43, + "learning_rate": 3.795237666546633e-05, + "loss": 0.195, + "step": 205875 + }, + { + "epoch": 166.45, + "learning_rate": 3.78961109110551e-05, + "loss": 0.2235, + "step": 205900 + }, + { + "epoch": 166.47, + "learning_rate": 3.783984515664386e-05, + "loss": 0.2031, + "step": 205925 + }, + { + "epoch": 166.49, + "learning_rate": 3.778357940223263e-05, + "loss": 0.1853, + "step": 205950 + }, + { + "epoch": 166.51, + "learning_rate": 3.772731364782139e-05, + "loss": 0.2208, + "step": 205975 + }, + { + "epoch": 166.53, + "learning_rate": 3.767104789341016e-05, + "loss": 0.1579, + "step": 206000 + }, + { + "epoch": 166.55, + "learning_rate": 3.761478213899892e-05, + "loss": 0.21, + "step": 206025 + }, + { + "epoch": 166.57, + "learning_rate": 3.755851638458768e-05, + "loss": 0.202, + "step": 206050 + }, + { + "epoch": 166.59, + "learning_rate": 3.7502250630176444e-05, + "loss": 0.2098, + "step": 206075 + }, + { + "epoch": 166.61, + "learning_rate": 3.7445984875765216e-05, + "loss": 0.1852, + "step": 206100 + }, + { + "epoch": 166.63, + "learning_rate": 3.738971912135398e-05, + "loss": 0.2041, + "step": 206125 + }, + { + "epoch": 166.65, + "learning_rate": 3.7333453366942746e-05, + "loss": 0.1956, + "step": 206150 + }, + { + "epoch": 166.67, + "learning_rate": 3.727718761253151e-05, + "loss": 0.2027, + "step": 206175 + }, + { + "epoch": 166.69, + "learning_rate": 3.7220921858120275e-05, + "loss": 0.1736, + "step": 206200 + }, + { + "epoch": 166.71, + "learning_rate": 3.716465610370904e-05, + "loss": 0.217, + "step": 206225 + }, + { + "epoch": 166.73, + "learning_rate": 3.7108390349297805e-05, + "loss": 0.1787, + "step": 206250 + }, + { + "epoch": 166.75, + "learning_rate": 3.705212459488657e-05, + "loss": 0.1932, + "step": 206275 + }, + { + "epoch": 166.77, + "learning_rate": 3.6995858840475334e-05, + "loss": 0.1837, + "step": 206300 + }, + { + "epoch": 166.79, + "learning_rate": 3.69395930860641e-05, + "loss": 0.1666, + "step": 206325 + }, + { + "epoch": 166.81, + "learning_rate": 3.6883327331652864e-05, + "loss": 0.1649, + "step": 206350 + }, + { + "epoch": 166.84, + "learning_rate": 3.682706157724163e-05, + "loss": 0.1981, + "step": 206375 + }, + { + "epoch": 166.86, + "learning_rate": 3.677079582283039e-05, + "loss": 0.2142, + "step": 206400 + }, + { + "epoch": 166.88, + "learning_rate": 3.671453006841916e-05, + "loss": 0.2036, + "step": 206425 + }, + { + "epoch": 166.9, + "learning_rate": 3.665826431400792e-05, + "loss": 0.2075, + "step": 206450 + }, + { + "epoch": 166.92, + "learning_rate": 3.660199855959669e-05, + "loss": 0.2142, + "step": 206475 + }, + { + "epoch": 166.94, + "learning_rate": 3.654573280518545e-05, + "loss": 0.1761, + "step": 206500 + }, + { + "epoch": 166.96, + "learning_rate": 3.648946705077422e-05, + "loss": 0.1917, + "step": 206525 + }, + { + "epoch": 166.98, + "learning_rate": 3.643320129636298e-05, + "loss": 0.2077, + "step": 206550 + }, + { + "epoch": 167.0, + "learning_rate": 3.637693554195175e-05, + "loss": 0.1955, + "step": 206575 + }, + { + "epoch": 167.02, + "learning_rate": 3.632066978754051e-05, + "loss": 0.2168, + "step": 206600 + }, + { + "epoch": 167.04, + "learning_rate": 3.626440403312928e-05, + "loss": 0.2142, + "step": 206625 + }, + { + "epoch": 167.06, + "learning_rate": 3.620813827871804e-05, + "loss": 0.1914, + "step": 206650 + }, + { + "epoch": 167.08, + "learning_rate": 3.6151872524306806e-05, + "loss": 0.215, + "step": 206675 + }, + { + "epoch": 167.1, + "learning_rate": 3.609560676989557e-05, + "loss": 0.2052, + "step": 206700 + }, + { + "epoch": 167.12, + "learning_rate": 3.6039341015484336e-05, + "loss": 0.2032, + "step": 206725 + }, + { + "epoch": 167.14, + "learning_rate": 3.598307526107311e-05, + "loss": 0.1999, + "step": 206750 + }, + { + "epoch": 167.16, + "learning_rate": 3.5926809506661866e-05, + "loss": 0.1718, + "step": 206775 + }, + { + "epoch": 167.18, + "learning_rate": 3.587054375225063e-05, + "loss": 0.187, + "step": 206800 + }, + { + "epoch": 167.2, + "learning_rate": 3.5814277997839395e-05, + "loss": 0.2237, + "step": 206825 + }, + { + "epoch": 167.22, + "learning_rate": 3.575801224342816e-05, + "loss": 0.2192, + "step": 206850 + }, + { + "epoch": 167.24, + "learning_rate": 3.5701746489016925e-05, + "loss": 0.2003, + "step": 206875 + }, + { + "epoch": 167.26, + "learning_rate": 3.564548073460569e-05, + "loss": 0.1946, + "step": 206900 + }, + { + "epoch": 167.28, + "learning_rate": 3.5589214980194454e-05, + "loss": 0.1779, + "step": 206925 + }, + { + "epoch": 167.3, + "learning_rate": 3.553294922578322e-05, + "loss": 0.2129, + "step": 206950 + }, + { + "epoch": 167.32, + "learning_rate": 3.5476683471371984e-05, + "loss": 0.1759, + "step": 206975 + }, + { + "epoch": 167.34, + "learning_rate": 3.542041771696075e-05, + "loss": 0.1797, + "step": 207000 + }, + { + "epoch": 167.34, + "eval_cer": 0.07387349465622209, + "eval_loss": 0.46532440185546875, + "eval_runtime": 150.405, + "eval_samples_per_second": 27.878, + "eval_steps_per_second": 6.975, + "eval_wer": 0.3169004893964111, + "step": 207000 + }, + { + "epoch": 167.36, + "learning_rate": 3.5364151962549514e-05, + "loss": 0.1926, + "step": 207025 + }, + { + "epoch": 167.38, + "learning_rate": 3.530788620813828e-05, + "loss": 0.2108, + "step": 207050 + }, + { + "epoch": 167.4, + "learning_rate": 3.525162045372705e-05, + "loss": 0.2033, + "step": 207075 + }, + { + "epoch": 167.42, + "learning_rate": 3.5195354699315815e-05, + "loss": 0.215, + "step": 207100 + }, + { + "epoch": 167.44, + "learning_rate": 3.513908894490457e-05, + "loss": 0.2169, + "step": 207125 + }, + { + "epoch": 167.46, + "learning_rate": 3.508282319049334e-05, + "loss": 0.1875, + "step": 207150 + }, + { + "epoch": 167.48, + "learning_rate": 3.50265574360821e-05, + "loss": 0.2083, + "step": 207175 + }, + { + "epoch": 167.5, + "learning_rate": 3.497029168167087e-05, + "loss": 0.2057, + "step": 207200 + }, + { + "epoch": 167.52, + "learning_rate": 3.491402592725963e-05, + "loss": 0.2003, + "step": 207225 + }, + { + "epoch": 167.54, + "learning_rate": 3.48577601728484e-05, + "loss": 0.1973, + "step": 207250 + }, + { + "epoch": 167.56, + "learning_rate": 3.480149441843716e-05, + "loss": 0.183, + "step": 207275 + }, + { + "epoch": 167.58, + "learning_rate": 3.4745228664025926e-05, + "loss": 0.2074, + "step": 207300 + }, + { + "epoch": 167.6, + "learning_rate": 3.468896290961469e-05, + "loss": 0.195, + "step": 207325 + }, + { + "epoch": 167.62, + "learning_rate": 3.4632697155203456e-05, + "loss": 0.1961, + "step": 207350 + }, + { + "epoch": 167.64, + "learning_rate": 3.457643140079223e-05, + "loss": 0.2117, + "step": 207375 + }, + { + "epoch": 167.66, + "learning_rate": 3.452016564638099e-05, + "loss": 0.2127, + "step": 207400 + }, + { + "epoch": 167.68, + "learning_rate": 3.446389989196976e-05, + "loss": 0.164, + "step": 207425 + }, + { + "epoch": 167.7, + "learning_rate": 3.440763413755852e-05, + "loss": 0.2018, + "step": 207450 + }, + { + "epoch": 167.72, + "learning_rate": 3.435136838314728e-05, + "loss": 0.1931, + "step": 207475 + }, + { + "epoch": 167.74, + "learning_rate": 3.4295102628736045e-05, + "loss": 0.1934, + "step": 207500 + }, + { + "epoch": 167.76, + "learning_rate": 3.423883687432481e-05, + "loss": 0.1863, + "step": 207525 + }, + { + "epoch": 167.78, + "learning_rate": 3.4182571119913574e-05, + "loss": 0.1935, + "step": 207550 + }, + { + "epoch": 167.81, + "learning_rate": 3.412630536550234e-05, + "loss": 0.1803, + "step": 207575 + }, + { + "epoch": 167.83, + "learning_rate": 3.4070039611091104e-05, + "loss": 0.1956, + "step": 207600 + }, + { + "epoch": 167.85, + "learning_rate": 3.401377385667987e-05, + "loss": 0.1794, + "step": 207625 + }, + { + "epoch": 167.87, + "learning_rate": 3.3957508102268634e-05, + "loss": 0.2416, + "step": 207650 + }, + { + "epoch": 167.89, + "learning_rate": 3.39012423478574e-05, + "loss": 0.1805, + "step": 207675 + }, + { + "epoch": 167.91, + "learning_rate": 3.384497659344617e-05, + "loss": 0.1733, + "step": 207700 + }, + { + "epoch": 167.93, + "learning_rate": 3.3788710839034935e-05, + "loss": 0.1806, + "step": 207725 + }, + { + "epoch": 167.95, + "learning_rate": 3.37324450846237e-05, + "loss": 0.1991, + "step": 207750 + }, + { + "epoch": 167.97, + "learning_rate": 3.3676179330212464e-05, + "loss": 0.1957, + "step": 207775 + }, + { + "epoch": 167.99, + "learning_rate": 3.361991357580123e-05, + "loss": 0.1942, + "step": 207800 + }, + { + "epoch": 168.01, + "learning_rate": 3.356364782138999e-05, + "loss": 0.1886, + "step": 207825 + }, + { + "epoch": 168.03, + "learning_rate": 3.350738206697875e-05, + "loss": 0.1943, + "step": 207850 + }, + { + "epoch": 168.05, + "learning_rate": 3.345111631256752e-05, + "loss": 0.191, + "step": 207875 + }, + { + "epoch": 168.07, + "learning_rate": 3.339485055815628e-05, + "loss": 0.198, + "step": 207900 + }, + { + "epoch": 168.09, + "learning_rate": 3.3338584803745046e-05, + "loss": 0.182, + "step": 207925 + }, + { + "epoch": 168.11, + "learning_rate": 3.328231904933381e-05, + "loss": 0.2229, + "step": 207950 + }, + { + "epoch": 168.13, + "learning_rate": 3.3226053294922576e-05, + "loss": 0.1699, + "step": 207975 + }, + { + "epoch": 168.15, + "learning_rate": 3.316978754051134e-05, + "loss": 0.1911, + "step": 208000 + }, + { + "epoch": 168.17, + "learning_rate": 3.311352178610011e-05, + "loss": 0.2104, + "step": 208025 + }, + { + "epoch": 168.19, + "learning_rate": 3.305725603168888e-05, + "loss": 0.1995, + "step": 208050 + }, + { + "epoch": 168.21, + "learning_rate": 3.300099027727764e-05, + "loss": 0.1987, + "step": 208075 + }, + { + "epoch": 168.23, + "learning_rate": 3.294472452286641e-05, + "loss": 0.2129, + "step": 208100 + }, + { + "epoch": 168.25, + "learning_rate": 3.288845876845517e-05, + "loss": 0.2092, + "step": 208125 + }, + { + "epoch": 168.27, + "learning_rate": 3.2832193014043936e-05, + "loss": 0.2171, + "step": 208150 + }, + { + "epoch": 168.29, + "learning_rate": 3.27759272596327e-05, + "loss": 0.1689, + "step": 208175 + }, + { + "epoch": 168.31, + "learning_rate": 3.271966150522146e-05, + "loss": 0.2163, + "step": 208200 + }, + { + "epoch": 168.33, + "learning_rate": 3.2663395750810224e-05, + "loss": 0.1767, + "step": 208225 + }, + { + "epoch": 168.35, + "learning_rate": 3.260712999639899e-05, + "loss": 0.2149, + "step": 208250 + }, + { + "epoch": 168.37, + "learning_rate": 3.2550864241987754e-05, + "loss": 0.2043, + "step": 208275 + }, + { + "epoch": 168.39, + "learning_rate": 3.249459848757652e-05, + "loss": 0.2012, + "step": 208300 + }, + { + "epoch": 168.41, + "learning_rate": 3.243833273316528e-05, + "loss": 0.2468, + "step": 208325 + }, + { + "epoch": 168.43, + "learning_rate": 3.2382066978754055e-05, + "loss": 0.1984, + "step": 208350 + }, + { + "epoch": 168.45, + "learning_rate": 3.232580122434282e-05, + "loss": 0.2305, + "step": 208375 + }, + { + "epoch": 168.47, + "learning_rate": 3.2269535469931584e-05, + "loss": 0.2011, + "step": 208400 + }, + { + "epoch": 168.49, + "learning_rate": 3.221326971552035e-05, + "loss": 0.1946, + "step": 208425 + }, + { + "epoch": 168.51, + "learning_rate": 3.2157003961109114e-05, + "loss": 0.2048, + "step": 208450 + }, + { + "epoch": 168.53, + "learning_rate": 3.210073820669788e-05, + "loss": 0.187, + "step": 208475 + }, + { + "epoch": 168.55, + "learning_rate": 3.2044472452286644e-05, + "loss": 0.1927, + "step": 208500 + }, + { + "epoch": 168.57, + "learning_rate": 3.198820669787541e-05, + "loss": 0.1787, + "step": 208525 + }, + { + "epoch": 168.59, + "learning_rate": 3.1931940943464166e-05, + "loss": 0.1875, + "step": 208550 + }, + { + "epoch": 168.61, + "learning_rate": 3.187567518905293e-05, + "loss": 0.1975, + "step": 208575 + }, + { + "epoch": 168.63, + "learning_rate": 3.1819409434641696e-05, + "loss": 0.2049, + "step": 208600 + }, + { + "epoch": 168.65, + "learning_rate": 3.176314368023046e-05, + "loss": 0.1778, + "step": 208625 + }, + { + "epoch": 168.67, + "learning_rate": 3.1706877925819226e-05, + "loss": 0.2165, + "step": 208650 + }, + { + "epoch": 168.69, + "learning_rate": 3.1650612171408e-05, + "loss": 0.1997, + "step": 208675 + }, + { + "epoch": 168.71, + "learning_rate": 3.159434641699676e-05, + "loss": 0.1911, + "step": 208700 + }, + { + "epoch": 168.73, + "learning_rate": 3.153808066258553e-05, + "loss": 0.1659, + "step": 208725 + }, + { + "epoch": 168.76, + "learning_rate": 3.148181490817429e-05, + "loss": 0.213, + "step": 208750 + }, + { + "epoch": 168.78, + "learning_rate": 3.1425549153763056e-05, + "loss": 0.2257, + "step": 208775 + }, + { + "epoch": 168.8, + "learning_rate": 3.136928339935182e-05, + "loss": 0.2027, + "step": 208800 + }, + { + "epoch": 168.82, + "learning_rate": 3.1313017644940586e-05, + "loss": 0.2051, + "step": 208825 + }, + { + "epoch": 168.84, + "learning_rate": 3.125675189052935e-05, + "loss": 0.212, + "step": 208850 + }, + { + "epoch": 168.86, + "learning_rate": 3.1200486136118116e-05, + "loss": 0.2062, + "step": 208875 + }, + { + "epoch": 168.88, + "learning_rate": 3.114422038170688e-05, + "loss": 0.1752, + "step": 208900 + }, + { + "epoch": 168.9, + "learning_rate": 3.1087954627295645e-05, + "loss": 0.1771, + "step": 208925 + }, + { + "epoch": 168.92, + "learning_rate": 3.103168887288441e-05, + "loss": 0.1909, + "step": 208950 + }, + { + "epoch": 168.94, + "learning_rate": 3.0975423118473175e-05, + "loss": 0.1723, + "step": 208975 + }, + { + "epoch": 168.96, + "learning_rate": 3.091915736406194e-05, + "loss": 0.2065, + "step": 209000 + }, + { + "epoch": 168.98, + "learning_rate": 3.0862891609650704e-05, + "loss": 0.1911, + "step": 209025 + }, + { + "epoch": 169.0, + "learning_rate": 3.080662585523947e-05, + "loss": 0.1954, + "step": 209050 + }, + { + "epoch": 169.02, + "learning_rate": 3.0750360100828234e-05, + "loss": 0.2045, + "step": 209075 + }, + { + "epoch": 169.04, + "learning_rate": 3.0694094346417e-05, + "loss": 0.1925, + "step": 209100 + }, + { + "epoch": 169.06, + "learning_rate": 3.0637828592005764e-05, + "loss": 0.1893, + "step": 209125 + }, + { + "epoch": 169.08, + "learning_rate": 3.058156283759453e-05, + "loss": 0.1945, + "step": 209150 + }, + { + "epoch": 169.1, + "learning_rate": 3.052529708318329e-05, + "loss": 0.1925, + "step": 209175 + }, + { + "epoch": 169.12, + "learning_rate": 3.0469031328772055e-05, + "loss": 0.1575, + "step": 209200 + }, + { + "epoch": 169.14, + "learning_rate": 3.0412765574360823e-05, + "loss": 0.2029, + "step": 209225 + }, + { + "epoch": 169.16, + "learning_rate": 3.0356499819949588e-05, + "loss": 0.184, + "step": 209250 + }, + { + "epoch": 169.18, + "learning_rate": 3.0300234065538352e-05, + "loss": 0.1891, + "step": 209275 + }, + { + "epoch": 169.2, + "learning_rate": 3.0243968311127117e-05, + "loss": 0.1909, + "step": 209300 + }, + { + "epoch": 169.22, + "learning_rate": 3.0187702556715882e-05, + "loss": 0.2016, + "step": 209325 + }, + { + "epoch": 169.24, + "learning_rate": 3.0131436802304643e-05, + "loss": 0.1868, + "step": 209350 + }, + { + "epoch": 169.26, + "learning_rate": 3.0075171047893408e-05, + "loss": 0.2264, + "step": 209375 + }, + { + "epoch": 169.28, + "learning_rate": 3.0018905293482176e-05, + "loss": 0.1688, + "step": 209400 + }, + { + "epoch": 169.3, + "learning_rate": 2.996263953907094e-05, + "loss": 0.2192, + "step": 209425 + }, + { + "epoch": 169.32, + "learning_rate": 2.9908624414836154e-05, + "loss": 0.1976, + "step": 209450 + }, + { + "epoch": 169.34, + "learning_rate": 2.985235866042492e-05, + "loss": 0.1995, + "step": 209475 + }, + { + "epoch": 169.36, + "learning_rate": 2.9796092906013683e-05, + "loss": 0.2118, + "step": 209500 + }, + { + "epoch": 169.38, + "learning_rate": 2.973982715160245e-05, + "loss": 0.2228, + "step": 209525 + }, + { + "epoch": 169.4, + "learning_rate": 2.9683561397191216e-05, + "loss": 0.1806, + "step": 209550 + }, + { + "epoch": 169.42, + "learning_rate": 2.962729564277998e-05, + "loss": 0.1977, + "step": 209575 + }, + { + "epoch": 169.44, + "learning_rate": 2.9571029888368743e-05, + "loss": 0.1966, + "step": 209600 + }, + { + "epoch": 169.46, + "learning_rate": 2.9514764133957507e-05, + "loss": 0.1841, + "step": 209625 + }, + { + "epoch": 169.48, + "learning_rate": 2.9458498379546272e-05, + "loss": 0.1788, + "step": 209650 + }, + { + "epoch": 169.5, + "learning_rate": 2.9402232625135037e-05, + "loss": 0.189, + "step": 209675 + }, + { + "epoch": 169.52, + "learning_rate": 2.9345966870723805e-05, + "loss": 0.1697, + "step": 209700 + }, + { + "epoch": 169.54, + "learning_rate": 2.928970111631257e-05, + "loss": 0.2083, + "step": 209725 + }, + { + "epoch": 169.56, + "learning_rate": 2.9233435361901335e-05, + "loss": 0.2094, + "step": 209750 + }, + { + "epoch": 169.58, + "learning_rate": 2.9177169607490096e-05, + "loss": 0.2036, + "step": 209775 + }, + { + "epoch": 169.6, + "learning_rate": 2.912090385307886e-05, + "loss": 0.1829, + "step": 209800 + }, + { + "epoch": 169.62, + "learning_rate": 2.9064638098667626e-05, + "loss": 0.195, + "step": 209825 + }, + { + "epoch": 169.64, + "learning_rate": 2.9008372344256394e-05, + "loss": 0.1701, + "step": 209850 + }, + { + "epoch": 169.66, + "learning_rate": 2.895210658984516e-05, + "loss": 0.1991, + "step": 209875 + }, + { + "epoch": 169.68, + "learning_rate": 2.8895840835433924e-05, + "loss": 0.2002, + "step": 209900 + }, + { + "epoch": 169.7, + "learning_rate": 2.883957508102269e-05, + "loss": 0.199, + "step": 209925 + }, + { + "epoch": 169.73, + "learning_rate": 2.878330932661145e-05, + "loss": 0.1758, + "step": 209950 + }, + { + "epoch": 169.75, + "learning_rate": 2.8727043572200215e-05, + "loss": 0.1984, + "step": 209975 + }, + { + "epoch": 169.77, + "learning_rate": 2.867077781778898e-05, + "loss": 0.1841, + "step": 210000 + }, + { + "epoch": 169.77, + "eval_cer": 0.07372462860486843, + "eval_loss": 0.47256383299827576, + "eval_runtime": 150.2166, + "eval_samples_per_second": 27.913, + "eval_steps_per_second": 6.983, + "eval_wer": 0.3164110929853181, + "step": 210000 + }, + { + "epoch": 169.79, + "learning_rate": 2.8614512063377748e-05, + "loss": 0.2131, + "step": 210025 + }, + { + "epoch": 169.81, + "learning_rate": 2.8558246308966512e-05, + "loss": 0.2113, + "step": 210050 + }, + { + "epoch": 169.83, + "learning_rate": 2.8504231184731725e-05, + "loss": 0.2038, + "step": 210075 + }, + { + "epoch": 169.85, + "learning_rate": 2.844796543032049e-05, + "loss": 0.182, + "step": 210100 + }, + { + "epoch": 169.87, + "learning_rate": 2.8391699675909254e-05, + "loss": 0.2077, + "step": 210125 + }, + { + "epoch": 169.89, + "learning_rate": 2.8335433921498023e-05, + "loss": 0.2242, + "step": 210150 + }, + { + "epoch": 169.91, + "learning_rate": 2.8279168167086787e-05, + "loss": 0.2341, + "step": 210175 + }, + { + "epoch": 169.93, + "learning_rate": 2.822290241267555e-05, + "loss": 0.1838, + "step": 210200 + }, + { + "epoch": 169.95, + "learning_rate": 2.8166636658264314e-05, + "loss": 0.2204, + "step": 210225 + }, + { + "epoch": 169.97, + "learning_rate": 2.811037090385308e-05, + "loss": 0.1779, + "step": 210250 + }, + { + "epoch": 169.99, + "learning_rate": 2.8054105149441843e-05, + "loss": 0.224, + "step": 210275 + }, + { + "epoch": 170.01, + "learning_rate": 2.7997839395030608e-05, + "loss": 0.2022, + "step": 210300 + }, + { + "epoch": 170.03, + "learning_rate": 2.7941573640619376e-05, + "loss": 0.179, + "step": 210325 + }, + { + "epoch": 170.05, + "learning_rate": 2.788530788620814e-05, + "loss": 0.1978, + "step": 210350 + }, + { + "epoch": 170.07, + "learning_rate": 2.7829042131796902e-05, + "loss": 0.1825, + "step": 210375 + }, + { + "epoch": 170.09, + "learning_rate": 2.7772776377385667e-05, + "loss": 0.187, + "step": 210400 + }, + { + "epoch": 170.11, + "learning_rate": 2.7716510622974432e-05, + "loss": 0.1917, + "step": 210425 + }, + { + "epoch": 170.13, + "learning_rate": 2.7660244868563197e-05, + "loss": 0.2035, + "step": 210450 + }, + { + "epoch": 170.15, + "learning_rate": 2.7603979114151965e-05, + "loss": 0.1981, + "step": 210475 + }, + { + "epoch": 170.17, + "learning_rate": 2.754771335974073e-05, + "loss": 0.1971, + "step": 210500 + }, + { + "epoch": 170.19, + "learning_rate": 2.7491447605329495e-05, + "loss": 0.1822, + "step": 210525 + }, + { + "epoch": 170.21, + "learning_rate": 2.7435181850918256e-05, + "loss": 0.2026, + "step": 210550 + }, + { + "epoch": 170.23, + "learning_rate": 2.737891609650702e-05, + "loss": 0.2142, + "step": 210575 + }, + { + "epoch": 170.25, + "learning_rate": 2.7322650342095786e-05, + "loss": 0.2011, + "step": 210600 + }, + { + "epoch": 170.27, + "learning_rate": 2.726638458768455e-05, + "loss": 0.1691, + "step": 210625 + }, + { + "epoch": 170.29, + "learning_rate": 2.721011883327332e-05, + "loss": 0.1798, + "step": 210650 + }, + { + "epoch": 170.31, + "learning_rate": 2.7153853078862083e-05, + "loss": 0.1828, + "step": 210675 + }, + { + "epoch": 170.33, + "learning_rate": 2.7097587324450848e-05, + "loss": 0.1837, + "step": 210700 + }, + { + "epoch": 170.35, + "learning_rate": 2.704132157003961e-05, + "loss": 0.1976, + "step": 210725 + }, + { + "epoch": 170.37, + "learning_rate": 2.6985055815628374e-05, + "loss": 0.1898, + "step": 210750 + }, + { + "epoch": 170.39, + "learning_rate": 2.692879006121714e-05, + "loss": 0.1906, + "step": 210775 + }, + { + "epoch": 170.41, + "learning_rate": 2.6872524306805907e-05, + "loss": 0.1866, + "step": 210800 + }, + { + "epoch": 170.43, + "learning_rate": 2.6816258552394672e-05, + "loss": 0.2003, + "step": 210825 + }, + { + "epoch": 170.45, + "learning_rate": 2.6759992797983437e-05, + "loss": 0.1728, + "step": 210850 + }, + { + "epoch": 170.47, + "learning_rate": 2.6703727043572202e-05, + "loss": 0.2115, + "step": 210875 + }, + { + "epoch": 170.49, + "learning_rate": 2.6647461289160967e-05, + "loss": 0.1753, + "step": 210900 + }, + { + "epoch": 170.51, + "learning_rate": 2.6591195534749728e-05, + "loss": 0.1987, + "step": 210925 + }, + { + "epoch": 170.53, + "learning_rate": 2.6534929780338493e-05, + "loss": 0.2055, + "step": 210950 + }, + { + "epoch": 170.55, + "learning_rate": 2.647866402592726e-05, + "loss": 0.2001, + "step": 210975 + }, + { + "epoch": 170.57, + "learning_rate": 2.6422398271516026e-05, + "loss": 0.1894, + "step": 211000 + }, + { + "epoch": 170.59, + "learning_rate": 2.636613251710479e-05, + "loss": 0.2001, + "step": 211025 + }, + { + "epoch": 170.61, + "learning_rate": 2.6309866762693555e-05, + "loss": 0.1836, + "step": 211050 + }, + { + "epoch": 170.63, + "learning_rate": 2.625360100828232e-05, + "loss": 0.2091, + "step": 211075 + }, + { + "epoch": 170.65, + "learning_rate": 2.619733525387108e-05, + "loss": 0.2003, + "step": 211100 + }, + { + "epoch": 170.68, + "learning_rate": 2.614106949945985e-05, + "loss": 0.1955, + "step": 211125 + }, + { + "epoch": 170.7, + "learning_rate": 2.6084803745048615e-05, + "loss": 0.2167, + "step": 211150 + }, + { + "epoch": 170.72, + "learning_rate": 2.602853799063738e-05, + "loss": 0.2527, + "step": 211175 + }, + { + "epoch": 170.74, + "learning_rate": 2.5972272236226144e-05, + "loss": 0.1774, + "step": 211200 + }, + { + "epoch": 170.76, + "learning_rate": 2.591600648181491e-05, + "loss": 0.2093, + "step": 211225 + }, + { + "epoch": 170.78, + "learning_rate": 2.5859740727403674e-05, + "loss": 0.191, + "step": 211250 + }, + { + "epoch": 170.8, + "learning_rate": 2.580347497299244e-05, + "loss": 0.1887, + "step": 211275 + }, + { + "epoch": 170.82, + "learning_rate": 2.5747209218581203e-05, + "loss": 0.2332, + "step": 211300 + }, + { + "epoch": 170.84, + "learning_rate": 2.5690943464169968e-05, + "loss": 0.2154, + "step": 211325 + }, + { + "epoch": 170.86, + "learning_rate": 2.5634677709758733e-05, + "loss": 0.179, + "step": 211350 + }, + { + "epoch": 170.88, + "learning_rate": 2.5578411955347498e-05, + "loss": 0.2106, + "step": 211375 + }, + { + "epoch": 170.9, + "learning_rate": 2.5522146200936263e-05, + "loss": 0.195, + "step": 211400 + }, + { + "epoch": 170.92, + "learning_rate": 2.5465880446525027e-05, + "loss": 0.1931, + "step": 211425 + }, + { + "epoch": 170.94, + "learning_rate": 2.5409614692113792e-05, + "loss": 0.1685, + "step": 211450 + }, + { + "epoch": 170.96, + "learning_rate": 2.5353348937702557e-05, + "loss": 0.1464, + "step": 211475 + }, + { + "epoch": 170.98, + "learning_rate": 2.5297083183291322e-05, + "loss": 0.1778, + "step": 211500 + }, + { + "epoch": 171.0, + "learning_rate": 2.5240817428880087e-05, + "loss": 0.1819, + "step": 211525 + }, + { + "epoch": 171.02, + "learning_rate": 2.518455167446885e-05, + "loss": 0.182, + "step": 211550 + }, + { + "epoch": 171.04, + "learning_rate": 2.5128285920057616e-05, + "loss": 0.1785, + "step": 211575 + }, + { + "epoch": 171.06, + "learning_rate": 2.5072020165646384e-05, + "loss": 0.2206, + "step": 211600 + }, + { + "epoch": 171.08, + "learning_rate": 2.5015754411235146e-05, + "loss": 0.1878, + "step": 211625 + }, + { + "epoch": 171.1, + "learning_rate": 2.495948865682391e-05, + "loss": 0.1952, + "step": 211650 + }, + { + "epoch": 171.12, + "learning_rate": 2.4903222902412675e-05, + "loss": 0.1731, + "step": 211675 + }, + { + "epoch": 171.14, + "learning_rate": 2.484695714800144e-05, + "loss": 0.2236, + "step": 211700 + }, + { + "epoch": 171.16, + "learning_rate": 2.4790691393590205e-05, + "loss": 0.1688, + "step": 211725 + }, + { + "epoch": 171.18, + "learning_rate": 2.4734425639178973e-05, + "loss": 0.1948, + "step": 211750 + }, + { + "epoch": 171.2, + "learning_rate": 2.4678159884767738e-05, + "loss": 0.174, + "step": 211775 + }, + { + "epoch": 171.22, + "learning_rate": 2.46218941303565e-05, + "loss": 0.174, + "step": 211800 + }, + { + "epoch": 171.24, + "learning_rate": 2.4565628375945264e-05, + "loss": 0.1988, + "step": 211825 + }, + { + "epoch": 171.26, + "learning_rate": 2.450936262153403e-05, + "loss": 0.2113, + "step": 211850 + }, + { + "epoch": 171.28, + "learning_rate": 2.4453096867122794e-05, + "loss": 0.1769, + "step": 211875 + }, + { + "epoch": 171.3, + "learning_rate": 2.439683111271156e-05, + "loss": 0.1963, + "step": 211900 + }, + { + "epoch": 171.32, + "learning_rate": 2.4340565358300327e-05, + "loss": 0.161, + "step": 211925 + }, + { + "epoch": 171.34, + "learning_rate": 2.428429960388909e-05, + "loss": 0.1801, + "step": 211950 + }, + { + "epoch": 171.36, + "learning_rate": 2.4228033849477853e-05, + "loss": 0.1774, + "step": 211975 + }, + { + "epoch": 171.38, + "learning_rate": 2.4171768095066618e-05, + "loss": 0.1972, + "step": 212000 + }, + { + "epoch": 171.4, + "learning_rate": 2.4115502340655383e-05, + "loss": 0.208, + "step": 212025 + }, + { + "epoch": 171.42, + "learning_rate": 2.4059236586244147e-05, + "loss": 0.1966, + "step": 212050 + }, + { + "epoch": 171.44, + "learning_rate": 2.4002970831832916e-05, + "loss": 0.165, + "step": 212075 + }, + { + "epoch": 171.46, + "learning_rate": 2.394670507742168e-05, + "loss": 0.2033, + "step": 212100 + }, + { + "epoch": 171.48, + "learning_rate": 2.3890439323010445e-05, + "loss": 0.164, + "step": 212125 + }, + { + "epoch": 171.5, + "learning_rate": 2.3834173568599207e-05, + "loss": 0.2168, + "step": 212150 + }, + { + "epoch": 171.52, + "learning_rate": 2.377790781418797e-05, + "loss": 0.2013, + "step": 212175 + }, + { + "epoch": 171.54, + "learning_rate": 2.3721642059776736e-05, + "loss": 0.1935, + "step": 212200 + }, + { + "epoch": 171.56, + "learning_rate": 2.36653763053655e-05, + "loss": 0.1854, + "step": 212225 + }, + { + "epoch": 171.58, + "learning_rate": 2.360911055095427e-05, + "loss": 0.2133, + "step": 212250 + }, + { + "epoch": 171.6, + "learning_rate": 2.3552844796543034e-05, + "loss": 0.1806, + "step": 212275 + }, + { + "epoch": 171.62, + "learning_rate": 2.34965790421318e-05, + "loss": 0.1823, + "step": 212300 + }, + { + "epoch": 171.65, + "learning_rate": 2.3440313287720564e-05, + "loss": 0.2023, + "step": 212325 + }, + { + "epoch": 171.67, + "learning_rate": 2.3384047533309325e-05, + "loss": 0.1978, + "step": 212350 + }, + { + "epoch": 171.69, + "learning_rate": 2.332778177889809e-05, + "loss": 0.1572, + "step": 212375 + }, + { + "epoch": 171.71, + "learning_rate": 2.3271516024486858e-05, + "loss": 0.2218, + "step": 212400 + }, + { + "epoch": 171.73, + "learning_rate": 2.3215250270075623e-05, + "loss": 0.1984, + "step": 212425 + }, + { + "epoch": 171.75, + "learning_rate": 2.3158984515664388e-05, + "loss": 0.2029, + "step": 212450 + }, + { + "epoch": 171.77, + "learning_rate": 2.3102718761253152e-05, + "loss": 0.1627, + "step": 212475 + }, + { + "epoch": 171.79, + "learning_rate": 2.3046453006841917e-05, + "loss": 0.1642, + "step": 212500 + }, + { + "epoch": 171.81, + "learning_rate": 2.299018725243068e-05, + "loss": 0.1891, + "step": 212525 + }, + { + "epoch": 171.83, + "learning_rate": 2.2933921498019443e-05, + "loss": 0.2037, + "step": 212550 + }, + { + "epoch": 171.85, + "learning_rate": 2.287765574360821e-05, + "loss": 0.1781, + "step": 212575 + }, + { + "epoch": 171.87, + "learning_rate": 2.2821389989196976e-05, + "loss": 0.1949, + "step": 212600 + }, + { + "epoch": 171.89, + "learning_rate": 2.276512423478574e-05, + "loss": 0.1819, + "step": 212625 + }, + { + "epoch": 171.91, + "learning_rate": 2.2708858480374506e-05, + "loss": 0.1855, + "step": 212650 + }, + { + "epoch": 171.93, + "learning_rate": 2.265259272596327e-05, + "loss": 0.1808, + "step": 212675 + }, + { + "epoch": 171.95, + "learning_rate": 2.2596326971552032e-05, + "loss": 0.1994, + "step": 212700 + }, + { + "epoch": 171.97, + "learning_rate": 2.25400612171408e-05, + "loss": 0.1876, + "step": 212725 + }, + { + "epoch": 171.99, + "learning_rate": 2.2483795462729565e-05, + "loss": 0.2074, + "step": 212750 + }, + { + "epoch": 172.01, + "learning_rate": 2.242752970831833e-05, + "loss": 0.1808, + "step": 212775 + }, + { + "epoch": 172.03, + "learning_rate": 2.2371263953907095e-05, + "loss": 0.1895, + "step": 212800 + }, + { + "epoch": 172.05, + "learning_rate": 2.231499819949586e-05, + "loss": 0.1993, + "step": 212825 + }, + { + "epoch": 172.07, + "learning_rate": 2.2258732445084624e-05, + "loss": 0.2055, + "step": 212850 + }, + { + "epoch": 172.09, + "learning_rate": 2.220246669067339e-05, + "loss": 0.2277, + "step": 212875 + }, + { + "epoch": 172.11, + "learning_rate": 2.2146200936262154e-05, + "loss": 0.2017, + "step": 212900 + }, + { + "epoch": 172.13, + "learning_rate": 2.208993518185092e-05, + "loss": 0.1825, + "step": 212925 + }, + { + "epoch": 172.15, + "learning_rate": 2.2033669427439684e-05, + "loss": 0.1839, + "step": 212950 + }, + { + "epoch": 172.17, + "learning_rate": 2.197740367302845e-05, + "loss": 0.1796, + "step": 212975 + }, + { + "epoch": 172.19, + "learning_rate": 2.1921137918617213e-05, + "loss": 0.1774, + "step": 213000 + }, + { + "epoch": 172.19, + "eval_cer": 0.07383756147141259, + "eval_loss": 0.4742075204849243, + "eval_runtime": 150.533, + "eval_samples_per_second": 27.854, + "eval_steps_per_second": 6.969, + "eval_wer": 0.3161500815660685, + "step": 213000 + }, + { + "epoch": 172.21, + "learning_rate": 2.1864872164205978e-05, + "loss": 0.1943, + "step": 213025 + }, + { + "epoch": 172.23, + "learning_rate": 2.1808606409794743e-05, + "loss": 0.1907, + "step": 213050 + }, + { + "epoch": 172.25, + "learning_rate": 2.1752340655383508e-05, + "loss": 0.1743, + "step": 213075 + }, + { + "epoch": 172.27, + "learning_rate": 2.1696074900972272e-05, + "loss": 0.1985, + "step": 213100 + }, + { + "epoch": 172.29, + "learning_rate": 2.1639809146561037e-05, + "loss": 0.2295, + "step": 213125 + }, + { + "epoch": 172.31, + "learning_rate": 2.1583543392149802e-05, + "loss": 0.1958, + "step": 213150 + }, + { + "epoch": 172.33, + "learning_rate": 2.1527277637738567e-05, + "loss": 0.1732, + "step": 213175 + }, + { + "epoch": 172.35, + "learning_rate": 2.1471011883327335e-05, + "loss": 0.2084, + "step": 213200 + }, + { + "epoch": 172.37, + "learning_rate": 2.1414746128916096e-05, + "loss": 0.1851, + "step": 213225 + }, + { + "epoch": 172.39, + "learning_rate": 2.135848037450486e-05, + "loss": 0.1872, + "step": 213250 + }, + { + "epoch": 172.41, + "learning_rate": 2.1302214620093626e-05, + "loss": 0.1918, + "step": 213275 + }, + { + "epoch": 172.43, + "learning_rate": 2.124594886568239e-05, + "loss": 0.1829, + "step": 213300 + }, + { + "epoch": 172.45, + "learning_rate": 2.1189683111271156e-05, + "loss": 0.1753, + "step": 213325 + }, + { + "epoch": 172.47, + "learning_rate": 2.1133417356859924e-05, + "loss": 0.1865, + "step": 213350 + }, + { + "epoch": 172.49, + "learning_rate": 2.107715160244869e-05, + "loss": 0.1732, + "step": 213375 + }, + { + "epoch": 172.51, + "learning_rate": 2.102088584803745e-05, + "loss": 0.1706, + "step": 213400 + }, + { + "epoch": 172.53, + "learning_rate": 2.0964620093626215e-05, + "loss": 0.1697, + "step": 213425 + }, + { + "epoch": 172.55, + "learning_rate": 2.090835433921498e-05, + "loss": 0.1971, + "step": 213450 + }, + { + "epoch": 172.57, + "learning_rate": 2.0852088584803744e-05, + "loss": 0.1733, + "step": 213475 + }, + { + "epoch": 172.59, + "learning_rate": 2.079582283039251e-05, + "loss": 0.1894, + "step": 213500 + }, + { + "epoch": 172.62, + "learning_rate": 2.0739557075981277e-05, + "loss": 0.1866, + "step": 213525 + }, + { + "epoch": 172.64, + "learning_rate": 2.0683291321570042e-05, + "loss": 0.1746, + "step": 213550 + }, + { + "epoch": 172.66, + "learning_rate": 2.0627025567158804e-05, + "loss": 0.1751, + "step": 213575 + }, + { + "epoch": 172.68, + "learning_rate": 2.057075981274757e-05, + "loss": 0.1906, + "step": 213600 + }, + { + "epoch": 172.7, + "learning_rate": 2.0514494058336333e-05, + "loss": 0.1656, + "step": 213625 + }, + { + "epoch": 172.72, + "learning_rate": 2.0458228303925098e-05, + "loss": 0.1831, + "step": 213650 + }, + { + "epoch": 172.74, + "learning_rate": 2.0401962549513866e-05, + "loss": 0.1708, + "step": 213675 + }, + { + "epoch": 172.76, + "learning_rate": 2.034569679510263e-05, + "loss": 0.1831, + "step": 213700 + }, + { + "epoch": 172.78, + "learning_rate": 2.0289431040691396e-05, + "loss": 0.1732, + "step": 213725 + }, + { + "epoch": 172.8, + "learning_rate": 2.023316528628016e-05, + "loss": 0.1691, + "step": 213750 + }, + { + "epoch": 172.82, + "learning_rate": 2.0176899531868922e-05, + "loss": 0.1903, + "step": 213775 + }, + { + "epoch": 172.84, + "learning_rate": 2.0120633777457687e-05, + "loss": 0.1739, + "step": 213800 + }, + { + "epoch": 172.86, + "learning_rate": 2.006436802304645e-05, + "loss": 0.1475, + "step": 213825 + }, + { + "epoch": 172.88, + "learning_rate": 2.000810226863522e-05, + "loss": 0.1844, + "step": 213850 + }, + { + "epoch": 172.9, + "learning_rate": 1.9951836514223985e-05, + "loss": 0.1972, + "step": 213875 + }, + { + "epoch": 172.92, + "learning_rate": 1.989557075981275e-05, + "loss": 0.1912, + "step": 213900 + }, + { + "epoch": 172.94, + "learning_rate": 1.9839305005401514e-05, + "loss": 0.1762, + "step": 213925 + }, + { + "epoch": 172.96, + "learning_rate": 1.9783039250990276e-05, + "loss": 0.2016, + "step": 213950 + }, + { + "epoch": 172.98, + "learning_rate": 1.972677349657904e-05, + "loss": 0.1875, + "step": 213975 + }, + { + "epoch": 173.0, + "learning_rate": 1.967050774216781e-05, + "loss": 0.1957, + "step": 214000 + }, + { + "epoch": 173.02, + "learning_rate": 1.9614241987756573e-05, + "loss": 0.2098, + "step": 214025 + }, + { + "epoch": 173.04, + "learning_rate": 1.9557976233345338e-05, + "loss": 0.2055, + "step": 214050 + }, + { + "epoch": 173.06, + "learning_rate": 1.9501710478934103e-05, + "loss": 0.2312, + "step": 214075 + }, + { + "epoch": 173.08, + "learning_rate": 1.9445444724522868e-05, + "loss": 0.1761, + "step": 214100 + }, + { + "epoch": 173.1, + "learning_rate": 1.938917897011163e-05, + "loss": 0.2061, + "step": 214125 + }, + { + "epoch": 173.12, + "learning_rate": 1.9332913215700394e-05, + "loss": 0.1726, + "step": 214150 + }, + { + "epoch": 173.14, + "learning_rate": 1.9276647461289162e-05, + "loss": 0.1935, + "step": 214175 + }, + { + "epoch": 173.16, + "learning_rate": 1.9222632337054375e-05, + "loss": 0.1552, + "step": 214200 + }, + { + "epoch": 173.18, + "learning_rate": 1.916636658264314e-05, + "loss": 0.2189, + "step": 214225 + }, + { + "epoch": 173.2, + "learning_rate": 1.9110100828231904e-05, + "loss": 0.1777, + "step": 214250 + }, + { + "epoch": 173.22, + "learning_rate": 1.905383507382067e-05, + "loss": 0.1906, + "step": 214275 + }, + { + "epoch": 173.24, + "learning_rate": 1.8997569319409437e-05, + "loss": 0.1802, + "step": 214300 + }, + { + "epoch": 173.26, + "learning_rate": 1.8941303564998202e-05, + "loss": 0.2032, + "step": 214325 + }, + { + "epoch": 173.28, + "learning_rate": 1.8885037810586967e-05, + "loss": 0.1831, + "step": 214350 + }, + { + "epoch": 173.3, + "learning_rate": 1.882877205617573e-05, + "loss": 0.2136, + "step": 214375 + }, + { + "epoch": 173.32, + "learning_rate": 1.8772506301764493e-05, + "loss": 0.1647, + "step": 214400 + }, + { + "epoch": 173.34, + "learning_rate": 1.8716240547353258e-05, + "loss": 0.188, + "step": 214425 + }, + { + "epoch": 173.36, + "learning_rate": 1.8659974792942023e-05, + "loss": 0.1585, + "step": 214450 + }, + { + "epoch": 173.38, + "learning_rate": 1.860370903853079e-05, + "loss": 0.1829, + "step": 214475 + }, + { + "epoch": 173.4, + "learning_rate": 1.8547443284119556e-05, + "loss": 0.1478, + "step": 214500 + }, + { + "epoch": 173.42, + "learning_rate": 1.849117752970832e-05, + "loss": 0.2183, + "step": 214525 + }, + { + "epoch": 173.44, + "learning_rate": 1.8434911775297082e-05, + "loss": 0.1815, + "step": 214550 + }, + { + "epoch": 173.46, + "learning_rate": 1.8378646020885847e-05, + "loss": 0.2044, + "step": 214575 + }, + { + "epoch": 173.48, + "learning_rate": 1.832238026647461e-05, + "loss": 0.1693, + "step": 214600 + }, + { + "epoch": 173.5, + "learning_rate": 1.826611451206338e-05, + "loss": 0.1877, + "step": 214625 + }, + { + "epoch": 173.52, + "learning_rate": 1.8209848757652144e-05, + "loss": 0.1964, + "step": 214650 + }, + { + "epoch": 173.54, + "learning_rate": 1.815358300324091e-05, + "loss": 0.2049, + "step": 214675 + }, + { + "epoch": 173.57, + "learning_rate": 1.8097317248829674e-05, + "loss": 0.179, + "step": 214700 + }, + { + "epoch": 173.59, + "learning_rate": 1.8041051494418436e-05, + "loss": 0.1841, + "step": 214725 + }, + { + "epoch": 173.61, + "learning_rate": 1.79847857400072e-05, + "loss": 0.1635, + "step": 214750 + }, + { + "epoch": 173.63, + "learning_rate": 1.7928519985595965e-05, + "loss": 0.1895, + "step": 214775 + }, + { + "epoch": 173.65, + "learning_rate": 1.7872254231184733e-05, + "loss": 0.1776, + "step": 214800 + }, + { + "epoch": 173.67, + "learning_rate": 1.7815988476773498e-05, + "loss": 0.1817, + "step": 214825 + }, + { + "epoch": 173.69, + "learning_rate": 1.7759722722362263e-05, + "loss": 0.1557, + "step": 214850 + }, + { + "epoch": 173.71, + "learning_rate": 1.7703456967951028e-05, + "loss": 0.207, + "step": 214875 + }, + { + "epoch": 173.73, + "learning_rate": 1.764719121353979e-05, + "loss": 0.1831, + "step": 214900 + }, + { + "epoch": 173.75, + "learning_rate": 1.7590925459128554e-05, + "loss": 0.2335, + "step": 214925 + }, + { + "epoch": 173.77, + "learning_rate": 1.7534659704717322e-05, + "loss": 0.2001, + "step": 214950 + }, + { + "epoch": 173.79, + "learning_rate": 1.7478393950306087e-05, + "loss": 0.2077, + "step": 214975 + }, + { + "epoch": 173.81, + "learning_rate": 1.742212819589485e-05, + "loss": 0.1638, + "step": 215000 + }, + { + "epoch": 173.83, + "learning_rate": 1.7365862441483616e-05, + "loss": 0.2241, + "step": 215025 + }, + { + "epoch": 173.85, + "learning_rate": 1.730959668707238e-05, + "loss": 0.1736, + "step": 215050 + }, + { + "epoch": 173.87, + "learning_rate": 1.7253330932661143e-05, + "loss": 0.2111, + "step": 215075 + }, + { + "epoch": 173.89, + "learning_rate": 1.719706517824991e-05, + "loss": 0.1622, + "step": 215100 + }, + { + "epoch": 173.91, + "learning_rate": 1.7140799423838676e-05, + "loss": 0.1935, + "step": 215125 + }, + { + "epoch": 173.93, + "learning_rate": 1.708453366942744e-05, + "loss": 0.1882, + "step": 215150 + }, + { + "epoch": 173.95, + "learning_rate": 1.7028267915016205e-05, + "loss": 0.2091, + "step": 215175 + }, + { + "epoch": 173.97, + "learning_rate": 1.697200216060497e-05, + "loss": 0.1914, + "step": 215200 + }, + { + "epoch": 173.99, + "learning_rate": 1.6915736406193735e-05, + "loss": 0.1978, + "step": 215225 + }, + { + "epoch": 174.01, + "learning_rate": 1.6859470651782496e-05, + "loss": 0.1971, + "step": 215250 + }, + { + "epoch": 174.03, + "learning_rate": 1.6803204897371264e-05, + "loss": 0.19, + "step": 215275 + }, + { + "epoch": 174.05, + "learning_rate": 1.674693914296003e-05, + "loss": 0.1619, + "step": 215300 + }, + { + "epoch": 174.07, + "learning_rate": 1.6690673388548794e-05, + "loss": 0.1741, + "step": 215325 + }, + { + "epoch": 174.09, + "learning_rate": 1.663440763413756e-05, + "loss": 0.1616, + "step": 215350 + }, + { + "epoch": 174.11, + "learning_rate": 1.6578141879726324e-05, + "loss": 0.2239, + "step": 215375 + }, + { + "epoch": 174.13, + "learning_rate": 1.652187612531509e-05, + "loss": 0.1858, + "step": 215400 + }, + { + "epoch": 174.15, + "learning_rate": 1.6465610370903853e-05, + "loss": 0.1955, + "step": 215425 + }, + { + "epoch": 174.17, + "learning_rate": 1.6409344616492618e-05, + "loss": 0.1749, + "step": 215450 + }, + { + "epoch": 174.19, + "learning_rate": 1.6353078862081383e-05, + "loss": 0.1855, + "step": 215475 + }, + { + "epoch": 174.21, + "learning_rate": 1.6296813107670148e-05, + "loss": 0.1706, + "step": 215500 + }, + { + "epoch": 174.23, + "learning_rate": 1.6240547353258912e-05, + "loss": 0.2086, + "step": 215525 + }, + { + "epoch": 174.25, + "learning_rate": 1.6184281598847677e-05, + "loss": 0.188, + "step": 215550 + }, + { + "epoch": 174.27, + "learning_rate": 1.6128015844436442e-05, + "loss": 0.1997, + "step": 215575 + }, + { + "epoch": 174.29, + "learning_rate": 1.607175009002521e-05, + "loss": 0.1771, + "step": 215600 + }, + { + "epoch": 174.31, + "learning_rate": 1.601548433561397e-05, + "loss": 0.1922, + "step": 215625 + }, + { + "epoch": 174.33, + "learning_rate": 1.5959218581202736e-05, + "loss": 0.1818, + "step": 215650 + }, + { + "epoch": 174.35, + "learning_rate": 1.590520345696795e-05, + "loss": 0.2173, + "step": 215675 + }, + { + "epoch": 174.37, + "learning_rate": 1.5848937702556714e-05, + "loss": 0.1975, + "step": 215700 + }, + { + "epoch": 174.39, + "learning_rate": 1.579267194814548e-05, + "loss": 0.1748, + "step": 215725 + }, + { + "epoch": 174.41, + "learning_rate": 1.5736406193734247e-05, + "loss": 0.1873, + "step": 215750 + }, + { + "epoch": 174.43, + "learning_rate": 1.568014043932301e-05, + "loss": 0.1777, + "step": 215775 + }, + { + "epoch": 174.45, + "learning_rate": 1.5623874684911776e-05, + "loss": 0.2143, + "step": 215800 + }, + { + "epoch": 174.47, + "learning_rate": 1.556760893050054e-05, + "loss": 0.1641, + "step": 215825 + }, + { + "epoch": 174.49, + "learning_rate": 1.5511343176089306e-05, + "loss": 0.1788, + "step": 215850 + }, + { + "epoch": 174.51, + "learning_rate": 1.545507742167807e-05, + "loss": 0.1697, + "step": 215875 + }, + { + "epoch": 174.54, + "learning_rate": 1.5398811667266836e-05, + "loss": 0.1693, + "step": 215900 + }, + { + "epoch": 174.56, + "learning_rate": 1.53425459128556e-05, + "loss": 0.1963, + "step": 215925 + }, + { + "epoch": 174.58, + "learning_rate": 1.5286280158444365e-05, + "loss": 0.2001, + "step": 215950 + }, + { + "epoch": 174.6, + "learning_rate": 1.523001440403313e-05, + "loss": 0.1966, + "step": 215975 + }, + { + "epoch": 174.62, + "learning_rate": 1.5173748649621893e-05, + "loss": 0.1819, + "step": 216000 + }, + { + "epoch": 174.62, + "eval_cer": 0.07368869542005893, + "eval_loss": 0.4719657897949219, + "eval_runtime": 150.9063, + "eval_samples_per_second": 27.785, + "eval_steps_per_second": 6.951, + "eval_wer": 0.31491027732463295, + "step": 216000 + }, + { + "epoch": 174.64, + "learning_rate": 1.511748289521066e-05, + "loss": 0.1881, + "step": 216025 + }, + { + "epoch": 174.66, + "learning_rate": 1.5061217140799424e-05, + "loss": 0.1883, + "step": 216050 + }, + { + "epoch": 174.68, + "learning_rate": 1.500495138638819e-05, + "loss": 0.1639, + "step": 216075 + }, + { + "epoch": 174.7, + "learning_rate": 1.4950936262153404e-05, + "loss": 0.2041, + "step": 216100 + }, + { + "epoch": 174.72, + "learning_rate": 1.4894670507742168e-05, + "loss": 0.1736, + "step": 216125 + }, + { + "epoch": 174.74, + "learning_rate": 1.4838404753330931e-05, + "loss": 0.2013, + "step": 216150 + }, + { + "epoch": 174.76, + "learning_rate": 1.4782138998919698e-05, + "loss": 0.1711, + "step": 216175 + }, + { + "epoch": 174.78, + "learning_rate": 1.4725873244508463e-05, + "loss": 0.1801, + "step": 216200 + }, + { + "epoch": 174.8, + "learning_rate": 1.4669607490097227e-05, + "loss": 0.1786, + "step": 216225 + }, + { + "epoch": 174.82, + "learning_rate": 1.4613341735685992e-05, + "loss": 0.1562, + "step": 216250 + }, + { + "epoch": 174.84, + "learning_rate": 1.4557075981274757e-05, + "loss": 0.1903, + "step": 216275 + }, + { + "epoch": 174.86, + "learning_rate": 1.4500810226863522e-05, + "loss": 0.2086, + "step": 216300 + }, + { + "epoch": 174.88, + "learning_rate": 1.4444544472452288e-05, + "loss": 0.1597, + "step": 216325 + }, + { + "epoch": 174.9, + "learning_rate": 1.4388278718041051e-05, + "loss": 0.1638, + "step": 216350 + }, + { + "epoch": 174.92, + "learning_rate": 1.4332012963629816e-05, + "loss": 0.1867, + "step": 216375 + }, + { + "epoch": 174.94, + "learning_rate": 1.4275747209218583e-05, + "loss": 0.1839, + "step": 216400 + }, + { + "epoch": 174.96, + "learning_rate": 1.4219481454807346e-05, + "loss": 0.2063, + "step": 216425 + }, + { + "epoch": 174.98, + "learning_rate": 1.416321570039611e-05, + "loss": 0.1848, + "step": 216450 + }, + { + "epoch": 175.0, + "learning_rate": 1.4106949945984877e-05, + "loss": 0.2096, + "step": 216475 + }, + { + "epoch": 175.02, + "learning_rate": 1.4050684191573642e-05, + "loss": 0.2003, + "step": 216500 + }, + { + "epoch": 175.04, + "learning_rate": 1.3994418437162405e-05, + "loss": 0.1422, + "step": 216525 + }, + { + "epoch": 175.06, + "learning_rate": 1.393815268275117e-05, + "loss": 0.1863, + "step": 216550 + }, + { + "epoch": 175.08, + "learning_rate": 1.3881886928339936e-05, + "loss": 0.1946, + "step": 216575 + }, + { + "epoch": 175.1, + "learning_rate": 1.38256211739287e-05, + "loss": 0.1949, + "step": 216600 + }, + { + "epoch": 175.12, + "learning_rate": 1.3769355419517464e-05, + "loss": 0.1733, + "step": 216625 + }, + { + "epoch": 175.14, + "learning_rate": 1.371308966510623e-05, + "loss": 0.197, + "step": 216650 + }, + { + "epoch": 175.16, + "learning_rate": 1.3656823910694996e-05, + "loss": 0.1728, + "step": 216675 + }, + { + "epoch": 175.18, + "learning_rate": 1.3600558156283759e-05, + "loss": 0.2056, + "step": 216700 + }, + { + "epoch": 175.2, + "learning_rate": 1.3544292401872525e-05, + "loss": 0.1502, + "step": 216725 + }, + { + "epoch": 175.22, + "learning_rate": 1.348802664746129e-05, + "loss": 0.1941, + "step": 216750 + }, + { + "epoch": 175.24, + "learning_rate": 1.3431760893050053e-05, + "loss": 0.1666, + "step": 216775 + }, + { + "epoch": 175.26, + "learning_rate": 1.337549513863882e-05, + "loss": 0.2049, + "step": 216800 + }, + { + "epoch": 175.28, + "learning_rate": 1.3319229384227584e-05, + "loss": 0.172, + "step": 216825 + }, + { + "epoch": 175.3, + "learning_rate": 1.326296362981635e-05, + "loss": 0.1989, + "step": 216850 + }, + { + "epoch": 175.32, + "learning_rate": 1.3206697875405114e-05, + "loss": 0.1849, + "step": 216875 + }, + { + "epoch": 175.34, + "learning_rate": 1.3150432120993879e-05, + "loss": 0.1806, + "step": 216900 + }, + { + "epoch": 175.36, + "learning_rate": 1.3094166366582644e-05, + "loss": 0.196, + "step": 216925 + }, + { + "epoch": 175.38, + "learning_rate": 1.3037900612171407e-05, + "loss": 0.2048, + "step": 216950 + }, + { + "epoch": 175.4, + "learning_rate": 1.2981634857760173e-05, + "loss": 0.1698, + "step": 216975 + }, + { + "epoch": 175.42, + "learning_rate": 1.2925369103348938e-05, + "loss": 0.203, + "step": 217000 + }, + { + "epoch": 175.44, + "learning_rate": 1.2869103348937703e-05, + "loss": 0.1793, + "step": 217025 + }, + { + "epoch": 175.46, + "learning_rate": 1.2812837594526468e-05, + "loss": 0.1805, + "step": 217050 + }, + { + "epoch": 175.49, + "learning_rate": 1.2756571840115232e-05, + "loss": 0.1815, + "step": 217075 + }, + { + "epoch": 175.51, + "learning_rate": 1.2700306085703997e-05, + "loss": 0.1887, + "step": 217100 + }, + { + "epoch": 175.53, + "learning_rate": 1.2644040331292764e-05, + "loss": 0.1623, + "step": 217125 + }, + { + "epoch": 175.55, + "learning_rate": 1.2587774576881527e-05, + "loss": 0.1942, + "step": 217150 + }, + { + "epoch": 175.57, + "learning_rate": 1.2531508822470292e-05, + "loss": 0.182, + "step": 217175 + }, + { + "epoch": 175.59, + "learning_rate": 1.2475243068059058e-05, + "loss": 0.1871, + "step": 217200 + }, + { + "epoch": 175.61, + "learning_rate": 1.2418977313647821e-05, + "loss": 0.1582, + "step": 217225 + }, + { + "epoch": 175.63, + "learning_rate": 1.2362711559236586e-05, + "loss": 0.2343, + "step": 217250 + }, + { + "epoch": 175.65, + "learning_rate": 1.2306445804825352e-05, + "loss": 0.1563, + "step": 217275 + }, + { + "epoch": 175.67, + "learning_rate": 1.2250180050414117e-05, + "loss": 0.1861, + "step": 217300 + }, + { + "epoch": 175.69, + "learning_rate": 1.219391429600288e-05, + "loss": 0.1569, + "step": 217325 + }, + { + "epoch": 175.71, + "learning_rate": 1.2137648541591645e-05, + "loss": 0.1992, + "step": 217350 + }, + { + "epoch": 175.73, + "learning_rate": 1.2081382787180412e-05, + "loss": 0.1648, + "step": 217375 + }, + { + "epoch": 175.75, + "learning_rate": 1.2025117032769175e-05, + "loss": 0.2176, + "step": 217400 + }, + { + "epoch": 175.77, + "learning_rate": 1.196885127835794e-05, + "loss": 0.1642, + "step": 217425 + }, + { + "epoch": 175.79, + "learning_rate": 1.1912585523946706e-05, + "loss": 0.1833, + "step": 217450 + }, + { + "epoch": 175.81, + "learning_rate": 1.1856319769535471e-05, + "loss": 0.1236, + "step": 217475 + }, + { + "epoch": 175.83, + "learning_rate": 1.1800054015124234e-05, + "loss": 0.2161, + "step": 217500 + }, + { + "epoch": 175.85, + "learning_rate": 1.1743788260713e-05, + "loss": 0.1724, + "step": 217525 + }, + { + "epoch": 175.87, + "learning_rate": 1.1687522506301765e-05, + "loss": 0.2116, + "step": 217550 + }, + { + "epoch": 175.89, + "learning_rate": 1.1631256751890528e-05, + "loss": 0.1617, + "step": 217575 + }, + { + "epoch": 175.91, + "learning_rate": 1.1574990997479295e-05, + "loss": 0.2011, + "step": 217600 + }, + { + "epoch": 175.93, + "learning_rate": 1.151872524306806e-05, + "loss": 0.1779, + "step": 217625 + }, + { + "epoch": 175.95, + "learning_rate": 1.1462459488656824e-05, + "loss": 0.2031, + "step": 217650 + }, + { + "epoch": 175.97, + "learning_rate": 1.140619373424559e-05, + "loss": 0.1873, + "step": 217675 + }, + { + "epoch": 175.99, + "learning_rate": 1.1349927979834354e-05, + "loss": 0.2092, + "step": 217700 + }, + { + "epoch": 176.01, + "learning_rate": 1.1293662225423119e-05, + "loss": 0.1807, + "step": 217725 + }, + { + "epoch": 176.03, + "learning_rate": 1.1237396471011882e-05, + "loss": 0.2006, + "step": 217750 + }, + { + "epoch": 176.05, + "learning_rate": 1.1181130716600648e-05, + "loss": 0.1731, + "step": 217775 + }, + { + "epoch": 176.07, + "learning_rate": 1.1124864962189413e-05, + "loss": 0.181, + "step": 217800 + }, + { + "epoch": 176.09, + "learning_rate": 1.1068599207778178e-05, + "loss": 0.1835, + "step": 217825 + }, + { + "epoch": 176.11, + "learning_rate": 1.1012333453366943e-05, + "loss": 0.1713, + "step": 217850 + }, + { + "epoch": 176.13, + "learning_rate": 1.0956067698955708e-05, + "loss": 0.1701, + "step": 217875 + }, + { + "epoch": 176.15, + "learning_rate": 1.0899801944544472e-05, + "loss": 0.1906, + "step": 217900 + }, + { + "epoch": 176.17, + "learning_rate": 1.0843536190133239e-05, + "loss": 0.1964, + "step": 217925 + }, + { + "epoch": 176.19, + "learning_rate": 1.0787270435722002e-05, + "loss": 0.2402, + "step": 217950 + }, + { + "epoch": 176.21, + "learning_rate": 1.0731004681310767e-05, + "loss": 0.2083, + "step": 217975 + }, + { + "epoch": 176.23, + "learning_rate": 1.0674738926899533e-05, + "loss": 0.188, + "step": 218000 + }, + { + "epoch": 176.25, + "learning_rate": 1.0618473172488296e-05, + "loss": 0.2039, + "step": 218025 + }, + { + "epoch": 176.27, + "learning_rate": 1.0562207418077061e-05, + "loss": 0.1994, + "step": 218050 + }, + { + "epoch": 176.29, + "learning_rate": 1.0505941663665828e-05, + "loss": 0.2071, + "step": 218075 + }, + { + "epoch": 176.31, + "learning_rate": 1.0449675909254593e-05, + "loss": 0.1852, + "step": 218100 + }, + { + "epoch": 176.33, + "learning_rate": 1.0393410154843356e-05, + "loss": 0.1698, + "step": 218125 + }, + { + "epoch": 176.35, + "learning_rate": 1.033714440043212e-05, + "loss": 0.1701, + "step": 218150 + }, + { + "epoch": 176.37, + "learning_rate": 1.0280878646020887e-05, + "loss": 0.1796, + "step": 218175 + }, + { + "epoch": 176.39, + "learning_rate": 1.022461289160965e-05, + "loss": 0.1857, + "step": 218200 + }, + { + "epoch": 176.41, + "learning_rate": 1.0168347137198415e-05, + "loss": 0.1589, + "step": 218225 + }, + { + "epoch": 176.43, + "learning_rate": 1.0112081382787181e-05, + "loss": 0.2114, + "step": 218250 + }, + { + "epoch": 176.46, + "learning_rate": 1.0055815628375946e-05, + "loss": 0.1822, + "step": 218275 + }, + { + "epoch": 176.48, + "learning_rate": 9.99954987396471e-06, + "loss": 0.1705, + "step": 218300 + }, + { + "epoch": 176.5, + "learning_rate": 9.943284119553476e-06, + "loss": 0.1892, + "step": 218325 + }, + { + "epoch": 176.52, + "learning_rate": 9.88701836514224e-06, + "loss": 0.1876, + "step": 218350 + }, + { + "epoch": 176.54, + "learning_rate": 9.830752610731004e-06, + "loss": 0.1808, + "step": 218375 + }, + { + "epoch": 176.56, + "learning_rate": 9.77448685631977e-06, + "loss": 0.1856, + "step": 218400 + }, + { + "epoch": 176.58, + "learning_rate": 9.718221101908535e-06, + "loss": 0.1873, + "step": 218425 + }, + { + "epoch": 176.6, + "learning_rate": 9.6619553474973e-06, + "loss": 0.2164, + "step": 218450 + }, + { + "epoch": 176.62, + "learning_rate": 9.605689593086065e-06, + "loss": 0.1846, + "step": 218475 + }, + { + "epoch": 176.64, + "learning_rate": 9.54942383867483e-06, + "loss": 0.2001, + "step": 218500 + }, + { + "epoch": 176.66, + "learning_rate": 9.493158084263594e-06, + "loss": 0.1865, + "step": 218525 + }, + { + "epoch": 176.68, + "learning_rate": 9.436892329852359e-06, + "loss": 0.1982, + "step": 218550 + }, + { + "epoch": 176.7, + "learning_rate": 9.380626575441124e-06, + "loss": 0.1883, + "step": 218575 + }, + { + "epoch": 176.72, + "learning_rate": 9.324360821029889e-06, + "loss": 0.1713, + "step": 218600 + }, + { + "epoch": 176.74, + "learning_rate": 9.268095066618653e-06, + "loss": 0.187, + "step": 218625 + }, + { + "epoch": 176.76, + "learning_rate": 9.211829312207418e-06, + "loss": 0.2027, + "step": 218650 + }, + { + "epoch": 176.78, + "learning_rate": 9.155563557796183e-06, + "loss": 0.2009, + "step": 218675 + }, + { + "epoch": 176.8, + "learning_rate": 9.099297803384948e-06, + "loss": 0.1972, + "step": 218700 + }, + { + "epoch": 176.82, + "learning_rate": 9.043032048973714e-06, + "loss": 0.2041, + "step": 218725 + }, + { + "epoch": 176.84, + "learning_rate": 8.986766294562477e-06, + "loss": 0.1886, + "step": 218750 + }, + { + "epoch": 176.86, + "learning_rate": 8.930500540151242e-06, + "loss": 0.1983, + "step": 218775 + }, + { + "epoch": 176.88, + "learning_rate": 8.874234785740009e-06, + "loss": 0.1995, + "step": 218800 + }, + { + "epoch": 176.9, + "learning_rate": 8.817969031328772e-06, + "loss": 0.166, + "step": 218825 + }, + { + "epoch": 176.92, + "learning_rate": 8.761703276917537e-06, + "loss": 0.1773, + "step": 218850 + }, + { + "epoch": 176.94, + "learning_rate": 8.705437522506303e-06, + "loss": 0.1902, + "step": 218875 + }, + { + "epoch": 176.96, + "learning_rate": 8.649171768095068e-06, + "loss": 0.1644, + "step": 218900 + }, + { + "epoch": 176.98, + "learning_rate": 8.592906013683831e-06, + "loss": 0.192, + "step": 218925 + }, + { + "epoch": 177.0, + "learning_rate": 8.536640259272596e-06, + "loss": 0.1746, + "step": 218950 + }, + { + "epoch": 177.02, + "learning_rate": 8.480374504861362e-06, + "loss": 0.1917, + "step": 218975 + }, + { + "epoch": 177.04, + "learning_rate": 8.424108750450125e-06, + "loss": 0.1746, + "step": 219000 + }, + { + "epoch": 177.04, + "eval_cer": 0.0737554284775623, + "eval_loss": 0.4736139476299286, + "eval_runtime": 150.3634, + "eval_samples_per_second": 27.886, + "eval_steps_per_second": 6.976, + "eval_wer": 0.3153344208809135, + "step": 219000 + }, + { + "epoch": 177.06, + "learning_rate": 8.36784299603889e-06, + "loss": 0.1999, + "step": 219025 + }, + { + "epoch": 177.08, + "learning_rate": 8.311577241627657e-06, + "loss": 0.1703, + "step": 219050 + }, + { + "epoch": 177.1, + "learning_rate": 8.255311487216421e-06, + "loss": 0.2036, + "step": 219075 + }, + { + "epoch": 177.12, + "learning_rate": 8.199045732805185e-06, + "loss": 0.1426, + "step": 219100 + }, + { + "epoch": 177.14, + "learning_rate": 8.142779978393951e-06, + "loss": 0.1903, + "step": 219125 + }, + { + "epoch": 177.16, + "learning_rate": 8.086514223982716e-06, + "loss": 0.1764, + "step": 219150 + }, + { + "epoch": 177.18, + "learning_rate": 8.030248469571479e-06, + "loss": 0.2088, + "step": 219175 + }, + { + "epoch": 177.2, + "learning_rate": 7.973982715160245e-06, + "loss": 0.1767, + "step": 219200 + }, + { + "epoch": 177.22, + "learning_rate": 7.91771696074901e-06, + "loss": 0.2087, + "step": 219225 + }, + { + "epoch": 177.24, + "learning_rate": 7.861451206337775e-06, + "loss": 0.1539, + "step": 219250 + }, + { + "epoch": 177.26, + "learning_rate": 7.80518545192654e-06, + "loss": 0.2094, + "step": 219275 + }, + { + "epoch": 177.28, + "learning_rate": 7.748919697515305e-06, + "loss": 0.1763, + "step": 219300 + }, + { + "epoch": 177.3, + "learning_rate": 7.69265394310407e-06, + "loss": 0.1884, + "step": 219325 + }, + { + "epoch": 177.32, + "learning_rate": 7.636388188692834e-06, + "loss": 0.1701, + "step": 219350 + }, + { + "epoch": 177.34, + "learning_rate": 7.580122434281599e-06, + "loss": 0.1838, + "step": 219375 + }, + { + "epoch": 177.36, + "learning_rate": 7.523856679870364e-06, + "loss": 0.1782, + "step": 219400 + }, + { + "epoch": 177.38, + "learning_rate": 7.467590925459129e-06, + "loss": 0.2152, + "step": 219425 + }, + { + "epoch": 177.41, + "learning_rate": 7.411325171047893e-06, + "loss": 0.1505, + "step": 219450 + }, + { + "epoch": 177.43, + "learning_rate": 7.355059416636658e-06, + "loss": 0.1944, + "step": 219475 + }, + { + "epoch": 177.45, + "learning_rate": 7.298793662225424e-06, + "loss": 0.1892, + "step": 219500 + }, + { + "epoch": 177.47, + "learning_rate": 7.242527907814188e-06, + "loss": 0.1961, + "step": 219525 + }, + { + "epoch": 177.49, + "learning_rate": 7.1862621534029534e-06, + "loss": 0.168, + "step": 219550 + }, + { + "epoch": 177.51, + "learning_rate": 7.129996398991718e-06, + "loss": 0.1958, + "step": 219575 + }, + { + "epoch": 177.53, + "learning_rate": 7.073730644580482e-06, + "loss": 0.171, + "step": 219600 + }, + { + "epoch": 177.55, + "learning_rate": 7.017464890169248e-06, + "loss": 0.1745, + "step": 219625 + }, + { + "epoch": 177.57, + "learning_rate": 6.961199135758012e-06, + "loss": 0.1488, + "step": 219650 + }, + { + "epoch": 177.59, + "learning_rate": 6.9049333813467774e-06, + "loss": 0.2208, + "step": 219675 + }, + { + "epoch": 177.61, + "learning_rate": 6.848667626935542e-06, + "loss": 0.1821, + "step": 219700 + }, + { + "epoch": 177.63, + "learning_rate": 6.792401872524307e-06, + "loss": 0.2024, + "step": 219725 + }, + { + "epoch": 177.65, + "learning_rate": 6.736136118113072e-06, + "loss": 0.1593, + "step": 219750 + }, + { + "epoch": 177.67, + "learning_rate": 6.679870363701837e-06, + "loss": 0.2056, + "step": 219775 + }, + { + "epoch": 177.69, + "learning_rate": 6.623604609290601e-06, + "loss": 0.2001, + "step": 219800 + }, + { + "epoch": 177.71, + "learning_rate": 6.567338854879366e-06, + "loss": 0.1689, + "step": 219825 + }, + { + "epoch": 177.73, + "learning_rate": 6.511073100468131e-06, + "loss": 0.175, + "step": 219850 }, { - "epoch": 15.52, - "learning_rate": 0.00024952428945777057, - "loss": 0.2007, - "step": 17200 + "epoch": 177.75, + "learning_rate": 6.454807346056896e-06, + "loss": 0.1894, + "step": 219875 }, { - "epoch": 15.52, - "eval_loss": 0.1601659506559372, - "eval_runtime": 202.199, - "eval_samples_per_second": 19.57, - "eval_steps_per_second": 2.448, - "eval_wer": 0.20924055499248592, - "step": 17200 + "epoch": 177.77, + "learning_rate": 6.3985415916456615e-06, + "loss": 0.1865, + "step": 219900 }, { - "epoch": 15.88, - "learning_rate": 0.0002483178794597863, - "loss": 0.2042, - "step": 17600 + "epoch": 177.79, + "learning_rate": 6.342275837234425e-06, + "loss": 0.1763, + "step": 219925 }, { - "epoch": 15.88, - "eval_loss": 0.15520912408828735, - "eval_runtime": 202.5397, - "eval_samples_per_second": 19.537, - "eval_steps_per_second": 2.444, - "eval_wer": 0.1952958445461853, - "step": 17600 + "epoch": 177.81, + "learning_rate": 6.286010082823191e-06, + "loss": 0.1881, + "step": 219950 }, { - "epoch": 16.25, - "learning_rate": 0.0002471084458778472, - "loss": 0.187, - "step": 18000 + "epoch": 177.83, + "learning_rate": 6.229744328411956e-06, + "loss": 0.1949, + "step": 219975 }, { - "epoch": 16.25, - "eval_loss": 0.16360661387443542, - "eval_runtime": 202.7459, - "eval_samples_per_second": 19.517, - "eval_steps_per_second": 2.441, - "eval_wer": 0.19442211582147975, - "step": 18000 + "epoch": 177.85, + "learning_rate": 6.17347857400072e-06, + "loss": 0.1876, + "step": 220000 }, { - "epoch": 16.61, - "learning_rate": 0.00024589901229590805, - "loss": 0.1931, - "step": 18400 + "epoch": 177.87, + "learning_rate": 6.1172128195894855e-06, + "loss": 0.2061, + "step": 220025 }, { - "epoch": 16.61, - "eval_loss": 0.1533084213733673, - "eval_runtime": 203.0495, - "eval_samples_per_second": 19.488, - "eval_steps_per_second": 2.438, - "eval_wer": 0.1916960822003984, - "step": 18400 + "epoch": 177.89, + "learning_rate": 6.060947065178249e-06, + "loss": 0.1828, + "step": 220050 }, { - "epoch": 16.97, - "learning_rate": 0.000244689578713969, - "loss": 0.1891, - "step": 18800 + "epoch": 177.91, + "learning_rate": 6.004681310767015e-06, + "loss": 0.2001, + "step": 220075 }, { - "epoch": 16.97, - "eval_loss": 0.16208086907863617, - "eval_runtime": 202.8946, - "eval_samples_per_second": 19.503, - "eval_steps_per_second": 2.44, - "eval_wer": 0.1907175060287282, - "step": 18800 + "epoch": 177.93, + "learning_rate": 5.94841555635578e-06, + "loss": 0.1594, + "step": 220100 }, { - "epoch": 17.33, - "learning_rate": 0.00024348014513202981, - "loss": 0.1863, - "step": 19200 + "epoch": 177.95, + "learning_rate": 5.892149801944545e-06, + "loss": 0.2194, + "step": 220125 }, { - "epoch": 17.33, - "eval_loss": 0.15993733704090118, - "eval_runtime": 202.8467, - "eval_samples_per_second": 19.507, - "eval_steps_per_second": 2.44, - "eval_wer": 0.1905777094327753, - "step": 19200 + "epoch": 177.97, + "learning_rate": 5.838134677709759e-06, + "loss": 0.195, + "step": 220150 }, { - "epoch": 17.69, - "learning_rate": 0.00024227071155009068, - "loss": 0.1863, - "step": 19600 + "epoch": 177.99, + "learning_rate": 5.781868923298524e-06, + "loss": 0.2, + "step": 220175 }, { - "epoch": 17.69, - "eval_loss": 0.15354220569133759, - "eval_runtime": 202.9873, - "eval_samples_per_second": 19.494, - "eval_steps_per_second": 2.439, - "eval_wer": 0.1911718449655751, - "step": 19600 + "epoch": 178.01, + "learning_rate": 5.7256031688872885e-06, + "loss": 0.1975, + "step": 220200 }, { - "epoch": 18.05, - "learning_rate": 0.00024106127796815155, - "loss": 0.1827, - "step": 20000 + "epoch": 178.03, + "learning_rate": 5.669337414476053e-06, + "loss": 0.1658, + "step": 220225 }, { - "epoch": 18.05, - "eval_loss": 0.1616511195898056, - "eval_runtime": 204.4003, - "eval_samples_per_second": 19.359, - "eval_steps_per_second": 2.422, - "eval_wer": 0.1880264215566351, - "step": 20000 + "epoch": 178.05, + "learning_rate": 5.613071660064818e-06, + "loss": 0.1948, + "step": 220250 }, { - "epoch": 18.41, - "learning_rate": 0.00023985184438621244, - "loss": 0.1822, - "step": 20400 + "epoch": 178.07, + "learning_rate": 5.556805905653583e-06, + "loss": 0.1941, + "step": 220275 }, { - "epoch": 18.41, - "eval_loss": 0.1649104207754135, - "eval_runtime": 206.8059, - "eval_samples_per_second": 19.134, - "eval_steps_per_second": 2.394, - "eval_wer": 0.18806137070562332, - "step": 20400 + "epoch": 178.09, + "learning_rate": 5.500540151242348e-06, + "loss": 0.1834, + "step": 220300 }, { - "epoch": 18.77, - "learning_rate": 0.0002386424108042733, - "loss": 0.1841, - "step": 20800 + "epoch": 178.11, + "learning_rate": 5.444274396831113e-06, + "loss": 0.1895, + "step": 220325 }, { - "epoch": 18.77, - "eval_loss": 0.16039612889289856, - "eval_runtime": 204.0742, - "eval_samples_per_second": 19.39, - "eval_steps_per_second": 2.426, - "eval_wer": 0.18942438751616397, - "step": 20800 + "epoch": 178.13, + "learning_rate": 5.388008642419877e-06, + "loss": 0.1861, + "step": 220350 }, { - "epoch": 19.13, - "learning_rate": 0.00023743297722233418, - "loss": 0.1817, - "step": 21200 + "epoch": 178.15, + "learning_rate": 5.331742888008643e-06, + "loss": 0.1968, + "step": 220375 }, { - "epoch": 19.13, - "eval_loss": 0.157293900847435, - "eval_runtime": 202.3143, - "eval_samples_per_second": 19.559, - "eval_steps_per_second": 2.447, - "eval_wer": 0.1810715409079789, - "step": 21200 + "epoch": 178.17, + "learning_rate": 5.275477133597407e-06, + "loss": 0.2075, + "step": 220400 }, { - "epoch": 19.49, - "learning_rate": 0.00023622959080830475, - "loss": 0.1756, - "step": 21600 + "epoch": 178.19, + "learning_rate": 5.2192113791861726e-06, + "loss": 0.2248, + "step": 220425 }, { - "epoch": 19.49, - "eval_loss": 0.16328036785125732, - "eval_runtime": 204.2348, - "eval_samples_per_second": 19.375, - "eval_steps_per_second": 2.424, - "eval_wer": 0.18809631985461153, - "step": 21600 + "epoch": 178.21, + "learning_rate": 5.162945624774937e-06, + "loss": 0.2085, + "step": 220450 }, { - "epoch": 19.86, - "learning_rate": 0.00023502015722636564, - "loss": 0.1804, - "step": 22000 + "epoch": 178.23, + "learning_rate": 5.106679870363701e-06, + "loss": 0.1733, + "step": 220475 }, { - "epoch": 19.86, - "eval_loss": 0.1585751324892044, - "eval_runtime": 204.9615, - "eval_samples_per_second": 19.306, - "eval_steps_per_second": 2.415, - "eval_wer": 0.18823611645056443, - "step": 22000 + "epoch": 178.25, + "learning_rate": 5.050414115952467e-06, + "loss": 0.1964, + "step": 220500 }, { - "epoch": 20.22, - "learning_rate": 0.0002338107236444265, - "loss": 0.1736, - "step": 22400 + "epoch": 178.27, + "learning_rate": 4.994148361541232e-06, + "loss": 0.1939, + "step": 220525 }, { - "epoch": 20.22, - "eval_loss": 0.15415678918361664, - "eval_runtime": 202.4017, - "eval_samples_per_second": 19.55, - "eval_steps_per_second": 2.446, - "eval_wer": 0.19033306538985775, - "step": 22400 + "epoch": 178.29, + "learning_rate": 4.9378826071299966e-06, + "loss": 0.176, + "step": 220550 }, { - "epoch": 20.58, - "learning_rate": 0.00023260129006248738, - "loss": 0.1704, - "step": 22800 + "epoch": 178.31, + "learning_rate": 4.881616852718761e-06, + "loss": 0.1646, + "step": 220575 }, { - "epoch": 20.58, - "eval_loss": 0.1622617095708847, - "eval_runtime": 206.2682, - "eval_samples_per_second": 19.184, - "eval_steps_per_second": 2.4, - "eval_wer": 0.1983014713591724, - "step": 22800 + "epoch": 178.33, + "learning_rate": 4.825351098307526e-06, + "loss": 0.1918, + "step": 220600 }, { - "epoch": 20.94, - "learning_rate": 0.00023139185648054828, - "loss": 0.1741, - "step": 23200 + "epoch": 178.35, + "learning_rate": 4.769085343896291e-06, + "loss": 0.1864, + "step": 220625 }, { - "epoch": 20.94, - "eval_loss": 0.15422095358371735, - "eval_runtime": 208.5273, - "eval_samples_per_second": 18.976, - "eval_steps_per_second": 2.374, - "eval_wer": 0.19568028518505573, - "step": 23200 + "epoch": 178.38, + "learning_rate": 4.712819589485056e-06, + "loss": 0.1978, + "step": 220650 }, { - "epoch": 21.3, - "learning_rate": 0.00023018242289860912, - "loss": 0.1642, - "step": 23600 + "epoch": 178.4, + "learning_rate": 4.6565538350738206e-06, + "loss": 0.1684, + "step": 220675 }, { - "epoch": 21.3, - "eval_loss": 0.155488982796669, - "eval_runtime": 206.3858, - "eval_samples_per_second": 19.173, - "eval_steps_per_second": 2.398, - "eval_wer": 0.19704330199559641, - "step": 23600 + "epoch": 178.42, + "learning_rate": 4.600288080662585e-06, + "loss": 0.1788, + "step": 220700 }, { - "epoch": 21.66, - "learning_rate": 0.00022897601290062486, - "loss": 0.1707, - "step": 24000 + "epoch": 178.44, + "learning_rate": 4.544022326251351e-06, + "loss": 0.199, + "step": 220725 }, { - "epoch": 21.66, - "eval_loss": 0.15275663137435913, - "eval_runtime": 206.6413, - "eval_samples_per_second": 19.149, - "eval_steps_per_second": 2.395, - "eval_wer": 0.18442665921084822, - "step": 24000 + "epoch": 178.46, + "learning_rate": 4.487756571840115e-06, + "loss": 0.1756, + "step": 220750 }, { - "epoch": 22.02, - "learning_rate": 0.00022776657931868573, - "loss": 0.1673, - "step": 24400 + "epoch": 178.48, + "learning_rate": 4.431490817428881e-06, + "loss": 0.1798, + "step": 220775 }, { - "epoch": 22.02, - "eval_loss": 0.15888585150241852, - "eval_runtime": 208.9307, - "eval_samples_per_second": 18.939, - "eval_steps_per_second": 2.369, - "eval_wer": 0.1858246251703771, - "step": 24400 + "epoch": 178.5, + "learning_rate": 4.3752250630176446e-06, + "loss": 0.2132, + "step": 220800 }, { - "epoch": 22.38, - "learning_rate": 0.0002265571457367466, - "loss": 0.1593, - "step": 24800 + "epoch": 178.52, + "learning_rate": 4.31895930860641e-06, + "loss": 0.222, + "step": 220825 }, { - "epoch": 22.38, - "eval_loss": 0.15319041907787323, - "eval_runtime": 206.6808, - "eval_samples_per_second": 19.145, - "eval_steps_per_second": 2.395, - "eval_wer": 0.17750672771118023, - "step": 24800 + "epoch": 178.54, + "learning_rate": 4.262693554195175e-06, + "loss": 0.1828, + "step": 220850 }, { - "epoch": 22.74, - "learning_rate": 0.0002253477121548075, - "loss": 0.1595, - "step": 25200 + "epoch": 178.56, + "learning_rate": 4.206427799783939e-06, + "loss": 0.1487, + "step": 220875 }, { - "epoch": 22.74, - "eval_loss": 0.15495522320270538, - "eval_runtime": 211.5152, - "eval_samples_per_second": 18.708, - "eval_steps_per_second": 2.34, - "eval_wer": 0.1755495753678398, - "step": 25200 + "epoch": 178.58, + "learning_rate": 4.150162045372705e-06, + "loss": 0.189, + "step": 220900 }, { - "epoch": 23.1, - "learning_rate": 0.00022413827857286836, - "loss": 0.1598, - "step": 25600 + "epoch": 178.6, + "learning_rate": 4.093896290961469e-06, + "loss": 0.181, + "step": 220925 }, { - "epoch": 23.1, - "eval_loss": 0.16047397255897522, - "eval_runtime": 213.237, - "eval_samples_per_second": 18.557, - "eval_steps_per_second": 2.321, - "eval_wer": 0.18624401495823575, - "step": 25600 + "epoch": 178.62, + "learning_rate": 4.037630536550234e-06, + "loss": 0.2038, + "step": 220950 }, { - "epoch": 23.47, - "learning_rate": 0.00022293186857488405, - "loss": 0.1573, - "step": 26000 + "epoch": 178.64, + "learning_rate": 3.981364782138999e-06, + "loss": 0.1737, + "step": 220975 }, { - "epoch": 23.47, - "eval_loss": 0.15952068567276, - "eval_runtime": 205.0554, - "eval_samples_per_second": 19.297, - "eval_steps_per_second": 2.414, - "eval_wer": 0.17796106664802713, - "step": 26000 + "epoch": 178.66, + "learning_rate": 3.925099027727764e-06, + "loss": 0.1809, + "step": 221000 }, { - "epoch": 23.83, - "learning_rate": 0.00022172243499294495, - "loss": 0.1596, - "step": 26400 + "epoch": 178.68, + "learning_rate": 3.868833273316529e-06, + "loss": 0.1816, + "step": 221025 }, { - "epoch": 23.83, - "eval_loss": 0.15038904547691345, - "eval_runtime": 203.7621, - "eval_samples_per_second": 19.42, - "eval_steps_per_second": 2.429, - "eval_wer": 0.17879984622374445, - "step": 26400 + "epoch": 178.7, + "learning_rate": 3.8125675189052934e-06, + "loss": 0.1417, + "step": 221050 }, { - "epoch": 24.19, - "learning_rate": 0.00022051300141100584, - "loss": 0.1589, - "step": 26800 + "epoch": 178.72, + "learning_rate": 3.7563017644940586e-06, + "loss": 0.189, + "step": 221075 }, { - "epoch": 24.19, - "eval_loss": 0.15989159047603607, - "eval_runtime": 202.8293, - "eval_samples_per_second": 19.509, - "eval_steps_per_second": 2.44, - "eval_wer": 0.17677279558242756, - "step": 26800 + "epoch": 178.74, + "learning_rate": 3.7000360100828234e-06, + "loss": 0.1741, + "step": 221100 }, { - "epoch": 24.55, - "learning_rate": 0.00021930356782906668, - "loss": 0.1551, - "step": 27200 + "epoch": 178.76, + "learning_rate": 3.6437702556715882e-06, + "loss": 0.1994, + "step": 221125 }, { - "epoch": 24.55, - "eval_loss": 0.15309767425060272, - "eval_runtime": 203.5071, - "eval_samples_per_second": 19.444, - "eval_steps_per_second": 2.432, - "eval_wer": 0.1685946947191836, - "step": 27200 + "epoch": 178.78, + "learning_rate": 3.5875045012603526e-06, + "loss": 0.1655, + "step": 221150 }, { - "epoch": 24.91, - "learning_rate": 0.00021809413424712758, - "loss": 0.1593, - "step": 27600 + "epoch": 178.8, + "learning_rate": 3.531238746849118e-06, + "loss": 0.1752, + "step": 221175 }, { - "epoch": 24.91, - "eval_loss": 0.1611892282962799, - "eval_runtime": 203.404, - "eval_samples_per_second": 19.454, - "eval_steps_per_second": 2.434, - "eval_wer": 0.181560828993814, - "step": 27600 + "epoch": 178.82, + "learning_rate": 3.4749729924378826e-06, + "loss": 0.2023, + "step": 221200 }, { - "epoch": 25.27, - "learning_rate": 0.00021688470066518845, - "loss": 0.1519, - "step": 28000 + "epoch": 178.84, + "learning_rate": 3.4187072380266474e-06, + "loss": 0.2079, + "step": 221225 }, { - "epoch": 25.27, - "eval_loss": 0.16373491287231445, - "eval_runtime": 203.251, - "eval_samples_per_second": 19.469, - "eval_steps_per_second": 2.435, - "eval_wer": 0.17638835494355712, - "step": 28000 + "epoch": 178.86, + "learning_rate": 3.3624414836154122e-06, + "loss": 0.1955, + "step": 221250 }, { - "epoch": 25.63, - "learning_rate": 0.0002156752670832493, - "loss": 0.1509, - "step": 28400 + "epoch": 178.88, + "learning_rate": 3.3061757292041774e-06, + "loss": 0.1915, + "step": 221275 }, { - "epoch": 25.63, - "eval_loss": 0.15399527549743652, - "eval_runtime": 203.0998, - "eval_samples_per_second": 19.483, - "eval_steps_per_second": 2.437, - "eval_wer": 0.17093628770139446, - "step": 28400 + "epoch": 178.9, + "learning_rate": 3.2499099747929422e-06, + "loss": 0.1881, + "step": 221300 }, { - "epoch": 25.99, - "learning_rate": 0.0002144658335013102, - "loss": 0.1524, - "step": 28800 + "epoch": 178.92, + "learning_rate": 3.193644220381707e-06, + "loss": 0.1544, + "step": 221325 }, { - "epoch": 25.99, - "eval_loss": 0.1519121676683426, - "eval_runtime": 203.5041, - "eval_samples_per_second": 19.444, - "eval_steps_per_second": 2.432, - "eval_wer": 0.18072204941809666, - "step": 28800 + "epoch": 178.94, + "learning_rate": 3.1373784659704714e-06, + "loss": 0.1657, + "step": 221350 }, { - "epoch": 26.35, - "learning_rate": 0.00021325639991937108, - "loss": 0.1452, - "step": 29200 + "epoch": 178.96, + "learning_rate": 3.0811127115592366e-06, + "loss": 0.1753, + "step": 221375 }, { - "epoch": 26.35, - "eval_loss": 0.15314562618732452, - "eval_runtime": 203.4098, - "eval_samples_per_second": 19.453, - "eval_steps_per_second": 2.434, - "eval_wer": 0.17310313493866425, - "step": 29200 + "epoch": 178.98, + "learning_rate": 3.0248469571480014e-06, + "loss": 0.1749, + "step": 221400 }, { - "epoch": 26.71, - "learning_rate": 0.0002120499899213868, - "loss": 0.1485, - "step": 29600 + "epoch": 179.0, + "learning_rate": 2.9685812027367662e-06, + "loss": 0.1666, + "step": 221425 }, { - "epoch": 26.71, - "eval_loss": 0.14827923476696014, - "eval_runtime": 203.2718, - "eval_samples_per_second": 19.467, - "eval_steps_per_second": 2.435, - "eval_wer": 0.16136022087862162, - "step": 29600 + "epoch": 179.02, + "learning_rate": 2.912315448325531e-06, + "loss": 0.1932, + "step": 221450 }, { - "epoch": 27.08, - "learning_rate": 0.0002108405563394477, - "loss": 0.1513, - "step": 30000 + "epoch": 179.04, + "learning_rate": 2.8560496939142963e-06, + "loss": 0.1363, + "step": 221475 }, { - "epoch": 27.08, - "eval_loss": 0.15502476692199707, - "eval_runtime": 203.5744, - "eval_samples_per_second": 19.438, - "eval_steps_per_second": 2.432, - "eval_wer": 0.16579876280012582, - "step": 30000 + "epoch": 179.06, + "learning_rate": 2.799783939503061e-06, + "loss": 0.2135, + "step": 221500 }, { - "epoch": 27.44, - "learning_rate": 0.00020963112275750853, - "loss": 0.1437, - "step": 30400 + "epoch": 179.08, + "learning_rate": 2.743518185091826e-06, + "loss": 0.1944, + "step": 221525 }, { - "epoch": 27.44, - "eval_loss": 0.15631796419620514, - "eval_runtime": 204.0627, - "eval_samples_per_second": 19.391, - "eval_steps_per_second": 2.426, - "eval_wer": 0.16614825429000804, - "step": 30400 + "epoch": 179.1, + "learning_rate": 2.6872524306805902e-06, + "loss": 0.1993, + "step": 221550 }, { - "epoch": 27.8, - "learning_rate": 0.00020842168917556943, - "loss": 0.1445, - "step": 30800 + "epoch": 179.12, + "learning_rate": 2.6309866762693555e-06, + "loss": 0.1866, + "step": 221575 }, { - "epoch": 27.8, - "eval_loss": 0.15840862691402435, - "eval_runtime": 204.5713, - "eval_samples_per_second": 19.343, - "eval_steps_per_second": 2.42, - "eval_wer": 0.17086638940341803, - "step": 30800 + "epoch": 179.14, + "learning_rate": 2.5747209218581203e-06, + "loss": 0.2085, + "step": 221600 }, { - "epoch": 28.16, - "learning_rate": 0.0002072122555936303, - "loss": 0.1438, - "step": 31200 + "epoch": 179.16, + "learning_rate": 2.518455167446885e-06, + "loss": 0.1564, + "step": 221625 }, { - "epoch": 28.16, - "eval_loss": 0.15680429339408875, - "eval_runtime": 204.0022, - "eval_samples_per_second": 19.397, - "eval_steps_per_second": 2.426, - "eval_wer": 0.1630727291790445, - "step": 31200 + "epoch": 179.18, + "learning_rate": 2.46218941303565e-06, + "loss": 0.2133, + "step": 221650 }, { - "epoch": 28.52, - "learning_rate": 0.00020600282201169116, - "loss": 0.1423, - "step": 31600 + "epoch": 179.2, + "learning_rate": 2.405923658624415e-06, + "loss": 0.1709, + "step": 221675 }, { - "epoch": 28.52, - "eval_loss": 0.15523846447467804, - "eval_runtime": 203.5692, - "eval_samples_per_second": 19.438, - "eval_steps_per_second": 2.432, - "eval_wer": 0.16090588194177471, - "step": 31600 + "epoch": 179.22, + "learning_rate": 2.34965790421318e-06, + "loss": 0.2061, + "step": 221700 }, { - "epoch": 28.88, - "learning_rate": 0.00020479338842975206, - "loss": 0.1451, - "step": 32000 + "epoch": 179.24, + "learning_rate": 2.2933921498019447e-06, + "loss": 0.1763, + "step": 221725 }, { - "epoch": 28.88, - "eval_loss": 0.1542510688304901, - "eval_runtime": 203.7413, - "eval_samples_per_second": 19.422, - "eval_steps_per_second": 2.43, - "eval_wer": 0.16314262747702094, - "step": 32000 + "epoch": 179.26, + "learning_rate": 2.237126395390709e-06, + "loss": 0.1902, + "step": 221750 }, { - "epoch": 29.24, - "learning_rate": 0.00020358395484781292, - "loss": 0.1396, - "step": 32400 + "epoch": 179.28, + "learning_rate": 2.1808606409794743e-06, + "loss": 0.1433, + "step": 221775 }, { - "epoch": 29.24, - "eval_loss": 0.15091465413570404, - "eval_runtime": 203.6781, - "eval_samples_per_second": 19.428, - "eval_steps_per_second": 2.43, - "eval_wer": 0.16317757662600915, - "step": 32400 + "epoch": 179.3, + "learning_rate": 2.124594886568239e-06, + "loss": 0.2202, + "step": 221800 }, { - "epoch": 29.6, - "learning_rate": 0.0002023745212658738, - "loss": 0.142, - "step": 32800 + "epoch": 179.32, + "learning_rate": 2.068329132157004e-06, + "loss": 0.1739, + "step": 221825 }, { - "epoch": 29.6, - "eval_loss": 0.15581683814525604, - "eval_runtime": 203.4725, - "eval_samples_per_second": 19.447, - "eval_steps_per_second": 2.433, - "eval_wer": 0.1635620172648796, - "step": 32800 + "epoch": 179.35, + "learning_rate": 2.0120633777457687e-06, + "loss": 0.1809, + "step": 221850 }, { - "epoch": 29.96, - "learning_rate": 0.0002011650876839347, - "loss": 0.1385, - "step": 33200 + "epoch": 179.37, + "learning_rate": 1.955797623334534e-06, + "loss": 0.1522, + "step": 221875 }, { - "epoch": 29.96, - "eval_loss": 0.145892933011055, - "eval_runtime": 203.8769, - "eval_samples_per_second": 19.409, - "eval_steps_per_second": 2.428, - "eval_wer": 0.17338272813057, - "step": 33200 + "epoch": 179.39, + "learning_rate": 1.8995318689232985e-06, + "loss": 0.204, + "step": 221900 }, { - "epoch": 30.32, - "learning_rate": 0.00019995565410199556, - "loss": 0.1376, - "step": 33600 + "epoch": 179.41, + "learning_rate": 1.8432661145120633e-06, + "loss": 0.1432, + "step": 221925 }, { - "epoch": 30.32, - "eval_loss": 0.15049244463443756, - "eval_runtime": 203.9232, - "eval_samples_per_second": 19.404, - "eval_steps_per_second": 2.427, - "eval_wer": 0.17236920280991158, - "step": 33600 + "epoch": 179.43, + "learning_rate": 1.7870003601008283e-06, + "loss": 0.1777, + "step": 221950 }, { - "epoch": 30.69, - "learning_rate": 0.00019874924410401127, - "loss": 0.1399, - "step": 34000 + "epoch": 179.45, + "learning_rate": 1.730734605689593e-06, + "loss": 0.1546, + "step": 221975 }, { - "epoch": 30.69, - "eval_loss": 0.14067970216274261, - "eval_runtime": 203.8686, - "eval_samples_per_second": 19.41, - "eval_steps_per_second": 2.428, - "eval_wer": 0.1610107293887394, - "step": 34000 + "epoch": 179.47, + "learning_rate": 1.674468851278358e-06, + "loss": 0.2101, + "step": 222000 }, { - "epoch": 31.05, - "learning_rate": 0.00019753981052207217, - "loss": 0.1377, - "step": 34400 + "epoch": 179.47, + "eval_cer": 0.07384269478352823, + "eval_loss": 0.4755805432796478, + "eval_runtime": 153.5849, + "eval_samples_per_second": 27.301, + "eval_steps_per_second": 6.83, + "eval_wer": 0.3161174551386623, + "step": 222000 }, { - "epoch": 31.05, - "eval_loss": 0.1523168534040451, - "eval_runtime": 203.6263, - "eval_samples_per_second": 19.433, - "eval_steps_per_second": 2.431, - "eval_wer": 0.17292838919372314, - "step": 34400 + "epoch": 179.49, + "learning_rate": 1.6182030968671227e-06, + "loss": 0.1692, + "step": 222025 }, { - "epoch": 31.41, - "learning_rate": 0.000196330376940133, - "loss": 0.1331, - "step": 34800 + "epoch": 179.51, + "learning_rate": 1.5619373424558877e-06, + "loss": 0.1836, + "step": 222050 }, { - "epoch": 31.41, - "eval_loss": 0.14309507608413696, - "eval_runtime": 204.8423, - "eval_samples_per_second": 19.317, - "eval_steps_per_second": 2.416, - "eval_wer": 0.1706566945094887, - "step": 34800 + "epoch": 179.53, + "learning_rate": 1.5056715880446525e-06, + "loss": 0.207, + "step": 222075 }, { - "epoch": 31.77, - "learning_rate": 0.0001951209433581939, - "loss": 0.1356, - "step": 35200 + "epoch": 179.55, + "learning_rate": 1.4494058336334173e-06, + "loss": 0.1892, + "step": 222100 }, { - "epoch": 31.77, - "eval_loss": 0.1558520793914795, - "eval_runtime": 204.495, - "eval_samples_per_second": 19.35, - "eval_steps_per_second": 2.421, - "eval_wer": 0.16391150875476182, - "step": 35200 + "epoch": 179.57, + "learning_rate": 1.393140079222182e-06, + "loss": 0.192, + "step": 222125 }, { - "epoch": 32.13, - "learning_rate": 0.00019391150977625477, - "loss": 0.1381, - "step": 35600 + "epoch": 179.59, + "learning_rate": 1.3368743248109471e-06, + "loss": 0.2154, + "step": 222150 }, { - "epoch": 32.13, - "eval_loss": 0.14920052886009216, - "eval_runtime": 204.3124, - "eval_samples_per_second": 19.367, - "eval_steps_per_second": 2.423, - "eval_wer": 0.1660783559920316, - "step": 35600 + "epoch": 179.61, + "learning_rate": 1.280608570399712e-06, + "loss": 0.1862, + "step": 222175 }, { - "epoch": 32.49, - "learning_rate": 0.00019270207619431564, - "loss": 0.1332, - "step": 36000 + "epoch": 179.63, + "learning_rate": 1.2243428159884767e-06, + "loss": 0.2028, + "step": 222200 }, { - "epoch": 32.49, - "eval_loss": 0.15177668631076813, - "eval_runtime": 204.8291, - "eval_samples_per_second": 19.319, - "eval_steps_per_second": 2.417, - "eval_wer": 0.16139517002760984, - "step": 36000 + "epoch": 179.65, + "learning_rate": 1.1680770615772415e-06, + "loss": 0.1858, + "step": 222225 }, { - "epoch": 32.85, - "learning_rate": 0.00019149264261237654, - "loss": 0.1345, - "step": 36400 + "epoch": 179.67, + "learning_rate": 1.1118113071660065e-06, + "loss": 0.1751, + "step": 222250 }, { - "epoch": 32.85, - "eval_loss": 0.14764094352722168, - "eval_runtime": 204.5031, - "eval_samples_per_second": 19.349, - "eval_steps_per_second": 2.421, - "eval_wer": 0.1562925942753294, - "step": 36400 + "epoch": 179.69, + "learning_rate": 1.0555455527547713e-06, + "loss": 0.1573, + "step": 222275 }, { - "epoch": 33.21, - "learning_rate": 0.00019028320903043738, - "loss": 0.1307, - "step": 36800 + "epoch": 179.71, + "learning_rate": 9.992797983435363e-07, + "loss": 0.2087, + "step": 222300 }, { - "epoch": 33.21, - "eval_loss": 0.1433647871017456, - "eval_runtime": 205.0597, - "eval_samples_per_second": 19.297, - "eval_steps_per_second": 2.414, - "eval_wer": 0.15922832279034005, - "step": 36800 + "epoch": 179.73, + "learning_rate": 9.430140439323011e-07, + "loss": 0.163, + "step": 222325 }, { - "epoch": 33.57, - "learning_rate": 0.00018907679903245312, - "loss": 0.1309, - "step": 37200 + "epoch": 179.75, + "learning_rate": 8.867482895210659e-07, + "loss": 0.1921, + "step": 222350 }, { - "epoch": 33.57, - "eval_loss": 0.1497233361005783, - "eval_runtime": 204.4523, - "eval_samples_per_second": 19.354, - "eval_steps_per_second": 2.421, - "eval_wer": 0.17090133855240625, - "step": 37200 + "epoch": 179.77, + "learning_rate": 8.304825351098308e-07, + "loss": 0.1446, + "step": 222375 }, { - "epoch": 33.93, - "learning_rate": 0.00018786736545051402, - "loss": 0.1319, - "step": 37600 + "epoch": 179.79, + "learning_rate": 7.742167806985956e-07, + "loss": 0.2213, + "step": 222400 }, { - "epoch": 33.93, - "eval_loss": 0.15207722783088684, - "eval_runtime": 204.6556, - "eval_samples_per_second": 19.335, - "eval_steps_per_second": 2.419, - "eval_wer": 0.1708314402544298, - "step": 37600 + "epoch": 179.81, + "learning_rate": 7.179510262873605e-07, + "loss": 0.1778, + "step": 222425 }, { - "epoch": 34.3, - "learning_rate": 0.00018665793186857486, - "loss": 0.1279, - "step": 38000 + "epoch": 179.83, + "learning_rate": 6.616852718761253e-07, + "loss": 0.1908, + "step": 222450 }, { - "epoch": 34.3, - "eval_loss": 0.14533580839633942, - "eval_runtime": 205.2587, - "eval_samples_per_second": 19.278, - "eval_steps_per_second": 2.412, - "eval_wer": 0.1569566281061056, - "step": 38000 + "epoch": 179.85, + "learning_rate": 6.054195174648902e-07, + "loss": 0.142, + "step": 222475 }, { - "epoch": 34.66, - "learning_rate": 0.00018544849828663575, - "loss": 0.1268, - "step": 38400 + "epoch": 179.87, + "learning_rate": 5.49153763053655e-07, + "loss": 0.1851, + "step": 222500 }, { - "epoch": 34.66, - "eval_loss": 0.14409175515174866, - "eval_runtime": 204.8962, - "eval_samples_per_second": 19.312, - "eval_steps_per_second": 2.416, - "eval_wer": 0.1608709327927865, - "step": 38400 + "epoch": 179.89, + "learning_rate": 4.9288800864242e-07, + "loss": 0.1485, + "step": 222525 }, { - "epoch": 35.02, - "learning_rate": 0.0001842390647046966, - "loss": 0.1301, - "step": 38800 + "epoch": 179.91, + "learning_rate": 4.3662225423118475e-07, + "loss": 0.1964, + "step": 222550 }, { - "epoch": 35.02, - "eval_loss": 0.1421143114566803, - "eval_runtime": 205.2147, - "eval_samples_per_second": 19.282, - "eval_steps_per_second": 2.412, - "eval_wer": 0.1567818823611645, - "step": 38800 + "epoch": 179.93, + "learning_rate": 3.803564998199496e-07, + "loss": 0.1942, + "step": 222575 }, { - "epoch": 35.38, - "learning_rate": 0.0001830296311227575, - "loss": 0.1248, - "step": 39200 + "epoch": 179.95, + "learning_rate": 3.2409074540871446e-07, + "loss": 0.1905, + "step": 222600 }, { - "epoch": 35.38, - "eval_loss": 0.14348700642585754, - "eval_runtime": 209.2746, - "eval_samples_per_second": 18.908, - "eval_steps_per_second": 2.365, - "eval_wer": 0.15727117044699962, - "step": 39200 + "epoch": 179.97, + "learning_rate": 2.678249909974793e-07, + "loss": 0.1591, + "step": 222625 }, { - "epoch": 35.74, - "learning_rate": 0.00018182322112477323, - "loss": 0.1256, - "step": 39600 + "epoch": 179.99, + "learning_rate": 2.1155923658624413e-07, + "loss": 0.1748, + "step": 222650 }, { - "epoch": 35.74, - "eval_loss": 0.14100748300552368, - "eval_runtime": 214.9156, - "eval_samples_per_second": 18.412, - "eval_steps_per_second": 2.303, - "eval_wer": 0.1528326285254954, - "step": 39600 + "epoch": 180.0, + "step": 222660, + "total_flos": 2.3788341158199368e+20, + "train_loss": 0.061750437557927515, + "train_runtime": 29496.4676, + "train_samples_per_second": 60.347, + "train_steps_per_second": 7.549 } ], - "max_steps": 99720, - "num_train_epochs": 90, - "total_flos": 1.728945548938538e+20, + "max_steps": 222660, + "num_train_epochs": 180, + "total_flos": 2.3788341158199368e+20, "trial_name": null, "trial_params": null }