diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,54751 +1,864 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 180.0, - "global_step": 222660, + "epoch": 493.02296211251434, + "global_step": 21200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { - "epoch": 0.01, - "learning_rate": 2.3e-05, - "loss": 12.7521, - "step": 25 - }, - { - "epoch": 0.01, - "learning_rate": 4.7000000000000004e-05, - "loss": 8.8854, - "step": 50 - }, - { - "epoch": 0.02, - "learning_rate": 7.2e-05, - "loss": 4.0895, - "step": 75 - }, - { - "epoch": 0.02, - "learning_rate": 9.7e-05, - "loss": 3.5682, - "step": 100 - }, - { - "epoch": 0.03, - "learning_rate": 0.000122, - "loss": 3.2477, - "step": 125 - }, - { - "epoch": 0.04, - "learning_rate": 0.000147, - "loss": 3.2236, - "step": 150 - }, - { - "epoch": 0.04, - "learning_rate": 0.00017199999999999998, - "loss": 3.1948, - "step": 175 - }, - { - "epoch": 0.05, - "learning_rate": 0.00019700000000000002, - "loss": 3.115, - "step": 200 - }, - { - "epoch": 0.05, - "learning_rate": 0.000222, - "loss": 3.1549, - "step": 225 - }, - { - "epoch": 0.06, - "learning_rate": 0.000247, - "loss": 3.1232, - "step": 250 - }, - { - "epoch": 0.07, - "learning_rate": 0.00027200000000000005, - "loss": 3.1312, - "step": 275 - }, - { - "epoch": 0.07, - "learning_rate": 0.000297, - "loss": 3.0763, - "step": 300 - }, - { - "epoch": 0.08, - "learning_rate": 0.000322, - "loss": 3.1158, - "step": 325 - }, - { - "epoch": 0.09, - "learning_rate": 0.000347, - "loss": 3.0469, - "step": 350 - }, - { - "epoch": 0.09, - "learning_rate": 0.000372, - "loss": 3.0859, - "step": 375 - }, - { - "epoch": 0.1, - "learning_rate": 0.00039700000000000005, - "loss": 3.0238, + "epoch": 9.3, + "learning_rate": 0.00023999999999999998, + "loss": 4.3982, "step": 400 }, { - "epoch": 0.1, - "learning_rate": 0.000422, - "loss": 3.1055, - "step": 425 - }, - { - "epoch": 0.11, - "learning_rate": 0.000447, - "loss": 3.0302, - "step": 450 - }, - { - "epoch": 0.12, - "learning_rate": 0.000472, - "loss": 3.0974, - "step": 475 - }, - { - "epoch": 0.12, - "learning_rate": 0.000497, - "loss": 3.0162, - "step": 500 - }, - { - "epoch": 0.12, - "eval_cer": 1.0, - "eval_loss": 3.1486001014709473, - "eval_runtime": 147.8787, - "eval_samples_per_second": 28.354, - "eval_steps_per_second": 7.094, - "eval_wer": 1.0, - "step": 500 - }, - { - "epoch": 0.13, - "learning_rate": 0.0004999731248473003, - "loss": 3.0909, - "step": 525 - }, - { - "epoch": 0.13, - "learning_rate": 0.0004999425849010506, - "loss": 2.9905, - "step": 550 - }, - { - "epoch": 0.14, - "learning_rate": 0.0004999120449548009, - "loss": 3.0408, - "step": 575 - }, - { - "epoch": 0.15, - "learning_rate": 0.0004998815050085511, - "loss": 2.9567, - "step": 600 - }, - { - "epoch": 0.15, - "learning_rate": 0.0004998509650623015, - "loss": 2.9644, - "step": 625 - }, - { - "epoch": 0.16, - "learning_rate": 0.0004998204251160518, - "loss": 2.7935, - "step": 650 - }, - { - "epoch": 0.16, - "learning_rate": 0.0004997898851698021, - "loss": 2.6574, - "step": 675 - }, - { - "epoch": 0.17, - "learning_rate": 0.0004997593452235524, - "loss": 2.4471, - "step": 700 - }, - { - "epoch": 0.18, - "learning_rate": 0.0004997288052773027, - "loss": 2.2672, - "step": 725 - }, - { - "epoch": 0.18, - "learning_rate": 0.000499698265331053, - "loss": 2.1358, - "step": 750 - }, - { - "epoch": 0.19, - "learning_rate": 0.0004996677253848033, - "loss": 2.0581, - "step": 775 + "epoch": 9.3, + "eval_cer": 0.14366206687135194, + "eval_loss": 0.5217852592468262, + "eval_runtime": 117.8175, + "eval_samples_per_second": 26.414, + "eval_steps_per_second": 3.302, + "eval_wer": 0.6506676906011348, + "step": 400 }, { - "epoch": 0.2, - "learning_rate": 0.0004996371854385537, - "loss": 1.9562, + "epoch": 18.6, + "learning_rate": 0.00029461077844311373, + "loss": 0.229, "step": 800 }, { - "epoch": 0.2, - "learning_rate": 0.0004996066454923039, - "loss": 1.9131, - "step": 825 - }, - { - "epoch": 0.21, - "learning_rate": 0.0004995761055460543, - "loss": 1.8268, - "step": 850 - }, - { - "epoch": 0.21, - "learning_rate": 0.0004995455655998046, - "loss": 1.8359, - "step": 875 - }, - { - "epoch": 0.22, - "learning_rate": 0.0004995150256535549, - "loss": 1.721, - "step": 900 - }, - { - "epoch": 0.23, - "learning_rate": 0.0004994844857073051, - "loss": 1.7865, - "step": 925 - }, - { - "epoch": 0.23, - "learning_rate": 0.0004994539457610555, - "loss": 1.6867, - "step": 950 - }, - { - "epoch": 0.24, - "learning_rate": 0.0004994234058148057, - "loss": 1.6645, - "step": 975 - }, - { - "epoch": 0.24, - "learning_rate": 0.0004993928658685561, - "loss": 1.6532, - "step": 1000 - }, - { - "epoch": 0.24, - "eval_cer": 0.4583123723088611, - "eval_loss": 1.3737213611602783, - "eval_runtime": 148.5107, - "eval_samples_per_second": 28.234, - "eval_steps_per_second": 7.063, - "eval_wer": 0.9951386623164763, - "step": 1000 - }, - { - "epoch": 0.25, - "learning_rate": 0.0004993623259223064, - "loss": 1.6458, - "step": 1025 - }, - { - "epoch": 0.26, - "learning_rate": 0.0004993317859760567, - "loss": 1.6264, - "step": 1050 - }, - { - "epoch": 0.26, - "learning_rate": 0.0004993012460298069, - "loss": 1.6296, - "step": 1075 - }, - { - "epoch": 0.27, - "learning_rate": 0.0004992707060835573, - "loss": 1.5512, - "step": 1100 - }, - { - "epoch": 0.27, - "learning_rate": 0.0004992401661373077, - "loss": 1.5247, - "step": 1125 - }, - { - "epoch": 0.28, - "learning_rate": 0.0004992096261910579, - "loss": 1.5277, - "step": 1150 - }, - { - "epoch": 0.29, - "learning_rate": 0.0004991790862448083, - "loss": 1.5062, - "step": 1175 + "epoch": 18.6, + "eval_cer": 0.08482742332737273, + "eval_loss": 0.36793914437294006, + "eval_runtime": 118.0263, + "eval_samples_per_second": 26.367, + "eval_steps_per_second": 3.296, + "eval_wer": 0.40479542642604205, + "step": 800 }, { - "epoch": 0.29, - "learning_rate": 0.0004991485462985585, - "loss": 1.4983, + "epoch": 27.9, + "learning_rate": 0.00028742514970059877, + "loss": 0.1054, "step": 1200 }, { - "epoch": 0.3, - "learning_rate": 0.0004991180063523088, - "loss": 1.5167, - "step": 1225 - }, - { - "epoch": 0.31, - "learning_rate": 0.0004990874664060591, - "loss": 1.4639, - "step": 1250 - }, - { - "epoch": 0.31, - "learning_rate": 0.0004990569264598095, - "loss": 1.4723, - "step": 1275 - }, - { - "epoch": 0.32, - "learning_rate": 0.0004990263865135597, - "loss": 1.4641, - "step": 1300 - }, - { - "epoch": 0.32, - "learning_rate": 0.0004989958465673101, - "loss": 1.4708, - "step": 1325 - }, - { - "epoch": 0.33, - "learning_rate": 0.0004989653066210603, - "loss": 1.4587, - "step": 1350 - }, - { - "epoch": 0.34, - "learning_rate": 0.0004989347666748106, - "loss": 1.3988, - "step": 1375 - }, - { - "epoch": 0.34, - "learning_rate": 0.0004989042267285609, - "loss": 1.4353, - "step": 1400 - }, - { - "epoch": 0.35, - "learning_rate": 0.0004988736867823113, - "loss": 1.4303, - "step": 1425 - }, - { - "epoch": 0.35, - "learning_rate": 0.0004988431468360615, - "loss": 1.4705, - "step": 1450 - }, - { - "epoch": 0.36, - "learning_rate": 0.0004988126068898119, - "loss": 1.3941, - "step": 1475 - }, - { - "epoch": 0.37, - "learning_rate": 0.0004987820669435622, - "loss": 1.3941, - "step": 1500 - }, - { - "epoch": 0.37, - "eval_cer": 0.37091260022791905, - "eval_loss": 1.1033180952072144, - "eval_runtime": 148.9205, - "eval_samples_per_second": 28.156, - "eval_steps_per_second": 7.044, - "eval_wer": 0.9866231647634583, - "step": 1500 - }, - { - "epoch": 0.37, - "learning_rate": 0.0004987515269973125, - "loss": 1.401, - "step": 1525 - }, - { - "epoch": 0.38, - "learning_rate": 0.0004987209870510628, - "loss": 1.3726, - "step": 1550 - }, - { - "epoch": 0.38, - "learning_rate": 0.0004986904471048131, - "loss": 1.3804, - "step": 1575 + "epoch": 27.9, + "eval_cer": 0.07780964270049597, + "eval_loss": 0.38127270340919495, + "eval_runtime": 116.0512, + "eval_samples_per_second": 26.816, + "eval_steps_per_second": 3.352, + "eval_wer": 0.367037842911387, + "step": 1200 }, { - "epoch": 0.39, - "learning_rate": 0.0004986599071585634, - "loss": 1.4081, + "epoch": 37.21, + "learning_rate": 0.0002802395209580838, + "loss": 0.0784, "step": 1600 }, { - "epoch": 0.4, - "learning_rate": 0.0004986293672123137, - "loss": 1.392, - "step": 1625 - }, - { - "epoch": 0.4, - "learning_rate": 0.0004985988272660641, - "loss": 1.3433, - "step": 1650 - }, - { - "epoch": 0.41, - "learning_rate": 0.0004985682873198143, - "loss": 1.3965, - "step": 1675 - }, - { - "epoch": 0.41, - "learning_rate": 0.0004985377473735646, - "loss": 1.3149, - "step": 1700 - }, - { - "epoch": 0.42, - "learning_rate": 0.0004985072074273149, - "loss": 1.3295, - "step": 1725 + "epoch": 37.21, + "eval_cer": 0.07465164141840143, + "eval_loss": 0.3839242458343506, + "eval_runtime": 116.2982, + "eval_samples_per_second": 26.759, + "eval_steps_per_second": 3.345, + "eval_wer": 0.35496394897393235, + "step": 1600 }, { - "epoch": 0.43, - "learning_rate": 0.0004984766674810652, - "loss": 1.3181, - "step": 1750 + "epoch": 46.51, + "learning_rate": 0.00027305389221556883, + "loss": 0.066, + "step": 2000 }, { - "epoch": 0.43, - "learning_rate": 0.0004984461275348155, - "loss": 1.3353, - "step": 1775 + "epoch": 46.51, + "eval_cer": 0.07363946152029421, + "eval_loss": 0.3969549238681793, + "eval_runtime": 118.9877, + "eval_samples_per_second": 26.154, + "eval_steps_per_second": 3.269, + "eval_wer": 0.3443406288664192, + "step": 2000 }, { - "epoch": 0.44, - "learning_rate": 0.0004984155875885659, - "loss": 1.3267, - "step": 1800 + "epoch": 55.8, + "learning_rate": 0.00026586826347305386, + "loss": 0.0603, + "step": 2400 }, { - "epoch": 0.45, - "learning_rate": 0.0004983850476423162, - "loss": 1.3335, - "step": 1825 + "epoch": 55.8, + "eval_cer": 0.07218192246701981, + "eval_loss": 0.3702129125595093, + "eval_runtime": 118.9492, + "eval_samples_per_second": 26.162, + "eval_steps_per_second": 3.27, + "eval_wer": 0.3393489483339733, + "step": 2400 }, { - "epoch": 0.45, - "learning_rate": 0.0004983545076960664, - "loss": 1.3258, - "step": 1850 + "epoch": 65.11, + "learning_rate": 0.0002586826347305389, + "loss": 0.0539, + "step": 2800 }, { - "epoch": 0.46, - "learning_rate": 0.0004983239677498168, - "loss": 1.3543, - "step": 1875 + "epoch": 65.11, + "eval_cer": 0.07241809777657816, + "eval_loss": 0.3762107491493225, + "eval_runtime": 117.3723, + "eval_samples_per_second": 26.514, + "eval_steps_per_second": 3.314, + "eval_wer": 0.33875165322752676, + "step": 2800 }, { - "epoch": 0.46, - "learning_rate": 0.0004982934278035671, - "loss": 1.3208, - "step": 1900 + "epoch": 74.41, + "learning_rate": 0.00025149700598802393, + "loss": 0.0497, + "step": 3200 }, { - "epoch": 0.47, - "learning_rate": 0.0004982628878573174, - "loss": 1.3046, - "step": 1925 + "epoch": 74.41, + "eval_cer": 0.07128445629069807, + "eval_loss": 0.36228740215301514, + "eval_runtime": 116.3914, + "eval_samples_per_second": 26.737, + "eval_steps_per_second": 3.342, + "eval_wer": 0.3413541533341866, + "step": 3200 }, { - "epoch": 0.48, - "learning_rate": 0.0004982323479110677, - "loss": 1.3268, - "step": 1950 + "epoch": 83.71, + "learning_rate": 0.00024431137724550896, + "loss": 0.0432, + "step": 3600 }, { - "epoch": 0.48, - "learning_rate": 0.000498201807964818, - "loss": 1.3152, - "step": 1975 + "epoch": 83.71, + "eval_cer": 0.07248557643645197, + "eval_loss": 0.3847475051879883, + "eval_runtime": 116.3314, + "eval_samples_per_second": 26.751, + "eval_steps_per_second": 3.344, + "eval_wer": 0.3346132514185759, + "step": 3600 }, { - "epoch": 0.49, - "learning_rate": 0.0004981712680185683, - "loss": 1.3275, - "step": 2000 + "epoch": 93.02, + "learning_rate": 0.000237125748502994, + "loss": 0.0438, + "step": 4000 }, { - "epoch": 0.49, - "eval_cer": 0.348711025327762, - "eval_loss": 1.093718409538269, - "eval_runtime": 154.6705, - "eval_samples_per_second": 27.109, - "eval_steps_per_second": 6.782, - "eval_wer": 0.9539641109298532, - "step": 2000 + "epoch": 93.02, + "eval_cer": 0.07503626977968217, + "eval_loss": 0.4057835340499878, + "eval_runtime": 116.616, + "eval_samples_per_second": 26.686, + "eval_steps_per_second": 3.336, + "eval_wer": 0.3393489483339733, + "step": 4000 }, { - "epoch": 0.49, - "learning_rate": 0.0004981407280723186, - "loss": 1.3006, - "step": 2025 + "epoch": 102.32, + "learning_rate": 0.00022994011976047902, + "loss": 0.0413, + "step": 4400 }, { - "epoch": 0.5, - "learning_rate": 0.0004981101881260689, - "loss": 1.2848, - "step": 2050 + "epoch": 102.32, + "eval_cer": 0.07270825601403556, + "eval_loss": 0.3957100510597229, + "eval_runtime": 116.9156, + "eval_samples_per_second": 26.617, + "eval_steps_per_second": 3.327, + "eval_wer": 0.3362771449293912, + "step": 4400 }, { - "epoch": 0.51, - "learning_rate": 0.0004980796481798192, - "loss": 1.2935, - "step": 2075 + "epoch": 111.62, + "learning_rate": 0.00022275449101796406, + "loss": 0.039, + "step": 4800 }, { - "epoch": 0.51, - "learning_rate": 0.0004980491082335695, - "loss": 1.3263, - "step": 2100 + "epoch": 111.62, + "eval_cer": 0.07179729410573905, + "eval_loss": 0.386459618806839, + "eval_runtime": 119.0004, + "eval_samples_per_second": 26.151, + "eval_steps_per_second": 3.269, + "eval_wer": 0.3330346857801101, + "step": 4800 }, { - "epoch": 0.52, - "learning_rate": 0.0004980185682873198, - "loss": 1.3252, - "step": 2125 + "epoch": 120.92, + "learning_rate": 0.0002155688622754491, + "loss": 0.0356, + "step": 5200 }, { - "epoch": 0.52, - "learning_rate": 0.0004979880283410701, - "loss": 1.3055, - "step": 2150 + "epoch": 120.92, + "eval_cer": 0.07110226390903876, + "eval_loss": 0.38599926233291626, + "eval_runtime": 118.9882, + "eval_samples_per_second": 26.154, + "eval_steps_per_second": 3.269, + "eval_wer": 0.33192542343956655, + "step": 5200 }, { - "epoch": 0.53, - "learning_rate": 0.0004979574883948204, - "loss": 1.2801, - "step": 2175 + "epoch": 130.23, + "learning_rate": 0.00020838323353293412, + "loss": 0.0336, + "step": 5600 }, { - "epoch": 0.54, - "learning_rate": 0.0004979269484485708, - "loss": 1.2867, - "step": 2200 + "epoch": 130.23, + "eval_cer": 0.07001585748507035, + "eval_loss": 0.3902195692062378, + "eval_runtime": 116.3404, + "eval_samples_per_second": 26.749, + "eval_steps_per_second": 3.344, + "eval_wer": 0.3241605870557618, + "step": 5600 }, { - "epoch": 0.54, - "learning_rate": 0.000497896408502321, - "loss": 1.3295, - "step": 2225 + "epoch": 139.53, + "learning_rate": 0.00020119760479041913, + "loss": 0.034, + "step": 6000 }, { - "epoch": 0.55, - "learning_rate": 0.0004978658685560714, - "loss": 1.3141, - "step": 2250 + "epoch": 139.53, + "eval_cer": 0.07322109382907656, + "eval_loss": 0.39304569363594055, + "eval_runtime": 116.7151, + "eval_samples_per_second": 26.663, + "eval_steps_per_second": 3.333, + "eval_wer": 0.3337173087589061, + "step": 6000 }, { - "epoch": 0.56, - "learning_rate": 0.0004978353286098217, - "loss": 1.2956, - "step": 2275 + "epoch": 148.83, + "learning_rate": 0.00019402994011976046, + "loss": 0.0273, + "step": 6400 }, { - "epoch": 0.56, - "learning_rate": 0.000497804788663572, - "loss": 1.2728, - "step": 2300 + "epoch": 148.83, + "eval_cer": 0.07479334660413645, + "eval_loss": 0.39119070768356323, + "eval_runtime": 116.4756, + "eval_samples_per_second": 26.718, + "eval_steps_per_second": 3.34, + "eval_wer": 0.33747173514228423, + "step": 6400 }, { - "epoch": 0.57, - "learning_rate": 0.0004977742487173222, - "loss": 1.2823, - "step": 2325 + "epoch": 158.14, + "learning_rate": 0.0001868443113772455, + "loss": 0.027, + "step": 6800 }, { - "epoch": 0.57, - "learning_rate": 0.0004977437087710726, - "loss": 1.3055, - "step": 2350 + "epoch": 158.14, + "eval_cer": 0.07523870575930362, + "eval_loss": 0.42656052112579346, + "eval_runtime": 116.5029, + "eval_samples_per_second": 26.712, + "eval_steps_per_second": 3.339, + "eval_wer": 0.34344468620674945, + "step": 6800 }, { - "epoch": 0.58, - "learning_rate": 0.0004977131688248228, - "loss": 1.2819, - "step": 2375 + "epoch": 167.44, + "learning_rate": 0.0001796586826347305, + "loss": 0.028, + "step": 7200 }, { - "epoch": 0.59, - "learning_rate": 0.0004976826288785732, - "loss": 1.2821, - "step": 2400 + "epoch": 167.44, + "eval_cer": 0.0707648706096697, + "eval_loss": 0.38949263095855713, + "eval_runtime": 116.3646, + "eval_samples_per_second": 26.744, + "eval_steps_per_second": 3.343, + "eval_wer": 0.32266734928964547, + "step": 7200 }, { - "epoch": 0.59, - "learning_rate": 0.0004976520889323235, - "loss": 1.2981, - "step": 2425 + "epoch": 176.73, + "learning_rate": 0.00017247305389221556, + "loss": 0.0241, + "step": 7600 }, { - "epoch": 0.6, - "learning_rate": 0.0004976215489860738, - "loss": 1.2734, - "step": 2450 + "epoch": 176.73, + "eval_cer": 0.07274874320995985, + "eval_loss": 0.3967472016811371, + "eval_runtime": 116.4729, + "eval_samples_per_second": 26.719, + "eval_steps_per_second": 3.34, + "eval_wer": 0.32936558726908144, + "step": 7600 }, { - "epoch": 0.6, - "learning_rate": 0.0004975910090398241, - "loss": 1.2244, - "step": 2475 + "epoch": 186.05, + "learning_rate": 0.00016530538922155687, + "loss": 0.0241, + "step": 8000 }, { - "epoch": 0.61, - "learning_rate": 0.0004975604690935744, - "loss": 1.2648, - "step": 2500 + "epoch": 186.05, + "eval_cer": 0.07122372549681164, + "eval_loss": 0.4058191776275635, + "eval_runtime": 116.3498, + "eval_samples_per_second": 26.747, + "eval_steps_per_second": 3.343, + "eval_wer": 0.32548316907717906, + "step": 8000 }, { - "epoch": 0.61, - "eval_cer": 0.3137429031960001, - "eval_loss": 0.9402545690536499, - "eval_runtime": 149.7438, - "eval_samples_per_second": 28.001, - "eval_steps_per_second": 7.005, - "eval_wer": 0.9449918433931485, - "step": 2500 + "epoch": 195.34, + "learning_rate": 0.0001581197604790419, + "loss": 0.0209, + "step": 8400 }, { - "epoch": 0.62, - "learning_rate": 0.0004975299291473248, - "loss": 1.2673, - "step": 2525 + "epoch": 195.34, + "eval_cer": 0.07019804986672964, + "eval_loss": 0.4101807177066803, + "eval_runtime": 116.6051, + "eval_samples_per_second": 26.688, + "eval_steps_per_second": 3.336, + "eval_wer": 0.3233499722684415, + "step": 8400 }, { - "epoch": 0.62, - "learning_rate": 0.000497499389201075, - "loss": 1.2347, - "step": 2550 + "epoch": 204.64, + "learning_rate": 0.00015093413173652694, + "loss": 0.0206, + "step": 8800 }, { - "epoch": 0.63, - "learning_rate": 0.0004974688492548254, - "loss": 1.2291, - "step": 2575 + "epoch": 204.64, + "eval_cer": 0.06987415229933533, + "eval_loss": 0.40751102566719055, + "eval_runtime": 117.508, + "eval_samples_per_second": 26.483, + "eval_steps_per_second": 3.31, + "eval_wer": 0.3193822262041896, + "step": 8800 }, { - "epoch": 0.63, - "learning_rate": 0.0004974383093085756, - "loss": 1.2904, - "step": 2600 + "epoch": 213.94, + "learning_rate": 0.00014376646706586825, + "loss": 0.0172, + "step": 9200 }, { - "epoch": 0.64, - "learning_rate": 0.000497407769362326, - "loss": 1.1844, - "step": 2625 + "epoch": 213.94, + "eval_cer": 0.06948952393805459, + "eval_loss": 0.42218008637428284, + "eval_runtime": 116.7394, + "eval_samples_per_second": 26.658, + "eval_steps_per_second": 3.332, + "eval_wer": 0.31912624258714106, + "step": 9200 }, { - "epoch": 0.65, - "learning_rate": 0.0004973772294160762, - "loss": 1.2243, - "step": 2650 + "epoch": 223.25, + "learning_rate": 0.00013658083832335328, + "loss": 0.0166, + "step": 9600 }, { - "epoch": 0.65, - "learning_rate": 0.0004973466894698266, - "loss": 1.265, - "step": 2675 + "epoch": 223.25, + "eval_cer": 0.06777556597725969, + "eval_loss": 0.38604938983917236, + "eval_runtime": 116.6232, + "eval_samples_per_second": 26.684, + "eval_steps_per_second": 3.336, + "eval_wer": 0.31345193907589913, + "step": 9600 }, { - "epoch": 0.66, - "learning_rate": 0.0004973161495235768, - "loss": 1.2719, - "step": 2700 + "epoch": 232.55, + "learning_rate": 0.0001293952095808383, + "loss": 0.0156, + "step": 10000 }, { - "epoch": 0.66, - "learning_rate": 0.0004972856095773272, - "loss": 1.2109, - "step": 2725 + "epoch": 232.55, + "eval_cer": 0.0677013394513985, + "eval_loss": 0.40345117449760437, + "eval_runtime": 117.639, + "eval_samples_per_second": 26.454, + "eval_steps_per_second": 3.307, + "eval_wer": 0.31170271769273433, + "step": 10000 }, { - "epoch": 0.67, - "learning_rate": 0.0004972550696310774, - "loss": 1.2428, - "step": 2750 + "epoch": 241.85, + "learning_rate": 0.00012220958083832334, + "loss": 0.0149, + "step": 10400 }, { - "epoch": 0.68, - "learning_rate": 0.0004972245296848278, - "loss": 1.2307, - "step": 2775 + "epoch": 241.85, + "eval_cer": 0.0677013394513985, + "eval_loss": 0.39512303471565247, + "eval_runtime": 120.4059, + "eval_samples_per_second": 25.846, + "eval_steps_per_second": 3.231, + "eval_wer": 0.30867357822432695, + "step": 10400 }, { - "epoch": 0.68, - "learning_rate": 0.000497193989738578, - "loss": 1.2242, - "step": 2800 + "epoch": 251.16, + "learning_rate": 0.00011502395209580837, + "loss": 0.0142, + "step": 10800 }, { - "epoch": 0.69, - "learning_rate": 0.0004971634497923284, - "loss": 1.2375, - "step": 2825 + "epoch": 251.16, + "eval_cer": 0.06735045042005466, + "eval_loss": 0.3971852958202362, + "eval_runtime": 118.3102, + "eval_samples_per_second": 26.304, + "eval_steps_per_second": 3.288, + "eval_wer": 0.309697512692521, + "step": 10800 }, { - "epoch": 0.7, - "learning_rate": 0.0004971329098460786, - "loss": 1.2087, - "step": 2850 + "epoch": 260.46, + "learning_rate": 0.0001078383233532934, + "loss": 0.0134, + "step": 11200 }, { - "epoch": 0.7, - "learning_rate": 0.000497102369899829, - "loss": 1.2111, - "step": 2875 + "epoch": 260.46, + "eval_cer": 0.06749215560578967, + "eval_loss": 0.40693503618240356, + "eval_runtime": 120.6637, + "eval_samples_per_second": 25.791, + "eval_steps_per_second": 3.224, + "eval_wer": 0.31114808652246256, + "step": 11200 }, { - "epoch": 0.71, - "learning_rate": 0.0004970718299535792, - "loss": 1.2721, - "step": 2900 + "epoch": 269.76, + "learning_rate": 0.00010065269461077844, + "loss": 0.0116, + "step": 11600 }, { - "epoch": 0.71, - "learning_rate": 0.0004970412900073296, - "loss": 1.2132, - "step": 2925 + "epoch": 269.76, + "eval_cer": 0.06968521205168865, + "eval_loss": 0.41885173320770264, + "eval_runtime": 118.3717, + "eval_samples_per_second": 26.29, + "eval_steps_per_second": 3.286, + "eval_wer": 0.31609710311873374, + "step": 11600 }, { - "epoch": 0.72, - "learning_rate": 0.00049701075006108, - "loss": 1.1936, - "step": 2950 + "epoch": 279.07, + "learning_rate": 9.346706586826346e-05, + "loss": 0.0119, + "step": 12000 }, { - "epoch": 0.73, - "learning_rate": 0.0004969802101148302, - "loss": 1.2966, - "step": 2975 + "epoch": 279.07, + "eval_cer": 0.0648200006747866, + "eval_loss": 0.3901657462120056, + "eval_runtime": 119.8759, + "eval_samples_per_second": 25.96, + "eval_steps_per_second": 3.245, + "eval_wer": 0.3008234139681727, + "step": 12000 }, { - "epoch": 0.73, - "learning_rate": 0.0004969496701685805, - "loss": 1.3085, - "step": 3000 + "epoch": 288.37, + "learning_rate": 8.62814371257485e-05, + "loss": 0.0098, + "step": 12400 }, { - "epoch": 0.73, - "eval_cer": 0.30896378961633625, - "eval_loss": 0.9274962544441223, - "eval_runtime": 149.1917, - "eval_samples_per_second": 28.105, - "eval_steps_per_second": 7.031, - "eval_wer": 0.9287765089722675, - "step": 3000 + "epoch": 288.37, + "eval_cer": 0.06515064610816829, + "eval_loss": 0.40946489572525024, + "eval_runtime": 120.8583, + "eval_samples_per_second": 25.749, + "eval_steps_per_second": 3.219, + "eval_wer": 0.30018345492555143, + "step": 12400 }, { - "epoch": 0.74, - "learning_rate": 0.0004969191302223308, - "loss": 1.2099, - "step": 3025 + "epoch": 297.67, + "learning_rate": 7.909580838323352e-05, + "loss": 0.0091, + "step": 12800 }, { - "epoch": 0.74, - "learning_rate": 0.0004968885902760812, - "loss": 1.2075, - "step": 3050 + "epoch": 297.67, + "eval_cer": 0.06441512871554371, + "eval_loss": 0.3892023265361786, + "eval_runtime": 118.1231, + "eval_samples_per_second": 26.345, + "eval_steps_per_second": 3.293, + "eval_wer": 0.2989888647126584, + "step": 12800 }, { - "epoch": 0.75, - "learning_rate": 0.0004968580503298314, - "loss": 1.2174, - "step": 3075 + "epoch": 306.96, + "learning_rate": 7.191017964071855e-05, + "loss": 0.0094, + "step": 13200 }, { - "epoch": 0.76, - "learning_rate": 0.0004968275103835818, - "loss": 1.2464, - "step": 3100 + "epoch": 306.96, + "eval_cer": 0.06469853908701373, + "eval_loss": 0.40261197090148926, + "eval_runtime": 118.2919, + "eval_samples_per_second": 26.308, + "eval_steps_per_second": 3.288, + "eval_wer": 0.29834890567003713, + "step": 13200 }, { - "epoch": 0.76, - "learning_rate": 0.000496796970437332, - "loss": 1.262, - "step": 3125 + "epoch": 316.28, + "learning_rate": 6.474251497005988e-05, + "loss": 0.0081, + "step": 13600 }, { - "epoch": 0.77, - "learning_rate": 0.0004967664304910823, - "loss": 1.2058, - "step": 3150 + "epoch": 316.28, + "eval_cer": 0.06462431256115253, + "eval_loss": 0.4302999675273895, + "eval_runtime": 118.0293, + "eval_samples_per_second": 26.366, + "eval_steps_per_second": 3.296, + "eval_wer": 0.29779427449976537, + "step": 13600 }, { - "epoch": 0.77, - "learning_rate": 0.0004967358905448326, - "loss": 1.2482, - "step": 3175 + "epoch": 325.57, + "learning_rate": 5.7556886227544904e-05, + "loss": 0.0079, + "step": 14000 }, { - "epoch": 0.78, - "learning_rate": 0.000496705350598583, - "loss": 1.2172, - "step": 3200 + "epoch": 325.57, + "eval_cer": 0.06431391072573299, + "eval_loss": 0.40440893173217773, + "eval_runtime": 118.2184, + "eval_samples_per_second": 26.324, + "eval_steps_per_second": 3.291, + "eval_wer": 0.29796493024446435, + "step": 14000 }, { - "epoch": 0.79, - "learning_rate": 0.0004966748106523332, - "loss": 1.2177, - "step": 3225 + "epoch": 334.87, + "learning_rate": 5.038922155688622e-05, + "loss": 0.0072, + "step": 14400 }, { - "epoch": 0.79, - "learning_rate": 0.0004966442707060836, - "loss": 1.2189, - "step": 3250 + "epoch": 334.87, + "eval_cer": 0.06546779580957522, + "eval_loss": 0.382755845785141, + "eval_runtime": 118.6873, + "eval_samples_per_second": 26.22, + "eval_steps_per_second": 3.278, + "eval_wer": 0.29992747130850295, + "step": 14400 }, { - "epoch": 0.8, - "learning_rate": 0.0004966137307598339, - "loss": 1.196, - "step": 3275 + "epoch": 344.18, + "learning_rate": 9.578571428571428e-05, + "loss": 0.0081, + "step": 14800 }, { - "epoch": 0.81, - "learning_rate": 0.0004965831908135842, - "loss": 1.1916, - "step": 3300 + "epoch": 344.18, + "eval_cer": 0.06676338607915247, + "eval_loss": 0.4108315706253052, + "eval_runtime": 114.661, + "eval_samples_per_second": 27.141, + "eval_steps_per_second": 3.393, + "eval_wer": 0.30457784035155083, + "step": 14800 }, { - "epoch": 0.81, - "learning_rate": 0.0004965526508673345, - "loss": 1.1967, - "step": 3325 + "epoch": 353.48, + "learning_rate": 9.007142857142856e-05, + "loss": 0.0088, + "step": 15200 }, { - "epoch": 0.82, - "learning_rate": 0.0004965221109210848, - "loss": 1.2152, - "step": 3350 + "epoch": 353.48, + "eval_cer": 0.06539356928371402, + "eval_loss": 0.40191251039505005, + "eval_runtime": 117.0774, + "eval_samples_per_second": 26.581, + "eval_steps_per_second": 3.323, + "eval_wer": 0.2993301762020564, + "step": 15200 }, { - "epoch": 0.82, - "learning_rate": 0.0004964915709748351, - "loss": 1.2419, - "step": 3375 + "epoch": 362.78, + "learning_rate": 8.435714285714286e-05, + "loss": 0.0088, + "step": 15600 }, { - "epoch": 0.83, - "learning_rate": 0.0004964610310285854, - "loss": 1.1729, - "step": 3400 + "epoch": 362.78, + "eval_cer": 0.06814669860656568, + "eval_loss": 0.4072999954223633, + "eval_runtime": 114.628, + "eval_samples_per_second": 27.149, + "eval_steps_per_second": 3.394, + "eval_wer": 0.3091002175860745, + "step": 15600 }, { - "epoch": 0.84, - "learning_rate": 0.0004964304910823357, - "loss": 1.1925, - "step": 3425 + "epoch": 372.09, + "learning_rate": 7.864285714285714e-05, + "loss": 0.0079, + "step": 16000 }, { - "epoch": 0.84, - "learning_rate": 0.000496399951136086, - "loss": 1.2207, - "step": 3450 + "epoch": 372.09, + "eval_cer": 0.0667161510172408, + "eval_loss": 0.42044562101364136, + "eval_runtime": 115.1974, + "eval_samples_per_second": 27.014, + "eval_steps_per_second": 3.377, + "eval_wer": 0.30547378301122063, + "step": 16000 }, { - "epoch": 0.85, - "learning_rate": 0.0004963694111898363, - "loss": 1.1863, - "step": 3475 + "epoch": 381.39, + "learning_rate": 7.292857142857142e-05, + "loss": 0.0072, + "step": 16400 }, { - "epoch": 0.85, - "learning_rate": 0.0004963388712435866, - "loss": 1.1934, - "step": 3500 + "epoch": 381.39, + "eval_cer": 0.06564998819123452, + "eval_loss": 0.40300747752189636, + "eval_runtime": 114.5196, + "eval_samples_per_second": 27.174, + "eval_steps_per_second": 3.397, + "eval_wer": 0.3027859550322113, + "step": 16400 }, { - "epoch": 0.85, - "eval_cer": 0.2815519029188013, - "eval_loss": 0.8737192153930664, - "eval_runtime": 147.4134, - "eval_samples_per_second": 28.444, - "eval_steps_per_second": 7.116, - "eval_wer": 0.8882218597063621, - "step": 3500 + "epoch": 390.69, + "learning_rate": 6.721428571428571e-05, + "loss": 0.0073, + "step": 16800 }, { - "epoch": 0.86, - "learning_rate": 0.0004963083312973369, - "loss": 1.1506, - "step": 3525 + "epoch": 390.69, + "eval_cer": 0.0677350787813354, + "eval_loss": 0.4031626284122467, + "eval_runtime": 114.7831, + "eval_samples_per_second": 27.112, + "eval_steps_per_second": 3.389, + "eval_wer": 0.30807628311788043, + "step": 16800 }, { - "epoch": 0.87, - "learning_rate": 0.0004962777913510872, - "loss": 1.1723, - "step": 3550 + "epoch": 399.99, + "learning_rate": 6.151428571428571e-05, + "loss": 0.0069, + "step": 17200 }, { - "epoch": 0.87, - "learning_rate": 0.0004962472514048376, - "loss": 1.1829, - "step": 3575 + "epoch": 399.99, + "eval_cer": 0.06693208272883701, + "eval_loss": 0.41302183270454407, + "eval_runtime": 114.8457, + "eval_samples_per_second": 27.097, + "eval_steps_per_second": 3.387, + "eval_wer": 0.30214599598959, + "step": 17200 }, { - "epoch": 0.88, - "learning_rate": 0.0004962167114585879, - "loss": 1.2188, - "step": 3600 + "epoch": 409.3, + "learning_rate": 5.5799999999999994e-05, + "loss": 0.0063, + "step": 17600 }, { - "epoch": 0.88, - "learning_rate": 0.0004961861715123381, - "loss": 1.179, - "step": 3625 + "epoch": 409.3, + "eval_cer": 0.06513715037619353, + "eval_loss": 0.4071926772594452, + "eval_runtime": 114.6356, + "eval_samples_per_second": 27.147, + "eval_steps_per_second": 3.393, + "eval_wer": 0.2979222663082896, + "step": 17600 }, { - "epoch": 0.89, - "learning_rate": 0.0004961556315660885, - "loss": 1.1642, - "step": 3650 + "epoch": 418.6, + "learning_rate": 5.008571428571428e-05, + "loss": 0.0059, + "step": 18000 }, { - "epoch": 0.9, - "learning_rate": 0.0004961250916198388, - "loss": 1.1982, - "step": 3675 + "epoch": 418.6, + "eval_cer": 0.06403724822025035, + "eval_loss": 0.41102761030197144, + "eval_runtime": 116.5576, + "eval_samples_per_second": 26.699, + "eval_steps_per_second": 3.337, + "eval_wer": 0.2969409957762703, + "step": 18000 }, { - "epoch": 0.9, - "learning_rate": 0.0004960945516735891, - "loss": 1.2169, - "step": 3700 + "epoch": 427.9, + "learning_rate": 4.437142857142857e-05, + "loss": 0.0056, + "step": 18400 }, { - "epoch": 0.91, - "learning_rate": 0.0004960640117273394, - "loss": 1.1939, - "step": 3725 + "epoch": 427.9, + "eval_cer": 0.06465805189108945, + "eval_loss": 0.4228787422180176, + "eval_runtime": 114.7096, + "eval_samples_per_second": 27.129, + "eval_steps_per_second": 3.391, + "eval_wer": 0.29945816801058067, + "step": 18400 }, { - "epoch": 0.92, - "learning_rate": 0.0004960334717810897, - "loss": 1.2329, - "step": 3750 + "epoch": 437.21, + "learning_rate": 3.8657142857142856e-05, + "loss": 0.005, + "step": 18800 }, { - "epoch": 0.92, - "learning_rate": 0.0004960029318348399, - "loss": 1.2036, - "step": 3775 + "epoch": 437.21, + "eval_cer": 0.062370525321367117, + "eval_loss": 0.41175001859664917, + "eval_runtime": 115.5821, + "eval_samples_per_second": 26.925, + "eval_steps_per_second": 3.366, + "eval_wer": 0.2884508724774948, + "step": 18800 }, { - "epoch": 0.93, - "learning_rate": 0.0004959723918885903, - "loss": 1.1609, - "step": 3800 + "epoch": 446.51, + "learning_rate": 3.294285714285714e-05, + "loss": 0.0046, + "step": 19200 }, { - "epoch": 0.93, - "learning_rate": 0.0004959418519423406, - "loss": 1.1622, - "step": 3825 + "epoch": 446.51, + "eval_cer": 0.06147305914504538, + "eval_loss": 0.41112595796585083, + "eval_runtime": 115.5282, + "eval_samples_per_second": 26.937, + "eval_steps_per_second": 3.367, + "eval_wer": 0.28409915098767013, + "step": 19200 }, { - "epoch": 0.94, - "learning_rate": 0.0004959113119960909, - "loss": 1.1903, - "step": 3850 + "epoch": 455.8, + "learning_rate": 2.7228571428571427e-05, + "loss": 0.0043, + "step": 19600 }, { - "epoch": 0.95, - "learning_rate": 0.0004958807720498412, - "loss": 1.1552, - "step": 3875 + "epoch": 455.8, + "eval_cer": 0.06160126859880563, + "eval_loss": 0.40707847476005554, + "eval_runtime": 117.681, + "eval_samples_per_second": 26.444, + "eval_steps_per_second": 3.306, + "eval_wer": 0.28495242971116513, + "step": 19600 }, { - "epoch": 0.95, - "learning_rate": 0.0004958502321035915, - "loss": 1.1445, - "step": 3900 + "epoch": 465.11, + "learning_rate": 2.1514285714285714e-05, + "loss": 0.0038, + "step": 20000 }, { - "epoch": 0.96, - "learning_rate": 0.0004958196921573418, - "loss": 1.1968, - "step": 3925 + "epoch": 465.11, + "eval_cer": 0.062363777455379736, + "eval_loss": 0.4267757534980774, + "eval_runtime": 115.119, + "eval_samples_per_second": 27.033, + "eval_steps_per_second": 3.379, + "eval_wer": 0.28670165109433, + "step": 20000 }, { - "epoch": 0.96, - "learning_rate": 0.0004957891522110921, - "loss": 1.1482, - "step": 3950 + "epoch": 474.41, + "learning_rate": 1.5799999999999998e-05, + "loss": 0.0035, + "step": 20400 }, { - "epoch": 0.97, - "learning_rate": 0.0004957586122648425, - "loss": 1.1879, - "step": 3975 + "epoch": 474.41, + "eval_cer": 0.06053510577279935, + "eval_loss": 0.4116959869861603, + "eval_runtime": 115.3416, + "eval_samples_per_second": 26.981, + "eval_steps_per_second": 3.373, + "eval_wer": 0.2820086181151073, + "step": 20400 }, { - "epoch": 0.98, - "learning_rate": 0.0004957280723185927, - "loss": 1.1909, - "step": 4000 + "epoch": 483.71, + "learning_rate": 1.0085714285714285e-05, + "loss": 0.0035, + "step": 20800 }, { - "epoch": 0.98, - "eval_cer": 0.27801505087112305, - "eval_loss": 0.8657284379005432, - "eval_runtime": 148.1841, - "eval_samples_per_second": 28.296, - "eval_steps_per_second": 7.079, - "eval_wer": 0.8697879282218597, - "step": 4000 + "epoch": 483.71, + "eval_cer": 0.060238199669354564, + "eval_loss": 0.4154604375362396, + "eval_runtime": 115.2471, + "eval_samples_per_second": 27.003, + "eval_steps_per_second": 3.375, + "eval_wer": 0.2819232902427578, + "step": 20800 }, { - "epoch": 0.98, - "learning_rate": 0.0004956975323723431, - "loss": 1.1837, - "step": 4025 + "epoch": 493.02, + "learning_rate": 4.371428571428571e-06, + "loss": 0.0034, + "step": 21200 }, { - "epoch": 0.99, - "learning_rate": 0.0004956669924260934, - "loss": 1.1907, - "step": 4050 - }, - { - "epoch": 0.99, - "learning_rate": 0.0004956364524798437, - "loss": 1.181, - "step": 4075 - }, - { - "epoch": 1.0, - "learning_rate": 0.0004956059125335939, - "loss": 1.1887, - "step": 4100 - }, - { - "epoch": 1.01, - "learning_rate": 0.0004955753725873443, - "loss": 1.1424, - "step": 4125 - }, - { - "epoch": 1.01, - "learning_rate": 0.0004955448326410945, - "loss": 1.2208, - "step": 4150 - }, - { - "epoch": 1.02, - "learning_rate": 0.0004955142926948449, - "loss": 1.0992, - "step": 4175 - }, - { - "epoch": 1.02, - "learning_rate": 0.0004954837527485952, - "loss": 1.1928, - "step": 4200 - }, - { - "epoch": 1.03, - "learning_rate": 0.0004954532128023455, - "loss": 1.1475, - "step": 4225 - }, - { - "epoch": 1.04, - "learning_rate": 0.0004954226728560957, - "loss": 1.1454, - "step": 4250 - }, - { - "epoch": 1.04, - "learning_rate": 0.0004953921329098461, - "loss": 1.1318, - "step": 4275 - }, - { - "epoch": 1.05, - "learning_rate": 0.0004953615929635963, - "loss": 1.0943, - "step": 4300 - }, - { - "epoch": 1.06, - "learning_rate": 0.0004953310530173467, - "loss": 1.1443, - "step": 4325 - }, - { - "epoch": 1.06, - "learning_rate": 0.0004953005130710971, - "loss": 1.14, - "step": 4350 - }, - { - "epoch": 1.07, - "learning_rate": 0.0004952699731248473, - "loss": 1.1257, - "step": 4375 - }, - { - "epoch": 1.07, - "learning_rate": 0.0004952394331785976, - "loss": 1.1535, - "step": 4400 - }, - { - "epoch": 1.08, - "learning_rate": 0.0004952088932323479, - "loss": 1.1164, - "step": 4425 - }, - { - "epoch": 1.09, - "learning_rate": 0.0004951783532860983, - "loss": 1.1142, - "step": 4450 - }, - { - "epoch": 1.09, - "learning_rate": 0.0004951478133398485, - "loss": 1.1491, - "step": 4475 - }, - { - "epoch": 1.1, - "learning_rate": 0.0004951172733935989, - "loss": 1.0647, - "step": 4500 - }, - { - "epoch": 1.1, - "eval_cer": 0.2660236337689804, - "eval_loss": 0.8246370553970337, - "eval_runtime": 149.8516, - "eval_samples_per_second": 27.981, - "eval_steps_per_second": 7.0, - "eval_wer": 0.8816639477977162, - "step": 4500 - }, - { - "epoch": 1.1, - "learning_rate": 0.0004950867334473491, - "loss": 1.1131, - "step": 4525 - }, - { - "epoch": 1.11, - "learning_rate": 0.0004950561935010994, - "loss": 1.1171, - "step": 4550 - }, - { - "epoch": 1.12, - "learning_rate": 0.0004950256535548497, - "loss": 1.14, - "step": 4575 - }, - { - "epoch": 1.12, - "learning_rate": 0.0004949951136086001, - "loss": 1.1237, - "step": 4600 - }, - { - "epoch": 1.13, - "learning_rate": 0.0004949645736623503, - "loss": 1.1444, - "step": 4625 - }, - { - "epoch": 1.13, - "learning_rate": 0.0004949340337161007, - "loss": 1.1466, - "step": 4650 - }, - { - "epoch": 1.14, - "learning_rate": 0.000494903493769851, - "loss": 1.0618, - "step": 4675 - }, - { - "epoch": 1.15, - "learning_rate": 0.0004948729538236013, - "loss": 1.128, - "step": 4700 - }, - { - "epoch": 1.15, - "learning_rate": 0.0004948424138773516, - "loss": 1.1266, - "step": 4725 - }, - { - "epoch": 1.16, - "learning_rate": 0.0004948130955289519, - "loss": 1.1306, - "step": 4750 - }, - { - "epoch": 1.17, - "learning_rate": 0.0004947825555827022, - "loss": 1.0861, - "step": 4775 - }, - { - "epoch": 1.17, - "learning_rate": 0.0004947520156364525, - "loss": 1.1126, - "step": 4800 - }, - { - "epoch": 1.18, - "learning_rate": 0.0004947214756902028, - "loss": 1.1643, - "step": 4825 - }, - { - "epoch": 1.18, - "learning_rate": 0.000494690935743953, - "loss": 1.1249, - "step": 4850 - }, - { - "epoch": 1.19, - "learning_rate": 0.0004946603957977034, - "loss": 1.0927, - "step": 4875 - }, - { - "epoch": 1.2, - "learning_rate": 0.0004946298558514537, - "loss": 1.0774, - "step": 4900 - }, - { - "epoch": 1.2, - "learning_rate": 0.000494599315905204, - "loss": 1.0776, - "step": 4925 - }, - { - "epoch": 1.21, - "learning_rate": 0.0004945687759589543, - "loss": 1.0937, - "step": 4950 - }, - { - "epoch": 1.21, - "learning_rate": 0.0004945382360127046, - "loss": 1.1052, - "step": 4975 - }, - { - "epoch": 1.22, - "learning_rate": 0.000494507696066455, - "loss": 1.1362, - "step": 5000 - }, - { - "epoch": 1.22, - "eval_cer": 0.27113127932404546, - "eval_loss": 0.8031673431396484, - "eval_runtime": 150.0559, - "eval_samples_per_second": 27.943, - "eval_steps_per_second": 6.991, - "eval_wer": 0.9086460032626428, - "step": 5000 - }, - { - "epoch": 1.23, - "learning_rate": 0.0004944771561202052, - "loss": 1.0782, - "step": 5025 - }, - { - "epoch": 1.23, - "learning_rate": 0.0004944466161739556, - "loss": 1.0927, - "step": 5050 - }, - { - "epoch": 1.24, - "learning_rate": 0.0004944160762277058, - "loss": 1.1011, - "step": 5075 - }, - { - "epoch": 1.24, - "learning_rate": 0.0004943855362814562, - "loss": 1.0837, - "step": 5100 - }, - { - "epoch": 1.25, - "learning_rate": 0.0004943549963352065, - "loss": 1.0993, - "step": 5125 - }, - { - "epoch": 1.26, - "learning_rate": 0.0004943244563889568, - "loss": 1.1002, - "step": 5150 - }, - { - "epoch": 1.26, - "learning_rate": 0.000494293916442707, - "loss": 1.0856, - "step": 5175 - }, - { - "epoch": 1.27, - "learning_rate": 0.0004942633764964574, - "loss": 1.1047, - "step": 5200 - }, - { - "epoch": 1.28, - "learning_rate": 0.0004942328365502076, - "loss": 1.1072, - "step": 5225 - }, - { - "epoch": 1.28, - "learning_rate": 0.000494202296603958, - "loss": 1.0748, - "step": 5250 - }, - { - "epoch": 1.29, - "learning_rate": 0.0004941717566577083, - "loss": 1.0535, - "step": 5275 - }, - { - "epoch": 1.29, - "learning_rate": 0.0004941412167114586, - "loss": 1.1443, - "step": 5300 - }, - { - "epoch": 1.3, - "learning_rate": 0.0004941106767652088, - "loss": 1.0943, - "step": 5325 - }, - { - "epoch": 1.31, - "learning_rate": 0.0004940801368189592, - "loss": 1.0904, - "step": 5350 - }, - { - "epoch": 1.31, - "learning_rate": 0.0004940495968727096, - "loss": 1.097, - "step": 5375 - }, - { - "epoch": 1.32, - "learning_rate": 0.0004940190569264598, - "loss": 1.1234, - "step": 5400 - }, - { - "epoch": 1.32, - "learning_rate": 0.0004939885169802102, - "loss": 1.1049, - "step": 5425 - }, - { - "epoch": 1.33, - "learning_rate": 0.0004939579770339604, - "loss": 1.0737, - "step": 5450 - }, - { - "epoch": 1.34, - "learning_rate": 0.0004939274370877108, - "loss": 1.0872, - "step": 5475 - }, - { - "epoch": 1.34, - "learning_rate": 0.000493896897141461, - "loss": 1.0994, - "step": 5500 - }, - { - "epoch": 1.34, - "eval_cer": 0.24623471556317567, - "eval_loss": 0.7718956470489502, - "eval_runtime": 150.4418, - "eval_samples_per_second": 27.871, - "eval_steps_per_second": 6.973, - "eval_wer": 0.8305709624796085, - "step": 5500 - }, - { - "epoch": 1.35, - "learning_rate": 0.0004938663571952114, - "loss": 1.0869, - "step": 5525 - }, - { - "epoch": 1.35, - "learning_rate": 0.0004938358172489616, - "loss": 1.0742, - "step": 5550 - }, - { - "epoch": 1.36, - "learning_rate": 0.000493805277302712, - "loss": 1.0867, - "step": 5575 - }, - { - "epoch": 1.37, - "learning_rate": 0.0004937747373564622, - "loss": 1.0516, - "step": 5600 - }, - { - "epoch": 1.37, - "learning_rate": 0.0004937441974102126, - "loss": 1.0562, - "step": 5625 - }, - { - "epoch": 1.38, - "learning_rate": 0.0004937136574639628, - "loss": 1.072, - "step": 5650 - }, - { - "epoch": 1.38, - "learning_rate": 0.0004936831175177132, - "loss": 1.0712, - "step": 5675 - }, - { - "epoch": 1.39, - "learning_rate": 0.0004936525775714634, - "loss": 1.0735, - "step": 5700 - }, - { - "epoch": 1.4, - "learning_rate": 0.0004936220376252138, - "loss": 1.0757, - "step": 5725 - }, - { - "epoch": 1.4, - "learning_rate": 0.0004935914976789642, - "loss": 1.0374, - "step": 5750 - }, - { - "epoch": 1.41, - "learning_rate": 0.0004935609577327144, - "loss": 1.0556, - "step": 5775 - }, - { - "epoch": 1.42, - "learning_rate": 0.0004935304177864647, - "loss": 1.0696, - "step": 5800 - }, - { - "epoch": 1.42, - "learning_rate": 0.000493499877840215, - "loss": 1.0751, - "step": 5825 - }, - { - "epoch": 1.43, - "learning_rate": 0.0004934693378939653, - "loss": 1.0841, - "step": 5850 - }, - { - "epoch": 1.43, - "learning_rate": 0.0004934387979477156, - "loss": 1.0686, - "step": 5875 - }, - { - "epoch": 1.44, - "learning_rate": 0.000493408258001466, - "loss": 1.062, - "step": 5900 - }, - { - "epoch": 1.45, - "learning_rate": 0.0004933777180552162, - "loss": 1.0416, - "step": 5925 - }, - { - "epoch": 1.45, - "learning_rate": 0.0004933471781089666, - "loss": 1.0138, - "step": 5950 - }, - { - "epoch": 1.46, - "learning_rate": 0.0004933166381627168, - "loss": 1.0089, - "step": 5975 - }, - { - "epoch": 1.46, - "learning_rate": 0.0004932860982164672, - "loss": 1.1, - "step": 6000 - }, - { - "epoch": 1.46, - "eval_cer": 0.25613174132213584, - "eval_loss": 0.7853134870529175, - "eval_runtime": 146.4034, - "eval_samples_per_second": 28.64, - "eval_steps_per_second": 7.165, - "eval_wer": 0.8400652528548124, - "step": 6000 - }, - { - "epoch": 1.47, - "learning_rate": 0.0004932555582702174, - "loss": 1.0436, - "step": 6025 - }, - { - "epoch": 1.48, - "learning_rate": 0.0004932250183239678, - "loss": 1.1361, - "step": 6050 - }, - { - "epoch": 1.48, - "learning_rate": 0.000493194478377718, - "loss": 1.0567, - "step": 6075 - }, - { - "epoch": 1.49, - "learning_rate": 0.0004931639384314684, - "loss": 1.1106, - "step": 6100 - }, - { - "epoch": 1.49, - "learning_rate": 0.0004931333984852187, - "loss": 1.0431, - "step": 6125 - }, - { - "epoch": 1.5, - "learning_rate": 0.000493102858538969, - "loss": 1.095, - "step": 6150 - }, - { - "epoch": 1.51, - "learning_rate": 0.0004930723185927193, - "loss": 1.0448, - "step": 6175 - }, - { - "epoch": 1.51, - "learning_rate": 0.0004930417786464696, - "loss": 1.0329, - "step": 6200 - }, - { - "epoch": 1.52, - "learning_rate": 0.0004930112387002199, - "loss": 1.0757, - "step": 6225 - }, - { - "epoch": 1.53, - "learning_rate": 0.0004929806987539702, - "loss": 1.0936, - "step": 6250 - }, - { - "epoch": 1.53, - "learning_rate": 0.0004929501588077205, - "loss": 1.0361, - "step": 6275 - }, - { - "epoch": 1.54, - "learning_rate": 0.0004929196188614708, - "loss": 1.0478, - "step": 6300 - }, - { - "epoch": 1.54, - "learning_rate": 0.0004928890789152211, - "loss": 1.0408, - "step": 6325 - }, - { - "epoch": 1.55, - "learning_rate": 0.0004928585389689714, - "loss": 1.0468, - "step": 6350 - }, - { - "epoch": 1.56, - "learning_rate": 0.0004928279990227217, - "loss": 1.0571, - "step": 6375 - }, - { - "epoch": 1.56, - "learning_rate": 0.000492797459076472, - "loss": 1.0958, - "step": 6400 - }, - { - "epoch": 1.57, - "learning_rate": 0.0004927669191302224, - "loss": 1.0402, - "step": 6425 - }, - { - "epoch": 1.57, - "learning_rate": 0.0004927363791839727, - "loss": 1.0423, - "step": 6450 - }, - { - "epoch": 1.58, - "learning_rate": 0.0004927058392377229, - "loss": 1.0132, - "step": 6475 - }, - { - "epoch": 1.59, - "learning_rate": 0.0004926752992914733, - "loss": 1.0629, - "step": 6500 - }, - { - "epoch": 1.59, - "eval_cer": 0.24587538371508064, - "eval_loss": 0.7808747887611389, - "eval_runtime": 150.3232, - "eval_samples_per_second": 27.893, - "eval_steps_per_second": 6.978, - "eval_wer": 0.8244698205546492, - "step": 6500 - }, - { - "epoch": 1.59, - "learning_rate": 0.0004926447593452236, - "loss": 1.0696, - "step": 6525 - }, - { - "epoch": 1.6, - "learning_rate": 0.0004926142193989739, - "loss": 1.0916, - "step": 6550 - }, - { - "epoch": 1.6, - "learning_rate": 0.0004925836794527242, - "loss": 1.0583, - "step": 6575 - }, - { - "epoch": 1.61, - "learning_rate": 0.0004925531395064745, - "loss": 1.0745, - "step": 6600 - }, - { - "epoch": 1.62, - "learning_rate": 0.0004925225995602247, - "loss": 1.0613, - "step": 6625 - }, - { - "epoch": 1.62, - "learning_rate": 0.0004924920596139751, - "loss": 1.0993, - "step": 6650 - }, - { - "epoch": 1.63, - "learning_rate": 0.0004924615196677254, - "loss": 1.0287, - "step": 6675 - }, - { - "epoch": 1.63, - "learning_rate": 0.0004924309797214757, - "loss": 1.0697, - "step": 6700 - }, - { - "epoch": 1.64, - "learning_rate": 0.000492400439775226, - "loss": 1.0078, - "step": 6725 - }, - { - "epoch": 1.65, - "learning_rate": 0.0004923698998289763, - "loss": 1.0758, - "step": 6750 - }, - { - "epoch": 1.65, - "learning_rate": 0.0004923393598827267, - "loss": 1.049, - "step": 6775 - }, - { - "epoch": 1.66, - "learning_rate": 0.0004923088199364769, - "loss": 1.0401, - "step": 6800 - }, - { - "epoch": 1.67, - "learning_rate": 0.0004922782799902273, - "loss": 1.0468, - "step": 6825 - }, - { - "epoch": 1.67, - "learning_rate": 0.0004922477400439775, - "loss": 1.0586, - "step": 6850 - }, - { - "epoch": 1.68, - "learning_rate": 0.0004922172000977279, - "loss": 1.0428, - "step": 6875 - }, - { - "epoch": 1.68, - "learning_rate": 0.0004921866601514781, - "loss": 1.0465, - "step": 6900 - }, - { - "epoch": 1.69, - "learning_rate": 0.0004921561202052285, - "loss": 1.015, - "step": 6925 - }, - { - "epoch": 1.7, - "learning_rate": 0.0004921255802589787, - "loss": 1.0893, - "step": 6950 - }, - { - "epoch": 1.7, - "learning_rate": 0.0004920950403127291, - "loss": 1.071, - "step": 6975 - }, - { - "epoch": 1.71, - "learning_rate": 0.0004920645003664793, - "loss": 1.1032, - "step": 7000 - }, - { - "epoch": 1.71, - "eval_cer": 0.24269786351549746, - "eval_loss": 0.7637730836868286, - "eval_runtime": 150.2038, - "eval_samples_per_second": 27.915, - "eval_steps_per_second": 6.984, - "eval_wer": 0.8227406199021207, - "step": 7000 - }, - { - "epoch": 1.71, - "learning_rate": 0.0004920339604202297, - "loss": 1.0387, - "step": 7025 - }, - { - "epoch": 1.72, - "learning_rate": 0.00049200342047398, - "loss": 1.0642, - "step": 7050 - }, - { - "epoch": 1.73, - "learning_rate": 0.0004919728805277303, - "loss": 1.0831, - "step": 7075 - }, - { - "epoch": 1.73, - "learning_rate": 0.0004919423405814805, - "loss": 1.0667, - "step": 7100 - }, - { - "epoch": 1.74, - "learning_rate": 0.0004919118006352309, - "loss": 1.042, - "step": 7125 - }, - { - "epoch": 1.74, - "learning_rate": 0.0004918812606889813, - "loss": 1.0001, - "step": 7150 - }, - { - "epoch": 1.75, - "learning_rate": 0.0004918507207427315, - "loss": 1.0786, - "step": 7175 - }, - { - "epoch": 1.76, - "learning_rate": 0.0004918201807964819, - "loss": 1.0567, - "step": 7200 - }, - { - "epoch": 1.76, - "learning_rate": 0.0004917896408502321, - "loss": 1.0255, - "step": 7225 - }, - { - "epoch": 1.77, - "learning_rate": 0.0004917591009039824, - "loss": 1.0694, - "step": 7250 - }, - { - "epoch": 1.78, - "learning_rate": 0.0004917285609577327, - "loss": 1.0622, - "step": 7275 - }, - { - "epoch": 1.78, - "learning_rate": 0.0004916980210114831, - "loss": 1.0316, - "step": 7300 - }, - { - "epoch": 1.79, - "learning_rate": 0.0004916674810652333, - "loss": 1.0995, - "step": 7325 - }, - { - "epoch": 1.79, - "learning_rate": 0.0004916369411189837, - "loss": 1.0378, - "step": 7350 - }, - { - "epoch": 1.8, - "learning_rate": 0.0004916064011727339, - "loss": 1.0338, - "step": 7375 - }, - { - "epoch": 1.81, - "learning_rate": 0.0004915758612264842, - "loss": 1.0584, - "step": 7400 - }, - { - "epoch": 1.81, - "learning_rate": 0.0004915453212802345, - "loss": 1.0315, - "step": 7425 - }, - { - "epoch": 1.82, - "learning_rate": 0.0004915147813339849, - "loss": 1.0323, - "step": 7450 - }, - { - "epoch": 1.82, - "learning_rate": 0.0004914842413877351, - "loss": 0.9843, - "step": 7475 - }, - { - "epoch": 1.83, - "learning_rate": 0.0004914537014414855, - "loss": 1.0171, - "step": 7500 - }, - { - "epoch": 1.83, - "eval_cer": 0.23322690266213567, - "eval_loss": 0.74111008644104, - "eval_runtime": 150.5438, - "eval_samples_per_second": 27.852, - "eval_steps_per_second": 6.968, - "eval_wer": 0.8087112561174551, - "step": 7500 - }, - { - "epoch": 1.84, - "learning_rate": 0.0004914231614952358, - "loss": 1.0284, - "step": 7525 - }, - { - "epoch": 1.84, - "learning_rate": 0.0004913926215489861, - "loss": 1.0462, - "step": 7550 - }, - { - "epoch": 1.85, - "learning_rate": 0.0004913620816027364, - "loss": 1.0062, - "step": 7575 - }, - { - "epoch": 1.85, - "learning_rate": 0.0004913315416564867, - "loss": 1.0715, - "step": 7600 - }, - { - "epoch": 1.86, - "learning_rate": 0.000491301001710237, - "loss": 1.0672, - "step": 7625 - }, - { - "epoch": 1.87, - "learning_rate": 0.0004912704617639873, - "loss": 1.0077, - "step": 7650 - }, - { - "epoch": 1.87, - "learning_rate": 0.0004912399218177377, - "loss": 1.0668, - "step": 7675 - }, - { - "epoch": 1.88, - "learning_rate": 0.0004912093818714879, - "loss": 1.0582, - "step": 7700 - }, - { - "epoch": 1.89, - "learning_rate": 0.0004911788419252382, - "loss": 1.0758, - "step": 7725 - }, - { - "epoch": 1.89, - "learning_rate": 0.0004911483019789885, - "loss": 1.0678, - "step": 7750 - }, - { - "epoch": 1.9, - "learning_rate": 0.0004911177620327388, - "loss": 1.041, - "step": 7775 - }, - { - "epoch": 1.9, - "learning_rate": 0.0004910872220864891, - "loss": 1.0245, - "step": 7800 - }, - { - "epoch": 1.91, - "learning_rate": 0.0004910566821402395, - "loss": 1.0517, - "step": 7825 - }, - { - "epoch": 1.92, - "learning_rate": 0.0004910261421939897, - "loss": 1.0589, - "step": 7850 - }, - { - "epoch": 1.92, - "learning_rate": 0.00049099560224774, - "loss": 1.0315, - "step": 7875 - }, - { - "epoch": 1.93, - "learning_rate": 0.0004909650623014904, - "loss": 1.0659, - "step": 7900 - }, - { - "epoch": 1.93, - "learning_rate": 0.0004909345223552407, - "loss": 1.0559, - "step": 7925 - }, - { - "epoch": 1.94, - "learning_rate": 0.000490903982408991, - "loss": 1.0801, - "step": 7950 - }, - { - "epoch": 1.95, - "learning_rate": 0.0004908734424627413, - "loss": 1.0445, - "step": 7975 - }, - { - "epoch": 1.95, - "learning_rate": 0.0004908429025164916, - "loss": 1.0591, - "step": 8000 - }, - { - "epoch": 1.95, - "eval_cer": 0.23618882375286182, - "eval_loss": 0.7331734895706177, - "eval_runtime": 150.163, - "eval_samples_per_second": 27.923, - "eval_steps_per_second": 6.986, - "eval_wer": 0.8274061990212072, - "step": 8000 - }, - { - "epoch": 1.96, - "learning_rate": 0.0004908123625702418, - "loss": 1.0552, - "step": 8025 - }, - { - "epoch": 1.96, - "learning_rate": 0.0004907818226239922, - "loss": 1.0331, - "step": 8050 - }, - { - "epoch": 1.97, - "learning_rate": 0.0004907512826777425, - "loss": 1.0102, - "step": 8075 - }, - { - "epoch": 1.98, - "learning_rate": 0.0004907219643293428, - "loss": 0.9944, - "step": 8100 - }, - { - "epoch": 1.98, - "learning_rate": 0.0004906914243830931, - "loss": 0.9907, - "step": 8125 - }, - { - "epoch": 1.99, - "learning_rate": 0.0004906608844368434, - "loss": 1.0408, - "step": 8150 - }, - { - "epoch": 1.99, - "learning_rate": 0.0004906303444905936, - "loss": 1.0145, - "step": 8175 - }, - { - "epoch": 2.0, - "learning_rate": 0.000490599804544344, - "loss": 1.033, - "step": 8200 - }, - { - "epoch": 2.01, - "learning_rate": 0.0004905692645980944, - "loss": 0.9967, - "step": 8225 - }, - { - "epoch": 2.01, - "learning_rate": 0.0004905387246518446, - "loss": 1.0126, - "step": 8250 - }, - { - "epoch": 2.02, - "learning_rate": 0.000490508184705595, - "loss": 0.9957, - "step": 8275 - }, - { - "epoch": 2.03, - "learning_rate": 0.0004904776447593452, - "loss": 1.0066, - "step": 8300 - }, - { - "epoch": 2.03, - "learning_rate": 0.0004904471048130955, - "loss": 0.9957, - "step": 8325 - }, - { - "epoch": 2.04, - "learning_rate": 0.0004904165648668458, - "loss": 1.0412, - "step": 8350 - }, - { - "epoch": 2.04, - "learning_rate": 0.0004903860249205962, - "loss": 1.0109, - "step": 8375 - }, - { - "epoch": 2.05, - "learning_rate": 0.0004903554849743464, - "loss": 0.9944, - "step": 8400 - }, - { - "epoch": 2.06, - "learning_rate": 0.0004903249450280968, - "loss": 0.9917, - "step": 8425 - }, - { - "epoch": 2.06, - "learning_rate": 0.000490294405081847, - "loss": 1.0134, - "step": 8450 - }, - { - "epoch": 2.07, - "learning_rate": 0.0004902638651355974, - "loss": 0.9979, - "step": 8475 - }, - { - "epoch": 2.07, - "learning_rate": 0.0004902333251893476, - "loss": 0.9725, - "step": 8500 - }, - { - "epoch": 2.07, - "eval_cer": 0.22165641715347575, - "eval_loss": 0.7190037369728088, - "eval_runtime": 154.2309, - "eval_samples_per_second": 27.187, - "eval_steps_per_second": 6.801, - "eval_wer": 0.7847308319738988, - "step": 8500 - }, - { - "epoch": 2.08, - "learning_rate": 0.000490202785243098, - "loss": 0.9934, - "step": 8525 - }, - { - "epoch": 2.09, - "learning_rate": 0.0004901722452968482, - "loss": 0.9609, - "step": 8550 - }, - { - "epoch": 2.09, - "learning_rate": 0.0004901417053505986, - "loss": 0.9797, - "step": 8575 - }, - { - "epoch": 2.1, - "learning_rate": 0.000490111165404349, - "loss": 0.9612, - "step": 8600 - }, - { - "epoch": 2.1, - "learning_rate": 0.0004900806254580992, - "loss": 0.9582, - "step": 8625 - }, - { - "epoch": 2.11, - "learning_rate": 0.0004900500855118495, - "loss": 1.0047, - "step": 8650 - }, - { - "epoch": 2.12, - "learning_rate": 0.0004900195455655998, - "loss": 0.9842, - "step": 8675 - }, - { - "epoch": 2.12, - "learning_rate": 0.0004899890056193501, - "loss": 0.9559, - "step": 8700 - }, - { - "epoch": 2.13, - "learning_rate": 0.0004899584656731004, - "loss": 0.9806, - "step": 8725 - }, - { - "epoch": 2.14, - "learning_rate": 0.0004899279257268508, - "loss": 0.988, - "step": 8750 - }, - { - "epoch": 2.14, - "learning_rate": 0.000489897385780601, - "loss": 0.9616, - "step": 8775 - }, - { - "epoch": 2.15, - "learning_rate": 0.0004898668458343513, - "loss": 0.9586, - "step": 8800 - }, - { - "epoch": 2.15, - "learning_rate": 0.0004898363058881016, - "loss": 0.9778, - "step": 8825 - }, - { - "epoch": 2.16, - "learning_rate": 0.000489805765941852, - "loss": 1.0124, - "step": 8850 - }, - { - "epoch": 2.17, - "learning_rate": 0.0004897752259956022, - "loss": 1.0, - "step": 8875 - }, - { - "epoch": 2.17, - "learning_rate": 0.0004897446860493526, - "loss": 0.9949, - "step": 8900 - }, - { - "epoch": 2.18, - "learning_rate": 0.0004897141461031028, - "loss": 0.9904, - "step": 8925 - }, - { - "epoch": 2.18, - "learning_rate": 0.0004896836061568532, - "loss": 1.0132, - "step": 8950 - }, - { - "epoch": 2.19, - "learning_rate": 0.0004896530662106035, - "loss": 0.971, - "step": 8975 - }, - { - "epoch": 2.2, - "learning_rate": 0.0004896225262643538, - "loss": 1.03, - "step": 9000 - }, - { - "epoch": 2.2, - "eval_cer": 0.23557795961110028, - "eval_loss": 0.7176295518875122, - "eval_runtime": 149.5931, - "eval_samples_per_second": 28.029, - "eval_steps_per_second": 7.012, - "eval_wer": 0.8255138662316477, - "step": 9000 - }, - { - "epoch": 2.2, - "learning_rate": 0.0004895919863181041, - "loss": 0.9694, - "step": 9025 - }, - { - "epoch": 2.21, - "learning_rate": 0.0004895614463718544, - "loss": 0.9855, - "step": 9050 - }, - { - "epoch": 2.21, - "learning_rate": 0.0004895309064256047, - "loss": 0.986, - "step": 9075 - }, - { - "epoch": 2.22, - "learning_rate": 0.000489500366479355, - "loss": 1.0111, - "step": 9100 - }, - { - "epoch": 2.23, - "learning_rate": 0.0004894698265331053, - "loss": 0.9636, - "step": 9125 - }, - { - "epoch": 2.23, - "learning_rate": 0.0004894392865868556, - "loss": 0.9908, - "step": 9150 - }, - { - "epoch": 2.24, - "learning_rate": 0.0004894087466406059, - "loss": 0.9693, - "step": 9175 - }, - { - "epoch": 2.24, - "learning_rate": 0.0004893782066943562, - "loss": 1.0015, - "step": 9200 - }, - { - "epoch": 2.25, - "learning_rate": 0.0004893476667481066, - "loss": 0.9758, - "step": 9225 - }, - { - "epoch": 2.26, - "learning_rate": 0.0004893171268018568, - "loss": 1.0329, - "step": 9250 - }, - { - "epoch": 2.26, - "learning_rate": 0.0004892865868556071, - "loss": 0.9654, - "step": 9275 - }, - { - "epoch": 2.27, - "learning_rate": 0.0004892560469093575, - "loss": 0.9999, - "step": 9300 - }, - { - "epoch": 2.28, - "learning_rate": 0.0004892255069631077, - "loss": 0.9878, - "step": 9325 - }, - { - "epoch": 2.28, - "learning_rate": 0.0004891949670168581, - "loss": 0.9785, - "step": 9350 - }, - { - "epoch": 2.29, - "learning_rate": 0.0004891644270706084, - "loss": 0.9796, - "step": 9375 - }, - { - "epoch": 2.29, - "learning_rate": 0.0004891338871243587, - "loss": 1.0357, - "step": 9400 - }, - { - "epoch": 2.3, - "learning_rate": 0.000489103347178109, - "loss": 0.9666, - "step": 9425 - }, - { - "epoch": 2.31, - "learning_rate": 0.0004890728072318593, - "loss": 1.0062, - "step": 9450 - }, - { - "epoch": 2.31, - "learning_rate": 0.0004890422672856095, - "loss": 0.9699, - "step": 9475 - }, - { - "epoch": 2.32, - "learning_rate": 0.0004890117273393599, - "loss": 0.9939, - "step": 9500 - }, - { - "epoch": 2.32, - "eval_cer": 0.2471176452470663, - "eval_loss": 0.7189167141914368, - "eval_runtime": 153.4415, - "eval_samples_per_second": 27.326, - "eval_steps_per_second": 6.836, - "eval_wer": 0.8653181076672104, - "step": 9500 - }, - { - "epoch": 2.32, - "learning_rate": 0.0004889811873931102, - "loss": 0.9811, - "step": 9525 - }, - { - "epoch": 2.33, - "learning_rate": 0.0004889506474468605, - "loss": 1.0085, - "step": 9550 - }, - { - "epoch": 2.34, - "learning_rate": 0.0004889201075006108, - "loss": 0.9753, - "step": 9575 - }, - { - "epoch": 2.34, - "learning_rate": 0.0004888895675543611, - "loss": 0.9409, - "step": 9600 - }, - { - "epoch": 2.35, - "learning_rate": 0.0004888590276081115, - "loss": 0.9792, - "step": 9625 - }, - { - "epoch": 2.35, - "learning_rate": 0.0004888284876618617, - "loss": 1.0009, - "step": 9650 - }, - { - "epoch": 2.36, - "learning_rate": 0.0004887979477156121, - "loss": 0.9875, - "step": 9675 - }, - { - "epoch": 2.37, - "learning_rate": 0.0004887674077693623, - "loss": 1.0286, - "step": 9700 - }, - { - "epoch": 2.37, - "learning_rate": 0.0004887368678231127, - "loss": 0.96, - "step": 9725 - }, - { - "epoch": 2.38, - "learning_rate": 0.0004887063278768629, - "loss": 0.9712, - "step": 9750 - }, - { - "epoch": 2.39, - "learning_rate": 0.0004886757879306133, - "loss": 0.9919, - "step": 9775 - }, - { - "epoch": 2.39, - "learning_rate": 0.0004886452479843635, - "loss": 1.0148, - "step": 9800 - }, - { - "epoch": 2.4, - "learning_rate": 0.0004886147080381139, - "loss": 0.9762, - "step": 9825 - }, - { - "epoch": 2.4, - "learning_rate": 0.0004885841680918641, - "loss": 0.9539, - "step": 9850 - }, - { - "epoch": 2.41, - "learning_rate": 0.0004885536281456145, - "loss": 0.9814, - "step": 9875 - }, - { - "epoch": 2.42, - "learning_rate": 0.0004885230881993648, - "loss": 0.9418, - "step": 9900 - }, - { - "epoch": 2.42, - "learning_rate": 0.0004884925482531151, - "loss": 0.9613, - "step": 9925 - }, - { - "epoch": 2.43, - "learning_rate": 0.0004884620083068653, - "loss": 1.0212, - "step": 9950 - }, - { - "epoch": 2.43, - "learning_rate": 0.0004884314683606157, - "loss": 0.9608, - "step": 9975 - }, - { - "epoch": 2.44, - "learning_rate": 0.0004884009284143661, - "loss": 0.9564, - "step": 10000 - }, - { - "epoch": 2.44, - "eval_cer": 0.22702586162643862, - "eval_loss": 0.7050137519836426, - "eval_runtime": 153.9631, - "eval_samples_per_second": 27.234, - "eval_steps_per_second": 6.813, - "eval_wer": 0.7984339314845025, - "step": 10000 - }, - { - "epoch": 2.45, - "learning_rate": 0.0004883703884681163, - "loss": 0.977, - "step": 10025 - }, - { - "epoch": 2.45, - "learning_rate": 0.0004883398485218667, - "loss": 1.0024, - "step": 10050 - }, - { - "epoch": 2.46, - "learning_rate": 0.0004883093085756169, - "loss": 0.9681, - "step": 10075 - }, - { - "epoch": 2.46, - "learning_rate": 0.0004882787686293672, - "loss": 0.9711, - "step": 10100 - }, - { - "epoch": 2.47, - "learning_rate": 0.0004882482286831175, - "loss": 0.9421, - "step": 10125 - }, - { - "epoch": 2.48, - "learning_rate": 0.0004882176887368678, - "loss": 0.9543, - "step": 10150 - }, - { - "epoch": 2.48, - "learning_rate": 0.0004881871487906181, - "loss": 0.9585, - "step": 10175 - }, - { - "epoch": 2.49, - "learning_rate": 0.0004881566088443685, - "loss": 1.012, - "step": 10200 - }, - { - "epoch": 2.5, - "learning_rate": 0.00048812606889811873, - "loss": 0.9411, - "step": 10225 - }, - { - "epoch": 2.5, - "learning_rate": 0.00048809552895186904, - "loss": 0.9809, - "step": 10250 - }, - { - "epoch": 2.51, - "learning_rate": 0.00048806498900561934, - "loss": 0.9897, - "step": 10275 - }, - { - "epoch": 2.51, - "learning_rate": 0.00048803444905936964, - "loss": 0.9325, - "step": 10300 - }, - { - "epoch": 2.52, - "learning_rate": 0.00048800390911312, - "loss": 0.9752, - "step": 10325 - }, - { - "epoch": 2.53, - "learning_rate": 0.0004879733691668703, - "loss": 0.9296, - "step": 10350 - }, - { - "epoch": 2.53, - "learning_rate": 0.00048794282922062055, - "loss": 1.0148, - "step": 10375 - }, - { - "epoch": 2.54, - "learning_rate": 0.00048791228927437086, - "loss": 1.0025, - "step": 10400 - }, - { - "epoch": 2.54, - "learning_rate": 0.00048788174932812116, - "loss": 0.9625, - "step": 10425 - }, - { - "epoch": 2.55, - "learning_rate": 0.0004878512093818715, - "loss": 0.9829, - "step": 10450 - }, - { - "epoch": 2.56, - "learning_rate": 0.0004878206694356218, - "loss": 0.9655, - "step": 10475 - }, - { - "epoch": 2.56, - "learning_rate": 0.0004877901294893721, - "loss": 0.966, - "step": 10500 - }, - { - "epoch": 2.56, - "eval_cer": 0.22002915721281685, - "eval_loss": 0.698431134223938, - "eval_runtime": 151.9452, - "eval_samples_per_second": 27.595, - "eval_steps_per_second": 6.904, - "eval_wer": 0.7738009787928222, - "step": 10500 - }, - { - "epoch": 2.57, - "learning_rate": 0.0004877595895431224, - "loss": 0.946, - "step": 10525 - }, - { - "epoch": 2.57, - "learning_rate": 0.0004877290495968727, - "loss": 0.9189, - "step": 10550 - }, - { - "epoch": 2.58, - "learning_rate": 0.00048769850965062303, - "loss": 0.9545, - "step": 10575 - }, - { - "epoch": 2.59, - "learning_rate": 0.00048766796970437334, - "loss": 0.9564, - "step": 10600 - }, - { - "epoch": 2.59, - "learning_rate": 0.00048763742975812364, - "loss": 0.994, - "step": 10625 - }, - { - "epoch": 2.6, - "learning_rate": 0.00048760688981187394, - "loss": 1.0165, - "step": 10650 - }, - { - "epoch": 2.6, - "learning_rate": 0.00048757634986562425, - "loss": 0.9581, - "step": 10675 - }, - { - "epoch": 2.61, - "learning_rate": 0.00048754580991937455, - "loss": 0.9181, - "step": 10700 - }, - { - "epoch": 2.62, - "learning_rate": 0.00048751526997312485, - "loss": 0.9664, - "step": 10725 - }, - { - "epoch": 2.62, - "learning_rate": 0.00048748473002687516, - "loss": 0.995, - "step": 10750 - }, - { - "epoch": 2.63, - "learning_rate": 0.00048745419008062546, - "loss": 0.9565, - "step": 10775 - }, - { - "epoch": 2.64, - "learning_rate": 0.00048742365013437576, - "loss": 0.9906, - "step": 10800 - }, - { - "epoch": 2.64, - "learning_rate": 0.0004873931101881261, - "loss": 0.9804, - "step": 10825 - }, - { - "epoch": 2.65, - "learning_rate": 0.00048736257024187637, - "loss": 0.9643, - "step": 10850 - }, - { - "epoch": 2.65, - "learning_rate": 0.0004873320302956267, - "loss": 0.9544, - "step": 10875 - }, - { - "epoch": 2.66, - "learning_rate": 0.000487301490349377, - "loss": 1.0451, - "step": 10900 - }, - { - "epoch": 2.67, - "learning_rate": 0.0004872709504031273, - "loss": 0.9919, - "step": 10925 - }, - { - "epoch": 2.67, - "learning_rate": 0.00048724041045687764, - "loss": 1.007, - "step": 10950 - }, - { - "epoch": 2.68, - "learning_rate": 0.00048720987051062794, - "loss": 0.9678, - "step": 10975 - }, - { - "epoch": 2.68, - "learning_rate": 0.00048717933056437824, - "loss": 0.9858, - "step": 11000 - }, - { - "epoch": 2.68, - "eval_cer": 0.22549613461597692, - "eval_loss": 0.6884613633155823, - "eval_runtime": 147.9789, - "eval_samples_per_second": 28.335, - "eval_steps_per_second": 7.089, - "eval_wer": 0.8049592169657422, - "step": 11000 - }, - { - "epoch": 2.69, - "learning_rate": 0.0004871487906181285, - "loss": 0.9764, - "step": 11025 - }, - { - "epoch": 2.7, - "learning_rate": 0.0004871182506718788, - "loss": 0.9899, - "step": 11050 - }, - { - "epoch": 2.7, - "learning_rate": 0.00048708771072562915, - "loss": 0.9894, - "step": 11075 - }, - { - "epoch": 2.71, - "learning_rate": 0.00048705717077937946, - "loss": 0.9927, - "step": 11100 - }, - { - "epoch": 2.71, - "learning_rate": 0.00048702663083312976, - "loss": 0.9676, - "step": 11125 - }, - { - "epoch": 2.72, - "learning_rate": 0.00048699609088688006, - "loss": 1.0058, - "step": 11150 - }, - { - "epoch": 2.73, - "learning_rate": 0.0004869655509406303, - "loss": 0.9584, - "step": 11175 - }, - { - "epoch": 2.73, - "learning_rate": 0.00048693501099438067, - "loss": 0.9052, - "step": 11200 - }, - { - "epoch": 2.74, - "learning_rate": 0.000486904471048131, - "loss": 0.9558, - "step": 11225 - }, - { - "epoch": 2.75, - "learning_rate": 0.0004868739311018813, - "loss": 0.9989, - "step": 11250 - }, - { - "epoch": 2.75, - "learning_rate": 0.0004868433911556316, - "loss": 0.9705, - "step": 11275 - }, - { - "epoch": 2.76, - "learning_rate": 0.0004868128512093819, - "loss": 0.96, - "step": 11300 - }, - { - "epoch": 2.76, - "learning_rate": 0.00048678231126313213, - "loss": 0.9782, - "step": 11325 - }, - { - "epoch": 2.77, - "learning_rate": 0.0004867517713168825, - "loss": 0.9906, - "step": 11350 - }, - { - "epoch": 2.78, - "learning_rate": 0.0004867212313706328, - "loss": 0.9869, - "step": 11375 - }, - { - "epoch": 2.78, - "learning_rate": 0.0004866906914243831, - "loss": 0.9431, - "step": 11400 - }, - { - "epoch": 2.79, - "learning_rate": 0.0004866601514781334, - "loss": 0.9565, - "step": 11425 - }, - { - "epoch": 2.79, - "learning_rate": 0.0004866296115318837, - "loss": 0.9876, - "step": 11450 - }, - { - "epoch": 2.8, - "learning_rate": 0.00048659907158563406, - "loss": 0.9448, - "step": 11475 - }, - { - "epoch": 2.81, - "learning_rate": 0.0004865685316393843, - "loss": 0.9484, - "step": 11500 - }, - { - "epoch": 2.81, - "eval_cer": 0.21829923102984508, - "eval_loss": 0.6878862977027893, - "eval_runtime": 149.5721, - "eval_samples_per_second": 28.033, - "eval_steps_per_second": 7.013, - "eval_wer": 0.7645676998368679, - "step": 11500 - }, - { - "epoch": 2.81, - "learning_rate": 0.0004865379916931346, - "loss": 0.9508, - "step": 11525 - }, - { - "epoch": 2.82, - "learning_rate": 0.0004865074517468849, - "loss": 0.996, - "step": 11550 - }, - { - "epoch": 2.82, - "learning_rate": 0.0004864769118006352, - "loss": 0.9525, - "step": 11575 - }, - { - "epoch": 2.83, - "learning_rate": 0.0004864463718543856, - "loss": 1.0059, - "step": 11600 - }, - { - "epoch": 2.84, - "learning_rate": 0.0004864158319081359, - "loss": 0.9635, - "step": 11625 - }, - { - "epoch": 2.84, - "learning_rate": 0.00048638529196188613, - "loss": 0.96, - "step": 11650 - }, - { - "epoch": 2.85, - "learning_rate": 0.00048635475201563643, - "loss": 0.968, - "step": 11675 - }, - { - "epoch": 2.86, - "learning_rate": 0.00048632421206938674, - "loss": 0.9205, - "step": 11700 - }, - { - "epoch": 2.86, - "learning_rate": 0.0004862936721231371, - "loss": 0.9185, - "step": 11725 - }, - { - "epoch": 2.87, - "learning_rate": 0.0004862631321768874, - "loss": 0.9517, - "step": 11750 - }, - { - "epoch": 2.87, - "learning_rate": 0.0004862325922306377, - "loss": 1.0051, - "step": 11775 - }, - { - "epoch": 2.88, - "learning_rate": 0.00048620205228438795, - "loss": 0.9333, - "step": 11800 - }, - { - "epoch": 2.89, - "learning_rate": 0.00048617151233813825, - "loss": 0.9508, - "step": 11825 - }, - { - "epoch": 2.89, - "learning_rate": 0.0004861409723918886, - "loss": 0.9726, - "step": 11850 - }, - { - "epoch": 2.9, - "learning_rate": 0.0004861104324456389, - "loss": 0.9376, - "step": 11875 - }, - { - "epoch": 2.9, - "learning_rate": 0.0004860798924993892, - "loss": 0.9773, - "step": 11900 - }, - { - "epoch": 2.91, - "learning_rate": 0.0004860493525531395, - "loss": 0.9483, - "step": 11925 - }, - { - "epoch": 2.92, - "learning_rate": 0.0004860188126068898, - "loss": 0.9744, - "step": 11950 - }, - { - "epoch": 2.92, - "learning_rate": 0.00048598827266064013, - "loss": 0.9449, - "step": 11975 - }, - { - "epoch": 2.93, - "learning_rate": 0.00048595773271439043, - "loss": 0.9244, - "step": 12000 - }, - { - "epoch": 2.93, - "eval_cer": 0.21655390491052637, - "eval_loss": 0.6589547991752625, - "eval_runtime": 149.4696, - "eval_samples_per_second": 28.053, - "eval_steps_per_second": 7.018, - "eval_wer": 0.7743882544861338, - "step": 12000 - }, - { - "epoch": 2.93, - "learning_rate": 0.00048592719276814074, - "loss": 0.9488, - "step": 12025 - }, - { - "epoch": 2.94, - "learning_rate": 0.00048589665282189104, - "loss": 0.9111, - "step": 12050 - }, - { - "epoch": 2.95, - "learning_rate": 0.00048586611287564134, - "loss": 0.9263, - "step": 12075 - }, - { - "epoch": 2.95, - "learning_rate": 0.0004858355729293917, - "loss": 0.8932, - "step": 12100 - }, - { - "epoch": 2.96, - "learning_rate": 0.00048580503298314195, - "loss": 0.9376, - "step": 12125 - }, - { - "epoch": 2.96, - "learning_rate": 0.00048577449303689225, - "loss": 0.9569, - "step": 12150 - }, - { - "epoch": 2.97, - "learning_rate": 0.00048574395309064256, - "loss": 0.9335, - "step": 12175 - }, - { - "epoch": 2.98, - "learning_rate": 0.00048571341314439286, - "loss": 0.9099, - "step": 12200 - }, - { - "epoch": 2.98, - "learning_rate": 0.0004856828731981432, - "loss": 0.9444, - "step": 12225 - }, - { - "epoch": 2.99, - "learning_rate": 0.0004856523332518935, - "loss": 0.9528, - "step": 12250 - }, - { - "epoch": 3.0, - "learning_rate": 0.00048562179330564377, - "loss": 0.9481, - "step": 12275 - }, - { - "epoch": 3.0, - "learning_rate": 0.00048559125335939407, - "loss": 0.9301, - "step": 12300 - }, - { - "epoch": 3.01, - "learning_rate": 0.0004855607134131444, - "loss": 0.8993, - "step": 12325 - }, - { - "epoch": 3.01, - "learning_rate": 0.00048553017346689473, - "loss": 0.905, - "step": 12350 - }, - { - "epoch": 3.02, - "learning_rate": 0.00048549963352064504, - "loss": 0.9204, - "step": 12375 - }, - { - "epoch": 3.03, - "learning_rate": 0.00048546909357439534, - "loss": 0.9196, - "step": 12400 - }, - { - "epoch": 3.03, - "learning_rate": 0.00048543855362814564, - "loss": 0.9102, - "step": 12425 - }, - { - "epoch": 3.04, - "learning_rate": 0.0004854080136818959, - "loss": 0.9034, - "step": 12450 - }, - { - "epoch": 3.04, - "learning_rate": 0.00048537747373564625, - "loss": 0.8883, - "step": 12475 - }, - { - "epoch": 3.05, - "learning_rate": 0.00048534693378939655, - "loss": 0.9224, - "step": 12500 - }, - { - "epoch": 3.05, - "eval_cer": 0.2035255587610238, - "eval_loss": 0.6522818207740784, - "eval_runtime": 150.425, - "eval_samples_per_second": 27.874, - "eval_steps_per_second": 6.974, - "eval_wer": 0.7476672104404568, - "step": 12500 - }, - { - "epoch": 3.06, - "learning_rate": 0.00048531639384314686, - "loss": 0.9002, - "step": 12525 - }, - { - "epoch": 3.06, - "learning_rate": 0.00048528585389689716, - "loss": 0.9254, - "step": 12550 - }, - { - "epoch": 3.07, - "learning_rate": 0.00048525531395064746, - "loss": 0.9498, - "step": 12575 - }, - { - "epoch": 3.07, - "learning_rate": 0.00048522477400439777, - "loss": 0.9027, - "step": 12600 - }, - { - "epoch": 3.08, - "learning_rate": 0.00048519423405814807, - "loss": 0.9143, - "step": 12625 - }, - { - "epoch": 3.09, - "learning_rate": 0.0004851636941118984, - "loss": 0.9581, - "step": 12650 - }, - { - "epoch": 3.09, - "learning_rate": 0.0004851331541656487, - "loss": 0.9042, - "step": 12675 - }, - { - "epoch": 3.1, - "learning_rate": 0.000485102614219399, - "loss": 0.927, - "step": 12700 - }, - { - "epoch": 3.11, - "learning_rate": 0.00048507207427314934, - "loss": 0.9333, - "step": 12725 - }, - { - "epoch": 3.11, - "learning_rate": 0.0004850415343268996, - "loss": 0.8864, - "step": 12750 - }, - { - "epoch": 3.12, - "learning_rate": 0.0004850109943806499, - "loss": 0.9396, - "step": 12775 - }, - { - "epoch": 3.12, - "learning_rate": 0.0004849804544344002, - "loss": 0.9603, - "step": 12800 - }, - { - "epoch": 3.13, - "learning_rate": 0.0004849499144881505, - "loss": 0.9117, - "step": 12825 - }, - { - "epoch": 3.14, - "learning_rate": 0.0004849193745419008, - "loss": 0.9961, - "step": 12850 - }, - { - "epoch": 3.14, - "learning_rate": 0.00048488883459565116, - "loss": 0.9035, - "step": 12875 - }, - { - "epoch": 3.15, - "learning_rate": 0.00048485829464940146, - "loss": 0.8586, - "step": 12900 - }, - { - "epoch": 3.15, - "learning_rate": 0.0004848277547031517, - "loss": 0.9017, - "step": 12925 - }, - { - "epoch": 3.16, - "learning_rate": 0.000484797214756902, - "loss": 0.8265, - "step": 12950 - }, - { - "epoch": 3.17, - "learning_rate": 0.0004847666748106523, - "loss": 0.926, - "step": 12975 - }, - { - "epoch": 3.17, - "learning_rate": 0.0004847361348644027, - "loss": 0.9148, - "step": 13000 - }, - { - "epoch": 3.17, - "eval_cer": 0.20544028418015872, - "eval_loss": 0.6521516442298889, - "eval_runtime": 148.4584, - "eval_samples_per_second": 28.244, - "eval_steps_per_second": 7.066, - "eval_wer": 0.7506688417618271, - "step": 13000 - }, - { - "epoch": 3.18, - "learning_rate": 0.000484705594918153, - "loss": 0.885, - "step": 13025 - }, - { - "epoch": 3.18, - "learning_rate": 0.0004846750549719033, - "loss": 0.9175, - "step": 13050 - }, - { - "epoch": 3.19, - "learning_rate": 0.00048464451502565353, - "loss": 0.8873, - "step": 13075 - }, - { - "epoch": 3.2, - "learning_rate": 0.00048461397507940383, - "loss": 0.9484, - "step": 13100 - }, - { - "epoch": 3.2, - "learning_rate": 0.0004845834351331542, - "loss": 0.8753, - "step": 13125 - }, - { - "epoch": 3.21, - "learning_rate": 0.0004845528951869045, - "loss": 0.9427, - "step": 13150 - }, - { - "epoch": 3.21, - "learning_rate": 0.0004845223552406548, - "loss": 0.9135, - "step": 13175 - }, - { - "epoch": 3.22, - "learning_rate": 0.0004844918152944051, - "loss": 0.9313, - "step": 13200 - }, - { - "epoch": 3.23, - "learning_rate": 0.00048446127534815535, - "loss": 0.9239, - "step": 13225 - }, - { - "epoch": 3.23, - "learning_rate": 0.0004844307354019057, - "loss": 0.9113, - "step": 13250 - }, - { - "epoch": 3.24, - "learning_rate": 0.000484400195455656, - "loss": 0.8907, - "step": 13275 - }, - { - "epoch": 3.25, - "learning_rate": 0.0004843696555094063, - "loss": 0.9199, - "step": 13300 - }, - { - "epoch": 3.25, - "learning_rate": 0.0004843391155631566, - "loss": 0.9231, - "step": 13325 - }, - { - "epoch": 3.26, - "learning_rate": 0.0004843085756169069, - "loss": 0.9079, - "step": 13350 - }, - { - "epoch": 3.26, - "learning_rate": 0.0004842780356706572, - "loss": 0.8949, - "step": 13375 - }, - { - "epoch": 3.27, - "learning_rate": 0.00048424749572440753, - "loss": 0.9139, - "step": 13400 - }, - { - "epoch": 3.28, - "learning_rate": 0.00048421695577815783, - "loss": 0.9003, - "step": 13425 - }, - { - "epoch": 3.28, - "learning_rate": 0.00048418641583190813, - "loss": 0.9042, - "step": 13450 - }, - { - "epoch": 3.29, - "learning_rate": 0.00048415587588565844, - "loss": 0.9246, - "step": 13475 - }, - { - "epoch": 3.29, - "learning_rate": 0.0004841253359394088, - "loss": 0.9227, - "step": 13500 - }, - { - "epoch": 3.29, - "eval_cer": 0.20374629118199644, - "eval_loss": 0.6420453190803528, - "eval_runtime": 148.4286, - "eval_samples_per_second": 28.249, - "eval_steps_per_second": 7.067, - "eval_wer": 0.754094616639478, - "step": 13500 - }, - { - "epoch": 3.3, - "learning_rate": 0.0004840947959931591, - "loss": 0.9074, - "step": 13525 - }, - { - "epoch": 3.31, - "learning_rate": 0.00048406425604690935, - "loss": 0.8885, - "step": 13550 - }, - { - "epoch": 3.31, - "learning_rate": 0.00048403371610065965, - "loss": 0.9374, - "step": 13575 - }, - { - "epoch": 3.32, - "learning_rate": 0.00048400317615440995, - "loss": 0.9339, - "step": 13600 - }, - { - "epoch": 3.32, - "learning_rate": 0.0004839726362081603, - "loss": 0.8923, - "step": 13625 - }, - { - "epoch": 3.33, - "learning_rate": 0.0004839420962619106, - "loss": 0.9201, - "step": 13650 - }, - { - "epoch": 3.34, - "learning_rate": 0.0004839115563156609, - "loss": 0.9358, - "step": 13675 - }, - { - "epoch": 3.34, - "learning_rate": 0.00048388101636941117, - "loss": 0.9606, - "step": 13700 - }, - { - "epoch": 3.35, - "learning_rate": 0.0004838516980210115, - "loss": 0.894, - "step": 13725 - }, - { - "epoch": 3.36, - "learning_rate": 0.0004838211580747618, - "loss": 0.9257, - "step": 13750 - }, - { - "epoch": 3.36, - "learning_rate": 0.0004837906181285121, - "loss": 0.8742, - "step": 13775 - }, - { - "epoch": 3.37, - "learning_rate": 0.00048376007818226244, - "loss": 0.8619, - "step": 13800 - }, - { - "epoch": 3.37, - "learning_rate": 0.00048372953823601274, - "loss": 0.8761, - "step": 13825 - }, - { - "epoch": 3.38, - "learning_rate": 0.000483698998289763, - "loss": 0.9257, - "step": 13850 - }, - { - "epoch": 3.39, - "learning_rate": 0.0004836684583435133, - "loss": 0.9392, - "step": 13875 - }, - { - "epoch": 3.39, - "learning_rate": 0.0004836379183972636, - "loss": 0.9186, - "step": 13900 - }, - { - "epoch": 3.4, - "learning_rate": 0.00048360737845101396, - "loss": 0.9031, - "step": 13925 - }, - { - "epoch": 3.4, - "learning_rate": 0.00048357683850476426, - "loss": 0.8896, - "step": 13950 - }, - { - "epoch": 3.41, - "learning_rate": 0.00048354629855851456, - "loss": 0.9033, - "step": 13975 - }, - { - "epoch": 3.42, - "learning_rate": 0.00048351575861226487, - "loss": 0.8935, - "step": 14000 - }, - { - "epoch": 3.42, - "eval_cer": 0.2014260341057257, - "eval_loss": 0.6442487835884094, - "eval_runtime": 150.0535, - "eval_samples_per_second": 27.943, - "eval_steps_per_second": 6.991, - "eval_wer": 0.7415986949429038, - "step": 14000 - }, - { - "epoch": 3.42, - "learning_rate": 0.0004834852186660151, - "loss": 0.8764, - "step": 14025 - }, - { - "epoch": 3.43, - "learning_rate": 0.00048345467871976547, - "loss": 0.9076, - "step": 14050 - }, - { - "epoch": 3.43, - "learning_rate": 0.0004834241387735158, - "loss": 0.9242, - "step": 14075 - }, - { - "epoch": 3.44, - "learning_rate": 0.0004833935988272661, - "loss": 0.855, - "step": 14100 - }, - { - "epoch": 3.45, - "learning_rate": 0.0004833630588810164, - "loss": 0.9283, - "step": 14125 - }, - { - "epoch": 3.45, - "learning_rate": 0.0004833325189347667, - "loss": 0.9128, - "step": 14150 - }, - { - "epoch": 3.46, - "learning_rate": 0.000483301978988517, - "loss": 0.9126, - "step": 14175 - }, - { - "epoch": 3.47, - "learning_rate": 0.0004832714390422673, - "loss": 0.8883, - "step": 14200 - }, - { - "epoch": 3.47, - "learning_rate": 0.0004832408990960176, - "loss": 0.8974, - "step": 14225 - }, - { - "epoch": 3.48, - "learning_rate": 0.0004832103591497679, - "loss": 0.9776, - "step": 14250 - }, - { - "epoch": 3.48, - "learning_rate": 0.0004831798192035182, - "loss": 0.9265, - "step": 14275 - }, - { - "epoch": 3.49, - "learning_rate": 0.00048314927925726856, - "loss": 0.9559, - "step": 14300 - }, - { - "epoch": 3.5, - "learning_rate": 0.0004831187393110188, - "loss": 0.9448, - "step": 14325 - }, - { - "epoch": 3.5, - "learning_rate": 0.0004830881993647691, - "loss": 0.9357, - "step": 14350 - }, - { - "epoch": 3.51, - "learning_rate": 0.0004830576594185194, - "loss": 0.9283, - "step": 14375 - }, - { - "epoch": 3.51, - "learning_rate": 0.0004830271194722697, - "loss": 0.9365, - "step": 14400 - }, - { - "epoch": 3.52, - "learning_rate": 0.0004829965795260201, - "loss": 0.9369, - "step": 14425 - }, - { - "epoch": 3.53, - "learning_rate": 0.0004829660395797704, - "loss": 0.9185, - "step": 14450 - }, - { - "epoch": 3.53, - "learning_rate": 0.0004829354996335207, - "loss": 0.923, - "step": 14475 - }, - { - "epoch": 3.54, - "learning_rate": 0.00048290495968727093, - "loss": 0.9257, - "step": 14500 - }, - { - "epoch": 3.54, - "eval_cer": 0.1986027124421219, - "eval_loss": 0.6285128593444824, - "eval_runtime": 148.5155, - "eval_samples_per_second": 28.233, - "eval_steps_per_second": 7.063, - "eval_wer": 0.7263295269168026, - "step": 14500 - }, - { - "epoch": 3.54, - "learning_rate": 0.00048287441974102124, - "loss": 0.9144, - "step": 14525 - }, - { - "epoch": 3.55, - "learning_rate": 0.0004828438797947716, - "loss": 0.9176, - "step": 14550 - }, - { - "epoch": 3.56, - "learning_rate": 0.0004828133398485219, - "loss": 0.8861, - "step": 14575 - }, - { - "epoch": 3.56, - "learning_rate": 0.0004827827999022722, - "loss": 0.9533, - "step": 14600 - }, - { - "epoch": 3.57, - "learning_rate": 0.0004827522599560225, - "loss": 0.8651, - "step": 14625 - }, - { - "epoch": 3.57, - "learning_rate": 0.00048272172000977275, - "loss": 0.9017, - "step": 14650 - }, - { - "epoch": 3.58, - "learning_rate": 0.0004826911800635231, - "loss": 0.8858, - "step": 14675 - }, - { - "epoch": 3.59, - "learning_rate": 0.0004826606401172734, - "loss": 0.9246, - "step": 14700 - }, - { - "epoch": 3.59, - "learning_rate": 0.0004826301001710237, - "loss": 0.844, - "step": 14725 - }, - { - "epoch": 3.6, - "learning_rate": 0.000482599560224774, - "loss": 0.8826, - "step": 14750 - }, - { - "epoch": 3.61, - "learning_rate": 0.0004825690202785243, - "loss": 0.8788, - "step": 14775 - }, - { - "epoch": 3.61, - "learning_rate": 0.00048253848033227457, - "loss": 0.907, - "step": 14800 - }, - { - "epoch": 3.62, - "learning_rate": 0.00048250794038602493, - "loss": 0.9251, - "step": 14825 - }, - { - "epoch": 3.62, - "learning_rate": 0.00048247740043977523, - "loss": 0.8712, - "step": 14850 - }, - { - "epoch": 3.63, - "learning_rate": 0.00048244686049352554, - "loss": 0.9175, - "step": 14875 - }, - { - "epoch": 3.64, - "learning_rate": 0.00048241632054727584, - "loss": 0.9437, - "step": 14900 - }, - { - "epoch": 3.64, - "learning_rate": 0.00048238578060102614, - "loss": 0.9023, - "step": 14925 - }, - { - "epoch": 3.65, - "learning_rate": 0.0004823552406547765, - "loss": 0.9112, - "step": 14950 - }, - { - "epoch": 3.65, - "learning_rate": 0.00048232470070852675, - "loss": 0.8988, - "step": 14975 - }, - { - "epoch": 3.66, - "learning_rate": 0.00048229538236012706, - "loss": 0.9194, - "step": 15000 - }, - { - "epoch": 3.66, - "eval_cer": 0.19383386548668932, - "eval_loss": 0.6116518378257751, - "eval_runtime": 157.9954, - "eval_samples_per_second": 26.539, - "eval_steps_per_second": 6.639, - "eval_wer": 0.72, - "step": 15000 - }, - { - "epoch": 3.67, - "learning_rate": 0.00048226484241387736, - "loss": 0.8694, - "step": 15025 - }, - { - "epoch": 3.67, - "learning_rate": 0.00048223430246762766, - "loss": 0.9755, - "step": 15050 - }, - { - "epoch": 3.68, - "learning_rate": 0.00048220376252137797, - "loss": 0.9342, - "step": 15075 - }, - { - "epoch": 3.68, - "learning_rate": 0.0004821732225751283, - "loss": 0.9129, - "step": 15100 - }, - { - "epoch": 3.69, - "learning_rate": 0.0004821426826288786, - "loss": 0.9193, - "step": 15125 - }, - { - "epoch": 3.7, - "learning_rate": 0.0004821121426826289, - "loss": 0.9264, - "step": 15150 - }, - { - "epoch": 3.7, - "learning_rate": 0.0004820816027363792, - "loss": 0.916, - "step": 15175 - }, - { - "epoch": 3.71, - "learning_rate": 0.0004820510627901295, - "loss": 0.968, - "step": 15200 - }, - { - "epoch": 3.72, - "learning_rate": 0.00048202052284387984, - "loss": 0.919, - "step": 15225 - }, - { - "epoch": 3.72, - "learning_rate": 0.00048198998289763014, - "loss": 0.8958, - "step": 15250 - }, - { - "epoch": 3.73, - "learning_rate": 0.0004819594429513804, - "loss": 0.881, - "step": 15275 - }, - { - "epoch": 3.73, - "learning_rate": 0.0004819289030051307, - "loss": 0.8499, - "step": 15300 - }, - { - "epoch": 3.74, - "learning_rate": 0.000481898363058881, - "loss": 0.8722, - "step": 15325 - }, - { - "epoch": 3.75, - "learning_rate": 0.00048186782311263136, - "loss": 0.9201, - "step": 15350 - }, - { - "epoch": 3.75, - "learning_rate": 0.00048183728316638166, - "loss": 0.9017, - "step": 15375 - }, - { - "epoch": 3.76, - "learning_rate": 0.00048180674322013196, - "loss": 0.8766, - "step": 15400 - }, - { - "epoch": 3.76, - "learning_rate": 0.00048177620327388227, - "loss": 0.8692, - "step": 15425 - }, - { - "epoch": 3.77, - "learning_rate": 0.0004817456633276325, - "loss": 0.8803, - "step": 15450 - }, - { - "epoch": 3.78, - "learning_rate": 0.0004817151233813828, - "loss": 0.8915, - "step": 15475 - }, - { - "epoch": 3.78, - "learning_rate": 0.0004816845834351332, - "loss": 0.9158, - "step": 15500 - }, - { - "epoch": 3.78, - "eval_cer": 0.19416753077420612, - "eval_loss": 0.6197028160095215, - "eval_runtime": 156.8998, - "eval_samples_per_second": 26.724, - "eval_steps_per_second": 6.686, - "eval_wer": 0.7233605220228385, - "step": 15500 - }, - { - "epoch": 3.79, - "learning_rate": 0.0004816540434888835, - "loss": 0.8998, - "step": 15525 - }, - { - "epoch": 3.79, - "learning_rate": 0.0004816235035426338, - "loss": 0.8904, - "step": 15550 - }, - { - "epoch": 3.8, - "learning_rate": 0.0004815929635963841, - "loss": 0.8888, - "step": 15575 - }, - { - "epoch": 3.81, - "learning_rate": 0.00048156242365013434, - "loss": 0.9235, - "step": 15600 - }, - { - "epoch": 3.81, - "learning_rate": 0.0004815318837038847, - "loss": 0.9225, - "step": 15625 - }, - { - "epoch": 3.82, - "learning_rate": 0.000481501343757635, - "loss": 0.955, - "step": 15650 - }, - { - "epoch": 3.83, - "learning_rate": 0.0004814708038113853, - "loss": 0.9162, - "step": 15675 - }, - { - "epoch": 3.83, - "learning_rate": 0.0004814402638651356, - "loss": 0.9626, - "step": 15700 - }, - { - "epoch": 3.84, - "learning_rate": 0.0004814097239188859, - "loss": 0.9149, - "step": 15725 - }, - { - "epoch": 3.84, - "learning_rate": 0.0004813791839726362, - "loss": 0.9075, - "step": 15750 - }, - { - "epoch": 3.85, - "learning_rate": 0.0004813486440263865, - "loss": 0.9157, - "step": 15775 - }, - { - "epoch": 3.86, - "learning_rate": 0.0004813181040801368, - "loss": 0.9607, - "step": 15800 - }, - { - "epoch": 3.86, - "learning_rate": 0.0004812875641338871, - "loss": 0.9188, - "step": 15825 - }, - { - "epoch": 3.87, - "learning_rate": 0.0004812570241876374, - "loss": 0.9023, - "step": 15850 - }, - { - "epoch": 3.87, - "learning_rate": 0.0004812264842413878, - "loss": 0.8976, - "step": 15875 - }, - { - "epoch": 3.88, - "learning_rate": 0.0004811959442951381, - "loss": 0.9066, - "step": 15900 - }, - { - "epoch": 3.89, - "learning_rate": 0.00048116540434888833, - "loss": 0.869, - "step": 15925 - }, - { - "epoch": 3.89, - "learning_rate": 0.00048113486440263864, - "loss": 0.8878, - "step": 15950 - }, - { - "epoch": 3.9, - "learning_rate": 0.00048110432445638894, - "loss": 0.887, - "step": 15975 - }, - { - "epoch": 3.9, - "learning_rate": 0.0004810737845101393, - "loss": 0.9079, - "step": 16000 - }, - { - "epoch": 3.9, - "eval_cer": 0.19389546523207704, - "eval_loss": 0.6110395789146423, - "eval_runtime": 159.6702, - "eval_samples_per_second": 26.26, - "eval_steps_per_second": 6.57, - "eval_wer": 0.7186623164763458, - "step": 16000 - }, - { - "epoch": 3.91, - "learning_rate": 0.0004810432445638896, - "loss": 0.8978, - "step": 16025 - }, - { - "epoch": 3.92, - "learning_rate": 0.0004810127046176399, - "loss": 0.9334, - "step": 16050 - }, - { - "epoch": 3.92, - "learning_rate": 0.00048098216467139015, - "loss": 0.9075, - "step": 16075 - }, - { - "epoch": 3.93, - "learning_rate": 0.00048095162472514046, - "loss": 0.9095, - "step": 16100 - }, - { - "epoch": 3.93, - "learning_rate": 0.0004809210847788908, - "loss": 0.8562, - "step": 16125 - }, - { - "epoch": 3.94, - "learning_rate": 0.0004808905448326411, - "loss": 0.8754, - "step": 16150 - }, - { - "epoch": 3.95, - "learning_rate": 0.0004808600048863914, - "loss": 0.8995, - "step": 16175 - }, - { - "epoch": 3.95, - "learning_rate": 0.0004808294649401417, - "loss": 0.888, - "step": 16200 - }, - { - "epoch": 3.96, - "learning_rate": 0.000480798924993892, - "loss": 0.9029, - "step": 16225 - }, - { - "epoch": 3.97, - "learning_rate": 0.00048076838504764233, - "loss": 0.8989, - "step": 16250 - }, - { - "epoch": 3.97, - "learning_rate": 0.00048073784510139264, - "loss": 0.8953, - "step": 16275 - }, - { - "epoch": 3.98, - "learning_rate": 0.00048070730515514294, - "loss": 0.8848, - "step": 16300 - }, - { - "epoch": 3.98, - "learning_rate": 0.00048067676520889324, - "loss": 0.8959, - "step": 16325 - }, - { - "epoch": 3.99, - "learning_rate": 0.00048064622526264355, - "loss": 0.9037, - "step": 16350 - }, - { - "epoch": 4.0, - "learning_rate": 0.0004806156853163939, - "loss": 0.8861, - "step": 16375 - }, - { - "epoch": 4.0, - "learning_rate": 0.00048058514537014415, - "loss": 0.8714, - "step": 16400 - }, - { - "epoch": 4.01, - "learning_rate": 0.00048055460542389446, - "loss": 0.8466, - "step": 16425 - }, - { - "epoch": 4.01, - "learning_rate": 0.00048052406547764476, - "loss": 0.8683, - "step": 16450 - }, - { - "epoch": 4.02, - "learning_rate": 0.00048049352553139506, - "loss": 0.8804, - "step": 16475 - }, - { - "epoch": 4.03, - "learning_rate": 0.0004804629855851454, - "loss": 0.8748, - "step": 16500 - }, - { - "epoch": 4.03, - "eval_cer": 0.19239140478219358, - "eval_loss": 0.6182339191436768, - "eval_runtime": 155.8113, - "eval_samples_per_second": 26.911, - "eval_steps_per_second": 6.733, - "eval_wer": 0.7095595432300164, - "step": 16500 - }, - { - "epoch": 4.03, - "learning_rate": 0.0004804324456388957, - "loss": 0.8761, - "step": 16525 - }, - { - "epoch": 4.04, - "learning_rate": 0.00048040190569264597, - "loss": 0.8836, - "step": 16550 - }, - { - "epoch": 4.04, - "learning_rate": 0.0004803713657463963, - "loss": 0.8432, - "step": 16575 - }, - { - "epoch": 4.05, - "learning_rate": 0.0004803408258001466, - "loss": 0.8815, - "step": 16600 - }, - { - "epoch": 4.06, - "learning_rate": 0.00048031028585389694, - "loss": 0.8588, - "step": 16625 - }, - { - "epoch": 4.06, - "learning_rate": 0.00048027974590764724, - "loss": 0.8693, - "step": 16650 - }, - { - "epoch": 4.07, - "learning_rate": 0.00048024920596139754, - "loss": 0.8591, - "step": 16675 - }, - { - "epoch": 4.08, - "learning_rate": 0.0004802186660151478, - "loss": 0.826, - "step": 16700 - }, - { - "epoch": 4.08, - "learning_rate": 0.0004801881260688981, - "loss": 0.8454, - "step": 16725 - }, - { - "epoch": 4.09, - "learning_rate": 0.00048015758612264845, - "loss": 0.8355, - "step": 16750 - }, - { - "epoch": 4.09, - "learning_rate": 0.00048012704617639876, - "loss": 0.8605, - "step": 16775 - }, - { - "epoch": 4.1, - "learning_rate": 0.00048009650623014906, - "loss": 0.8632, - "step": 16800 - }, - { - "epoch": 4.11, - "learning_rate": 0.00048006596628389936, - "loss": 0.8736, - "step": 16825 - }, - { - "epoch": 4.11, - "learning_rate": 0.00048003542633764967, - "loss": 0.8854, - "step": 16850 - }, - { - "epoch": 4.12, - "learning_rate": 0.0004800048863913999, - "loss": 0.8112, - "step": 16875 - }, - { - "epoch": 4.12, - "learning_rate": 0.0004799743464451503, - "loss": 0.9039, - "step": 16900 - }, - { - "epoch": 4.13, - "learning_rate": 0.0004799438064989006, - "loss": 0.8413, - "step": 16925 - }, - { - "epoch": 4.14, - "learning_rate": 0.0004799132665526509, - "loss": 0.893, - "step": 16950 - }, - { - "epoch": 4.14, - "learning_rate": 0.0004798827266064012, - "loss": 0.8393, - "step": 16975 - }, - { - "epoch": 4.15, - "learning_rate": 0.0004798521866601515, - "loss": 0.8646, - "step": 17000 - }, - { - "epoch": 4.15, - "eval_cer": 0.1894038171308892, - "eval_loss": 0.610537588596344, - "eval_runtime": 151.6007, - "eval_samples_per_second": 27.658, - "eval_steps_per_second": 6.919, - "eval_wer": 0.7057096247960848, - "step": 17000 - }, - { - "epoch": 4.15, - "learning_rate": 0.0004798216467139018, - "loss": 0.8306, - "step": 17025 - }, - { - "epoch": 4.16, - "learning_rate": 0.0004797911067676521, - "loss": 0.8423, - "step": 17050 - }, - { - "epoch": 4.17, - "learning_rate": 0.0004797605668214024, - "loss": 0.8677, - "step": 17075 - }, - { - "epoch": 4.17, - "learning_rate": 0.0004797300268751527, - "loss": 0.881, - "step": 17100 - }, - { - "epoch": 4.18, - "learning_rate": 0.000479699486928903, - "loss": 0.8678, - "step": 17125 - }, - { - "epoch": 4.18, - "learning_rate": 0.00047966894698265336, - "loss": 0.8482, - "step": 17150 - }, - { - "epoch": 4.19, - "learning_rate": 0.0004796384070364036, - "loss": 0.8506, - "step": 17175 - }, - { - "epoch": 4.2, - "learning_rate": 0.0004796078670901539, - "loss": 0.865, - "step": 17200 - }, - { - "epoch": 4.2, - "learning_rate": 0.0004795773271439042, - "loss": 0.8473, - "step": 17225 - }, - { - "epoch": 4.21, - "learning_rate": 0.0004795467871976545, - "loss": 0.8935, - "step": 17250 - }, - { - "epoch": 4.22, - "learning_rate": 0.0004795162472514049, - "loss": 0.8363, - "step": 17275 - }, - { - "epoch": 4.22, - "learning_rate": 0.0004794857073051552, - "loss": 0.8998, - "step": 17300 - }, - { - "epoch": 4.23, - "learning_rate": 0.00047945516735890543, - "loss": 0.8064, - "step": 17325 - }, - { - "epoch": 4.23, - "learning_rate": 0.00047942462741265573, - "loss": 0.8821, - "step": 17350 - }, - { - "epoch": 4.24, - "learning_rate": 0.00047939408746640604, - "loss": 0.8698, - "step": 17375 - }, - { - "epoch": 4.25, - "learning_rate": 0.0004793635475201564, - "loss": 0.8981, - "step": 17400 - }, - { - "epoch": 4.25, - "learning_rate": 0.0004793330075739067, - "loss": 0.89, - "step": 17425 - }, - { - "epoch": 4.26, - "learning_rate": 0.000479302467627657, - "loss": 0.9013, - "step": 17450 - }, - { - "epoch": 4.26, - "learning_rate": 0.0004792719276814073, - "loss": 0.8582, - "step": 17475 - }, - { - "epoch": 4.27, - "learning_rate": 0.00047924138773515755, - "loss": 0.8455, - "step": 17500 - }, - { - "epoch": 4.27, - "eval_cer": 0.19123640955617383, - "eval_loss": 0.6235982775688171, - "eval_runtime": 151.4202, - "eval_samples_per_second": 27.691, - "eval_steps_per_second": 6.928, - "eval_wer": 0.7036215334420881, - "step": 17500 - }, - { - "epoch": 4.28, - "learning_rate": 0.0004792108477889079, - "loss": 0.8973, - "step": 17525 - }, - { - "epoch": 4.28, - "learning_rate": 0.0004791803078426582, - "loss": 0.9159, - "step": 17550 - }, - { - "epoch": 4.29, - "learning_rate": 0.0004791497678964085, - "loss": 0.891, - "step": 17575 - }, - { - "epoch": 4.29, - "learning_rate": 0.0004791192279501588, - "loss": 0.8436, - "step": 17600 - }, - { - "epoch": 4.3, - "learning_rate": 0.0004790886880039091, - "loss": 0.8194, - "step": 17625 - }, - { - "epoch": 4.31, - "learning_rate": 0.00047905814805765943, - "loss": 0.9107, - "step": 17650 - }, - { - "epoch": 4.31, - "learning_rate": 0.00047902760811140973, - "loss": 0.8197, - "step": 17675 - }, - { - "epoch": 4.32, - "learning_rate": 0.00047899706816516003, - "loss": 0.8804, - "step": 17700 - }, - { - "epoch": 4.33, - "learning_rate": 0.00047896652821891034, - "loss": 0.8347, - "step": 17725 - }, - { - "epoch": 4.33, - "learning_rate": 0.00047893598827266064, - "loss": 0.8829, - "step": 17750 - }, - { - "epoch": 4.34, - "learning_rate": 0.000478905448326411, - "loss": 0.8283, - "step": 17775 - }, - { - "epoch": 4.34, - "learning_rate": 0.00047887490838016125, - "loss": 0.9252, - "step": 17800 - }, - { - "epoch": 4.35, - "learning_rate": 0.00047884436843391155, - "loss": 0.8479, - "step": 17825 - }, - { - "epoch": 4.36, - "learning_rate": 0.00047881382848766185, - "loss": 0.8377, - "step": 17850 - }, - { - "epoch": 4.36, - "learning_rate": 0.00047878328854141216, - "loss": 0.839, - "step": 17875 - }, - { - "epoch": 4.37, - "learning_rate": 0.0004787527485951625, - "loss": 0.8441, - "step": 17900 - }, - { - "epoch": 4.37, - "learning_rate": 0.0004787222086489128, - "loss": 0.8075, - "step": 17925 - }, - { - "epoch": 4.38, - "learning_rate": 0.0004786916687026631, - "loss": 0.8223, - "step": 17950 - }, - { - "epoch": 4.39, - "learning_rate": 0.00047866112875641337, - "loss": 0.8505, - "step": 17975 - }, - { - "epoch": 4.39, - "learning_rate": 0.0004786305888101637, - "loss": 0.8922, - "step": 18000 - }, - { - "epoch": 4.39, - "eval_cer": 0.1920988059916019, - "eval_loss": 0.5946230888366699, - "eval_runtime": 153.06, - "eval_samples_per_second": 27.394, - "eval_steps_per_second": 6.854, - "eval_wer": 0.7341272430668841, - "step": 18000 - }, - { - "epoch": 4.4, - "learning_rate": 0.00047860004886391403, - "loss": 0.8649, - "step": 18025 - }, - { - "epoch": 4.4, - "learning_rate": 0.00047856950891766434, - "loss": 0.8993, - "step": 18050 - }, - { - "epoch": 4.41, - "learning_rate": 0.00047853896897141464, - "loss": 0.8717, - "step": 18075 - }, - { - "epoch": 4.42, - "learning_rate": 0.00047850842902516494, - "loss": 0.8664, - "step": 18100 - }, - { - "epoch": 4.42, - "learning_rate": 0.0004784778890789152, - "loss": 0.8581, - "step": 18125 - }, - { - "epoch": 4.43, - "learning_rate": 0.0004784473491326655, - "loss": 0.88, - "step": 18150 - }, - { - "epoch": 4.44, - "learning_rate": 0.00047841680918641585, - "loss": 0.882, - "step": 18175 - }, - { - "epoch": 4.44, - "learning_rate": 0.00047838626924016616, - "loss": 0.8509, - "step": 18200 - }, - { - "epoch": 4.45, - "learning_rate": 0.00047835572929391646, - "loss": 0.8531, - "step": 18225 - }, - { - "epoch": 4.45, - "learning_rate": 0.00047832518934766676, - "loss": 0.8309, - "step": 18250 - }, - { - "epoch": 4.46, - "learning_rate": 0.000478294649401417, - "loss": 0.8175, - "step": 18275 - }, - { - "epoch": 4.47, - "learning_rate": 0.00047826410945516737, - "loss": 0.8153, - "step": 18300 - }, - { - "epoch": 4.47, - "learning_rate": 0.00047823356950891767, - "loss": 0.8628, - "step": 18325 - }, - { - "epoch": 4.48, - "learning_rate": 0.000478203029562668, - "loss": 0.8184, - "step": 18350 - }, - { - "epoch": 4.48, - "learning_rate": 0.0004781724896164183, - "loss": 0.8636, - "step": 18375 - }, - { - "epoch": 4.49, - "learning_rate": 0.0004781419496701686, - "loss": 0.9017, - "step": 18400 - }, - { - "epoch": 4.5, - "learning_rate": 0.00047811140972391894, - "loss": 0.8521, - "step": 18425 - }, - { - "epoch": 4.5, - "learning_rate": 0.0004780808697776692, - "loss": 0.8823, - "step": 18450 - }, - { - "epoch": 4.51, - "learning_rate": 0.0004780503298314195, - "loss": 0.8743, - "step": 18475 - }, - { - "epoch": 4.51, - "learning_rate": 0.0004780197898851698, - "loss": 0.892, - "step": 18500 - }, - { - "epoch": 4.51, - "eval_cer": 0.1869244273790335, - "eval_loss": 0.5911566615104675, - "eval_runtime": 154.1004, - "eval_samples_per_second": 27.21, - "eval_steps_per_second": 6.807, - "eval_wer": 0.7141924959216965, - "step": 18500 - }, - { - "epoch": 4.52, - "learning_rate": 0.0004779892499389201, - "loss": 0.819, - "step": 18525 - }, - { - "epoch": 4.53, - "learning_rate": 0.00047795870999267046, - "loss": 0.8848, - "step": 18550 - }, - { - "epoch": 4.53, - "learning_rate": 0.00047792817004642076, - "loss": 0.866, - "step": 18575 - }, - { - "epoch": 4.54, - "learning_rate": 0.000477897630100171, - "loss": 0.8542, - "step": 18600 - }, - { - "epoch": 4.54, - "learning_rate": 0.0004778670901539213, - "loss": 0.8467, - "step": 18625 - }, - { - "epoch": 4.55, - "learning_rate": 0.0004778365502076716, - "loss": 0.8299, - "step": 18650 - }, - { - "epoch": 4.56, - "learning_rate": 0.000477806010261422, - "loss": 0.8438, - "step": 18675 - }, - { - "epoch": 4.56, - "learning_rate": 0.0004777754703151723, - "loss": 0.9114, - "step": 18700 - }, - { - "epoch": 4.57, - "learning_rate": 0.0004777449303689226, - "loss": 0.8342, - "step": 18725 - }, - { - "epoch": 4.58, - "learning_rate": 0.00047771561202052283, - "loss": 0.8113, - "step": 18750 - }, - { - "epoch": 4.58, - "learning_rate": 0.00047768507207427314, - "loss": 0.8987, - "step": 18775 - }, - { - "epoch": 4.59, - "learning_rate": 0.00047765453212802344, - "loss": 0.9497, - "step": 18800 - }, - { - "epoch": 4.59, - "learning_rate": 0.0004776239921817738, - "loss": 0.8582, - "step": 18825 - }, - { - "epoch": 4.6, - "learning_rate": 0.0004775934522355241, - "loss": 0.8603, - "step": 18850 - }, - { - "epoch": 4.61, - "learning_rate": 0.0004775629122892744, - "loss": 0.8849, - "step": 18875 - }, - { - "epoch": 4.61, - "learning_rate": 0.0004775323723430247, - "loss": 0.7985, - "step": 18900 - }, - { - "epoch": 4.62, - "learning_rate": 0.00047750183239677496, - "loss": 0.8452, - "step": 18925 - }, - { - "epoch": 4.62, - "learning_rate": 0.00047747129245052526, - "loss": 0.8839, - "step": 18950 - }, - { - "epoch": 4.63, - "learning_rate": 0.0004774407525042756, - "loss": 0.875, - "step": 18975 - }, - { - "epoch": 4.64, - "learning_rate": 0.0004774102125580259, - "loss": 0.8652, - "step": 19000 - }, - { - "epoch": 4.64, - "eval_cer": 0.18706816011827151, - "eval_loss": 0.6004529595375061, - "eval_runtime": 153.7951, - "eval_samples_per_second": 27.264, - "eval_steps_per_second": 6.821, - "eval_wer": 0.6966068515497553, - "step": 19000 - }, - { - "epoch": 4.64, - "learning_rate": 0.0004773796726117762, - "loss": 0.8351, - "step": 19025 - }, - { - "epoch": 4.65, - "learning_rate": 0.0004773491326655265, - "loss": 0.8282, - "step": 19050 - }, - { - "epoch": 4.65, - "learning_rate": 0.0004773185927192768, - "loss": 0.8422, - "step": 19075 - }, - { - "epoch": 4.66, - "learning_rate": 0.00047728805277302713, - "loss": 0.8612, - "step": 19100 - }, - { - "epoch": 4.67, - "learning_rate": 0.00047725751282677744, - "loss": 0.843, - "step": 19125 - }, - { - "epoch": 4.67, - "learning_rate": 0.00047722697288052774, - "loss": 0.8185, - "step": 19150 - }, - { - "epoch": 4.68, - "learning_rate": 0.00047719643293427804, - "loss": 0.8069, - "step": 19175 - }, - { - "epoch": 4.69, - "learning_rate": 0.00047716589298802835, - "loss": 0.8473, - "step": 19200 - }, - { - "epoch": 4.69, - "learning_rate": 0.00047713535304177865, - "loss": 0.8486, - "step": 19225 - }, - { - "epoch": 4.7, - "learning_rate": 0.00047710481309552895, - "loss": 0.8625, - "step": 19250 - }, - { - "epoch": 4.7, - "learning_rate": 0.00047707427314927926, - "loss": 0.8526, - "step": 19275 - }, - { - "epoch": 4.71, - "learning_rate": 0.00047704373320302956, - "loss": 0.8784, - "step": 19300 - }, - { - "epoch": 4.72, - "learning_rate": 0.00047701319325677986, - "loss": 0.8541, - "step": 19325 - }, - { - "epoch": 4.72, - "learning_rate": 0.0004769826533105302, - "loss": 0.8885, - "step": 19350 - }, - { - "epoch": 4.73, - "learning_rate": 0.0004769521133642805, - "loss": 0.8381, - "step": 19375 - }, - { - "epoch": 4.73, - "learning_rate": 0.0004769215734180308, - "loss": 0.8414, - "step": 19400 - }, - { - "epoch": 4.74, - "learning_rate": 0.0004768910334717811, - "loss": 0.8571, - "step": 19425 - }, - { - "epoch": 4.75, - "learning_rate": 0.0004768604935255314, - "loss": 0.8505, - "step": 19450 - }, - { - "epoch": 4.75, - "learning_rate": 0.00047682995357928174, - "loss": 0.8485, - "step": 19475 - }, - { - "epoch": 4.76, - "learning_rate": 0.00047679941363303204, - "loss": 0.899, - "step": 19500 - }, - { - "epoch": 4.76, - "eval_cer": 0.18276131125324682, - "eval_loss": 0.5773286819458008, - "eval_runtime": 154.5433, - "eval_samples_per_second": 27.132, - "eval_steps_per_second": 6.788, - "eval_wer": 0.6981402936378467, - "step": 19500 - }, - { - "epoch": 4.76, - "learning_rate": 0.00047676887368678234, - "loss": 0.8769, - "step": 19525 - }, - { - "epoch": 4.77, - "learning_rate": 0.0004767383337405326, - "loss": 0.9001, - "step": 19550 - }, - { - "epoch": 4.78, - "learning_rate": 0.0004767077937942829, - "loss": 0.8733, - "step": 19575 - }, - { - "epoch": 4.78, - "learning_rate": 0.00047667725384803325, - "loss": 0.8425, - "step": 19600 - }, - { - "epoch": 4.79, - "learning_rate": 0.00047664671390178356, - "loss": 0.8404, - "step": 19625 - }, - { - "epoch": 4.8, - "learning_rate": 0.00047661617395553386, - "loss": 0.8385, - "step": 19650 - }, - { - "epoch": 4.8, - "learning_rate": 0.00047658563400928416, - "loss": 0.8495, - "step": 19675 - }, - { - "epoch": 4.81, - "learning_rate": 0.0004765550940630344, - "loss": 0.8986, - "step": 19700 - }, - { - "epoch": 4.81, - "learning_rate": 0.00047652455411678477, - "loss": 0.847, - "step": 19725 - }, - { - "epoch": 4.82, - "learning_rate": 0.0004764940141705351, - "loss": 0.8786, - "step": 19750 - }, - { - "epoch": 4.83, - "learning_rate": 0.0004764634742242854, - "loss": 0.857, - "step": 19775 - }, - { - "epoch": 4.83, - "learning_rate": 0.0004764329342780357, - "loss": 0.8316, - "step": 19800 - }, - { - "epoch": 4.84, - "learning_rate": 0.000476402394331786, - "loss": 0.8361, - "step": 19825 - }, - { - "epoch": 4.84, - "learning_rate": 0.00047637185438553634, - "loss": 0.8672, - "step": 19850 - }, - { - "epoch": 4.85, - "learning_rate": 0.0004763413144392866, - "loss": 0.82, - "step": 19875 - }, - { - "epoch": 4.86, - "learning_rate": 0.0004763107744930369, - "loss": 0.9363, - "step": 19900 - }, - { - "epoch": 4.86, - "learning_rate": 0.0004762802345467872, - "loss": 0.8214, - "step": 19925 - }, - { - "epoch": 4.87, - "learning_rate": 0.0004762496946005375, - "loss": 0.8463, - "step": 19950 - }, - { - "epoch": 4.87, - "learning_rate": 0.00047621915465428786, - "loss": 0.8159, - "step": 19975 - }, - { - "epoch": 4.88, - "learning_rate": 0.00047618861470803816, - "loss": 0.8552, - "step": 20000 - }, - { - "epoch": 4.88, - "eval_cer": 0.18054372041928893, - "eval_loss": 0.5839799642562866, - "eval_runtime": 155.5746, - "eval_samples_per_second": 26.952, - "eval_steps_per_second": 6.743, - "eval_wer": 0.687536704730832, - "step": 20000 - }, - { - "epoch": 4.89, - "learning_rate": 0.0004761580747617884, - "loss": 0.8316, - "step": 20025 - }, - { - "epoch": 4.89, - "learning_rate": 0.0004761275348155387, - "loss": 0.8426, - "step": 20050 - }, - { - "epoch": 4.9, - "learning_rate": 0.000476096994869289, - "loss": 0.8167, - "step": 20075 - }, - { - "epoch": 4.9, - "learning_rate": 0.0004760664549230394, - "loss": 0.8331, - "step": 20100 - }, - { - "epoch": 4.91, - "learning_rate": 0.0004760359149767897, - "loss": 0.8494, - "step": 20125 - }, - { - "epoch": 4.92, - "learning_rate": 0.00047600537503054, - "loss": 0.8332, - "step": 20150 - }, - { - "epoch": 4.92, - "learning_rate": 0.00047597483508429023, - "loss": 0.8497, - "step": 20175 - }, - { - "epoch": 4.93, - "learning_rate": 0.00047594429513804054, - "loss": 0.8528, - "step": 20200 - }, - { - "epoch": 4.94, - "learning_rate": 0.00047591375519179084, - "loss": 0.8209, - "step": 20225 - }, - { - "epoch": 4.94, - "learning_rate": 0.0004758832152455412, - "loss": 0.8663, - "step": 20250 - }, - { - "epoch": 4.95, - "learning_rate": 0.0004758526752992915, - "loss": 0.8484, - "step": 20275 - }, - { - "epoch": 4.95, - "learning_rate": 0.0004758221353530418, - "loss": 0.9051, - "step": 20300 - }, - { - "epoch": 4.96, - "learning_rate": 0.0004757915954067921, - "loss": 0.8601, - "step": 20325 - }, - { - "epoch": 4.97, - "learning_rate": 0.00047576105546054236, - "loss": 0.8726, - "step": 20350 - }, - { - "epoch": 4.97, - "learning_rate": 0.0004757305155142927, - "loss": 0.8709, - "step": 20375 - }, - { - "epoch": 4.98, - "learning_rate": 0.000475699975568043, - "loss": 0.8691, - "step": 20400 - }, - { - "epoch": 4.98, - "learning_rate": 0.0004756694356217933, - "loss": 0.8425, - "step": 20425 - }, - { - "epoch": 4.99, - "learning_rate": 0.0004756388956755436, - "loss": 0.9021, - "step": 20450 - }, - { - "epoch": 5.0, - "learning_rate": 0.0004756083557292939, - "loss": 0.8877, - "step": 20475 - }, - { - "epoch": 5.0, - "learning_rate": 0.00047557781578304423, - "loss": 0.8581, - "step": 20500 - }, - { - "epoch": 5.0, - "eval_cer": 0.18998901471207252, - "eval_loss": 0.5940809845924377, - "eval_runtime": 154.3505, - "eval_samples_per_second": 27.165, - "eval_steps_per_second": 6.796, - "eval_wer": 0.7326916802610114, - "step": 20500 - }, - { - "epoch": 5.01, - "learning_rate": 0.00047554727583679453, - "loss": 0.8584, - "step": 20525 - }, - { - "epoch": 5.01, - "learning_rate": 0.00047551673589054484, - "loss": 0.8564, - "step": 20550 - }, - { - "epoch": 5.02, - "learning_rate": 0.00047548619594429514, - "loss": 0.7907, - "step": 20575 - }, - { - "epoch": 5.03, - "learning_rate": 0.00047545565599804544, - "loss": 0.7891, - "step": 20600 - }, - { - "epoch": 5.03, - "learning_rate": 0.0004754251160517958, - "loss": 0.7914, - "step": 20625 - }, - { - "epoch": 5.04, - "learning_rate": 0.00047539457610554605, - "loss": 0.8744, - "step": 20650 - }, - { - "epoch": 5.05, - "learning_rate": 0.00047536403615929635, - "loss": 0.813, - "step": 20675 - }, - { - "epoch": 5.05, - "learning_rate": 0.00047533349621304666, - "loss": 0.8361, - "step": 20700 - }, - { - "epoch": 5.06, - "learning_rate": 0.00047530295626679696, - "loss": 0.7998, - "step": 20725 - }, - { - "epoch": 5.06, - "learning_rate": 0.0004752724163205473, - "loss": 0.7892, - "step": 20750 - }, - { - "epoch": 5.07, - "learning_rate": 0.0004752418763742976, - "loss": 0.7928, - "step": 20775 - }, - { - "epoch": 5.08, - "learning_rate": 0.00047521133642804787, - "loss": 0.826, - "step": 20800 - }, - { - "epoch": 5.08, - "learning_rate": 0.00047518079648179817, - "loss": 0.8311, - "step": 20825 - }, - { - "epoch": 5.09, - "learning_rate": 0.0004751502565355485, - "loss": 0.8117, - "step": 20850 - }, - { - "epoch": 5.09, - "learning_rate": 0.00047511971658929883, - "loss": 0.8047, - "step": 20875 - }, - { - "epoch": 5.1, - "learning_rate": 0.00047508917664304914, - "loss": 0.7799, - "step": 20900 - }, - { - "epoch": 5.11, - "learning_rate": 0.00047505863669679944, - "loss": 0.8633, - "step": 20925 - }, - { - "epoch": 5.11, - "learning_rate": 0.00047502809675054974, - "loss": 0.817, - "step": 20950 - }, - { - "epoch": 5.12, - "learning_rate": 0.0004749975568043, - "loss": 0.782, - "step": 20975 - }, - { - "epoch": 5.12, - "learning_rate": 0.00047496701685805035, - "loss": 0.8571, - "step": 21000 - }, - { - "epoch": 5.12, - "eval_cer": 0.18460417030276274, - "eval_loss": 0.591896116733551, - "eval_runtime": 154.5066, - "eval_samples_per_second": 27.138, - "eval_steps_per_second": 6.789, - "eval_wer": 0.7048939641109299, - "step": 21000 - }, - { - "epoch": 5.13, - "learning_rate": 0.00047493647691180065, - "loss": 0.842, - "step": 21025 - }, - { - "epoch": 5.14, - "learning_rate": 0.00047490593696555096, - "loss": 0.8247, - "step": 21050 - }, - { - "epoch": 5.14, - "learning_rate": 0.00047487539701930126, - "loss": 0.7865, - "step": 21075 - }, - { - "epoch": 5.15, - "learning_rate": 0.00047484485707305156, - "loss": 0.8372, - "step": 21100 - }, - { - "epoch": 5.15, - "learning_rate": 0.00047481431712680187, - "loss": 0.8344, - "step": 21125 - }, - { - "epoch": 5.16, - "learning_rate": 0.00047478377718055217, - "loss": 0.8012, - "step": 21150 - }, - { - "epoch": 5.17, - "learning_rate": 0.0004747532372343025, - "loss": 0.8137, - "step": 21175 - }, - { - "epoch": 5.17, - "learning_rate": 0.0004747226972880528, - "loss": 0.8604, - "step": 21200 - }, - { - "epoch": 5.18, - "learning_rate": 0.0004746921573418031, - "loss": 0.8123, - "step": 21225 - }, - { - "epoch": 5.19, - "learning_rate": 0.00047466161739555344, - "loss": 0.7806, - "step": 21250 - }, - { - "epoch": 5.19, - "learning_rate": 0.0004746310774493037, - "loss": 0.8092, - "step": 21275 - }, - { - "epoch": 5.2, - "learning_rate": 0.000474600537503054, - "loss": 0.8068, - "step": 21300 - }, - { - "epoch": 5.2, - "learning_rate": 0.0004745699975568043, - "loss": 0.792, - "step": 21325 - }, - { - "epoch": 5.21, - "learning_rate": 0.0004745394576105546, - "loss": 0.7547, - "step": 21350 - }, - { - "epoch": 5.22, - "learning_rate": 0.00047450891766430495, - "loss": 0.8371, - "step": 21375 - }, - { - "epoch": 5.22, - "learning_rate": 0.00047447837771805526, - "loss": 0.819, - "step": 21400 - }, - { - "epoch": 5.23, - "learning_rate": 0.00047444783777180556, - "loss": 0.7873, - "step": 21425 - }, - { - "epoch": 5.23, - "learning_rate": 0.0004744172978255558, - "loss": 0.8598, - "step": 21450 - }, - { - "epoch": 5.24, - "learning_rate": 0.0004743867578793061, - "loss": 0.8331, - "step": 21475 - }, - { - "epoch": 5.25, - "learning_rate": 0.0004743562179330564, - "loss": 0.7979, - "step": 21500 - }, - { - "epoch": 5.25, - "eval_cer": 0.1748200774103467, - "eval_loss": 0.5703975558280945, - "eval_runtime": 154.9079, - "eval_samples_per_second": 27.068, - "eval_steps_per_second": 6.772, - "eval_wer": 0.6698205546492659, - "step": 21500 - }, - { - "epoch": 5.25, - "learning_rate": 0.0004743256779868068, - "loss": 0.83, - "step": 21525 - }, - { - "epoch": 5.26, - "learning_rate": 0.0004742951380405571, - "loss": 0.85, - "step": 21550 - }, - { - "epoch": 5.26, - "learning_rate": 0.0004742645980943074, - "loss": 0.8218, - "step": 21575 - }, - { - "epoch": 5.27, - "learning_rate": 0.00047423405814805763, - "loss": 0.8249, - "step": 21600 - }, - { - "epoch": 5.28, - "learning_rate": 0.00047420351820180793, - "loss": 0.8485, - "step": 21625 - }, - { - "epoch": 5.28, - "learning_rate": 0.0004741729782555583, - "loss": 0.8386, - "step": 21650 - }, - { - "epoch": 5.29, - "learning_rate": 0.0004741424383093086, - "loss": 0.797, - "step": 21675 - }, - { - "epoch": 5.3, - "learning_rate": 0.0004741118983630589, - "loss": 0.854, - "step": 21700 - }, - { - "epoch": 5.3, - "learning_rate": 0.0004740813584168092, - "loss": 0.7792, - "step": 21725 - }, - { - "epoch": 5.31, - "learning_rate": 0.00047405081847055945, - "loss": 0.804, - "step": 21750 - }, - { - "epoch": 5.31, - "learning_rate": 0.0004740202785243098, - "loss": 0.7898, - "step": 21775 - }, - { - "epoch": 5.32, - "learning_rate": 0.0004739897385780601, - "loss": 0.7937, - "step": 21800 - }, - { - "epoch": 5.33, - "learning_rate": 0.0004739591986318104, - "loss": 0.8173, - "step": 21825 - }, - { - "epoch": 5.33, - "learning_rate": 0.0004739286586855607, - "loss": 0.8347, - "step": 21850 - }, - { - "epoch": 5.34, - "learning_rate": 0.000473898118739311, - "loss": 0.8076, - "step": 21875 - }, - { - "epoch": 5.34, - "learning_rate": 0.0004738675787930614, - "loss": 0.8352, - "step": 21900 - }, - { - "epoch": 5.35, - "learning_rate": 0.00047383703884681163, - "loss": 0.8279, - "step": 21925 - }, - { - "epoch": 5.36, - "learning_rate": 0.00047380649890056193, - "loss": 0.784, - "step": 21950 - }, - { - "epoch": 5.36, - "learning_rate": 0.00047377595895431224, - "loss": 0.8001, - "step": 21975 - }, - { - "epoch": 5.37, - "learning_rate": 0.00047374541900806254, - "loss": 0.8348, - "step": 22000 - }, - { - "epoch": 5.37, - "eval_cer": 0.1788907939180518, - "eval_loss": 0.5868992805480957, - "eval_runtime": 154.2562, - "eval_samples_per_second": 27.182, - "eval_steps_per_second": 6.8, - "eval_wer": 0.6766068515497553, - "step": 22000 - }, - { - "epoch": 5.37, - "learning_rate": 0.0004737148790618129, - "loss": 0.8137, - "step": 22025 - }, - { - "epoch": 5.38, - "learning_rate": 0.0004736843391155632, - "loss": 0.8458, - "step": 22050 - }, - { - "epoch": 5.39, - "learning_rate": 0.00047365379916931345, - "loss": 0.8318, - "step": 22075 - }, - { - "epoch": 5.39, - "learning_rate": 0.00047362325922306375, - "loss": 0.8083, - "step": 22100 - }, - { - "epoch": 5.4, - "learning_rate": 0.00047359271927681406, - "loss": 0.7662, - "step": 22125 - }, - { - "epoch": 5.41, - "learning_rate": 0.0004735621793305644, - "loss": 0.8556, - "step": 22150 - }, - { - "epoch": 5.41, - "learning_rate": 0.0004735316393843147, - "loss": 0.8289, - "step": 22175 - }, - { - "epoch": 5.42, - "learning_rate": 0.000473501099438065, - "loss": 0.7828, - "step": 22200 - }, - { - "epoch": 5.42, - "learning_rate": 0.00047347055949181527, - "loss": 0.7481, - "step": 22225 - }, - { - "epoch": 5.43, - "learning_rate": 0.00047344001954556557, - "loss": 0.8216, - "step": 22250 - }, - { - "epoch": 5.44, - "learning_rate": 0.00047340947959931593, - "loss": 0.8051, - "step": 22275 - }, - { - "epoch": 5.44, - "learning_rate": 0.00047337893965306623, - "loss": 0.7921, - "step": 22300 - }, - { - "epoch": 5.45, - "learning_rate": 0.00047334839970681654, - "loss": 0.8073, - "step": 22325 - }, - { - "epoch": 5.45, - "learning_rate": 0.00047331785976056684, - "loss": 0.8664, - "step": 22350 - }, - { - "epoch": 5.46, - "learning_rate": 0.00047328731981431714, - "loss": 0.8147, - "step": 22375 - }, - { - "epoch": 5.47, - "learning_rate": 0.00047325677986806745, - "loss": 0.8146, - "step": 22400 - }, - { - "epoch": 5.47, - "learning_rate": 0.00047322623992181775, - "loss": 0.7966, - "step": 22425 - }, - { - "epoch": 5.48, - "learning_rate": 0.00047319569997556805, - "loss": 0.8359, - "step": 22450 - }, - { - "epoch": 5.48, - "learning_rate": 0.00047316516002931836, - "loss": 0.8292, - "step": 22475 - }, - { - "epoch": 5.49, - "learning_rate": 0.00047313462008306866, - "loss": 0.7843, - "step": 22500 - }, - { - "epoch": 5.49, - "eval_cer": 0.1750356765192037, - "eval_loss": 0.5732399821281433, - "eval_runtime": 154.5633, - "eval_samples_per_second": 27.128, - "eval_steps_per_second": 6.787, - "eval_wer": 0.6731810766721044, - "step": 22500 - }, - { - "epoch": 5.5, - "learning_rate": 0.000473104080136819, - "loss": 0.7897, - "step": 22525 - }, - { - "epoch": 5.5, - "learning_rate": 0.00047307354019056927, - "loss": 0.7618, - "step": 22550 - }, - { - "epoch": 5.51, - "learning_rate": 0.00047304300024431957, - "loss": 0.8309, - "step": 22575 - }, - { - "epoch": 5.51, - "learning_rate": 0.0004730124602980699, - "loss": 0.7635, - "step": 22600 - }, - { - "epoch": 5.52, - "learning_rate": 0.0004729819203518202, - "loss": 0.818, - "step": 22625 - }, - { - "epoch": 5.53, - "learning_rate": 0.00047295138040557053, - "loss": 0.8215, - "step": 22650 - }, - { - "epoch": 5.53, - "learning_rate": 0.00047292084045932084, - "loss": 0.8412, - "step": 22675 - }, - { - "epoch": 5.54, - "learning_rate": 0.0004728903005130711, - "loss": 0.7867, - "step": 22700 - }, - { - "epoch": 5.55, - "learning_rate": 0.0004728597605668214, - "loss": 0.7692, - "step": 22725 - }, - { - "epoch": 5.55, - "learning_rate": 0.0004728292206205717, - "loss": 0.8446, - "step": 22750 - }, - { - "epoch": 5.56, - "learning_rate": 0.00047279868067432205, - "loss": 0.8351, - "step": 22775 - }, - { - "epoch": 5.56, - "learning_rate": 0.00047276814072807235, - "loss": 0.7931, - "step": 22800 - }, - { - "epoch": 5.57, - "learning_rate": 0.00047273760078182266, - "loss": 0.862, - "step": 22825 - }, - { - "epoch": 5.58, - "learning_rate": 0.00047270706083557296, - "loss": 0.88, - "step": 22850 - }, - { - "epoch": 5.58, - "learning_rate": 0.0004726765208893232, - "loss": 0.785, - "step": 22875 - }, - { - "epoch": 5.59, - "learning_rate": 0.0004726459809430735, - "loss": 0.8098, - "step": 22900 - }, - { - "epoch": 5.59, - "learning_rate": 0.00047261544099682387, - "loss": 0.7932, - "step": 22925 - }, - { - "epoch": 5.6, - "learning_rate": 0.0004725849010505742, - "loss": 0.8176, - "step": 22950 - }, - { - "epoch": 5.61, - "learning_rate": 0.0004725543611043245, - "loss": 0.8033, - "step": 22975 - }, - { - "epoch": 5.61, - "learning_rate": 0.0004725250427559248, - "loss": 0.855, - "step": 23000 - }, - { - "epoch": 5.61, - "eval_cer": 0.1686601028715748, - "eval_loss": 0.5447995662689209, - "eval_runtime": 154.9215, - "eval_samples_per_second": 27.065, - "eval_steps_per_second": 6.771, - "eval_wer": 0.6520065252854812, - "step": 23000 - }, - { - "epoch": 5.62, - "learning_rate": 0.00047249450280967503, - "loss": 0.7908, - "step": 23025 - }, - { - "epoch": 5.62, - "learning_rate": 0.00047246396286342534, - "loss": 0.8381, - "step": 23050 - }, - { - "epoch": 5.63, - "learning_rate": 0.0004724334229171757, - "loss": 0.8155, - "step": 23075 - }, - { - "epoch": 5.64, - "learning_rate": 0.000472402882970926, - "loss": 0.8471, - "step": 23100 - }, - { - "epoch": 5.64, - "learning_rate": 0.0004723723430246763, - "loss": 0.8259, - "step": 23125 - }, - { - "epoch": 5.65, - "learning_rate": 0.0004723418030784266, - "loss": 0.8709, - "step": 23150 - }, - { - "epoch": 5.66, - "learning_rate": 0.00047231126313217685, - "loss": 0.7902, - "step": 23175 - }, - { - "epoch": 5.66, - "learning_rate": 0.0004722807231859272, - "loss": 0.8795, - "step": 23200 - }, - { - "epoch": 5.67, - "learning_rate": 0.0004722501832396775, - "loss": 0.8107, - "step": 23225 - }, - { - "epoch": 5.67, - "learning_rate": 0.0004722196432934278, - "loss": 0.7959, - "step": 23250 - }, - { - "epoch": 5.68, - "learning_rate": 0.0004721891033471781, - "loss": 0.7615, - "step": 23275 - }, - { - "epoch": 5.69, - "learning_rate": 0.0004721585634009284, - "loss": 0.8344, - "step": 23300 - }, - { - "epoch": 5.69, - "learning_rate": 0.0004721280234546788, - "loss": 0.8545, - "step": 23325 - }, - { - "epoch": 5.7, - "learning_rate": 0.00047209748350842903, - "loss": 0.8713, - "step": 23350 - }, - { - "epoch": 5.7, - "learning_rate": 0.00047206694356217933, - "loss": 0.7914, - "step": 23375 - }, - { - "epoch": 5.71, - "learning_rate": 0.00047203640361592964, - "loss": 0.8725, - "step": 23400 - }, - { - "epoch": 5.72, - "learning_rate": 0.00047200586366967994, - "loss": 0.834, - "step": 23425 - }, - { - "epoch": 5.72, - "learning_rate": 0.0004719753237234303, - "loss": 0.8515, - "step": 23450 - }, - { - "epoch": 5.73, - "learning_rate": 0.0004719447837771806, - "loss": 0.7854, - "step": 23475 - }, - { - "epoch": 5.73, - "learning_rate": 0.00047191424383093085, - "loss": 0.7774, - "step": 23500 - }, - { - "epoch": 5.73, - "eval_cer": 0.17590320626674744, - "eval_loss": 0.5685146450996399, - "eval_runtime": 150.6401, - "eval_samples_per_second": 27.835, - "eval_steps_per_second": 6.964, - "eval_wer": 0.6818270799347471, - "step": 23500 - }, - { - "epoch": 5.74, - "learning_rate": 0.00047188370388468115, - "loss": 0.8371, - "step": 23525 - }, - { - "epoch": 5.75, - "learning_rate": 0.00047185316393843146, - "loss": 0.7747, - "step": 23550 - }, - { - "epoch": 5.75, - "learning_rate": 0.00047182262399218176, - "loss": 0.801, - "step": 23575 - }, - { - "epoch": 5.76, - "learning_rate": 0.0004717920840459321, - "loss": 0.7689, - "step": 23600 - }, - { - "epoch": 5.77, - "learning_rate": 0.0004717615440996824, - "loss": 0.8017, - "step": 23625 - }, - { - "epoch": 5.77, - "learning_rate": 0.00047173100415343267, - "loss": 0.849, - "step": 23650 - }, - { - "epoch": 5.78, - "learning_rate": 0.000471700464207183, - "loss": 0.7922, - "step": 23675 - }, - { - "epoch": 5.78, - "learning_rate": 0.0004716699242609333, - "loss": 0.849, - "step": 23700 - }, - { - "epoch": 5.79, - "learning_rate": 0.00047163938431468364, - "loss": 0.8138, - "step": 23725 - }, - { - "epoch": 5.8, - "learning_rate": 0.00047160884436843394, - "loss": 0.8949, - "step": 23750 - }, - { - "epoch": 5.8, - "learning_rate": 0.00047157830442218424, - "loss": 0.8182, - "step": 23775 - }, - { - "epoch": 5.81, - "learning_rate": 0.00047154776447593455, - "loss": 0.8002, - "step": 23800 - }, - { - "epoch": 5.81, - "learning_rate": 0.0004715172245296848, - "loss": 0.825, - "step": 23825 - }, - { - "epoch": 5.82, - "learning_rate": 0.00047148668458343515, - "loss": 0.8962, - "step": 23850 - }, - { - "epoch": 5.83, - "learning_rate": 0.00047145614463718546, - "loss": 0.816, - "step": 23875 - }, - { - "epoch": 5.83, - "learning_rate": 0.00047142560469093576, - "loss": 0.7518, - "step": 23900 - }, - { - "epoch": 5.84, - "learning_rate": 0.00047139506474468606, - "loss": 0.812, - "step": 23925 - }, - { - "epoch": 5.84, - "learning_rate": 0.00047136452479843637, - "loss": 0.8034, - "step": 23950 - }, - { - "epoch": 5.85, - "learning_rate": 0.00047133398485218667, - "loss": 0.8022, - "step": 23975 - }, - { - "epoch": 5.86, - "learning_rate": 0.00047130344490593697, - "loss": 0.8622, - "step": 24000 - }, - { - "epoch": 5.86, - "eval_cer": 0.17418868002012258, - "eval_loss": 0.5598137378692627, - "eval_runtime": 151.7552, - "eval_samples_per_second": 27.63, - "eval_steps_per_second": 6.912, - "eval_wer": 0.6687438825448614, - "step": 24000 - }, - { - "epoch": 5.86, - "learning_rate": 0.0004712729049596873, - "loss": 0.8301, - "step": 24025 - }, - { - "epoch": 5.87, - "learning_rate": 0.0004712423650134376, - "loss": 0.7974, - "step": 24050 - }, - { - "epoch": 5.87, - "learning_rate": 0.0004712118250671879, - "loss": 0.788, - "step": 24075 - }, - { - "epoch": 5.88, - "learning_rate": 0.00047118128512093824, - "loss": 0.8011, - "step": 24100 - }, - { - "epoch": 5.89, - "learning_rate": 0.0004711507451746885, - "loss": 0.8189, - "step": 24125 - }, - { - "epoch": 5.89, - "learning_rate": 0.0004711202052284388, - "loss": 0.8521, - "step": 24150 - }, - { - "epoch": 5.9, - "learning_rate": 0.0004710896652821891, - "loss": 0.832, - "step": 24175 - }, - { - "epoch": 5.91, - "learning_rate": 0.0004710591253359394, - "loss": 0.8306, - "step": 24200 - }, - { - "epoch": 5.91, - "learning_rate": 0.00047102858538968976, - "loss": 0.8189, - "step": 24225 - }, - { - "epoch": 5.92, - "learning_rate": 0.00047099804544344006, - "loss": 0.8372, - "step": 24250 - }, - { - "epoch": 5.92, - "learning_rate": 0.0004709675054971903, - "loss": 0.8268, - "step": 24275 - }, - { - "epoch": 5.93, - "learning_rate": 0.0004709369655509406, - "loss": 0.8726, - "step": 24300 - }, - { - "epoch": 5.94, - "learning_rate": 0.0004709064256046909, - "loss": 0.816, - "step": 24325 - }, - { - "epoch": 5.94, - "learning_rate": 0.0004708758856584413, - "loss": 0.8516, - "step": 24350 - }, - { - "epoch": 5.95, - "learning_rate": 0.0004708453457121916, - "loss": 0.7799, - "step": 24375 - }, - { - "epoch": 5.95, - "learning_rate": 0.0004708148057659419, - "loss": 0.825, - "step": 24400 - }, - { - "epoch": 5.96, - "learning_rate": 0.0004707842658196922, - "loss": 0.767, - "step": 24425 - }, - { - "epoch": 5.97, - "learning_rate": 0.00047075372587344243, - "loss": 0.8352, - "step": 24450 - }, - { - "epoch": 5.97, - "learning_rate": 0.0004707231859271928, - "loss": 0.8106, - "step": 24475 - }, - { - "epoch": 5.98, - "learning_rate": 0.0004706926459809431, - "loss": 0.7968, - "step": 24500 - }, - { - "epoch": 5.98, - "eval_cer": 0.16986643121875097, - "eval_loss": 0.5589384436607361, - "eval_runtime": 150.8942, - "eval_samples_per_second": 27.788, - "eval_steps_per_second": 6.952, - "eval_wer": 0.657716150081566, - "step": 24500 - }, - { - "epoch": 5.98, - "learning_rate": 0.0004706621060346934, - "loss": 0.8186, - "step": 24525 - }, - { - "epoch": 5.99, - "learning_rate": 0.0004706315660884437, - "loss": 0.8581, - "step": 24550 - }, - { - "epoch": 6.0, - "learning_rate": 0.000470601026142194, - "loss": 0.7809, - "step": 24575 - }, - { - "epoch": 6.0, - "learning_rate": 0.0004705704861959443, - "loss": 0.8235, - "step": 24600 - }, - { - "epoch": 6.01, - "learning_rate": 0.0004705399462496946, - "loss": 0.8245, - "step": 24625 - }, - { - "epoch": 6.02, - "learning_rate": 0.0004705094063034449, - "loss": 0.8341, - "step": 24650 - }, - { - "epoch": 6.02, - "learning_rate": 0.0004704788663571952, - "loss": 0.7669, - "step": 24675 - }, - { - "epoch": 6.03, - "learning_rate": 0.0004704483264109455, - "loss": 0.775, - "step": 24700 - }, - { - "epoch": 6.03, - "learning_rate": 0.0004704177864646959, - "loss": 0.7697, - "step": 24725 - }, - { - "epoch": 6.04, - "learning_rate": 0.0004703872465184461, - "loss": 0.775, - "step": 24750 - }, - { - "epoch": 6.05, - "learning_rate": 0.00047035670657219643, - "loss": 0.7845, - "step": 24775 - }, - { - "epoch": 6.05, - "learning_rate": 0.00047032616662594673, - "loss": 0.8577, - "step": 24800 - }, - { - "epoch": 6.06, - "learning_rate": 0.00047029562667969704, - "loss": 0.7583, - "step": 24825 - }, - { - "epoch": 6.06, - "learning_rate": 0.0004702650867334474, - "loss": 0.777, - "step": 24850 - }, - { - "epoch": 6.07, - "learning_rate": 0.0004702345467871977, - "loss": 0.7411, - "step": 24875 - }, - { - "epoch": 6.08, - "learning_rate": 0.000470204006840948, - "loss": 0.7703, - "step": 24900 - }, - { - "epoch": 6.08, - "learning_rate": 0.00047017346689469825, - "loss": 0.7881, - "step": 24925 - }, - { - "epoch": 6.09, - "learning_rate": 0.00047014292694844855, - "loss": 0.7471, - "step": 24950 - }, - { - "epoch": 6.09, - "learning_rate": 0.00047011238700219886, - "loss": 0.8077, - "step": 24975 - }, - { - "epoch": 6.1, - "learning_rate": 0.0004700818470559492, - "loss": 0.8253, - "step": 25000 - }, - { - "epoch": 6.1, - "eval_cer": 0.16891676847735695, - "eval_loss": 0.5600982308387756, - "eval_runtime": 152.7105, - "eval_samples_per_second": 27.457, - "eval_steps_per_second": 6.869, - "eval_wer": 0.6617292006525285, - "step": 25000 - }, - { - "epoch": 6.11, - "learning_rate": 0.0004700513071096995, - "loss": 0.774, - "step": 25025 - }, - { - "epoch": 6.11, - "learning_rate": 0.0004700207671634498, - "loss": 0.7965, - "step": 25050 - }, - { - "epoch": 6.12, - "learning_rate": 0.00046999022721720007, - "loss": 0.7859, - "step": 25075 - }, - { - "epoch": 6.12, - "learning_rate": 0.0004699596872709504, - "loss": 0.7834, - "step": 25100 - }, - { - "epoch": 6.13, - "learning_rate": 0.00046992914732470073, - "loss": 0.7398, - "step": 25125 - }, - { - "epoch": 6.14, - "learning_rate": 0.00046989860737845103, - "loss": 0.8568, - "step": 25150 - }, - { - "epoch": 6.14, - "learning_rate": 0.00046986806743220134, - "loss": 0.783, - "step": 25175 - }, - { - "epoch": 6.15, - "learning_rate": 0.00046983752748595164, - "loss": 0.8308, - "step": 25200 - }, - { - "epoch": 6.16, - "learning_rate": 0.0004698069875397019, - "loss": 0.7543, - "step": 25225 - }, - { - "epoch": 6.16, - "learning_rate": 0.00046977644759345225, - "loss": 0.8413, - "step": 25250 - }, - { - "epoch": 6.17, - "learning_rate": 0.00046974590764720255, - "loss": 0.7851, - "step": 25275 - }, - { - "epoch": 6.17, - "learning_rate": 0.00046971536770095285, - "loss": 0.7815, - "step": 25300 - }, - { - "epoch": 6.18, - "learning_rate": 0.00046968482775470316, - "loss": 0.7607, - "step": 25325 - }, - { - "epoch": 6.19, - "learning_rate": 0.00046965428780845346, - "loss": 0.7827, - "step": 25350 - }, - { - "epoch": 6.19, - "learning_rate": 0.0004696237478622038, - "loss": 0.7891, - "step": 25375 - }, - { - "epoch": 6.2, - "learning_rate": 0.00046959320791595407, - "loss": 0.7708, - "step": 25400 - }, - { - "epoch": 6.2, - "learning_rate": 0.00046956266796970437, - "loss": 0.7806, - "step": 25425 - }, - { - "epoch": 6.21, - "learning_rate": 0.0004695321280234547, - "loss": 0.8272, - "step": 25450 - }, - { - "epoch": 6.22, - "learning_rate": 0.000469501588077205, - "loss": 0.7922, - "step": 25475 - }, - { - "epoch": 6.22, - "learning_rate": 0.00046947104813095534, - "loss": 0.7947, - "step": 25500 - }, - { - "epoch": 6.22, - "eval_cer": 0.16775663993922157, - "eval_loss": 0.5526652932167053, - "eval_runtime": 153.2005, - "eval_samples_per_second": 27.369, - "eval_steps_per_second": 6.847, - "eval_wer": 0.6471778140293638, - "step": 25500 - }, - { - "epoch": 6.23, - "learning_rate": 0.00046944050818470564, - "loss": 0.7896, - "step": 25525 - }, - { - "epoch": 6.23, - "learning_rate": 0.0004694099682384559, - "loss": 0.7802, - "step": 25550 - }, - { - "epoch": 6.24, - "learning_rate": 0.0004693806498900562, - "loss": 0.7681, - "step": 25575 - }, - { - "epoch": 6.25, - "learning_rate": 0.0004693501099438065, - "loss": 0.7726, - "step": 25600 - }, - { - "epoch": 6.25, - "learning_rate": 0.0004693207915954068, - "loss": 0.7731, - "step": 25625 - }, - { - "epoch": 6.26, - "learning_rate": 0.0004692902516491571, - "loss": 0.7475, - "step": 25650 - }, - { - "epoch": 6.27, - "learning_rate": 0.0004692597117029074, - "loss": 0.7772, - "step": 25675 - }, - { - "epoch": 6.27, - "learning_rate": 0.0004692291717566577, - "loss": 0.7563, - "step": 25700 - }, - { - "epoch": 6.28, - "learning_rate": 0.000469198631810408, - "loss": 0.7887, - "step": 25725 - }, - { - "epoch": 6.28, - "learning_rate": 0.0004691680918641583, - "loss": 0.8447, - "step": 25750 - }, - { - "epoch": 6.29, - "learning_rate": 0.0004691375519179086, - "loss": 0.7684, - "step": 25775 - }, - { - "epoch": 6.3, - "learning_rate": 0.00046910701197165893, - "loss": 0.8256, - "step": 25800 - }, - { - "epoch": 6.3, - "learning_rate": 0.0004690764720254093, - "loss": 0.7834, - "step": 25825 - }, - { - "epoch": 6.31, - "learning_rate": 0.0004690459320791596, - "loss": 0.7856, - "step": 25850 - }, - { - "epoch": 6.31, - "learning_rate": 0.00046901539213290984, - "loss": 0.7571, - "step": 25875 - }, - { - "epoch": 6.32, - "learning_rate": 0.00046898485218666014, - "loss": 0.8078, - "step": 25900 - }, - { - "epoch": 6.33, - "learning_rate": 0.00046895431224041044, - "loss": 0.7851, - "step": 25925 - }, - { - "epoch": 6.33, - "learning_rate": 0.0004689237722941608, - "loss": 0.8066, - "step": 25950 - }, - { - "epoch": 6.34, - "learning_rate": 0.0004688932323479111, - "loss": 0.7699, - "step": 25975 - }, - { - "epoch": 6.34, - "learning_rate": 0.0004688626924016614, - "loss": 0.8273, - "step": 26000 - }, - { - "epoch": 6.34, - "eval_cer": 0.17227908791310328, - "eval_loss": 0.5425549745559692, - "eval_runtime": 153.5111, - "eval_samples_per_second": 27.314, - "eval_steps_per_second": 6.833, - "eval_wer": 0.6673083197389886, - "step": 26000 - }, - { - "epoch": 6.35, - "learning_rate": 0.00046883215245541166, - "loss": 0.8126, - "step": 26025 - }, - { - "epoch": 6.36, - "learning_rate": 0.00046880161250916196, - "loss": 0.8578, - "step": 26050 - }, - { - "epoch": 6.36, - "learning_rate": 0.0004687710725629123, - "loss": 0.7734, - "step": 26075 - }, - { - "epoch": 6.37, - "learning_rate": 0.0004687405326166626, - "loss": 0.7617, - "step": 26100 - }, - { - "epoch": 6.38, - "learning_rate": 0.0004687099926704129, - "loss": 0.7766, - "step": 26125 - }, - { - "epoch": 6.38, - "learning_rate": 0.00046867945272416323, - "loss": 0.8196, - "step": 26150 - }, - { - "epoch": 6.39, - "learning_rate": 0.0004686489127779135, - "loss": 0.7303, - "step": 26175 - }, - { - "epoch": 6.39, - "learning_rate": 0.00046861837283166384, - "loss": 0.7622, - "step": 26200 - }, - { - "epoch": 6.4, - "learning_rate": 0.00046858783288541414, - "loss": 0.7714, - "step": 26225 - }, - { - "epoch": 6.41, - "learning_rate": 0.00046855729293916444, - "loss": 0.7608, - "step": 26250 - }, - { - "epoch": 6.41, - "learning_rate": 0.00046852675299291475, - "loss": 0.8122, - "step": 26275 - }, - { - "epoch": 6.42, - "learning_rate": 0.00046849621304666505, - "loss": 0.7717, - "step": 26300 - }, - { - "epoch": 6.42, - "learning_rate": 0.0004684656731004154, - "loss": 0.741, - "step": 26325 - }, - { - "epoch": 6.43, - "learning_rate": 0.00046843513315416566, - "loss": 0.7665, - "step": 26350 - }, - { - "epoch": 6.44, - "learning_rate": 0.00046840459320791596, - "loss": 0.81, - "step": 26375 - }, - { - "epoch": 6.44, - "learning_rate": 0.00046837405326166626, - "loss": 0.8025, - "step": 26400 - }, - { - "epoch": 6.45, - "learning_rate": 0.00046834351331541657, - "loss": 0.7949, - "step": 26425 - }, - { - "epoch": 6.45, - "learning_rate": 0.00046831297336916687, - "loss": 0.8085, - "step": 26450 - }, - { - "epoch": 6.46, - "learning_rate": 0.0004682824334229172, - "loss": 0.8072, - "step": 26475 - }, - { - "epoch": 6.47, - "learning_rate": 0.0004682518934766675, - "loss": 0.8085, - "step": 26500 - }, - { - "epoch": 6.47, - "eval_cer": 0.1681621715963574, - "eval_loss": 0.5464115142822266, - "eval_runtime": 151.2701, - "eval_samples_per_second": 27.719, - "eval_steps_per_second": 6.935, - "eval_wer": 0.6475693311582382, - "step": 26500 - }, - { - "epoch": 6.47, - "learning_rate": 0.0004682213535304178, - "loss": 0.7243, - "step": 26525 - }, - { - "epoch": 6.48, - "learning_rate": 0.0004681908135841681, - "loss": 0.8214, - "step": 26550 - }, - { - "epoch": 6.48, - "learning_rate": 0.0004681602736379184, - "loss": 0.7823, - "step": 26575 - }, - { - "epoch": 6.49, - "learning_rate": 0.00046812973369166874, - "loss": 0.7737, - "step": 26600 - }, - { - "epoch": 6.5, - "learning_rate": 0.00046809919374541905, - "loss": 0.7714, - "step": 26625 - }, - { - "epoch": 6.5, - "learning_rate": 0.0004680686537991693, - "loss": 0.7848, - "step": 26650 - }, - { - "epoch": 6.51, - "learning_rate": 0.0004680381138529196, - "loss": 0.8329, - "step": 26675 - }, - { - "epoch": 6.52, - "learning_rate": 0.0004680075739066699, - "loss": 0.802, - "step": 26700 - }, - { - "epoch": 6.52, - "learning_rate": 0.00046797703396042026, - "loss": 0.8132, - "step": 26725 - }, - { - "epoch": 6.53, - "learning_rate": 0.00046794649401417056, - "loss": 0.8287, - "step": 26750 - }, - { - "epoch": 6.53, - "learning_rate": 0.00046791595406792087, - "loss": 0.7784, - "step": 26775 - }, - { - "epoch": 6.54, - "learning_rate": 0.00046788541412167117, - "loss": 0.803, - "step": 26800 - }, - { - "epoch": 6.55, - "learning_rate": 0.0004678548741754214, - "loss": 0.7928, - "step": 26825 - }, - { - "epoch": 6.55, - "learning_rate": 0.0004678243342291718, - "loss": 0.8156, - "step": 26850 - }, - { - "epoch": 6.56, - "learning_rate": 0.0004677937942829221, - "loss": 0.7577, - "step": 26875 - }, - { - "epoch": 6.56, - "learning_rate": 0.0004677632543366724, - "loss": 0.7651, - "step": 26900 - }, - { - "epoch": 6.57, - "learning_rate": 0.0004677327143904227, - "loss": 0.7585, - "step": 26925 - }, - { - "epoch": 6.58, - "learning_rate": 0.000467702174444173, - "loss": 0.8167, - "step": 26950 - }, - { - "epoch": 6.58, - "learning_rate": 0.0004676716344979233, - "loss": 0.7781, - "step": 26975 - }, - { - "epoch": 6.59, - "learning_rate": 0.0004676410945516736, - "loss": 0.8164, - "step": 27000 - }, - { - "epoch": 6.59, - "eval_cer": 0.1653131833721754, - "eval_loss": 0.5459656715393066, - "eval_runtime": 153.5643, - "eval_samples_per_second": 27.305, - "eval_steps_per_second": 6.831, - "eval_wer": 0.6328548123980424, - "step": 27000 - }, - { - "epoch": 6.59, - "learning_rate": 0.0004676105546054239, - "loss": 0.7949, - "step": 27025 - }, - { - "epoch": 6.6, - "learning_rate": 0.0004675800146591742, - "loss": 0.7673, - "step": 27050 - }, - { - "epoch": 6.61, - "learning_rate": 0.0004675494747129245, - "loss": 0.7335, - "step": 27075 - }, - { - "epoch": 6.61, - "learning_rate": 0.00046751893476667486, - "loss": 0.8251, - "step": 27100 - }, - { - "epoch": 6.62, - "learning_rate": 0.0004674883948204251, - "loss": 0.7464, - "step": 27125 - }, - { - "epoch": 6.63, - "learning_rate": 0.0004674578548741754, - "loss": 0.8075, - "step": 27150 - }, - { - "epoch": 6.63, - "learning_rate": 0.0004674273149279257, - "loss": 0.7601, - "step": 27175 - }, - { - "epoch": 6.64, - "learning_rate": 0.000467396774981676, - "loss": 0.8107, - "step": 27200 - }, - { - "epoch": 6.64, - "learning_rate": 0.0004673662350354264, - "loss": 0.7774, - "step": 27225 - }, - { - "epoch": 6.65, - "learning_rate": 0.0004673356950891767, - "loss": 0.8015, - "step": 27250 - }, - { - "epoch": 6.66, - "learning_rate": 0.000467305155142927, - "loss": 0.7453, - "step": 27275 - }, - { - "epoch": 6.66, - "learning_rate": 0.00046727461519667724, - "loss": 0.8042, - "step": 27300 - }, - { - "epoch": 6.67, - "learning_rate": 0.00046724407525042754, - "loss": 0.7639, - "step": 27325 - }, - { - "epoch": 6.67, - "learning_rate": 0.0004672135353041779, - "loss": 0.7875, - "step": 27350 - }, - { - "epoch": 6.68, - "learning_rate": 0.0004671829953579282, - "loss": 0.7677, - "step": 27375 - }, - { - "epoch": 6.69, - "learning_rate": 0.0004671524554116785, - "loss": 0.8096, - "step": 27400 - }, - { - "epoch": 6.69, - "learning_rate": 0.0004671219154654288, - "loss": 0.7775, - "step": 27425 - }, - { - "epoch": 6.7, - "learning_rate": 0.00046709137551917906, - "loss": 0.8353, - "step": 27450 - }, - { - "epoch": 6.7, - "learning_rate": 0.0004670608355729294, - "loss": 0.8382, - "step": 27475 - }, - { - "epoch": 6.71, - "learning_rate": 0.0004670302956266797, - "loss": 0.755, - "step": 27500 - }, - { - "epoch": 6.71, - "eval_cer": 0.16939929981622742, - "eval_loss": 0.5419759154319763, - "eval_runtime": 152.9956, - "eval_samples_per_second": 27.406, - "eval_steps_per_second": 6.856, - "eval_wer": 0.6614355628058728, - "step": 27500 - }, - { - "epoch": 6.72, - "learning_rate": 0.00046699975568043, - "loss": 0.7685, - "step": 27525 - }, - { - "epoch": 6.72, - "learning_rate": 0.0004669692157341803, - "loss": 0.7839, - "step": 27550 - }, - { - "epoch": 6.73, - "learning_rate": 0.00046693867578793063, - "loss": 0.7775, - "step": 27575 - }, - { - "epoch": 6.73, - "learning_rate": 0.0004669081358416809, - "loss": 0.8121, - "step": 27600 - }, - { - "epoch": 6.74, - "learning_rate": 0.00046687759589543123, - "loss": 0.765, - "step": 27625 - }, - { - "epoch": 6.75, - "learning_rate": 0.00046684705594918154, - "loss": 0.8056, - "step": 27650 - }, - { - "epoch": 6.75, - "learning_rate": 0.00046681651600293184, - "loss": 0.733, - "step": 27675 - }, - { - "epoch": 6.76, - "learning_rate": 0.00046678597605668214, - "loss": 0.8103, - "step": 27700 - }, - { - "epoch": 6.77, - "learning_rate": 0.00046675543611043245, - "loss": 0.7478, - "step": 27725 - }, - { - "epoch": 6.77, - "learning_rate": 0.0004667248961641828, - "loss": 0.7973, - "step": 27750 - }, - { - "epoch": 6.78, - "learning_rate": 0.00046669435621793305, - "loss": 0.7877, - "step": 27775 - }, - { - "epoch": 6.78, - "learning_rate": 0.00046666381627168336, - "loss": 0.8024, - "step": 27800 - }, - { - "epoch": 6.79, - "learning_rate": 0.00046663327632543366, - "loss": 0.7701, - "step": 27825 - }, - { - "epoch": 6.8, - "learning_rate": 0.00046660273637918396, - "loss": 0.8046, - "step": 27850 - }, - { - "epoch": 6.8, - "learning_rate": 0.0004665721964329343, - "loss": 0.7917, - "step": 27875 - }, - { - "epoch": 6.81, - "learning_rate": 0.0004665416564866846, - "loss": 0.8223, - "step": 27900 - }, - { - "epoch": 6.81, - "learning_rate": 0.0004665111165404349, - "loss": 0.7697, - "step": 27925 - }, - { - "epoch": 6.82, - "learning_rate": 0.0004664805765941852, - "loss": 0.8104, - "step": 27950 - }, - { - "epoch": 6.83, - "learning_rate": 0.0004664500366479355, - "loss": 0.7723, - "step": 27975 - }, - { - "epoch": 6.83, - "learning_rate": 0.00046641949670168584, - "loss": 0.822, - "step": 28000 - }, - { - "epoch": 6.83, - "eval_cer": 0.1698561645945197, - "eval_loss": 0.5540247559547424, - "eval_runtime": 153.0638, - "eval_samples_per_second": 27.394, - "eval_steps_per_second": 6.853, - "eval_wer": 0.6492985318107667, - "step": 28000 - }, - { - "epoch": 6.84, - "learning_rate": 0.00046638895675543614, - "loss": 0.7624, - "step": 28025 - }, - { - "epoch": 6.84, - "learning_rate": 0.00046635841680918645, - "loss": 0.8005, - "step": 28050 - }, - { - "epoch": 6.85, - "learning_rate": 0.0004663278768629367, - "loss": 0.7542, - "step": 28075 - }, - { - "epoch": 6.86, - "learning_rate": 0.000466297336916687, - "loss": 0.8048, - "step": 28100 - }, - { - "epoch": 6.86, - "learning_rate": 0.00046626679697043736, - "loss": 0.7846, - "step": 28125 - }, - { - "epoch": 6.87, - "learning_rate": 0.00046623625702418766, - "loss": 0.7999, - "step": 28150 - }, - { - "epoch": 6.88, - "learning_rate": 0.00046620571707793796, - "loss": 0.7547, - "step": 28175 - }, - { - "epoch": 6.88, - "learning_rate": 0.00046617517713168827, - "loss": 0.7975, - "step": 28200 - }, - { - "epoch": 6.89, - "learning_rate": 0.0004661446371854385, - "loss": 0.7271, - "step": 28225 - }, - { - "epoch": 6.89, - "learning_rate": 0.00046611409723918887, - "loss": 0.8168, - "step": 28250 - }, - { - "epoch": 6.9, - "learning_rate": 0.0004660835572929392, - "loss": 0.7559, - "step": 28275 - }, - { - "epoch": 6.91, - "learning_rate": 0.0004660530173466895, - "loss": 0.7618, - "step": 28300 - }, - { - "epoch": 6.91, - "learning_rate": 0.0004660224774004398, - "loss": 0.811, - "step": 28325 - }, - { - "epoch": 6.92, - "learning_rate": 0.0004659919374541901, - "loss": 0.7985, - "step": 28350 - }, - { - "epoch": 6.92, - "learning_rate": 0.00046596139750794044, - "loss": 0.779, - "step": 28375 - }, - { - "epoch": 6.93, - "learning_rate": 0.0004659308575616907, - "loss": 0.8269, - "step": 28400 - }, - { - "epoch": 6.94, - "learning_rate": 0.000465900317615441, - "loss": 0.7372, - "step": 28425 - }, - { - "epoch": 6.94, - "learning_rate": 0.0004658697776691913, - "loss": 0.8145, - "step": 28450 - }, - { - "epoch": 6.95, - "learning_rate": 0.0004658392377229416, - "loss": 0.7761, - "step": 28475 - }, - { - "epoch": 6.95, - "learning_rate": 0.00046580869777669196, - "loss": 0.7957, - "step": 28500 - }, - { - "epoch": 6.95, - "eval_cer": 0.16304425941706108, - "eval_loss": 0.5358180403709412, - "eval_runtime": 151.3883, - "eval_samples_per_second": 27.697, - "eval_steps_per_second": 6.929, - "eval_wer": 0.6373246329526917, - "step": 28500 - }, - { - "epoch": 6.96, - "learning_rate": 0.00046577815783044226, - "loss": 0.7879, - "step": 28525 - }, - { - "epoch": 6.97, - "learning_rate": 0.0004657476178841925, - "loss": 0.8106, - "step": 28550 - }, - { - "epoch": 6.97, - "learning_rate": 0.0004657170779379428, - "loss": 0.7716, - "step": 28575 - }, - { - "epoch": 6.98, - "learning_rate": 0.0004656877595895431, - "loss": 0.7921, - "step": 28600 - }, - { - "epoch": 6.99, - "learning_rate": 0.0004656572196432934, - "loss": 0.7744, - "step": 28625 - }, - { - "epoch": 6.99, - "learning_rate": 0.00046562667969704373, - "loss": 0.7707, - "step": 28650 - }, - { - "epoch": 7.0, - "learning_rate": 0.0004655961397507941, - "loss": 0.7645, - "step": 28675 - }, - { - "epoch": 7.0, - "learning_rate": 0.00046556559980454434, - "loss": 0.8178, - "step": 28700 - }, - { - "epoch": 7.01, - "learning_rate": 0.00046553505985829464, - "loss": 0.7335, - "step": 28725 - }, - { - "epoch": 7.02, - "learning_rate": 0.00046550451991204494, - "loss": 0.7847, - "step": 28750 - }, - { - "epoch": 7.02, - "learning_rate": 0.00046547397996579525, - "loss": 0.7395, - "step": 28775 - }, - { - "epoch": 7.03, - "learning_rate": 0.0004654434400195456, - "loss": 0.7532, - "step": 28800 - }, - { - "epoch": 7.03, - "learning_rate": 0.0004654129000732959, - "loss": 0.7882, - "step": 28825 - }, - { - "epoch": 7.04, - "learning_rate": 0.0004653823601270462, - "loss": 0.7519, - "step": 28850 - }, - { - "epoch": 7.05, - "learning_rate": 0.00046535182018079646, - "loss": 0.6923, - "step": 28875 - }, - { - "epoch": 7.05, - "learning_rate": 0.00046532128023454676, - "loss": 0.7965, - "step": 28900 - }, - { - "epoch": 7.06, - "learning_rate": 0.0004652907402882971, - "loss": 0.703, - "step": 28925 - }, - { - "epoch": 7.06, - "learning_rate": 0.0004652602003420474, - "loss": 0.752, - "step": 28950 - }, - { - "epoch": 7.07, - "learning_rate": 0.0004652296603957977, - "loss": 0.6877, - "step": 28975 - }, - { - "epoch": 7.08, - "learning_rate": 0.00046519912044954803, - "loss": 0.7739, - "step": 29000 - }, - { - "epoch": 7.08, - "eval_cer": 0.17274621931562684, - "eval_loss": 0.5662298202514648, - "eval_runtime": 153.6801, - "eval_samples_per_second": 27.284, - "eval_steps_per_second": 6.826, - "eval_wer": 0.6695595432300163, - "step": 29000 - }, - { - "epoch": 7.08, - "learning_rate": 0.0004651685805032983, - "loss": 0.7574, - "step": 29025 - }, - { - "epoch": 7.09, - "learning_rate": 0.00046513804055704864, - "loss": 0.8008, - "step": 29050 - }, - { - "epoch": 7.09, - "learning_rate": 0.00046510750061079894, - "loss": 0.7341, - "step": 29075 - }, - { - "epoch": 7.1, - "learning_rate": 0.00046507696066454924, - "loss": 0.7556, - "step": 29100 - }, - { - "epoch": 7.11, - "learning_rate": 0.00046504642071829955, - "loss": 0.7353, - "step": 29125 - }, - { - "epoch": 7.11, - "learning_rate": 0.00046501588077204985, - "loss": 0.7788, - "step": 29150 - }, - { - "epoch": 7.12, - "learning_rate": 0.00046498534082580015, - "loss": 0.75, - "step": 29175 - }, - { - "epoch": 7.13, - "learning_rate": 0.00046495480087955046, - "loss": 0.7361, - "step": 29200 - }, - { - "epoch": 7.13, - "learning_rate": 0.00046492426093330076, - "loss": 0.7574, - "step": 29225 - }, - { - "epoch": 7.14, - "learning_rate": 0.00046489372098705106, - "loss": 0.7727, - "step": 29250 - }, - { - "epoch": 7.14, - "learning_rate": 0.00046486318104080137, - "loss": 0.74, - "step": 29275 - }, - { - "epoch": 7.15, - "learning_rate": 0.0004648326410945517, - "loss": 0.7178, - "step": 29300 - }, - { - "epoch": 7.16, - "learning_rate": 0.00046480210114830203, - "loss": 0.7438, - "step": 29325 - }, - { - "epoch": 7.16, - "learning_rate": 0.0004647715612020523, - "loss": 0.7835, - "step": 29350 - }, - { - "epoch": 7.17, - "learning_rate": 0.0004647410212558026, - "loss": 0.7028, - "step": 29375 - }, - { - "epoch": 7.17, - "learning_rate": 0.0004647104813095529, - "loss": 0.784, - "step": 29400 - }, - { - "epoch": 7.18, - "learning_rate": 0.00046467994136330324, - "loss": 0.7249, - "step": 29425 - }, - { - "epoch": 7.19, - "learning_rate": 0.00046464940141705354, - "loss": 0.7371, - "step": 29450 - }, - { - "epoch": 7.19, - "learning_rate": 0.00046461886147080385, - "loss": 0.7614, - "step": 29475 - }, - { - "epoch": 7.2, - "learning_rate": 0.0004645883215245541, - "loss": 0.7833, - "step": 29500 - }, - { - "epoch": 7.2, - "eval_cer": 0.15938420787860744, - "eval_loss": 0.5323081016540527, - "eval_runtime": 153.6339, - "eval_samples_per_second": 27.292, - "eval_steps_per_second": 6.828, - "eval_wer": 0.6227079934747145, - "step": 29500 - }, - { - "epoch": 7.2, - "learning_rate": 0.0004645577815783044, - "loss": 0.7305, - "step": 29525 - }, - { - "epoch": 7.21, - "learning_rate": 0.00046452724163205476, - "loss": 0.7645, - "step": 29550 - }, - { - "epoch": 7.22, - "learning_rate": 0.00046449670168580506, - "loss": 0.7863, - "step": 29575 - }, - { - "epoch": 7.22, - "learning_rate": 0.00046446616173955536, - "loss": 0.7635, - "step": 29600 - }, - { - "epoch": 7.23, - "learning_rate": 0.00046443562179330567, - "loss": 0.7263, - "step": 29625 - }, - { - "epoch": 7.24, - "learning_rate": 0.0004644050818470559, - "loss": 0.7765, - "step": 29650 - }, - { - "epoch": 7.24, - "learning_rate": 0.0004643745419008062, - "loss": 0.7977, - "step": 29675 - }, - { - "epoch": 7.25, - "learning_rate": 0.0004643440019545566, - "loss": 0.7765, - "step": 29700 - }, - { - "epoch": 7.25, - "learning_rate": 0.0004643134620083069, - "loss": 0.7449, - "step": 29725 - }, - { - "epoch": 7.26, - "learning_rate": 0.0004642829220620572, - "loss": 0.7772, - "step": 29750 - }, - { - "epoch": 7.27, - "learning_rate": 0.0004642523821158075, - "loss": 0.7407, - "step": 29775 - }, - { - "epoch": 7.27, - "learning_rate": 0.0004642218421695578, - "loss": 0.7405, - "step": 29800 - }, - { - "epoch": 7.28, - "learning_rate": 0.0004641913022233081, - "loss": 0.7628, - "step": 29825 - }, - { - "epoch": 7.28, - "learning_rate": 0.0004641607622770584, - "loss": 0.7384, - "step": 29850 - }, - { - "epoch": 7.29, - "learning_rate": 0.0004641302223308087, - "loss": 0.7202, - "step": 29875 - }, - { - "epoch": 7.3, - "learning_rate": 0.000464099682384559, - "loss": 0.8118, - "step": 29900 - }, - { - "epoch": 7.3, - "learning_rate": 0.0004640691424383093, - "loss": 0.7478, - "step": 29925 - }, - { - "epoch": 7.31, - "learning_rate": 0.00046403860249205967, - "loss": 0.7712, - "step": 29950 - }, - { - "epoch": 7.31, - "learning_rate": 0.0004640080625458099, - "loss": 0.729, - "step": 29975 - }, - { - "epoch": 7.32, - "learning_rate": 0.0004639775225995602, - "loss": 0.7737, - "step": 30000 - }, - { - "epoch": 7.32, - "eval_cer": 0.1612784000492798, - "eval_loss": 0.5348503589630127, - "eval_runtime": 151.5191, - "eval_samples_per_second": 27.673, - "eval_steps_per_second": 6.923, - "eval_wer": 0.6303425774877651, - "step": 30000 - }, - { - "epoch": 7.33, - "learning_rate": 0.0004639469826533105, - "loss": 0.7539, - "step": 30025 - }, - { - "epoch": 7.33, - "learning_rate": 0.0004639164427070608, - "loss": 0.7372, - "step": 30050 - }, - { - "epoch": 7.34, - "learning_rate": 0.0004638859027608112, - "loss": 0.7137, - "step": 30075 - }, - { - "epoch": 7.35, - "learning_rate": 0.0004638553628145615, - "loss": 0.7689, - "step": 30100 - }, - { - "epoch": 7.35, - "learning_rate": 0.00046382482286831173, - "loss": 0.7584, - "step": 30125 - }, - { - "epoch": 7.36, - "learning_rate": 0.00046379428292206204, - "loss": 0.7275, - "step": 30150 - }, - { - "epoch": 7.36, - "learning_rate": 0.00046376374297581234, - "loss": 0.7524, - "step": 30175 - }, - { - "epoch": 7.37, - "learning_rate": 0.0004637332030295627, - "loss": 0.7609, - "step": 30200 - }, - { - "epoch": 7.38, - "learning_rate": 0.000463702663083313, - "loss": 0.6847, - "step": 30225 - }, - { - "epoch": 7.38, - "learning_rate": 0.0004636721231370633, - "loss": 0.7438, - "step": 30250 - }, - { - "epoch": 7.39, - "learning_rate": 0.0004636415831908136, - "loss": 0.7237, - "step": 30275 - }, - { - "epoch": 7.39, - "learning_rate": 0.00046361104324456386, - "loss": 0.8116, - "step": 30300 - }, - { - "epoch": 7.4, - "learning_rate": 0.0004635805032983142, - "loss": 0.7247, - "step": 30325 - }, - { - "epoch": 7.41, - "learning_rate": 0.0004635499633520645, - "loss": 0.8259, - "step": 30350 - }, - { - "epoch": 7.41, - "learning_rate": 0.0004635194234058148, - "loss": 0.7375, - "step": 30375 - }, - { - "epoch": 7.42, - "learning_rate": 0.0004634888834595651, - "loss": 0.7721, - "step": 30400 - }, - { - "epoch": 7.42, - "learning_rate": 0.00046345834351331543, - "loss": 0.7388, - "step": 30425 - }, - { - "epoch": 7.43, - "learning_rate": 0.00046342780356706573, - "loss": 0.7617, - "step": 30450 - }, - { - "epoch": 7.44, - "learning_rate": 0.00046339726362081604, - "loss": 0.7408, - "step": 30475 - }, - { - "epoch": 7.44, - "learning_rate": 0.00046336672367456634, - "loss": 0.7697, - "step": 30500 - }, - { - "epoch": 7.44, - "eval_cer": 0.1623358623451023, - "eval_loss": 0.531502366065979, - "eval_runtime": 153.2868, - "eval_samples_per_second": 27.354, - "eval_steps_per_second": 6.843, - "eval_wer": 0.6386296900489397, - "step": 30500 - }, - { - "epoch": 7.45, - "learning_rate": 0.00046333618372831664, - "loss": 0.7369, - "step": 30525 - }, - { - "epoch": 7.45, - "learning_rate": 0.00046330564378206695, - "loss": 0.7767, - "step": 30550 - }, - { - "epoch": 7.46, - "learning_rate": 0.0004632751038358173, - "loss": 0.7329, - "step": 30575 - }, - { - "epoch": 7.47, - "learning_rate": 0.00046324456388956755, - "loss": 0.7998, - "step": 30600 - }, - { - "epoch": 7.47, - "learning_rate": 0.00046321402394331786, - "loss": 0.7511, - "step": 30625 - }, - { - "epoch": 7.48, - "learning_rate": 0.00046318348399706816, - "loss": 0.775, - "step": 30650 - }, - { - "epoch": 7.49, - "learning_rate": 0.00046315294405081846, - "loss": 0.7321, - "step": 30675 - }, - { - "epoch": 7.49, - "learning_rate": 0.0004631224041045688, - "loss": 0.7492, - "step": 30700 - }, - { - "epoch": 7.5, - "learning_rate": 0.0004630918641583191, - "loss": 0.7255, - "step": 30725 - }, - { - "epoch": 7.5, - "learning_rate": 0.0004630613242120694, - "loss": 0.8, - "step": 30750 - }, - { - "epoch": 7.51, - "learning_rate": 0.0004630307842658197, - "loss": 0.7936, - "step": 30775 - }, - { - "epoch": 7.52, - "learning_rate": 0.00046300024431957, - "loss": 0.8171, - "step": 30800 - }, - { - "epoch": 7.52, - "learning_rate": 0.00046296970437332034, - "loss": 0.7838, - "step": 30825 - }, - { - "epoch": 7.53, - "learning_rate": 0.00046293916442707064, - "loss": 0.7683, - "step": 30850 - }, - { - "epoch": 7.53, - "learning_rate": 0.00046290862448082094, - "loss": 0.754, - "step": 30875 - }, - { - "epoch": 7.54, - "learning_rate": 0.00046287808453457125, - "loss": 0.723, - "step": 30900 - }, - { - "epoch": 7.55, - "learning_rate": 0.0004628475445883215, - "loss": 0.7296, - "step": 30925 - }, - { - "epoch": 7.55, - "learning_rate": 0.0004628170046420718, - "loss": 0.7375, - "step": 30950 - }, - { - "epoch": 7.56, - "learning_rate": 0.00046278646469582216, - "loss": 0.7338, - "step": 30975 - }, - { - "epoch": 7.56, - "learning_rate": 0.00046275592474957246, - "loss": 0.7647, - "step": 31000 - }, - { - "epoch": 7.56, - "eval_cer": 0.16078560208617804, - "eval_loss": 0.5345603823661804, - "eval_runtime": 152.8664, - "eval_samples_per_second": 27.429, - "eval_steps_per_second": 6.862, - "eval_wer": 0.6219249592169658, - "step": 31000 - }, - { - "epoch": 7.57, - "learning_rate": 0.00046272538480332276, - "loss": 0.7339, - "step": 31025 - }, - { - "epoch": 7.58, - "learning_rate": 0.00046269484485707307, - "loss": 0.8613, - "step": 31050 - }, - { - "epoch": 7.58, - "learning_rate": 0.0004626643049108233, - "loss": 0.7179, - "step": 31075 - }, - { - "epoch": 7.59, - "learning_rate": 0.0004626337649645737, - "loss": 0.8002, - "step": 31100 - }, - { - "epoch": 7.6, - "learning_rate": 0.000462603225018324, - "loss": 0.7486, - "step": 31125 - }, - { - "epoch": 7.6, - "learning_rate": 0.0004625726850720743, - "loss": 0.7804, - "step": 31150 - }, - { - "epoch": 7.61, - "learning_rate": 0.0004625421451258246, - "loss": 0.7206, - "step": 31175 - }, - { - "epoch": 7.61, - "learning_rate": 0.0004625116051795749, - "loss": 0.7351, - "step": 31200 - }, - { - "epoch": 7.62, - "learning_rate": 0.00046248106523332524, - "loss": 0.7299, - "step": 31225 - }, - { - "epoch": 7.63, - "learning_rate": 0.0004624505252870755, - "loss": 0.776, - "step": 31250 - }, - { - "epoch": 7.63, - "learning_rate": 0.0004624199853408258, - "loss": 0.753, - "step": 31275 - }, - { - "epoch": 7.64, - "learning_rate": 0.0004623894453945761, - "loss": 0.7613, - "step": 31300 - }, - { - "epoch": 7.64, - "learning_rate": 0.0004623589054483264, - "loss": 0.7381, - "step": 31325 - }, - { - "epoch": 7.65, - "learning_rate": 0.00046232836550207676, - "loss": 0.7744, - "step": 31350 - }, - { - "epoch": 7.66, - "learning_rate": 0.00046229782555582706, - "loss": 0.7205, - "step": 31375 - }, - { - "epoch": 7.66, - "learning_rate": 0.0004622672856095773, - "loss": 0.7958, - "step": 31400 - }, - { - "epoch": 7.67, - "learning_rate": 0.0004622367456633276, - "loss": 0.8055, - "step": 31425 - }, - { - "epoch": 7.67, - "learning_rate": 0.0004622062057170779, - "loss": 0.8087, - "step": 31450 - }, - { - "epoch": 7.68, - "learning_rate": 0.0004621756657708283, - "loss": 0.7123, - "step": 31475 - }, - { - "epoch": 7.69, - "learning_rate": 0.0004621451258245786, - "loss": 0.7123, - "step": 31500 - }, - { - "epoch": 7.69, - "eval_cer": 0.15610915474882703, - "eval_loss": 0.5194910764694214, - "eval_runtime": 154.4911, - "eval_samples_per_second": 27.141, - "eval_steps_per_second": 6.79, - "eval_wer": 0.6110277324632952, - "step": 31500 - }, - { - "epoch": 7.69, - "learning_rate": 0.0004621145858783289, - "loss": 0.7202, - "step": 31525 - }, - { - "epoch": 7.7, - "learning_rate": 0.00046208404593207913, - "loss": 0.7416, - "step": 31550 - }, - { - "epoch": 7.7, - "learning_rate": 0.00046205350598582944, - "loss": 0.7489, - "step": 31575 - }, - { - "epoch": 7.71, - "learning_rate": 0.0004620229660395798, - "loss": 0.7806, - "step": 31600 - }, - { - "epoch": 7.72, - "learning_rate": 0.0004619924260933301, - "loss": 0.7351, - "step": 31625 - }, - { - "epoch": 7.72, - "learning_rate": 0.0004619618861470804, - "loss": 0.7592, - "step": 31650 - }, - { - "epoch": 7.73, - "learning_rate": 0.0004619313462008307, - "loss": 0.7057, - "step": 31675 - }, - { - "epoch": 7.74, - "learning_rate": 0.00046190080625458095, - "loss": 0.7845, - "step": 31700 - }, - { - "epoch": 7.74, - "learning_rate": 0.0004618702663083313, - "loss": 0.7061, - "step": 31725 - }, - { - "epoch": 7.75, - "learning_rate": 0.0004618397263620816, - "loss": 0.7245, - "step": 31750 - }, - { - "epoch": 7.75, - "learning_rate": 0.0004618091864158319, - "loss": 0.7343, - "step": 31775 - }, - { - "epoch": 7.76, - "learning_rate": 0.0004617786464695822, - "loss": 0.7688, - "step": 31800 - }, - { - "epoch": 7.77, - "learning_rate": 0.0004617481065233325, - "loss": 0.7333, - "step": 31825 - }, - { - "epoch": 7.77, - "learning_rate": 0.0004617175665770829, - "loss": 0.7634, - "step": 31850 - }, - { - "epoch": 7.78, - "learning_rate": 0.00046168702663083313, - "loss": 0.781, - "step": 31875 - }, - { - "epoch": 7.78, - "learning_rate": 0.00046165648668458343, - "loss": 0.8163, - "step": 31900 - }, - { - "epoch": 7.79, - "learning_rate": 0.00046162594673833374, - "loss": 0.7101, - "step": 31925 - }, - { - "epoch": 7.8, - "learning_rate": 0.00046159540679208404, - "loss": 0.7749, - "step": 31950 - }, - { - "epoch": 7.8, - "learning_rate": 0.0004615648668458344, - "loss": 0.7374, - "step": 31975 - }, - { - "epoch": 7.81, - "learning_rate": 0.0004615343268995847, - "loss": 0.7412, - "step": 32000 - }, - { - "epoch": 7.81, - "eval_cer": 0.1613245998583206, - "eval_loss": 0.5384941697120667, - "eval_runtime": 151.6218, - "eval_samples_per_second": 27.654, - "eval_steps_per_second": 6.919, - "eval_wer": 0.6256117455138662, - "step": 32000 - }, - { - "epoch": 7.81, - "learning_rate": 0.00046150378695333495, - "loss": 0.7464, - "step": 32025 - }, - { - "epoch": 7.82, - "learning_rate": 0.00046147324700708525, - "loss": 0.789, - "step": 32050 - }, - { - "epoch": 7.83, - "learning_rate": 0.00046144270706083556, - "loss": 0.7565, - "step": 32075 - }, - { - "epoch": 7.83, - "learning_rate": 0.0004614121671145859, - "loss": 0.7613, - "step": 32100 - }, - { - "epoch": 7.84, - "learning_rate": 0.0004613816271683362, - "loss": 0.732, - "step": 32125 - }, - { - "epoch": 7.85, - "learning_rate": 0.0004613510872220865, - "loss": 0.7272, - "step": 32150 - }, - { - "epoch": 7.85, - "learning_rate": 0.00046132054727583677, - "loss": 0.7103, - "step": 32175 - }, - { - "epoch": 7.86, - "learning_rate": 0.0004612900073295871, - "loss": 0.7953, - "step": 32200 - }, - { - "epoch": 7.86, - "learning_rate": 0.00046125946738333743, - "loss": 0.7259, - "step": 32225 - }, - { - "epoch": 7.87, - "learning_rate": 0.00046122892743708774, - "loss": 0.7467, - "step": 32250 - }, - { - "epoch": 7.88, - "learning_rate": 0.00046119838749083804, - "loss": 0.7153, - "step": 32275 - }, - { - "epoch": 7.88, - "learning_rate": 0.00046116784754458834, - "loss": 0.6801, - "step": 32300 - }, - { - "epoch": 7.89, - "learning_rate": 0.00046113730759833865, - "loss": 0.6988, - "step": 32325 - }, - { - "epoch": 7.89, - "learning_rate": 0.0004611067676520889, - "loss": 0.8216, - "step": 32350 - }, - { - "epoch": 7.9, - "learning_rate": 0.00046107622770583925, - "loss": 0.7436, - "step": 32375 - }, - { - "epoch": 7.91, - "learning_rate": 0.00046104568775958956, - "loss": 0.802, - "step": 32400 - }, - { - "epoch": 7.91, - "learning_rate": 0.00046101514781333986, - "loss": 0.7254, - "step": 32425 - }, - { - "epoch": 7.92, - "learning_rate": 0.00046098460786709016, - "loss": 0.7719, - "step": 32450 - }, - { - "epoch": 7.92, - "learning_rate": 0.00046095406792084047, - "loss": 0.7155, - "step": 32475 - }, - { - "epoch": 7.93, - "learning_rate": 0.00046092352797459077, - "loss": 0.7702, - "step": 32500 - }, - { - "epoch": 7.93, - "eval_cer": 0.16136053304313008, - "eval_loss": 0.5290741920471191, - "eval_runtime": 152.6414, - "eval_samples_per_second": 27.47, - "eval_steps_per_second": 6.872, - "eval_wer": 0.6342903752039152, - "step": 32500 - }, - { - "epoch": 7.94, - "learning_rate": 0.00045748786240159785, - "loss": 0.7358, - "step": 32525 - }, - { - "epoch": 7.94, - "learning_rate": 0.0004574546632812417, - "loss": 0.8072, - "step": 32550 - }, - { - "epoch": 7.95, - "learning_rate": 0.0004574214641608856, - "loss": 0.7435, - "step": 32575 - }, - { - "epoch": 7.96, - "learning_rate": 0.0004573882650405295, - "loss": 0.7616, - "step": 32600 - }, - { - "epoch": 7.96, - "learning_rate": 0.0004573550659201734, - "loss": 0.75, - "step": 32625 - }, - { - "epoch": 7.97, - "learning_rate": 0.0004573218667998173, - "loss": 0.7756, - "step": 32650 - }, - { - "epoch": 7.97, - "learning_rate": 0.0004572886676794612, - "loss": 0.7521, - "step": 32675 - }, - { - "epoch": 7.98, - "learning_rate": 0.0004572567965239193, - "loss": 0.7256, - "step": 32700 - }, - { - "epoch": 7.99, - "learning_rate": 0.00045722359740356323, - "loss": 0.7392, - "step": 32725 - }, - { - "epoch": 7.99, - "learning_rate": 0.0004571903982832071, - "loss": 0.7464, - "step": 32750 - }, - { - "epoch": 8.0, - "learning_rate": 0.00045715719916285095, - "loss": 0.71, - "step": 32775 - }, - { - "epoch": 8.0, - "learning_rate": 0.00045712400004249487, - "loss": 0.7379, - "step": 32800 - }, - { - "epoch": 8.01, - "learning_rate": 0.0004570908009221388, - "loss": 0.69, - "step": 32825 - }, - { - "epoch": 8.02, - "learning_rate": 0.0004570576018017827, - "loss": 0.7467, - "step": 32850 - }, - { - "epoch": 8.02, - "learning_rate": 0.0004570244026814266, - "loss": 0.6749, - "step": 32875 - }, - { - "epoch": 8.03, - "learning_rate": 0.0004569912035610704, - "loss": 0.7433, - "step": 32900 - }, - { - "epoch": 8.03, - "learning_rate": 0.00045695800444071433, - "loss": 0.6778, - "step": 32925 - }, - { - "epoch": 8.04, - "learning_rate": 0.00045692480532035824, - "loss": 0.7142, - "step": 32950 - }, - { - "epoch": 8.05, - "learning_rate": 0.00045689160620000216, - "loss": 0.683, - "step": 32975 - }, - { - "epoch": 8.05, - "learning_rate": 0.00045685840707964607, - "loss": 0.7561, - "step": 33000 - }, - { - "epoch": 8.05, - "eval_cer": 0.1552724248739772, - "eval_loss": 0.5043615102767944, - "eval_runtime": 142.7702, - "eval_samples_per_second": 29.369, - "eval_steps_per_second": 7.347, - "eval_wer": 0.6138336052202283, - "step": 33000 - }, - { - "epoch": 8.06, - "learning_rate": 0.00045682520795928993, - "loss": 0.6955, - "step": 33025 - }, - { - "epoch": 8.06, - "learning_rate": 0.0004567920088389338, - "loss": 0.7009, - "step": 33050 - }, - { - "epoch": 8.07, - "learning_rate": 0.0004567588097185777, - "loss": 0.6887, - "step": 33075 - }, - { - "epoch": 8.08, - "learning_rate": 0.0004567256105982216, - "loss": 0.7224, - "step": 33100 - }, - { - "epoch": 8.08, - "learning_rate": 0.0004566924114778655, - "loss": 0.7305, - "step": 33125 - }, - { - "epoch": 8.09, - "learning_rate": 0.0004566592123575094, - "loss": 0.7314, - "step": 33150 - }, - { - "epoch": 8.1, - "learning_rate": 0.0004566260132371533, - "loss": 0.7016, - "step": 33175 - }, - { - "epoch": 8.1, - "learning_rate": 0.00045659281411679716, - "loss": 0.7451, - "step": 33200 - }, - { - "epoch": 8.11, - "learning_rate": 0.0004565596149964411, - "loss": 0.7097, - "step": 33225 - }, - { - "epoch": 8.11, - "learning_rate": 0.00045652641587608494, - "loss": 0.6997, - "step": 33250 - }, - { - "epoch": 8.12, - "learning_rate": 0.00045649321675572885, - "loss": 0.6959, - "step": 33275 - }, - { - "epoch": 8.13, - "learning_rate": 0.00045646001763537277, - "loss": 0.7657, - "step": 33300 - }, - { - "epoch": 8.13, - "learning_rate": 0.0004564268185150167, - "loss": 0.7058, - "step": 33325 - }, - { - "epoch": 8.14, - "learning_rate": 0.0004563936193946605, - "loss": 0.7508, - "step": 33350 - }, - { - "epoch": 8.14, - "learning_rate": 0.0004563604202743044, - "loss": 0.6738, - "step": 33375 - }, - { - "epoch": 8.15, - "learning_rate": 0.0004563272211539483, - "loss": 0.7368, - "step": 33400 - }, - { - "epoch": 8.16, - "learning_rate": 0.00045629402203359223, - "loss": 0.7343, - "step": 33425 - }, - { - "epoch": 8.16, - "learning_rate": 0.00045626082291323614, - "loss": 0.709, - "step": 33450 - }, - { - "epoch": 8.17, - "learning_rate": 0.00045622762379288, - "loss": 0.7208, - "step": 33475 - }, - { - "epoch": 8.17, - "learning_rate": 0.00045619442467252386, - "loss": 0.7045, - "step": 33500 - }, - { - "epoch": 8.18, - "learning_rate": 0.0004561612255521678, - "loss": 0.7289, - "step": 33525 - }, - { - "epoch": 8.19, - "learning_rate": 0.0004561280264318117, - "loss": 0.7799, - "step": 33550 - }, - { - "epoch": 8.19, - "learning_rate": 0.00045609482731145555, - "loss": 0.7295, - "step": 33575 - }, - { - "epoch": 8.2, - "learning_rate": 0.00045606162819109946, - "loss": 0.7468, - "step": 33600 - }, - { - "epoch": 8.21, - "learning_rate": 0.0004560284290707434, - "loss": 0.711, - "step": 33625 - }, - { - "epoch": 8.21, - "learning_rate": 0.00045599522995038724, - "loss": 0.7462, - "step": 33650 - }, - { - "epoch": 8.22, - "learning_rate": 0.00045596203083003115, - "loss": 0.6793, - "step": 33675 - }, - { - "epoch": 8.22, - "learning_rate": 0.000455928831709675, - "loss": 0.7026, - "step": 33700 - }, - { - "epoch": 8.23, - "learning_rate": 0.0004558956325893189, - "loss": 0.707, - "step": 33725 - }, - { - "epoch": 8.24, - "learning_rate": 0.00045586243346896284, - "loss": 0.7465, - "step": 33750 - }, - { - "epoch": 8.24, - "learning_rate": 0.00045582923434860675, - "loss": 0.7105, - "step": 33775 - }, - { - "epoch": 8.25, - "learning_rate": 0.00045579603522825056, - "loss": 0.7257, - "step": 33800 - }, - { - "epoch": 8.25, - "learning_rate": 0.00045576283610789447, - "loss": 0.6767, - "step": 33825 - }, - { - "epoch": 8.26, - "learning_rate": 0.0004557296369875384, - "loss": 0.7343, - "step": 33850 - }, - { - "epoch": 8.27, - "learning_rate": 0.0004556964378671823, - "loss": 0.6389, - "step": 33875 - }, - { - "epoch": 8.27, - "learning_rate": 0.0004556632387468262, - "loss": 0.7362, - "step": 33900 - }, - { - "epoch": 8.28, - "learning_rate": 0.0004556300396264701, - "loss": 0.66, - "step": 33925 - }, - { - "epoch": 8.28, - "learning_rate": 0.00045559684050611393, - "loss": 0.7329, - "step": 33950 - }, - { - "epoch": 8.29, - "learning_rate": 0.00045556364138575785, - "loss": 0.6778, - "step": 33975 - }, - { - "epoch": 8.3, - "learning_rate": 0.00045553044226540176, - "loss": 0.7017, - "step": 34000 - }, - { - "epoch": 8.3, - "learning_rate": 0.0004554972431450456, - "loss": 0.6709, - "step": 34025 - }, - { - "epoch": 8.31, - "learning_rate": 0.00045546404402468954, - "loss": 0.7861, - "step": 34050 - }, - { - "epoch": 8.32, - "learning_rate": 0.0004554308449043334, - "loss": 0.7241, - "step": 34075 - }, - { - "epoch": 8.32, - "learning_rate": 0.0004553976457839773, - "loss": 0.6993, - "step": 34100 - }, - { - "epoch": 8.33, - "learning_rate": 0.0004553644466636212, - "loss": 0.6818, - "step": 34125 - }, - { - "epoch": 8.33, - "learning_rate": 0.0004553312475432651, - "loss": 0.7136, - "step": 34150 - }, - { - "epoch": 8.34, - "learning_rate": 0.000455298048422909, - "loss": 0.725, - "step": 34175 - }, - { - "epoch": 8.35, - "learning_rate": 0.0004552648493025529, - "loss": 0.7254, - "step": 34200 - }, - { - "epoch": 8.35, - "learning_rate": 0.00045523165018219677, - "loss": 0.7135, - "step": 34225 - }, - { - "epoch": 8.36, - "learning_rate": 0.00045519845106184063, - "loss": 0.7367, - "step": 34250 - }, - { - "epoch": 8.36, - "learning_rate": 0.00045516525194148454, - "loss": 0.7019, - "step": 34275 - }, - { - "epoch": 8.37, - "learning_rate": 0.00045513205282112846, - "loss": 0.7287, - "step": 34300 - }, - { - "epoch": 8.38, - "learning_rate": 0.00045509885370077237, - "loss": 0.7241, - "step": 34325 - }, - { - "epoch": 8.38, - "learning_rate": 0.0004550656545804163, - "loss": 0.749, - "step": 34350 - }, - { - "epoch": 8.39, - "learning_rate": 0.0004550324554600601, - "loss": 0.7361, - "step": 34375 - }, - { - "epoch": 8.39, - "learning_rate": 0.000454999256339704, - "loss": 0.7496, - "step": 34400 - }, - { - "epoch": 8.4, - "learning_rate": 0.0004549660572193479, - "loss": 0.6714, - "step": 34425 - }, - { - "epoch": 8.41, - "learning_rate": 0.00045493285809899183, - "loss": 0.7154, - "step": 34450 - }, - { - "epoch": 8.41, - "learning_rate": 0.00045489965897863575, - "loss": 0.7159, - "step": 34475 - }, - { - "epoch": 8.42, - "learning_rate": 0.0004548664598582796, - "loss": 0.6873, - "step": 34500 - }, - { - "epoch": 8.42, - "learning_rate": 0.00045483326073792347, - "loss": 0.7398, - "step": 34525 - }, - { - "epoch": 8.43, - "learning_rate": 0.0004548000616175674, - "loss": 0.7187, - "step": 34550 - }, - { - "epoch": 8.44, - "learning_rate": 0.0004547668624972113, - "loss": 0.7376, - "step": 34575 - }, - { - "epoch": 8.44, - "learning_rate": 0.00045473366337685515, - "loss": 0.7299, - "step": 34600 - }, - { - "epoch": 8.45, - "learning_rate": 0.00045470046425649907, - "loss": 0.7037, - "step": 34625 - }, - { - "epoch": 8.46, - "learning_rate": 0.000454667265136143, - "loss": 0.7256, - "step": 34650 - }, - { - "epoch": 8.46, - "learning_rate": 0.00045463406601578684, - "loss": 0.6814, - "step": 34675 - }, - { - "epoch": 8.47, - "learning_rate": 0.00045460086689543076, - "loss": 0.7661, - "step": 34700 - }, - { - "epoch": 8.47, - "learning_rate": 0.0004545676677750746, - "loss": 0.7051, - "step": 34725 - }, - { - "epoch": 8.48, - "learning_rate": 0.00045453446865471853, - "loss": 0.7034, - "step": 34750 - }, - { - "epoch": 8.49, - "learning_rate": 0.00045450126953436244, - "loss": 0.6999, - "step": 34775 - }, - { - "epoch": 8.49, - "learning_rate": 0.00045446807041400636, - "loss": 0.7787, - "step": 34800 - }, - { - "epoch": 8.5, - "learning_rate": 0.00045443487129365016, - "loss": 0.6958, - "step": 34825 - }, - { - "epoch": 8.5, - "learning_rate": 0.0004544016721732941, - "loss": 0.7198, - "step": 34850 - }, - { - "epoch": 8.51, - "learning_rate": 0.000454368473052938, - "loss": 0.7049, - "step": 34875 - }, - { - "epoch": 8.52, - "learning_rate": 0.0004543352739325819, - "loss": 0.7153, - "step": 34900 - }, - { - "epoch": 8.52, - "learning_rate": 0.0004543020748122258, - "loss": 0.6683, - "step": 34925 - }, - { - "epoch": 8.53, - "learning_rate": 0.0004542688756918697, - "loss": 0.7465, - "step": 34950 - }, - { - "epoch": 8.53, - "learning_rate": 0.0004542370045363278, - "loss": 0.7218, - "step": 34975 - }, - { - "epoch": 8.54, - "learning_rate": 0.00045420380541597174, - "loss": 0.7668, - "step": 35000 - }, - { - "epoch": 8.55, - "learning_rate": 0.0004541706062956156, - "loss": 0.7447, - "step": 35025 - }, - { - "epoch": 8.55, - "learning_rate": 0.00045413740717525946, - "loss": 0.7514, - "step": 35050 - }, - { - "epoch": 8.56, - "learning_rate": 0.00045410420805490337, - "loss": 0.6962, - "step": 35075 - }, - { - "epoch": 8.57, - "learning_rate": 0.0004540710089345473, - "loss": 0.7447, - "step": 35100 - }, - { - "epoch": 8.57, - "learning_rate": 0.0004540378098141912, - "loss": 0.6955, - "step": 35125 - }, - { - "epoch": 8.58, - "learning_rate": 0.00045400461069383506, - "loss": 0.7442, - "step": 35150 - }, - { - "epoch": 8.58, - "learning_rate": 0.0004539714115734789, - "loss": 0.7125, - "step": 35175 - }, - { - "epoch": 8.59, - "learning_rate": 0.00045393821245312283, - "loss": 0.6657, - "step": 35200 - }, - { - "epoch": 8.6, - "learning_rate": 0.00045390501333276675, - "loss": 0.7187, - "step": 35225 - }, - { - "epoch": 8.6, - "learning_rate": 0.00045387181421241066, - "loss": 0.7508, - "step": 35250 - }, - { - "epoch": 8.61, - "learning_rate": 0.0004538386150920545, - "loss": 0.6859, - "step": 35275 - }, - { - "epoch": 8.61, - "learning_rate": 0.00045380541597169843, - "loss": 0.735, - "step": 35300 - }, - { - "epoch": 8.62, - "learning_rate": 0.0004537722168513423, - "loss": 0.7471, - "step": 35325 - }, - { - "epoch": 8.63, - "learning_rate": 0.0004537390177309862, - "loss": 0.7225, - "step": 35350 - }, - { - "epoch": 8.63, - "learning_rate": 0.00045370581861063007, - "loss": 0.6906, - "step": 35375 - }, - { - "epoch": 8.64, - "learning_rate": 0.000453672619490274, - "loss": 0.7514, - "step": 35400 - }, - { - "epoch": 8.64, - "learning_rate": 0.0004536394203699179, - "loss": 0.6694, - "step": 35425 - }, - { - "epoch": 8.65, - "learning_rate": 0.0004536062212495618, - "loss": 0.7746, - "step": 35450 - }, - { - "epoch": 8.66, - "learning_rate": 0.00045357302212920567, - "loss": 0.701, - "step": 35475 - }, - { - "epoch": 8.66, - "learning_rate": 0.00045353982300884953, - "loss": 0.7392, - "step": 35500 - }, - { - "epoch": 8.67, - "learning_rate": 0.00045350662388849344, - "loss": 0.6876, - "step": 35525 - }, - { - "epoch": 8.67, - "learning_rate": 0.00045347342476813736, - "loss": 0.7694, - "step": 35550 - }, - { - "epoch": 8.68, - "learning_rate": 0.00045344022564778127, - "loss": 0.7055, - "step": 35575 - }, - { - "epoch": 8.69, - "learning_rate": 0.0004534070265274252, - "loss": 0.7324, - "step": 35600 - }, - { - "epoch": 8.69, - "learning_rate": 0.000453373827407069, - "loss": 0.6626, - "step": 35625 - }, - { - "epoch": 8.7, - "learning_rate": 0.0004533406282867129, - "loss": 0.7154, - "step": 35650 - }, - { - "epoch": 8.71, - "learning_rate": 0.0004533074291663568, - "loss": 0.6535, - "step": 35675 - }, - { - "epoch": 8.71, - "learning_rate": 0.00045327423004600073, - "loss": 0.7425, - "step": 35700 - }, - { - "epoch": 8.72, - "learning_rate": 0.0004532410309256446, - "loss": 0.6725, - "step": 35725 - }, - { - "epoch": 8.72, - "learning_rate": 0.0004532078318052885, - "loss": 0.7673, - "step": 35750 - }, - { - "epoch": 8.73, - "learning_rate": 0.00045317463268493237, - "loss": 0.7024, - "step": 35775 - }, - { - "epoch": 8.74, - "learning_rate": 0.0004531414335645763, - "loss": 0.7646, - "step": 35800 - }, - { - "epoch": 8.74, - "learning_rate": 0.0004531082344442202, - "loss": 0.6934, - "step": 35825 - }, - { - "epoch": 8.75, - "learning_rate": 0.00045307503532386405, - "loss": 0.7679, - "step": 35850 - }, - { - "epoch": 8.75, - "learning_rate": 0.00045304183620350797, - "loss": 0.7127, - "step": 35875 - }, - { - "epoch": 8.76, - "learning_rate": 0.0004530086370831519, - "loss": 0.7156, - "step": 35900 - }, - { - "epoch": 8.77, - "learning_rate": 0.00045297543796279574, - "loss": 0.7257, - "step": 35925 - }, - { - "epoch": 8.77, - "learning_rate": 0.0004529422388424396, - "loss": 0.7511, - "step": 35950 - }, - { - "epoch": 8.78, - "learning_rate": 0.0004529090397220835, - "loss": 0.716, - "step": 35975 - }, - { - "epoch": 8.78, - "learning_rate": 0.00045287584060172743, - "loss": 0.6707, - "step": 36000 - }, - { - "epoch": 8.78, - "eval_cer": 0.1483578534542057, - "eval_loss": 0.4949270784854889, - "eval_runtime": 144.1661, - "eval_samples_per_second": 29.085, - "eval_steps_per_second": 7.276, - "eval_wer": 0.5880587275693312, - "step": 36000 - }, - { - "epoch": 8.79, - "learning_rate": 0.00045284264148137134, - "loss": 0.7008, - "step": 36025 - }, - { - "epoch": 8.8, - "learning_rate": 0.00045280944236101526, - "loss": 0.7192, - "step": 36050 - }, - { - "epoch": 8.8, - "learning_rate": 0.00045277624324065906, - "loss": 0.6832, - "step": 36075 - }, - { - "epoch": 8.81, - "learning_rate": 0.000452743044120303, - "loss": 0.6916, - "step": 36100 - }, - { - "epoch": 8.82, - "learning_rate": 0.0004527098449999469, - "loss": 0.7466, - "step": 36125 - }, - { - "epoch": 8.82, - "learning_rate": 0.0004526766458795908, - "loss": 0.7268, - "step": 36150 - }, - { - "epoch": 8.83, - "learning_rate": 0.0004526447747240489, - "loss": 0.7509, - "step": 36175 - }, - { - "epoch": 8.83, - "learning_rate": 0.0004526115756036928, - "loss": 0.7412, - "step": 36200 - }, - { - "epoch": 8.84, - "learning_rate": 0.0004525783764833367, - "loss": 0.7099, - "step": 36225 - }, - { - "epoch": 8.85, - "learning_rate": 0.00045254517736298064, - "loss": 0.7817, - "step": 36250 - }, - { - "epoch": 8.85, - "learning_rate": 0.00045251197824262444, - "loss": 0.7181, - "step": 36275 - }, - { - "epoch": 8.86, - "learning_rate": 0.00045247877912226836, - "loss": 0.7417, - "step": 36300 - }, - { - "epoch": 8.86, - "learning_rate": 0.00045244558000191227, - "loss": 0.7523, - "step": 36325 - }, - { - "epoch": 8.87, - "learning_rate": 0.0004524123808815562, - "loss": 0.7523, - "step": 36350 - }, - { - "epoch": 8.88, - "learning_rate": 0.0004523791817612001, - "loss": 0.6954, - "step": 36375 - }, - { - "epoch": 8.88, - "learning_rate": 0.00045234598264084396, - "loss": 0.7373, - "step": 36400 - }, - { - "epoch": 8.89, - "learning_rate": 0.0004523127835204878, - "loss": 0.6966, - "step": 36425 - }, - { - "epoch": 8.89, - "learning_rate": 0.00045227958440013173, - "loss": 0.7854, - "step": 36450 - }, - { - "epoch": 8.9, - "learning_rate": 0.00045224638527977565, - "loss": 0.7014, - "step": 36475 - }, - { - "epoch": 8.91, - "learning_rate": 0.0004522131861594195, - "loss": 0.6959, - "step": 36500 - }, - { - "epoch": 8.91, - "learning_rate": 0.0004521799870390634, - "loss": 0.6655, - "step": 36525 - }, - { - "epoch": 8.92, - "learning_rate": 0.00045214678791870733, - "loss": 0.7365, - "step": 36550 - }, - { - "epoch": 8.93, - "learning_rate": 0.0004521135887983512, - "loss": 0.7066, - "step": 36575 - }, - { - "epoch": 8.93, - "learning_rate": 0.0004520803896779951, - "loss": 0.7764, - "step": 36600 - }, - { - "epoch": 8.94, - "learning_rate": 0.00045204719055763897, - "loss": 0.7355, - "step": 36625 - }, - { - "epoch": 8.94, - "learning_rate": 0.0004520139914372829, - "loss": 0.737, - "step": 36650 - }, - { - "epoch": 8.95, - "learning_rate": 0.0004519807923169268, - "loss": 0.6743, - "step": 36675 - }, - { - "epoch": 8.96, - "learning_rate": 0.0004519475931965707, - "loss": 0.7412, - "step": 36700 - }, - { - "epoch": 8.96, - "learning_rate": 0.0004519143940762145, - "loss": 0.6972, - "step": 36725 - }, - { - "epoch": 8.97, - "learning_rate": 0.00045188119495585843, - "loss": 0.6959, - "step": 36750 - }, - { - "epoch": 8.97, - "learning_rate": 0.00045184799583550234, - "loss": 0.7406, - "step": 36775 - }, - { - "epoch": 8.98, - "learning_rate": 0.00045181479671514626, - "loss": 0.7489, - "step": 36800 - }, - { - "epoch": 8.99, - "learning_rate": 0.00045178159759479017, - "loss": 0.7189, - "step": 36825 - }, - { - "epoch": 8.99, - "learning_rate": 0.00045174839847443403, - "loss": 0.7095, - "step": 36850 - }, - { - "epoch": 9.0, - "learning_rate": 0.0004517151993540779, - "loss": 0.6805, - "step": 36875 - }, - { - "epoch": 9.0, - "learning_rate": 0.0004516820002337218, - "loss": 0.7752, - "step": 36900 - }, - { - "epoch": 9.01, - "learning_rate": 0.0004516488011133657, - "loss": 0.6744, - "step": 36925 - }, - { - "epoch": 9.02, - "learning_rate": 0.00045161560199300963, - "loss": 0.7001, - "step": 36950 - }, - { - "epoch": 9.02, - "learning_rate": 0.0004515824028726535, - "loss": 0.6452, - "step": 36975 - }, - { - "epoch": 9.03, - "learning_rate": 0.0004515492037522974, - "loss": 0.7344, - "step": 37000 - }, - { - "epoch": 9.03, - "learning_rate": 0.00045151600463194127, - "loss": 0.6445, - "step": 37025 - }, - { - "epoch": 9.04, - "learning_rate": 0.0004514828055115852, - "loss": 0.7017, - "step": 37050 - }, - { - "epoch": 9.05, - "learning_rate": 0.00045144960639122904, - "loss": 0.6833, - "step": 37075 - }, - { - "epoch": 9.05, - "learning_rate": 0.00045141640727087295, - "loss": 0.724, - "step": 37100 - }, - { - "epoch": 9.06, - "learning_rate": 0.00045138320815051687, - "loss": 0.7056, - "step": 37125 - }, - { - "epoch": 9.07, - "learning_rate": 0.0004513500090301608, - "loss": 0.7139, - "step": 37150 - }, - { - "epoch": 9.07, - "learning_rate": 0.00045131680990980464, - "loss": 0.6972, - "step": 37175 - }, - { - "epoch": 9.08, - "learning_rate": 0.0004512836107894485, - "loss": 0.6807, - "step": 37200 - }, - { - "epoch": 9.08, - "learning_rate": 0.0004512504116690924, - "loss": 0.7068, - "step": 37225 - }, - { - "epoch": 9.09, - "learning_rate": 0.00045121721254873633, - "loss": 0.763, - "step": 37250 - }, - { - "epoch": 9.1, - "learning_rate": 0.00045118401342838024, - "loss": 0.6558, - "step": 37275 - }, - { - "epoch": 9.1, - "learning_rate": 0.0004511508143080241, - "loss": 0.7469, - "step": 37300 - }, - { - "epoch": 9.11, - "learning_rate": 0.00045111761518766796, - "loss": 0.6294, - "step": 37325 - }, - { - "epoch": 9.11, - "learning_rate": 0.0004510844160673119, - "loss": 0.7112, - "step": 37350 - }, - { - "epoch": 9.12, - "learning_rate": 0.0004510512169469558, - "loss": 0.6873, - "step": 37375 - }, - { - "epoch": 9.13, - "learning_rate": 0.0004510180178265997, - "loss": 0.7776, - "step": 37400 - }, - { - "epoch": 9.13, - "learning_rate": 0.00045098481870624356, - "loss": 0.6728, - "step": 37425 - }, - { - "epoch": 9.14, - "learning_rate": 0.0004509516195858875, - "loss": 0.747, - "step": 37450 - }, - { - "epoch": 9.14, - "learning_rate": 0.00045091842046553134, - "loss": 0.6623, - "step": 37475 - }, - { - "epoch": 9.15, - "learning_rate": 0.00045088522134517525, - "loss": 0.7196, - "step": 37500 - }, - { - "epoch": 9.16, - "learning_rate": 0.0004508520222248191, - "loss": 0.7017, - "step": 37525 - }, - { - "epoch": 9.16, - "learning_rate": 0.000450818823104463, - "loss": 0.723, - "step": 37550 - }, - { - "epoch": 9.17, - "learning_rate": 0.00045078562398410694, - "loss": 0.66, - "step": 37575 - }, - { - "epoch": 9.18, - "learning_rate": 0.00045075242486375085, - "loss": 0.7111, - "step": 37600 - }, - { - "epoch": 9.18, - "learning_rate": 0.0004507192257433947, - "loss": 0.7159, - "step": 37625 - }, - { - "epoch": 9.19, - "learning_rate": 0.0004506860266230386, - "loss": 0.7171, - "step": 37650 - }, - { - "epoch": 9.19, - "learning_rate": 0.0004506528275026825, - "loss": 0.6743, - "step": 37675 - }, - { - "epoch": 9.2, - "learning_rate": 0.0004506196283823264, - "loss": 0.7218, - "step": 37700 - }, - { - "epoch": 9.21, - "learning_rate": 0.0004505864292619703, - "loss": 0.6664, - "step": 37725 - }, - { - "epoch": 9.21, - "learning_rate": 0.0004505532301416142, - "loss": 0.7363, - "step": 37750 - }, - { - "epoch": 9.22, - "learning_rate": 0.00045052003102125803, - "loss": 0.6426, - "step": 37775 - }, - { - "epoch": 9.22, - "learning_rate": 0.00045048683190090195, - "loss": 0.664, - "step": 37800 - }, - { - "epoch": 9.23, - "learning_rate": 0.00045045363278054586, - "loss": 0.7016, - "step": 37825 - }, - { - "epoch": 9.24, - "learning_rate": 0.0004504204336601898, - "loss": 0.6749, - "step": 37850 - }, - { - "epoch": 9.24, - "learning_rate": 0.00045038723453983364, - "loss": 0.6577, - "step": 37875 - }, - { - "epoch": 9.25, - "learning_rate": 0.00045035403541947755, - "loss": 0.744, - "step": 37900 - }, - { - "epoch": 9.25, - "learning_rate": 0.0004503208362991214, - "loss": 0.6835, - "step": 37925 - }, - { - "epoch": 9.26, - "learning_rate": 0.0004502876371787653, - "loss": 0.7322, - "step": 37950 - }, - { - "epoch": 9.27, - "learning_rate": 0.0004502544380584092, - "loss": 0.708, - "step": 37975 - }, - { - "epoch": 9.27, - "learning_rate": 0.0004502212389380531, - "loss": 0.7195, - "step": 38000 - }, - { - "epoch": 9.28, - "learning_rate": 0.000450188039817697, - "loss": 0.6804, - "step": 38025 - }, - { - "epoch": 9.29, - "learning_rate": 0.0004501548406973409, - "loss": 0.7341, - "step": 38050 - }, - { - "epoch": 9.29, - "learning_rate": 0.0004501216415769848, - "loss": 0.7179, - "step": 38075 - }, - { - "epoch": 9.3, - "learning_rate": 0.00045008844245662865, - "loss": 0.7163, - "step": 38100 - }, - { - "epoch": 9.3, - "learning_rate": 0.00045005524333627256, - "loss": 0.6866, - "step": 38125 - }, - { - "epoch": 9.31, - "learning_rate": 0.0004500220442159165, - "loss": 0.7201, - "step": 38150 - }, - { - "epoch": 9.32, - "learning_rate": 0.0004499888450955604, - "loss": 0.6692, - "step": 38175 - }, - { - "epoch": 9.32, - "learning_rate": 0.0004499556459752043, - "loss": 0.6772, - "step": 38200 - }, - { - "epoch": 9.33, - "learning_rate": 0.0004499224468548481, - "loss": 0.6355, - "step": 38225 - }, - { - "epoch": 9.33, - "learning_rate": 0.000449889247734492, - "loss": 0.7786, - "step": 38250 - }, - { - "epoch": 9.34, - "learning_rate": 0.00044985604861413593, - "loss": 0.691, - "step": 38275 - }, - { - "epoch": 9.35, - "learning_rate": 0.00044982284949377985, - "loss": 0.6757, - "step": 38300 - }, - { - "epoch": 9.35, - "learning_rate": 0.0004497896503734237, - "loss": 0.6706, - "step": 38325 - }, - { - "epoch": 9.36, - "learning_rate": 0.0004497564512530676, - "loss": 0.709, - "step": 38350 - }, - { - "epoch": 9.36, - "learning_rate": 0.0004497232521327115, - "loss": 0.6798, - "step": 38375 - }, - { - "epoch": 9.37, - "learning_rate": 0.0004496900530123554, - "loss": 0.7252, - "step": 38400 - }, - { - "epoch": 9.38, - "learning_rate": 0.0004496568538919993, - "loss": 0.6908, - "step": 38425 - }, - { - "epoch": 9.38, - "learning_rate": 0.00044962365477164317, - "loss": 0.7345, - "step": 38450 - }, - { - "epoch": 9.39, - "learning_rate": 0.0004495904556512871, - "loss": 0.7017, - "step": 38475 - }, - { - "epoch": 9.39, - "learning_rate": 0.000449557256530931, - "loss": 0.7145, - "step": 38500 - }, - { - "epoch": 9.4, - "learning_rate": 0.00044952405741057486, - "loss": 0.6815, - "step": 38525 - }, - { - "epoch": 9.41, - "learning_rate": 0.0004494908582902187, - "loss": 0.7273, - "step": 38550 - }, - { - "epoch": 9.41, - "learning_rate": 0.00044945765916986263, - "loss": 0.6296, - "step": 38575 - }, - { - "epoch": 9.42, - "learning_rate": 0.00044942446004950655, - "loss": 0.7299, - "step": 38600 - }, - { - "epoch": 9.43, - "learning_rate": 0.00044939126092915046, - "loss": 0.6673, - "step": 38625 - }, - { - "epoch": 9.43, - "learning_rate": 0.0004493580618087944, - "loss": 0.6781, - "step": 38650 - }, - { - "epoch": 9.44, - "learning_rate": 0.0004493248626884382, - "loss": 0.6999, - "step": 38675 - }, - { - "epoch": 9.44, - "learning_rate": 0.0004492916635680821, - "loss": 0.6705, - "step": 38700 - }, - { - "epoch": 9.45, - "learning_rate": 0.000449258464447726, - "loss": 0.6873, - "step": 38725 - }, - { - "epoch": 9.46, - "learning_rate": 0.0004492252653273699, - "loss": 0.7198, - "step": 38750 - }, - { - "epoch": 9.46, - "learning_rate": 0.0004491920662070138, - "loss": 0.6728, - "step": 38775 - }, - { - "epoch": 9.47, - "learning_rate": 0.0004491588670866577, - "loss": 0.7017, - "step": 38800 - }, - { - "epoch": 9.47, - "learning_rate": 0.00044912566796630155, - "loss": 0.7148, - "step": 38825 - }, - { - "epoch": 9.48, - "learning_rate": 0.00044909246884594547, - "loss": 0.7188, - "step": 38850 - }, - { - "epoch": 9.49, - "learning_rate": 0.0004490592697255894, - "loss": 0.6564, - "step": 38875 - }, - { - "epoch": 9.49, - "learning_rate": 0.00044902607060523324, - "loss": 0.6816, - "step": 38900 - }, - { - "epoch": 9.5, - "learning_rate": 0.00044899287148487716, - "loss": 0.6847, - "step": 38925 - }, - { - "epoch": 9.5, - "learning_rate": 0.00044895967236452107, - "loss": 0.6948, - "step": 38950 - }, - { - "epoch": 9.51, - "learning_rate": 0.00044892647324416493, - "loss": 0.7111, - "step": 38975 - }, - { - "epoch": 9.52, - "learning_rate": 0.0004488932741238088, - "loss": 0.719, - "step": 39000 - }, - { - "epoch": 9.52, - "eval_cer": 0.15075511021221114, - "eval_loss": 0.5013872385025024, - "eval_runtime": 145.9791, - "eval_samples_per_second": 28.723, - "eval_steps_per_second": 7.186, - "eval_wer": 0.5959216965742251, - "step": 39000 - }, - { - "epoch": 9.52, - "learning_rate": 0.0004488600750034527, - "loss": 0.6854, - "step": 39025 - }, - { - "epoch": 9.53, - "learning_rate": 0.0004488268758830966, - "loss": 0.678, - "step": 39050 - }, - { - "epoch": 9.54, - "learning_rate": 0.00044879367676274053, - "loss": 0.6631, - "step": 39075 - }, - { - "epoch": 9.54, - "learning_rate": 0.00044876047764238445, - "loss": 0.7081, - "step": 39100 - }, - { - "epoch": 9.55, - "learning_rate": 0.00044872727852202825, - "loss": 0.6705, - "step": 39125 - }, - { - "epoch": 9.55, - "learning_rate": 0.00044869407940167216, - "loss": 0.729, - "step": 39150 - }, - { - "epoch": 9.56, - "learning_rate": 0.0004486608802813161, - "loss": 0.7027, - "step": 39175 - }, - { - "epoch": 9.57, - "learning_rate": 0.00044862768116096, - "loss": 0.7308, - "step": 39200 - }, - { - "epoch": 9.57, - "learning_rate": 0.0004485944820406039, - "loss": 0.7288, - "step": 39225 - }, - { - "epoch": 9.58, - "learning_rate": 0.00044856128292024777, - "loss": 0.7452, - "step": 39250 - }, - { - "epoch": 9.58, - "learning_rate": 0.0004485280837998916, - "loss": 0.6672, - "step": 39275 - }, - { - "epoch": 9.59, - "learning_rate": 0.00044849488467953554, - "loss": 0.7339, - "step": 39300 - }, - { - "epoch": 9.6, - "learning_rate": 0.00044846168555917945, - "loss": 0.6634, - "step": 39325 - }, - { - "epoch": 9.6, - "learning_rate": 0.0004484284864388233, - "loss": 0.753, - "step": 39350 - }, - { - "epoch": 9.61, - "learning_rate": 0.00044839528731846723, - "loss": 0.7163, - "step": 39375 - }, - { - "epoch": 9.61, - "learning_rate": 0.00044836208819811114, - "loss": 0.688, - "step": 39400 - }, - { - "epoch": 9.62, - "learning_rate": 0.000448328889077755, - "loss": 0.6879, - "step": 39425 - }, - { - "epoch": 9.63, - "learning_rate": 0.00044829701792221315, - "loss": 0.6762, - "step": 39450 - }, - { - "epoch": 9.63, - "learning_rate": 0.000448263818801857, - "loss": 0.6697, - "step": 39475 - }, - { - "epoch": 9.64, - "learning_rate": 0.0004482306196815009, - "loss": 0.7131, - "step": 39500 - }, - { - "epoch": 9.64, - "learning_rate": 0.00044819742056114483, - "loss": 0.6714, - "step": 39525 - }, - { - "epoch": 9.65, - "learning_rate": 0.00044816422144078875, - "loss": 0.7331, - "step": 39550 - }, - { - "epoch": 9.66, - "learning_rate": 0.0004481310223204326, - "loss": 0.669, - "step": 39575 - }, - { - "epoch": 9.66, - "learning_rate": 0.0004480978232000765, - "loss": 0.7278, - "step": 39600 - }, - { - "epoch": 9.67, - "learning_rate": 0.0004480646240797204, - "loss": 0.71, - "step": 39625 - }, - { - "epoch": 9.68, - "learning_rate": 0.0004480314249593643, - "loss": 0.7189, - "step": 39650 - }, - { - "epoch": 9.68, - "learning_rate": 0.00044799822583900815, - "loss": 0.6807, - "step": 39675 - }, - { - "epoch": 9.69, - "learning_rate": 0.00044796502671865207, - "loss": 0.7424, - "step": 39700 - }, - { - "epoch": 9.69, - "learning_rate": 0.000447931827598296, - "loss": 0.6599, - "step": 39725 - }, - { - "epoch": 9.7, - "learning_rate": 0.0004478986284779399, - "loss": 0.7126, - "step": 39750 - }, - { - "epoch": 9.71, - "learning_rate": 0.00044786542935758376, - "loss": 0.6809, - "step": 39775 - }, - { - "epoch": 9.71, - "learning_rate": 0.0004478322302372276, - "loss": 0.7082, - "step": 39800 - }, - { - "epoch": 9.72, - "learning_rate": 0.00044779903111687153, - "loss": 0.6746, - "step": 39825 - }, - { - "epoch": 9.72, - "learning_rate": 0.00044776583199651544, - "loss": 0.7128, - "step": 39850 - }, - { - "epoch": 9.73, - "learning_rate": 0.00044773263287615936, - "loss": 0.6563, - "step": 39875 - }, - { - "epoch": 9.74, - "learning_rate": 0.0004476994337558032, - "loss": 0.7062, - "step": 39900 - }, - { - "epoch": 9.74, - "learning_rate": 0.0004476662346354471, - "loss": 0.7103, - "step": 39925 - }, - { - "epoch": 9.75, - "learning_rate": 0.000447633035515091, - "loss": 0.7658, - "step": 39950 - }, - { - "epoch": 9.75, - "learning_rate": 0.0004475998363947349, - "loss": 0.71, - "step": 39975 - }, - { - "epoch": 9.76, - "learning_rate": 0.0004475666372743788, - "loss": 0.7136, - "step": 40000 - }, - { - "epoch": 9.77, - "learning_rate": 0.0004475334381540227, - "loss": 0.6374, - "step": 40025 - }, - { - "epoch": 9.77, - "learning_rate": 0.0004475002390336666, - "loss": 0.7416, - "step": 40050 - }, - { - "epoch": 9.78, - "learning_rate": 0.00044746703991331045, - "loss": 0.6768, - "step": 40075 - }, - { - "epoch": 9.79, - "learning_rate": 0.00044743384079295437, - "loss": 0.7113, - "step": 40100 - }, - { - "epoch": 9.79, - "learning_rate": 0.0004474006416725982, - "loss": 0.7097, - "step": 40125 - }, - { - "epoch": 9.8, - "learning_rate": 0.00044736744255224214, - "loss": 0.73, - "step": 40150 - }, - { - "epoch": 9.8, - "learning_rate": 0.00044733424343188606, - "loss": 0.6649, - "step": 40175 - }, - { - "epoch": 9.81, - "learning_rate": 0.0004473010443115299, - "loss": 0.7055, - "step": 40200 - }, - { - "epoch": 9.82, - "learning_rate": 0.00044726784519117383, - "loss": 0.7035, - "step": 40225 - }, - { - "epoch": 9.82, - "learning_rate": 0.0004472346460708177, - "loss": 0.6875, - "step": 40250 - }, - { - "epoch": 9.83, - "learning_rate": 0.0004472014469504616, - "loss": 0.6591, - "step": 40275 - }, - { - "epoch": 9.83, - "learning_rate": 0.0004471682478301055, - "loss": 0.7477, - "step": 40300 - }, - { - "epoch": 9.84, - "learning_rate": 0.00044713504870974943, - "loss": 0.6654, - "step": 40325 - }, - { - "epoch": 9.85, - "learning_rate": 0.00044710184958939324, - "loss": 0.7281, - "step": 40350 - }, - { - "epoch": 9.85, - "learning_rate": 0.00044706865046903715, - "loss": 0.7106, - "step": 40375 - }, - { - "epoch": 9.86, - "learning_rate": 0.00044703545134868106, - "loss": 0.6784, - "step": 40400 - }, - { - "epoch": 9.86, - "learning_rate": 0.000447002252228325, - "loss": 0.7191, - "step": 40425 - }, - { - "epoch": 9.87, - "learning_rate": 0.0004469690531079689, - "loss": 0.7231, - "step": 40450 - }, - { - "epoch": 9.88, - "learning_rate": 0.00044693585398761275, - "loss": 0.6801, - "step": 40475 - }, - { - "epoch": 9.88, - "learning_rate": 0.0004469026548672566, - "loss": 0.7126, - "step": 40500 - }, - { - "epoch": 9.89, - "learning_rate": 0.0004468694557469005, - "loss": 0.6579, - "step": 40525 - }, - { - "epoch": 9.9, - "learning_rate": 0.00044683625662654444, - "loss": 0.7128, - "step": 40550 - }, - { - "epoch": 9.9, - "learning_rate": 0.0004468030575061883, - "loss": 0.677, - "step": 40575 - }, - { - "epoch": 9.91, - "learning_rate": 0.0004467698583858322, - "loss": 0.707, - "step": 40600 - }, - { - "epoch": 9.91, - "learning_rate": 0.00044673665926547613, - "loss": 0.6787, - "step": 40625 - }, - { - "epoch": 9.92, - "learning_rate": 0.00044670346014512, - "loss": 0.7532, - "step": 40650 - }, - { - "epoch": 9.93, - "learning_rate": 0.0004466702610247639, - "loss": 0.6928, - "step": 40675 - }, - { - "epoch": 9.93, - "learning_rate": 0.00044663706190440776, - "loss": 0.7258, - "step": 40700 - }, - { - "epoch": 9.94, - "learning_rate": 0.0004466038627840517, - "loss": 0.6488, - "step": 40725 - }, - { - "epoch": 9.94, - "learning_rate": 0.0004465706636636956, - "loss": 0.731, - "step": 40750 - }, - { - "epoch": 9.95, - "learning_rate": 0.0004465374645433395, - "loss": 0.6426, - "step": 40775 - }, - { - "epoch": 9.96, - "learning_rate": 0.00044650426542298336, - "loss": 0.7102, - "step": 40800 - }, - { - "epoch": 9.96, - "learning_rate": 0.0004464710663026272, - "loss": 0.6771, - "step": 40825 - }, - { - "epoch": 9.97, - "learning_rate": 0.00044643786718227114, - "loss": 0.7049, - "step": 40850 - }, - { - "epoch": 9.97, - "learning_rate": 0.00044640466806191505, - "loss": 0.6875, - "step": 40875 - }, - { - "epoch": 9.98, - "learning_rate": 0.00044637146894155896, - "loss": 0.7471, - "step": 40900 - }, - { - "epoch": 9.99, - "learning_rate": 0.0004463382698212028, - "loss": 0.6649, - "step": 40925 - }, - { - "epoch": 9.99, - "learning_rate": 0.0004463050707008467, - "loss": 0.7104, - "step": 40950 - }, - { - "epoch": 10.0, - "learning_rate": 0.0004462718715804906, - "loss": 0.6589, - "step": 40975 - }, - { - "epoch": 10.0, - "learning_rate": 0.0004462386724601345, - "loss": 0.7005, - "step": 41000 - }, - { - "epoch": 10.01, - "learning_rate": 0.0004462054733397784, - "loss": 0.661, - "step": 41025 - }, - { - "epoch": 10.02, - "learning_rate": 0.0004461722742194223, - "loss": 0.6775, - "step": 41050 - }, - { - "epoch": 10.02, - "learning_rate": 0.0004461390750990662, - "loss": 0.6869, - "step": 41075 - }, - { - "epoch": 10.03, - "learning_rate": 0.00044610587597871006, - "loss": 0.6901, - "step": 41100 - }, - { - "epoch": 10.04, - "learning_rate": 0.000446072676858354, - "loss": 0.6488, - "step": 41125 - }, - { - "epoch": 10.04, - "learning_rate": 0.00044603947773799783, - "loss": 0.6936, - "step": 41150 - }, - { - "epoch": 10.05, - "learning_rate": 0.00044600627861764175, - "loss": 0.6753, - "step": 41175 - }, - { - "epoch": 10.05, - "learning_rate": 0.00044597307949728566, - "loss": 0.6729, - "step": 41200 - }, - { - "epoch": 10.06, - "learning_rate": 0.0004459398803769296, - "loss": 0.6251, - "step": 41225 - }, - { - "epoch": 10.07, - "learning_rate": 0.00044590668125657343, - "loss": 0.6957, - "step": 41250 - }, - { - "epoch": 10.07, - "learning_rate": 0.0004458734821362173, - "loss": 0.6599, - "step": 41275 - }, - { - "epoch": 10.08, - "learning_rate": 0.0004458402830158612, - "loss": 0.6987, - "step": 41300 - }, - { - "epoch": 10.08, - "learning_rate": 0.0004458070838955051, - "loss": 0.6458, - "step": 41325 - }, - { - "epoch": 10.09, - "learning_rate": 0.00044577388477514904, - "loss": 0.6997, - "step": 41350 - }, - { - "epoch": 10.1, - "learning_rate": 0.0004457406856547929, - "loss": 0.6358, - "step": 41375 - }, - { - "epoch": 10.1, - "learning_rate": 0.00044570748653443676, - "loss": 0.6762, - "step": 41400 - }, - { - "epoch": 10.11, - "learning_rate": 0.00044567428741408067, - "loss": 0.65, - "step": 41425 - }, - { - "epoch": 10.11, - "learning_rate": 0.0004456410882937246, - "loss": 0.6963, - "step": 41450 - }, - { - "epoch": 10.12, - "learning_rate": 0.0004456078891733685, - "loss": 0.6206, - "step": 41475 - }, - { - "epoch": 10.13, - "learning_rate": 0.00044557469005301236, - "loss": 0.7114, - "step": 41500 - }, - { - "epoch": 10.13, - "learning_rate": 0.00044554149093265627, - "loss": 0.6766, - "step": 41525 - }, - { - "epoch": 10.14, - "learning_rate": 0.00044550829181230013, - "loss": 0.6714, - "step": 41550 - }, - { - "epoch": 10.15, - "learning_rate": 0.00044547509269194405, - "loss": 0.6488, - "step": 41575 - }, - { - "epoch": 10.15, - "learning_rate": 0.0004454418935715879, - "loss": 0.689, - "step": 41600 - }, - { - "epoch": 10.16, - "learning_rate": 0.0004454086944512318, - "loss": 0.6763, - "step": 41625 - }, - { - "epoch": 10.16, - "learning_rate": 0.00044537549533087573, - "loss": 0.6771, - "step": 41650 - }, - { - "epoch": 10.17, - "learning_rate": 0.00044534229621051965, - "loss": 0.6449, - "step": 41675 - }, - { - "epoch": 10.18, - "learning_rate": 0.0004453090970901635, - "loss": 0.7202, - "step": 41700 - }, - { - "epoch": 10.18, - "learning_rate": 0.00044527589796980737, - "loss": 0.6936, - "step": 41725 - }, - { - "epoch": 10.19, - "learning_rate": 0.0004452426988494513, - "loss": 0.7044, - "step": 41750 - }, - { - "epoch": 10.19, - "learning_rate": 0.0004452094997290952, - "loss": 0.6643, - "step": 41775 - }, - { - "epoch": 10.2, - "learning_rate": 0.0004451763006087391, - "loss": 0.6966, - "step": 41800 - }, - { - "epoch": 10.21, - "learning_rate": 0.000445143101488383, - "loss": 0.6873, - "step": 41825 - }, - { - "epoch": 10.21, - "learning_rate": 0.00044510990236802683, - "loss": 0.7328, - "step": 41850 - }, - { - "epoch": 10.22, - "learning_rate": 0.00044507670324767074, - "loss": 0.6346, - "step": 41875 - }, - { - "epoch": 10.22, - "learning_rate": 0.00044504350412731466, - "loss": 0.6716, - "step": 41900 - }, - { - "epoch": 10.23, - "learning_rate": 0.00044501030500695857, - "loss": 0.6719, - "step": 41925 - }, - { - "epoch": 10.24, - "learning_rate": 0.00044497710588660243, - "loss": 0.7415, - "step": 41950 - }, - { - "epoch": 10.24, - "learning_rate": 0.00044494390676624634, - "loss": 0.6444, - "step": 41975 - }, - { - "epoch": 10.25, - "learning_rate": 0.0004449107076458902, - "loss": 0.6563, - "step": 42000 - }, - { - "epoch": 10.25, - "eval_cer": 0.14417420407995646, - "eval_loss": 0.4852425754070282, - "eval_runtime": 146.8969, - "eval_samples_per_second": 28.544, - "eval_steps_per_second": 7.141, - "eval_wer": 0.5690701468189233, - "step": 42000 - }, - { - "epoch": 10.26, - "learning_rate": 0.0004448775085255341, - "loss": 0.6437, - "step": 42025 - }, - { - "epoch": 10.26, - "learning_rate": 0.00044484430940517803, - "loss": 0.7146, - "step": 42050 - }, - { - "epoch": 10.27, - "learning_rate": 0.0004448111102848219, - "loss": 0.6791, - "step": 42075 - }, - { - "epoch": 10.27, - "learning_rate": 0.0004447779111644658, - "loss": 0.7027, - "step": 42100 - }, - { - "epoch": 10.28, - "learning_rate": 0.0004447447120441097, - "loss": 0.6643, - "step": 42125 - }, - { - "epoch": 10.29, - "learning_rate": 0.0004447115129237536, - "loss": 0.693, - "step": 42150 - }, - { - "epoch": 10.29, - "learning_rate": 0.00044467831380339744, - "loss": 0.6317, - "step": 42175 - }, - { - "epoch": 10.3, - "learning_rate": 0.00044464511468304135, - "loss": 0.72, - "step": 42200 - }, - { - "epoch": 10.3, - "learning_rate": 0.00044461191556268527, - "loss": 0.6405, - "step": 42225 - }, - { - "epoch": 10.31, - "learning_rate": 0.0004445787164423292, - "loss": 0.7249, - "step": 42250 - }, - { - "epoch": 10.32, - "learning_rate": 0.0004445455173219731, - "loss": 0.7042, - "step": 42275 - }, - { - "epoch": 10.32, - "learning_rate": 0.0004445123182016169, - "loss": 0.7549, - "step": 42300 - }, - { - "epoch": 10.33, - "learning_rate": 0.0004444791190812608, - "loss": 0.6494, - "step": 42325 - }, - { - "epoch": 10.33, - "learning_rate": 0.00044444591996090473, - "loss": 0.6912, - "step": 42350 - }, - { - "epoch": 10.34, - "learning_rate": 0.00044441272084054864, - "loss": 0.6709, - "step": 42375 - }, - { - "epoch": 10.35, - "learning_rate": 0.0004443795217201925, - "loss": 0.6731, - "step": 42400 - }, - { - "epoch": 10.35, - "learning_rate": 0.0004443463225998364, - "loss": 0.6616, - "step": 42425 - }, - { - "epoch": 10.36, - "learning_rate": 0.0004443131234794803, - "loss": 0.6595, - "step": 42450 - }, - { - "epoch": 10.36, - "learning_rate": 0.0004442799243591242, - "loss": 0.671, - "step": 42475 - }, - { - "epoch": 10.37, - "learning_rate": 0.0004442467252387681, - "loss": 0.7151, - "step": 42500 - }, - { - "epoch": 10.38, - "learning_rate": 0.00044421352611841196, - "loss": 0.7016, - "step": 42525 - }, - { - "epoch": 10.38, - "learning_rate": 0.0004441803269980559, - "loss": 0.6729, - "step": 42550 - }, - { - "epoch": 10.39, - "learning_rate": 0.0004441471278776998, - "loss": 0.6412, - "step": 42575 - }, - { - "epoch": 10.4, - "learning_rate": 0.00044411392875734365, - "loss": 0.6664, - "step": 42600 - }, - { - "epoch": 10.4, - "learning_rate": 0.0004440807296369875, - "loss": 0.6066, - "step": 42625 - }, - { - "epoch": 10.41, - "learning_rate": 0.0004440475305166314, - "loss": 0.7433, - "step": 42650 - }, - { - "epoch": 10.41, - "learning_rate": 0.00044401433139627534, - "loss": 0.6678, - "step": 42675 - }, - { - "epoch": 10.42, - "learning_rate": 0.00044398113227591925, - "loss": 0.7147, - "step": 42700 - }, - { - "epoch": 10.43, - "learning_rate": 0.00044394793315556317, - "loss": 0.6558, - "step": 42725 - }, - { - "epoch": 10.43, - "learning_rate": 0.00044391473403520697, - "loss": 0.7616, - "step": 42750 - }, - { - "epoch": 10.44, - "learning_rate": 0.0004438815349148509, - "loss": 0.6852, - "step": 42775 - }, - { - "epoch": 10.44, - "learning_rate": 0.0004438483357944948, - "loss": 0.6825, - "step": 42800 - }, - { - "epoch": 10.45, - "learning_rate": 0.0004438151366741387, - "loss": 0.6371, - "step": 42825 - }, - { - "epoch": 10.46, - "learning_rate": 0.0004437819375537826, - "loss": 0.6984, - "step": 42850 - }, - { - "epoch": 10.46, - "learning_rate": 0.0004437487384334265, - "loss": 0.64, - "step": 42875 - }, - { - "epoch": 10.47, - "learning_rate": 0.00044371553931307035, - "loss": 0.6893, - "step": 42900 - }, - { - "epoch": 10.47, - "learning_rate": 0.00044368234019271426, - "loss": 0.6656, - "step": 42925 - }, - { - "epoch": 10.48, - "learning_rate": 0.0004436491410723582, - "loss": 0.6727, - "step": 42950 - }, - { - "epoch": 10.49, - "learning_rate": 0.00044361594195200204, - "loss": 0.5953, - "step": 42975 - }, - { - "epoch": 10.49, - "learning_rate": 0.00044358274283164595, - "loss": 0.7229, - "step": 43000 - }, - { - "epoch": 10.5, - "learning_rate": 0.00044354954371128986, - "loss": 0.6533, - "step": 43025 - }, - { - "epoch": 10.51, - "learning_rate": 0.0004435163445909337, - "loss": 0.6537, - "step": 43050 - }, - { - "epoch": 10.51, - "learning_rate": 0.0004434831454705776, - "loss": 0.6482, - "step": 43075 - }, - { - "epoch": 10.52, - "learning_rate": 0.0004434499463502215, - "loss": 0.684, - "step": 43100 - }, - { - "epoch": 10.52, - "learning_rate": 0.0004434167472298654, - "loss": 0.5997, - "step": 43125 - }, - { - "epoch": 10.53, - "learning_rate": 0.0004433835481095093, - "loss": 0.6668, - "step": 43150 - }, - { - "epoch": 10.54, - "learning_rate": 0.00044335034898915324, - "loss": 0.6491, - "step": 43175 - }, - { - "epoch": 10.54, - "learning_rate": 0.00044331714986879704, - "loss": 0.7128, - "step": 43200 - }, - { - "epoch": 10.55, - "learning_rate": 0.00044328395074844096, - "loss": 0.6342, - "step": 43225 - }, - { - "epoch": 10.55, - "learning_rate": 0.00044325075162808487, - "loss": 0.6943, - "step": 43250 - }, - { - "epoch": 10.56, - "learning_rate": 0.0004432175525077288, - "loss": 0.6803, - "step": 43275 - }, - { - "epoch": 10.57, - "learning_rate": 0.0004431843533873727, - "loss": 0.7371, - "step": 43300 - }, - { - "epoch": 10.57, - "learning_rate": 0.00044315115426701656, - "loss": 0.6904, - "step": 43325 - }, - { - "epoch": 10.58, - "learning_rate": 0.0004431179551466604, - "loss": 0.6995, - "step": 43350 - }, - { - "epoch": 10.58, - "learning_rate": 0.00044308475602630433, - "loss": 0.6529, - "step": 43375 - }, - { - "epoch": 10.59, - "learning_rate": 0.00044305155690594825, - "loss": 0.7138, - "step": 43400 - }, - { - "epoch": 10.6, - "learning_rate": 0.0004430183577855921, - "loss": 0.6653, - "step": 43425 - }, - { - "epoch": 10.6, - "learning_rate": 0.000442985158665236, - "loss": 0.6868, - "step": 43450 - }, - { - "epoch": 10.61, - "learning_rate": 0.00044295195954487994, - "loss": 0.6545, - "step": 43475 - }, - { - "epoch": 10.61, - "learning_rate": 0.0004429187604245238, - "loss": 0.696, - "step": 43500 - }, - { - "epoch": 10.62, - "learning_rate": 0.0004428855613041677, - "loss": 0.6071, - "step": 43525 - }, - { - "epoch": 10.63, - "learning_rate": 0.00044285236218381157, - "loss": 0.6957, - "step": 43550 - }, - { - "epoch": 10.63, - "learning_rate": 0.0004428191630634555, - "loss": 0.6626, - "step": 43575 - }, - { - "epoch": 10.64, - "learning_rate": 0.0004427859639430994, - "loss": 0.706, - "step": 43600 - }, - { - "epoch": 10.65, - "learning_rate": 0.0004427527648227433, - "loss": 0.6271, - "step": 43625 - }, - { - "epoch": 10.65, - "learning_rate": 0.0004427195657023871, - "loss": 0.6782, - "step": 43650 - }, - { - "epoch": 10.66, - "learning_rate": 0.00044268636658203103, - "loss": 0.6682, - "step": 43675 - }, - { - "epoch": 10.66, - "learning_rate": 0.00044265316746167494, - "loss": 0.6901, - "step": 43700 - }, - { - "epoch": 10.67, - "learning_rate": 0.00044261996834131886, - "loss": 0.6317, - "step": 43725 - }, - { - "epoch": 10.68, - "learning_rate": 0.00044258676922096277, - "loss": 0.6766, - "step": 43750 - }, - { - "epoch": 10.68, - "learning_rate": 0.00044255357010060663, - "loss": 0.5699, - "step": 43775 - }, - { - "epoch": 10.69, - "learning_rate": 0.0004425203709802505, - "loss": 0.72, - "step": 43800 - }, - { - "epoch": 10.69, - "learning_rate": 0.0004424871718598944, - "loss": 0.635, - "step": 43825 - }, - { - "epoch": 10.7, - "learning_rate": 0.0004424539727395383, - "loss": 0.7373, - "step": 43850 - }, - { - "epoch": 10.71, - "learning_rate": 0.0004424207736191822, - "loss": 0.6996, - "step": 43875 - }, - { - "epoch": 10.71, - "learning_rate": 0.0004423875744988261, - "loss": 0.6847, - "step": 43900 - }, - { - "epoch": 10.72, - "learning_rate": 0.00044235570334328424, - "loss": 0.6777, - "step": 43925 - }, - { - "epoch": 10.72, - "learning_rate": 0.00044232250422292815, - "loss": 0.7208, - "step": 43950 - }, - { - "epoch": 10.73, - "learning_rate": 0.000442289305102572, - "loss": 0.6545, - "step": 43975 - }, - { - "epoch": 10.74, - "learning_rate": 0.00044225610598221587, - "loss": 0.6631, - "step": 44000 - }, - { - "epoch": 10.74, - "learning_rate": 0.0004422229068618598, - "loss": 0.6274, - "step": 44025 - }, - { - "epoch": 10.75, - "learning_rate": 0.0004421897077415037, - "loss": 0.688, - "step": 44050 - }, - { - "epoch": 10.76, - "learning_rate": 0.0004421565086211476, - "loss": 0.6188, - "step": 44075 - }, - { - "epoch": 10.76, - "learning_rate": 0.00044212330950079147, - "loss": 0.6948, - "step": 44100 - }, - { - "epoch": 10.77, - "learning_rate": 0.0004420901103804354, - "loss": 0.6858, - "step": 44125 - }, - { - "epoch": 10.77, - "learning_rate": 0.00044205691126007925, - "loss": 0.7341, - "step": 44150 - }, - { - "epoch": 10.78, - "learning_rate": 0.00044202371213972316, - "loss": 0.6184, - "step": 44175 - }, - { - "epoch": 10.79, - "learning_rate": 0.000441990513019367, - "loss": 0.6862, - "step": 44200 - }, - { - "epoch": 10.79, - "learning_rate": 0.00044195731389901093, - "loss": 0.6461, - "step": 44225 - }, - { - "epoch": 10.8, - "learning_rate": 0.00044192411477865485, - "loss": 0.7194, - "step": 44250 - }, - { - "epoch": 10.8, - "learning_rate": 0.00044189091565829876, - "loss": 0.6877, - "step": 44275 - }, - { - "epoch": 10.81, - "learning_rate": 0.0004418577165379426, - "loss": 0.7203, - "step": 44300 - }, - { - "epoch": 10.82, - "learning_rate": 0.0004418245174175865, - "loss": 0.6138, - "step": 44325 - }, - { - "epoch": 10.82, - "learning_rate": 0.0004417913182972304, - "loss": 0.7073, - "step": 44350 - }, - { - "epoch": 10.83, - "learning_rate": 0.0004417581191768743, - "loss": 0.6408, - "step": 44375 - }, - { - "epoch": 10.83, - "learning_rate": 0.0004417249200565182, - "loss": 0.6973, - "step": 44400 - }, - { - "epoch": 10.84, - "learning_rate": 0.00044169172093616214, - "loss": 0.6758, - "step": 44425 - }, - { - "epoch": 10.85, - "learning_rate": 0.00044165852181580594, - "loss": 0.717, - "step": 44450 - }, - { - "epoch": 10.85, - "learning_rate": 0.00044162532269544986, - "loss": 0.6669, - "step": 44475 - }, - { - "epoch": 10.86, - "learning_rate": 0.00044159212357509377, - "loss": 0.7094, - "step": 44500 - }, - { - "epoch": 10.87, - "learning_rate": 0.0004415589244547377, - "loss": 0.6459, - "step": 44525 - }, - { - "epoch": 10.87, - "learning_rate": 0.00044152572533438154, - "loss": 0.6706, - "step": 44550 - }, - { - "epoch": 10.88, - "learning_rate": 0.00044149252621402546, - "loss": 0.6072, - "step": 44575 - }, - { - "epoch": 10.88, - "learning_rate": 0.0004414593270936693, - "loss": 0.7027, - "step": 44600 - }, - { - "epoch": 10.89, - "learning_rate": 0.00044142612797331323, - "loss": 0.637, - "step": 44625 - }, - { - "epoch": 10.9, - "learning_rate": 0.00044139292885295715, - "loss": 0.7063, - "step": 44650 - }, - { - "epoch": 10.9, - "learning_rate": 0.000441359729732601, - "loss": 0.7203, - "step": 44675 - }, - { - "epoch": 10.91, - "learning_rate": 0.0004413265306122449, - "loss": 0.6884, - "step": 44700 - }, - { - "epoch": 10.91, - "learning_rate": 0.00044129333149188883, - "loss": 0.6446, - "step": 44725 - }, - { - "epoch": 10.92, - "learning_rate": 0.0004412601323715327, - "loss": 0.739, - "step": 44750 - }, - { - "epoch": 10.93, - "learning_rate": 0.00044122693325117655, - "loss": 0.6525, - "step": 44775 - }, - { - "epoch": 10.93, - "learning_rate": 0.00044119373413082047, - "loss": 0.7124, - "step": 44800 - }, - { - "epoch": 10.94, - "learning_rate": 0.0004411605350104644, - "loss": 0.6768, - "step": 44825 - }, - { - "epoch": 10.94, - "learning_rate": 0.0004411273358901083, - "loss": 0.7047, - "step": 44850 - }, - { - "epoch": 10.95, - "learning_rate": 0.00044109413676975216, - "loss": 0.6307, - "step": 44875 - }, - { - "epoch": 10.96, - "learning_rate": 0.000441060937649396, - "loss": 0.6887, - "step": 44900 - }, - { - "epoch": 10.96, - "learning_rate": 0.00044102773852903993, - "loss": 0.6407, - "step": 44925 - }, - { - "epoch": 10.97, - "learning_rate": 0.00044099453940868384, - "loss": 0.7153, - "step": 44950 - }, - { - "epoch": 10.97, - "learning_rate": 0.00044096134028832776, - "loss": 0.6612, - "step": 44975 - }, - { - "epoch": 10.98, - "learning_rate": 0.0004409281411679716, - "loss": 0.7166, - "step": 45000 - }, - { - "epoch": 10.98, - "eval_cer": 0.14372247261377985, - "eval_loss": 0.4731488525867462, - "eval_runtime": 144.4871, - "eval_samples_per_second": 29.02, - "eval_steps_per_second": 7.26, - "eval_wer": 0.5718433931484502, - "step": 45000 - }, - { - "epoch": 10.99, - "learning_rate": 0.0004408949420476155, - "loss": 0.6463, - "step": 45025 - }, - { - "epoch": 10.99, - "learning_rate": 0.0004408617429272594, - "loss": 0.7169, - "step": 45050 - }, - { - "epoch": 11.0, - "learning_rate": 0.0004408285438069033, - "loss": 0.6929, - "step": 45075 - }, - { - "epoch": 11.01, - "learning_rate": 0.0004407953446865472, - "loss": 0.7587, - "step": 45100 - }, - { - "epoch": 11.01, - "learning_rate": 0.0004407621455661911, - "loss": 0.6414, - "step": 45125 - }, - { - "epoch": 11.02, - "learning_rate": 0.000440728946445835, - "loss": 0.7008, - "step": 45150 - }, - { - "epoch": 11.02, - "learning_rate": 0.00044069574732547885, - "loss": 0.6039, - "step": 45175 - }, - { - "epoch": 11.03, - "learning_rate": 0.00044066254820512277, - "loss": 0.6642, - "step": 45200 - }, - { - "epoch": 11.04, - "learning_rate": 0.0004406293490847666, - "loss": 0.5708, - "step": 45225 - }, - { - "epoch": 11.04, - "learning_rate": 0.00044059614996441054, - "loss": 0.6622, - "step": 45250 - }, - { - "epoch": 11.05, - "learning_rate": 0.00044056295084405445, - "loss": 0.6563, - "step": 45275 - }, - { - "epoch": 11.05, - "learning_rate": 0.00044052975172369837, - "loss": 0.682, - "step": 45300 - }, - { - "epoch": 11.06, - "learning_rate": 0.00044049655260334223, - "loss": 0.6252, - "step": 45325 - }, - { - "epoch": 11.07, - "learning_rate": 0.0004404633534829861, - "loss": 0.6542, - "step": 45350 - }, - { - "epoch": 11.07, - "learning_rate": 0.00044043015436263, - "loss": 0.6675, - "step": 45375 - }, - { - "epoch": 11.08, - "learning_rate": 0.0004403969552422739, - "loss": 0.6733, - "step": 45400 - }, - { - "epoch": 11.08, - "learning_rate": 0.00044036375612191783, - "loss": 0.603, - "step": 45425 - }, - { - "epoch": 11.09, - "learning_rate": 0.0004403305570015617, - "loss": 0.6562, - "step": 45450 - }, - { - "epoch": 11.1, - "learning_rate": 0.00044029735788120555, - "loss": 0.6738, - "step": 45475 - }, - { - "epoch": 11.1, - "learning_rate": 0.00044026415876084946, - "loss": 0.6869, - "step": 45500 - }, - { - "epoch": 11.11, - "learning_rate": 0.0004402309596404934, - "loss": 0.639, - "step": 45525 - }, - { - "epoch": 11.12, - "learning_rate": 0.0004401977605201373, - "loss": 0.6751, - "step": 45550 - }, - { - "epoch": 11.12, - "learning_rate": 0.00044016456139978115, - "loss": 0.5983, - "step": 45575 - }, - { - "epoch": 11.13, - "learning_rate": 0.00044013136227942506, - "loss": 0.6827, - "step": 45600 - }, - { - "epoch": 11.13, - "learning_rate": 0.0004400981631590689, - "loss": 0.6128, - "step": 45625 - }, - { - "epoch": 11.14, - "learning_rate": 0.00044006496403871284, - "loss": 0.6782, - "step": 45650 - }, - { - "epoch": 11.15, - "learning_rate": 0.0004400317649183567, - "loss": 0.6196, - "step": 45675 - }, - { - "epoch": 11.15, - "learning_rate": 0.0004399985657980006, - "loss": 0.6424, - "step": 45700 - }, - { - "epoch": 11.16, - "learning_rate": 0.0004399653666776445, - "loss": 0.5857, - "step": 45725 - }, - { - "epoch": 11.16, - "learning_rate": 0.00043993216755728844, - "loss": 0.6674, - "step": 45750 - }, - { - "epoch": 11.17, - "learning_rate": 0.0004398989684369323, - "loss": 0.6245, - "step": 45775 - }, - { - "epoch": 11.18, - "learning_rate": 0.00043986576931657616, - "loss": 0.6766, - "step": 45800 - }, - { - "epoch": 11.18, - "learning_rate": 0.0004398325701962201, - "loss": 0.64, - "step": 45825 - }, - { - "epoch": 11.19, - "learning_rate": 0.000439799371075864, - "loss": 0.6693, - "step": 45850 - }, - { - "epoch": 11.19, - "learning_rate": 0.00043976749992032213, - "loss": 0.654, - "step": 45875 - }, - { - "epoch": 11.2, - "learning_rate": 0.000439734300799966, - "loss": 0.6695, - "step": 45900 - }, - { - "epoch": 11.21, - "learning_rate": 0.0004397011016796099, - "loss": 0.6548, - "step": 45925 - }, - { - "epoch": 11.21, - "learning_rate": 0.0004396679025592538, - "loss": 0.6577, - "step": 45950 - }, - { - "epoch": 11.22, - "learning_rate": 0.0004396347034388977, - "loss": 0.5869, - "step": 45975 - }, - { - "epoch": 11.22, - "learning_rate": 0.0004396015043185416, - "loss": 0.6876, - "step": 46000 - }, - { - "epoch": 11.23, - "learning_rate": 0.00043956830519818545, - "loss": 0.5679, - "step": 46025 - }, - { - "epoch": 11.24, - "learning_rate": 0.00043953510607782937, - "loss": 0.6973, - "step": 46050 - }, - { - "epoch": 11.24, - "learning_rate": 0.0004395019069574733, - "loss": 0.6237, - "step": 46075 - }, - { - "epoch": 11.25, - "learning_rate": 0.0004394687078371172, - "loss": 0.6779, - "step": 46100 - }, - { - "epoch": 11.26, - "learning_rate": 0.000439435508716761, - "loss": 0.6205, - "step": 46125 - }, - { - "epoch": 11.26, - "learning_rate": 0.0004394023095964049, - "loss": 0.6393, - "step": 46150 - }, - { - "epoch": 11.27, - "learning_rate": 0.00043936911047604883, - "loss": 0.6353, - "step": 46175 - }, - { - "epoch": 11.27, - "learning_rate": 0.00043933591135569274, - "loss": 0.6752, - "step": 46200 - }, - { - "epoch": 11.28, - "learning_rate": 0.00043930271223533666, - "loss": 0.6567, - "step": 46225 - }, - { - "epoch": 11.29, - "learning_rate": 0.0004392695131149805, - "loss": 0.6625, - "step": 46250 - }, - { - "epoch": 11.29, - "learning_rate": 0.0004392363139946244, - "loss": 0.6082, - "step": 46275 - }, - { - "epoch": 11.3, - "learning_rate": 0.0004392031148742683, - "loss": 0.6796, - "step": 46300 - }, - { - "epoch": 11.3, - "learning_rate": 0.0004391699157539122, - "loss": 0.6016, - "step": 46325 - }, - { - "epoch": 11.31, - "learning_rate": 0.00043913671663355606, - "loss": 0.6826, - "step": 46350 - }, - { - "epoch": 11.32, - "learning_rate": 0.0004391035175132, - "loss": 0.6277, - "step": 46375 - }, - { - "epoch": 11.32, - "learning_rate": 0.0004390703183928439, - "loss": 0.705, - "step": 46400 - }, - { - "epoch": 11.33, - "learning_rate": 0.00043903711927248775, - "loss": 0.6284, - "step": 46425 - }, - { - "epoch": 11.33, - "learning_rate": 0.00043900392015213167, - "loss": 0.6422, - "step": 46450 - }, - { - "epoch": 11.34, - "learning_rate": 0.0004389707210317755, - "loss": 0.6124, - "step": 46475 - }, - { - "epoch": 11.35, - "learning_rate": 0.00043893752191141944, - "loss": 0.7005, - "step": 46500 - }, - { - "epoch": 11.35, - "learning_rate": 0.00043890432279106335, - "loss": 0.638, - "step": 46525 - }, - { - "epoch": 11.36, - "learning_rate": 0.00043887112367070727, - "loss": 0.6668, - "step": 46550 - }, - { - "epoch": 11.37, - "learning_rate": 0.00043883792455035107, - "loss": 0.629, - "step": 46575 - }, - { - "epoch": 11.37, - "learning_rate": 0.000438804725429995, - "loss": 0.6606, - "step": 46600 - }, - { - "epoch": 11.38, - "learning_rate": 0.0004387715263096389, - "loss": 0.622, - "step": 46625 - }, - { - "epoch": 11.38, - "learning_rate": 0.0004387383271892828, - "loss": 0.6692, - "step": 46650 - }, - { - "epoch": 11.39, - "learning_rate": 0.00043870512806892673, - "loss": 0.6024, - "step": 46675 - }, - { - "epoch": 11.4, - "learning_rate": 0.0004386719289485706, - "loss": 0.6572, - "step": 46700 - }, - { - "epoch": 11.4, - "learning_rate": 0.00043863872982821445, - "loss": 0.6421, - "step": 46725 - }, - { - "epoch": 11.41, - "learning_rate": 0.00043860553070785836, - "loss": 0.6752, - "step": 46750 - }, - { - "epoch": 11.41, - "learning_rate": 0.0004385723315875023, - "loss": 0.6175, - "step": 46775 - }, - { - "epoch": 11.42, - "learning_rate": 0.00043853913246714614, - "loss": 0.7093, - "step": 46800 - }, - { - "epoch": 11.43, - "learning_rate": 0.00043850593334679005, - "loss": 0.6018, - "step": 46825 - }, - { - "epoch": 11.43, - "learning_rate": 0.00043847273422643396, - "loss": 0.7242, - "step": 46850 - }, - { - "epoch": 11.44, - "learning_rate": 0.0004384395351060778, - "loss": 0.6118, - "step": 46875 - }, - { - "epoch": 11.44, - "learning_rate": 0.00043840633598572174, - "loss": 0.6412, - "step": 46900 - }, - { - "epoch": 11.45, - "learning_rate": 0.0004383731368653656, - "loss": 0.6692, - "step": 46925 - }, - { - "epoch": 11.46, - "learning_rate": 0.0004383399377450095, - "loss": 0.6875, - "step": 46950 - }, - { - "epoch": 11.46, - "learning_rate": 0.0004383067386246534, - "loss": 0.6527, - "step": 46975 - }, - { - "epoch": 11.47, - "learning_rate": 0.00043827353950429734, - "loss": 0.6862, - "step": 47000 - }, - { - "epoch": 11.48, - "learning_rate": 0.00043824034038394114, - "loss": 0.6665, - "step": 47025 - }, - { - "epoch": 11.48, - "learning_rate": 0.00043820714126358506, - "loss": 0.6639, - "step": 47050 - }, - { - "epoch": 11.49, - "learning_rate": 0.00043817394214322897, - "loss": 0.6384, - "step": 47075 - }, - { - "epoch": 11.49, - "learning_rate": 0.0004381407430228729, - "loss": 0.6528, - "step": 47100 - }, - { - "epoch": 11.5, - "learning_rate": 0.0004381075439025168, - "loss": 0.6745, - "step": 47125 - }, - { - "epoch": 11.51, - "learning_rate": 0.00043807434478216066, - "loss": 0.671, - "step": 47150 - }, - { - "epoch": 11.51, - "learning_rate": 0.0004380411456618045, - "loss": 0.6352, - "step": 47175 - }, - { - "epoch": 11.52, - "learning_rate": 0.00043800794654144843, - "loss": 0.645, - "step": 47200 - }, - { - "epoch": 11.52, - "learning_rate": 0.00043797474742109235, - "loss": 0.6738, - "step": 47225 - }, - { - "epoch": 11.53, - "learning_rate": 0.00043794154830073626, - "loss": 0.6946, - "step": 47250 - }, - { - "epoch": 11.54, - "learning_rate": 0.0004379083491803801, - "loss": 0.6427, - "step": 47275 - }, - { - "epoch": 11.54, - "learning_rate": 0.00043787515006002404, - "loss": 0.6668, - "step": 47300 - }, - { - "epoch": 11.55, - "learning_rate": 0.0004378419509396679, - "loss": 0.6233, - "step": 47325 - }, - { - "epoch": 11.55, - "learning_rate": 0.0004378087518193118, - "loss": 0.6855, - "step": 47350 - }, - { - "epoch": 11.56, - "learning_rate": 0.00043777555269895567, - "loss": 0.6396, - "step": 47375 - }, - { - "epoch": 11.57, - "learning_rate": 0.0004377423535785996, - "loss": 0.6812, - "step": 47400 - }, - { - "epoch": 11.57, - "learning_rate": 0.0004377091544582435, - "loss": 0.626, - "step": 47425 - }, - { - "epoch": 11.58, - "learning_rate": 0.0004376759553378874, - "loss": 0.655, - "step": 47450 - }, - { - "epoch": 11.58, - "learning_rate": 0.00043764275621753127, - "loss": 0.6244, - "step": 47475 - }, - { - "epoch": 11.59, - "learning_rate": 0.00043760955709717513, - "loss": 0.6704, - "step": 47500 - }, - { - "epoch": 11.6, - "learning_rate": 0.00043757635797681904, - "loss": 0.6312, - "step": 47525 - }, - { - "epoch": 11.6, - "learning_rate": 0.00043754315885646296, - "loss": 0.7087, - "step": 47550 - }, - { - "epoch": 11.61, - "learning_rate": 0.00043750995973610687, - "loss": 0.5872, - "step": 47575 - }, - { - "epoch": 11.62, - "learning_rate": 0.00043747676061575073, - "loss": 0.655, - "step": 47600 - }, - { - "epoch": 11.62, - "learning_rate": 0.0004374435614953946, - "loss": 0.6432, - "step": 47625 - }, - { - "epoch": 11.63, - "learning_rate": 0.0004374103623750385, - "loss": 0.6731, - "step": 47650 - }, - { - "epoch": 11.63, - "learning_rate": 0.0004373771632546824, - "loss": 0.6227, - "step": 47675 - }, - { - "epoch": 11.64, - "learning_rate": 0.00043734396413432633, - "loss": 0.7036, - "step": 47700 - }, - { - "epoch": 11.65, - "learning_rate": 0.0004373107650139702, - "loss": 0.6288, - "step": 47725 - }, - { - "epoch": 11.65, - "learning_rate": 0.0004372775658936141, - "loss": 0.659, - "step": 47750 - }, - { - "epoch": 11.66, - "learning_rate": 0.00043724436677325797, - "loss": 0.6138, - "step": 47775 - }, - { - "epoch": 11.66, - "learning_rate": 0.0004372111676529019, - "loss": 0.6878, - "step": 47800 - }, - { - "epoch": 11.67, - "learning_rate": 0.00043717796853254574, - "loss": 0.6326, - "step": 47825 - }, - { - "epoch": 11.68, - "learning_rate": 0.00043714476941218966, - "loss": 0.6692, - "step": 47850 - }, - { - "epoch": 11.68, - "learning_rate": 0.00043711157029183357, - "loss": 0.6122, - "step": 47875 - }, - { - "epoch": 11.69, - "learning_rate": 0.0004370783711714775, - "loss": 0.7086, - "step": 47900 - }, - { - "epoch": 11.69, - "learning_rate": 0.00043704517205112134, - "loss": 0.6116, - "step": 47925 - }, - { - "epoch": 11.7, - "learning_rate": 0.0004370119729307652, - "loss": 0.6945, - "step": 47950 - }, - { - "epoch": 11.71, - "learning_rate": 0.0004369787738104091, - "loss": 0.5723, - "step": 47975 - }, - { - "epoch": 11.71, - "learning_rate": 0.00043694557469005303, - "loss": 0.6627, - "step": 48000 - }, - { - "epoch": 11.71, - "eval_cer": 0.14209521267312095, - "eval_loss": 0.47871026396751404, - "eval_runtime": 145.6062, - "eval_samples_per_second": 28.797, - "eval_steps_per_second": 7.204, - "eval_wer": 0.559510603588907, - "step": 48000 - }, - { - "epoch": 11.72, - "learning_rate": 0.00043691237556969694, - "loss": 0.5936, - "step": 48025 - }, - { - "epoch": 11.73, - "learning_rate": 0.0004368791764493408, - "loss": 0.6948, - "step": 48050 - }, - { - "epoch": 11.73, - "learning_rate": 0.00043684597732898466, - "loss": 0.6084, - "step": 48075 - }, - { - "epoch": 11.74, - "learning_rate": 0.0004368127782086286, - "loss": 0.6846, - "step": 48100 - }, - { - "epoch": 11.74, - "learning_rate": 0.0004367795790882725, - "loss": 0.6348, - "step": 48125 - }, - { - "epoch": 11.75, - "learning_rate": 0.0004367463799679164, - "loss": 0.6736, - "step": 48150 - }, - { - "epoch": 11.76, - "learning_rate": 0.00043671318084756027, - "loss": 0.6213, - "step": 48175 - }, - { - "epoch": 11.76, - "learning_rate": 0.0004366799817272042, - "loss": 0.7163, - "step": 48200 - }, - { - "epoch": 11.77, - "learning_rate": 0.00043664678260684804, - "loss": 0.6381, - "step": 48225 - }, - { - "epoch": 11.77, - "learning_rate": 0.00043661358348649195, - "loss": 0.7344, - "step": 48250 - }, - { - "epoch": 11.78, - "learning_rate": 0.00043658038436613587, - "loss": 0.6165, - "step": 48275 - }, - { - "epoch": 11.79, - "learning_rate": 0.00043654718524577973, - "loss": 0.6836, - "step": 48300 - }, - { - "epoch": 11.79, - "learning_rate": 0.00043651398612542364, - "loss": 0.6184, - "step": 48325 - }, - { - "epoch": 11.8, - "learning_rate": 0.00043648078700506756, - "loss": 0.7038, - "step": 48350 - }, - { - "epoch": 11.8, - "learning_rate": 0.0004364475878847114, - "loss": 0.6353, - "step": 48375 - }, - { - "epoch": 11.81, - "learning_rate": 0.0004364143887643553, - "loss": 0.6672, - "step": 48400 - }, - { - "epoch": 11.82, - "learning_rate": 0.0004363811896439992, - "loss": 0.613, - "step": 48425 - }, - { - "epoch": 11.82, - "learning_rate": 0.0004363479905236431, - "loss": 0.7012, - "step": 48450 - }, - { - "epoch": 11.83, - "learning_rate": 0.000436314791403287, - "loss": 0.6223, - "step": 48475 - }, - { - "epoch": 11.84, - "learning_rate": 0.00043628159228293093, - "loss": 0.6902, - "step": 48500 - }, - { - "epoch": 11.84, - "learning_rate": 0.00043624839316257474, - "loss": 0.5867, - "step": 48525 - }, - { - "epoch": 11.85, - "learning_rate": 0.00043621519404221865, - "loss": 0.6947, - "step": 48550 - }, - { - "epoch": 11.85, - "learning_rate": 0.00043618199492186256, - "loss": 0.6178, - "step": 48575 - }, - { - "epoch": 11.86, - "learning_rate": 0.0004361487958015065, - "loss": 0.6746, - "step": 48600 - }, - { - "epoch": 11.87, - "learning_rate": 0.00043611559668115034, - "loss": 0.6568, - "step": 48625 - }, - { - "epoch": 11.87, - "learning_rate": 0.00043608239756079425, - "loss": 0.6817, - "step": 48650 - }, - { - "epoch": 11.88, - "learning_rate": 0.0004360491984404381, - "loss": 0.6562, - "step": 48675 - }, - { - "epoch": 11.88, - "learning_rate": 0.000436015999320082, - "loss": 0.6814, - "step": 48700 - }, - { - "epoch": 11.89, - "learning_rate": 0.0004359841281645401, - "loss": 0.6593, - "step": 48725 - }, - { - "epoch": 11.9, - "learning_rate": 0.00043595092904418403, - "loss": 0.7107, - "step": 48750 - }, - { - "epoch": 11.9, - "learning_rate": 0.00043591772992382794, - "loss": 0.6651, - "step": 48775 - }, - { - "epoch": 11.91, - "learning_rate": 0.00043588453080347186, - "loss": 0.7025, - "step": 48800 - }, - { - "epoch": 11.91, - "learning_rate": 0.00043585133168311577, - "loss": 0.638, - "step": 48825 - }, - { - "epoch": 11.92, - "learning_rate": 0.00043581813256275963, - "loss": 0.6696, - "step": 48850 - }, - { - "epoch": 11.93, - "learning_rate": 0.0004357849334424035, - "loss": 0.6291, - "step": 48875 - }, - { - "epoch": 11.93, - "learning_rate": 0.0004357517343220474, - "loss": 0.6475, - "step": 48900 - }, - { - "epoch": 11.94, - "learning_rate": 0.0004357185352016913, - "loss": 0.6309, - "step": 48925 - }, - { - "epoch": 11.94, - "learning_rate": 0.0004356853360813352, - "loss": 0.6623, - "step": 48950 - }, - { - "epoch": 11.95, - "learning_rate": 0.0004356521369609791, - "loss": 0.6565, - "step": 48975 - }, - { - "epoch": 11.96, - "learning_rate": 0.000435618937840623, - "loss": 0.6518, - "step": 49000 - }, - { - "epoch": 11.96, - "learning_rate": 0.00043558573872026687, - "loss": 0.6328, - "step": 49025 - }, - { - "epoch": 11.97, - "learning_rate": 0.0004355525395999108, - "loss": 0.6526, - "step": 49050 - }, - { - "epoch": 11.98, - "learning_rate": 0.00043551934047955464, - "loss": 0.6355, - "step": 49075 - }, - { - "epoch": 11.98, - "learning_rate": 0.00043548614135919855, - "loss": 0.7023, - "step": 49100 - }, - { - "epoch": 11.99, - "learning_rate": 0.00043545294223884247, - "loss": 0.6291, - "step": 49125 - }, - { - "epoch": 11.99, - "learning_rate": 0.0004354197431184864, - "loss": 0.6556, - "step": 49150 - }, - { - "epoch": 12.0, - "learning_rate": 0.0004353865439981302, - "loss": 0.631, - "step": 49175 - }, - { - "epoch": 12.01, - "learning_rate": 0.0004353533448777741, - "loss": 0.69, - "step": 49200 - }, - { - "epoch": 12.01, - "learning_rate": 0.000435320145757418, - "loss": 0.5947, - "step": 49225 - }, - { - "epoch": 12.02, - "learning_rate": 0.00043528694663706193, - "loss": 0.6668, - "step": 49250 - }, - { - "epoch": 12.02, - "learning_rate": 0.00043525374751670584, - "loss": 0.6321, - "step": 49275 - }, - { - "epoch": 12.03, - "learning_rate": 0.0004352205483963497, - "loss": 0.644, - "step": 49300 - }, - { - "epoch": 12.04, - "learning_rate": 0.00043518734927599356, - "loss": 0.628, - "step": 49325 - }, - { - "epoch": 12.04, - "learning_rate": 0.0004351541501556375, - "loss": 0.639, - "step": 49350 - }, - { - "epoch": 12.05, - "learning_rate": 0.0004351209510352814, - "loss": 0.5915, - "step": 49375 - }, - { - "epoch": 12.05, - "learning_rate": 0.00043508775191492525, - "loss": 0.6678, - "step": 49400 - }, - { - "epoch": 12.06, - "learning_rate": 0.00043505455279456917, - "loss": 0.6273, - "step": 49425 - }, - { - "epoch": 12.07, - "learning_rate": 0.0004350213536742131, - "loss": 0.6117, - "step": 49450 - }, - { - "epoch": 12.07, - "learning_rate": 0.00043498815455385694, - "loss": 0.5568, - "step": 49475 - }, - { - "epoch": 12.08, - "learning_rate": 0.00043495495543350085, - "loss": 0.6563, - "step": 49500 - }, - { - "epoch": 12.09, - "learning_rate": 0.0004349217563131447, - "loss": 0.5866, - "step": 49525 - }, - { - "epoch": 12.09, - "learning_rate": 0.0004348885571927886, - "loss": 0.6908, - "step": 49550 - }, - { - "epoch": 12.1, - "learning_rate": 0.00043485535807243254, - "loss": 0.6039, - "step": 49575 - }, - { - "epoch": 12.1, - "learning_rate": 0.00043482215895207645, - "loss": 0.6675, - "step": 49600 - }, - { - "epoch": 12.11, - "learning_rate": 0.0004347889598317203, - "loss": 0.5785, - "step": 49625 - }, - { - "epoch": 12.12, - "learning_rate": 0.0004347557607113642, - "loss": 0.6426, - "step": 49650 - }, - { - "epoch": 12.12, - "learning_rate": 0.0004347225615910081, - "loss": 0.658, - "step": 49675 - }, - { - "epoch": 12.13, - "learning_rate": 0.000434689362470652, - "loss": 0.6528, - "step": 49700 - }, - { - "epoch": 12.13, - "learning_rate": 0.0004346561633502959, - "loss": 0.5638, - "step": 49725 - }, - { - "epoch": 12.14, - "learning_rate": 0.0004346229642299398, - "loss": 0.6568, - "step": 49750 - }, - { - "epoch": 12.15, - "learning_rate": 0.00043458976510958364, - "loss": 0.6403, - "step": 49775 - }, - { - "epoch": 12.15, - "learning_rate": 0.00043455656598922755, - "loss": 0.6668, - "step": 49800 - }, - { - "epoch": 12.16, - "learning_rate": 0.00043452336686887146, - "loss": 0.6377, - "step": 49825 - }, - { - "epoch": 12.16, - "learning_rate": 0.0004344901677485154, - "loss": 0.6156, - "step": 49850 - }, - { - "epoch": 12.17, - "learning_rate": 0.00043445696862815924, - "loss": 0.5868, - "step": 49875 - }, - { - "epoch": 12.18, - "learning_rate": 0.00043442376950780315, - "loss": 0.6497, - "step": 49900 - }, - { - "epoch": 12.18, - "learning_rate": 0.000434390570387447, - "loss": 0.618, - "step": 49925 - }, - { - "epoch": 12.19, - "learning_rate": 0.0004343573712670909, - "loss": 0.6685, - "step": 49950 - }, - { - "epoch": 12.19, - "learning_rate": 0.0004343241721467348, - "loss": 0.6276, - "step": 49975 - }, - { - "epoch": 12.2, - "learning_rate": 0.0004342909730263787, - "loss": 0.6609, - "step": 50000 - }, - { - "epoch": 12.21, - "learning_rate": 0.0004342577739060226, - "loss": 0.5746, - "step": 50025 - }, - { - "epoch": 12.21, - "learning_rate": 0.0004342245747856665, - "loss": 0.6416, - "step": 50050 - }, - { - "epoch": 12.22, - "learning_rate": 0.0004341913756653104, - "loss": 0.5834, - "step": 50075 - }, - { - "epoch": 12.23, - "learning_rate": 0.00043415817654495425, - "loss": 0.6515, - "step": 50100 - }, - { - "epoch": 12.23, - "learning_rate": 0.00043412497742459816, - "loss": 0.5516, - "step": 50125 - }, - { - "epoch": 12.24, - "learning_rate": 0.0004340917783042421, - "loss": 0.6494, - "step": 50150 - }, - { - "epoch": 12.24, - "learning_rate": 0.000434058579183886, - "loss": 0.5935, - "step": 50175 - }, - { - "epoch": 12.25, - "learning_rate": 0.00043402538006352985, - "loss": 0.6556, - "step": 50200 - }, - { - "epoch": 12.26, - "learning_rate": 0.0004339921809431737, - "loss": 0.6083, - "step": 50225 - }, - { - "epoch": 12.26, - "learning_rate": 0.0004339589818228176, - "loss": 0.6471, - "step": 50250 - }, - { - "epoch": 12.27, - "learning_rate": 0.00043392711066727577, - "loss": 0.5967, - "step": 50275 - }, - { - "epoch": 12.27, - "learning_rate": 0.0004338939115469196, - "loss": 0.6667, - "step": 50300 - }, - { - "epoch": 12.28, - "learning_rate": 0.00043386071242656354, - "loss": 0.5851, - "step": 50325 - }, - { - "epoch": 12.29, - "learning_rate": 0.00043382751330620745, - "loss": 0.683, - "step": 50350 - }, - { - "epoch": 12.29, - "learning_rate": 0.00043379431418585137, - "loss": 0.6329, - "step": 50375 - }, - { - "epoch": 12.3, - "learning_rate": 0.0004337611150654953, - "loss": 0.64, - "step": 50400 - }, - { - "epoch": 12.3, - "learning_rate": 0.0004337279159451391, - "loss": 0.6474, - "step": 50425 - }, - { - "epoch": 12.31, - "learning_rate": 0.000433694716824783, - "loss": 0.6692, - "step": 50450 - }, - { - "epoch": 12.32, - "learning_rate": 0.0004336615177044269, - "loss": 0.6072, - "step": 50475 - }, - { - "epoch": 12.32, - "learning_rate": 0.00043362831858407083, - "loss": 0.6352, - "step": 50500 - }, - { - "epoch": 12.33, - "learning_rate": 0.0004335951194637147, - "loss": 0.5983, - "step": 50525 - }, - { - "epoch": 12.34, - "learning_rate": 0.0004335619203433586, - "loss": 0.6722, - "step": 50550 - }, - { - "epoch": 12.34, - "learning_rate": 0.00043352872122300246, - "loss": 0.6317, - "step": 50575 - }, - { - "epoch": 12.35, - "learning_rate": 0.0004334955221026464, - "loss": 0.6641, - "step": 50600 - }, - { - "epoch": 12.35, - "learning_rate": 0.0004334623229822903, - "loss": 0.613, - "step": 50625 - }, - { - "epoch": 12.36, - "learning_rate": 0.00043342912386193415, - "loss": 0.638, - "step": 50650 - }, - { - "epoch": 12.37, - "learning_rate": 0.00043339592474157806, - "loss": 0.5691, - "step": 50675 - }, - { - "epoch": 12.37, - "learning_rate": 0.000433362725621222, - "loss": 0.638, - "step": 50700 - }, - { - "epoch": 12.38, - "learning_rate": 0.00043332952650086584, - "loss": 0.6625, - "step": 50725 - }, - { - "epoch": 12.38, - "learning_rate": 0.0004332963273805097, - "loss": 0.6371, - "step": 50750 - }, - { - "epoch": 12.39, - "learning_rate": 0.0004332631282601536, - "loss": 0.5906, - "step": 50775 - }, - { - "epoch": 12.4, - "learning_rate": 0.0004332299291397975, - "loss": 0.6377, - "step": 50800 - }, - { - "epoch": 12.4, - "learning_rate": 0.00043319673001944144, - "loss": 0.5568, - "step": 50825 - }, - { - "epoch": 12.41, - "learning_rate": 0.00043316353089908535, - "loss": 0.6468, - "step": 50850 - }, - { - "epoch": 12.41, - "learning_rate": 0.00043313033177872916, - "loss": 0.5864, - "step": 50875 - }, - { - "epoch": 12.42, - "learning_rate": 0.0004330971326583731, - "loss": 0.6945, - "step": 50900 - }, - { - "epoch": 12.43, - "learning_rate": 0.000433063933538017, - "loss": 0.6353, - "step": 50925 - }, - { - "epoch": 12.43, - "learning_rate": 0.0004330307344176609, - "loss": 0.689, - "step": 50950 - }, - { - "epoch": 12.44, - "learning_rate": 0.0004329975352973048, - "loss": 0.6057, - "step": 50975 - }, - { - "epoch": 12.45, - "learning_rate": 0.0004329643361769487, - "loss": 0.6642, - "step": 51000 - }, - { - "epoch": 12.45, - "eval_cer": 0.135288440807778, - "eval_loss": 0.4786597192287445, - "eval_runtime": 145.9643, - "eval_samples_per_second": 28.726, - "eval_steps_per_second": 7.187, - "eval_wer": 0.5417292006525285, - "step": 51000 - }, - { - "epoch": 12.45, - "learning_rate": 0.00043293113705659254, - "loss": 0.5972, - "step": 51025 - }, - { - "epoch": 12.46, - "learning_rate": 0.00043289793793623645, - "loss": 0.6796, - "step": 51050 - }, - { - "epoch": 12.46, - "learning_rate": 0.00043286473881588036, - "loss": 0.5829, - "step": 51075 - }, - { - "epoch": 12.47, - "learning_rate": 0.0004328315396955242, - "loss": 0.6555, - "step": 51100 - }, - { - "epoch": 12.48, - "learning_rate": 0.00043279834057516814, - "loss": 0.638, - "step": 51125 - }, - { - "epoch": 12.48, - "learning_rate": 0.000432765141454812, - "loss": 0.6506, - "step": 51150 - }, - { - "epoch": 12.49, - "learning_rate": 0.0004327319423344559, - "loss": 0.5731, - "step": 51175 - }, - { - "epoch": 12.49, - "learning_rate": 0.0004326987432140998, - "loss": 0.6235, - "step": 51200 - }, - { - "epoch": 12.5, - "learning_rate": 0.0004326655440937437, - "loss": 0.6339, - "step": 51225 - }, - { - "epoch": 12.51, - "learning_rate": 0.0004326323449733876, - "loss": 0.6643, - "step": 51250 - }, - { - "epoch": 12.51, - "learning_rate": 0.0004325991458530315, - "loss": 0.6002, - "step": 51275 - }, - { - "epoch": 12.52, - "learning_rate": 0.00043256594673267537, - "loss": 0.6213, - "step": 51300 - }, - { - "epoch": 12.52, - "learning_rate": 0.00043253274761231923, - "loss": 0.6105, - "step": 51325 - }, - { - "epoch": 12.53, - "learning_rate": 0.00043249954849196315, - "loss": 0.6795, - "step": 51350 - }, - { - "epoch": 12.54, - "learning_rate": 0.00043246634937160706, - "loss": 0.6539, - "step": 51375 - }, - { - "epoch": 12.54, - "learning_rate": 0.000432433150251251, - "loss": 0.6513, - "step": 51400 - }, - { - "epoch": 12.55, - "learning_rate": 0.0004323999511308949, - "loss": 0.6141, - "step": 51425 - }, - { - "epoch": 12.55, - "learning_rate": 0.0004323667520105387, - "loss": 0.6625, - "step": 51450 - }, - { - "epoch": 12.56, - "learning_rate": 0.0004323335528901826, - "loss": 0.601, - "step": 51475 - }, - { - "epoch": 12.57, - "learning_rate": 0.0004323003537698265, - "loss": 0.6888, - "step": 51500 - }, - { - "epoch": 12.57, - "learning_rate": 0.00043226715464947044, - "loss": 0.6562, - "step": 51525 - }, - { - "epoch": 12.58, - "learning_rate": 0.0004322339555291143, - "loss": 0.6252, - "step": 51550 - }, - { - "epoch": 12.59, - "learning_rate": 0.0004322007564087582, - "loss": 0.6727, - "step": 51575 - }, - { - "epoch": 12.59, - "learning_rate": 0.00043216755728840207, - "loss": 0.6696, - "step": 51600 - }, - { - "epoch": 12.6, - "learning_rate": 0.000432134358168046, - "loss": 0.5774, - "step": 51625 - }, - { - "epoch": 12.6, - "learning_rate": 0.0004321011590476899, - "loss": 0.6587, - "step": 51650 - }, - { - "epoch": 12.61, - "learning_rate": 0.00043206795992733376, - "loss": 0.5901, - "step": 51675 - }, - { - "epoch": 12.62, - "learning_rate": 0.00043203476080697767, - "loss": 0.66, - "step": 51700 - }, - { - "epoch": 12.62, - "learning_rate": 0.0004320015616866216, - "loss": 0.6307, - "step": 51725 - }, - { - "epoch": 12.63, - "learning_rate": 0.00043196836256626544, - "loss": 0.6557, - "step": 51750 - }, - { - "epoch": 12.63, - "learning_rate": 0.0004319351634459093, - "loss": 0.6062, - "step": 51775 - }, - { - "epoch": 12.64, - "learning_rate": 0.0004319019643255532, - "loss": 0.6771, - "step": 51800 - }, - { - "epoch": 12.65, - "learning_rate": 0.00043186876520519713, - "loss": 0.5835, - "step": 51825 - }, - { - "epoch": 12.65, - "learning_rate": 0.00043183556608484105, - "loss": 0.6817, - "step": 51850 - }, - { - "epoch": 12.66, - "learning_rate": 0.00043180236696448496, - "loss": 0.5813, - "step": 51875 - }, - { - "epoch": 12.66, - "learning_rate": 0.00043176916784412877, - "loss": 0.6822, - "step": 51900 - }, - { - "epoch": 12.67, - "learning_rate": 0.0004317359687237727, - "loss": 0.624, - "step": 51925 - }, - { - "epoch": 12.68, - "learning_rate": 0.0004317027696034166, - "loss": 0.6184, - "step": 51950 - }, - { - "epoch": 12.68, - "learning_rate": 0.0004316695704830605, - "loss": 0.5797, - "step": 51975 - }, - { - "epoch": 12.69, - "learning_rate": 0.0004316363713627044, - "loss": 0.6656, - "step": 52000 - }, - { - "epoch": 12.7, - "learning_rate": 0.0004316031722423483, - "loss": 0.6369, - "step": 52025 - }, - { - "epoch": 12.7, - "learning_rate": 0.00043156997312199214, - "loss": 0.6581, - "step": 52050 - }, - { - "epoch": 12.71, - "learning_rate": 0.00043153677400163605, - "loss": 0.6149, - "step": 52075 - }, - { - "epoch": 12.71, - "learning_rate": 0.00043150357488127997, - "loss": 0.6381, - "step": 52100 - }, - { - "epoch": 12.72, - "learning_rate": 0.00043147037576092383, - "loss": 0.6081, - "step": 52125 - }, - { - "epoch": 12.73, - "learning_rate": 0.00043143717664056774, - "loss": 0.6467, - "step": 52150 - }, - { - "epoch": 12.73, - "learning_rate": 0.00043140397752021166, - "loss": 0.6111, - "step": 52175 - }, - { - "epoch": 12.74, - "learning_rate": 0.0004313707783998555, - "loss": 0.6133, - "step": 52200 - }, - { - "epoch": 12.74, - "learning_rate": 0.00043133757927949943, - "loss": 0.6808, - "step": 52225 - }, - { - "epoch": 12.75, - "learning_rate": 0.0004313043801591433, - "loss": 0.6614, - "step": 52250 - }, - { - "epoch": 12.76, - "learning_rate": 0.0004312711810387872, - "loss": 0.6509, - "step": 52275 - }, - { - "epoch": 12.76, - "learning_rate": 0.0004312379819184311, - "loss": 0.6602, - "step": 52300 - }, - { - "epoch": 12.77, - "learning_rate": 0.00043120478279807503, - "loss": 0.6146, - "step": 52325 - }, - { - "epoch": 12.77, - "learning_rate": 0.00043117158367771884, - "loss": 0.6843, - "step": 52350 - }, - { - "epoch": 12.78, - "learning_rate": 0.00043113838455736275, - "loss": 0.6288, - "step": 52375 - }, - { - "epoch": 12.79, - "learning_rate": 0.00043110518543700667, - "loss": 0.6445, - "step": 52400 - }, - { - "epoch": 12.79, - "learning_rate": 0.0004310719863166506, - "loss": 0.5682, - "step": 52425 - }, - { - "epoch": 12.8, - "learning_rate": 0.0004310387871962945, - "loss": 0.7003, - "step": 52450 - }, - { - "epoch": 12.81, - "learning_rate": 0.00043100558807593835, - "loss": 0.5748, - "step": 52475 - }, - { - "epoch": 12.81, - "learning_rate": 0.0004309723889555822, - "loss": 0.6869, - "step": 52500 - }, - { - "epoch": 12.82, - "learning_rate": 0.0004309391898352261, - "loss": 0.5552, - "step": 52525 - }, - { - "epoch": 12.82, - "learning_rate": 0.00043090599071487004, - "loss": 0.6504, - "step": 52550 - }, - { - "epoch": 12.83, - "learning_rate": 0.0004308727915945139, - "loss": 0.6439, - "step": 52575 - }, - { - "epoch": 12.84, - "learning_rate": 0.0004308395924741578, - "loss": 0.6415, - "step": 52600 - }, - { - "epoch": 12.84, - "learning_rate": 0.00043080639335380173, - "loss": 0.6279, - "step": 52625 - }, - { - "epoch": 12.85, - "learning_rate": 0.0004307731942334456, - "loss": 0.6609, - "step": 52650 - }, - { - "epoch": 12.85, - "learning_rate": 0.0004307399951130895, - "loss": 0.628, - "step": 52675 - }, - { - "epoch": 12.86, - "learning_rate": 0.00043070679599273336, - "loss": 0.6844, - "step": 52700 - }, - { - "epoch": 12.87, - "learning_rate": 0.0004306735968723773, - "loss": 0.6197, - "step": 52725 - }, - { - "epoch": 12.87, - "learning_rate": 0.0004306403977520212, - "loss": 0.6395, - "step": 52750 - }, - { - "epoch": 12.88, - "learning_rate": 0.0004306071986316651, - "loss": 0.6112, - "step": 52775 - }, - { - "epoch": 12.88, - "learning_rate": 0.0004305739995113089, - "loss": 0.6495, - "step": 52800 - }, - { - "epoch": 12.89, - "learning_rate": 0.0004305408003909528, - "loss": 0.5714, - "step": 52825 - }, - { - "epoch": 12.9, - "learning_rate": 0.00043050760127059674, - "loss": 0.6368, - "step": 52850 - }, - { - "epoch": 12.9, - "learning_rate": 0.00043047440215024065, - "loss": 0.6219, - "step": 52875 - }, - { - "epoch": 12.91, - "learning_rate": 0.00043044120302988457, - "loss": 0.6374, - "step": 52900 - }, - { - "epoch": 12.91, - "learning_rate": 0.0004304080039095284, - "loss": 0.6305, - "step": 52925 - }, - { - "epoch": 12.92, - "learning_rate": 0.0004303748047891723, - "loss": 0.6444, - "step": 52950 - }, - { - "epoch": 12.93, - "learning_rate": 0.0004303416056688162, - "loss": 0.6064, - "step": 52975 - }, - { - "epoch": 12.93, - "learning_rate": 0.0004303084065484601, - "loss": 0.6849, - "step": 53000 - }, - { - "epoch": 12.94, - "learning_rate": 0.00043027520742810397, - "loss": 0.6103, - "step": 53025 - }, - { - "epoch": 12.95, - "learning_rate": 0.0004302420083077479, - "loss": 0.6676, - "step": 53050 - }, - { - "epoch": 12.95, - "learning_rate": 0.0004302088091873918, - "loss": 0.6101, - "step": 53075 - }, - { - "epoch": 12.96, - "learning_rate": 0.00043017561006703566, - "loss": 0.6528, - "step": 53100 - }, - { - "epoch": 12.96, - "learning_rate": 0.0004301424109466796, - "loss": 0.6113, - "step": 53125 - }, - { - "epoch": 12.97, - "learning_rate": 0.00043010921182632343, - "loss": 0.6564, - "step": 53150 - }, - { - "epoch": 12.98, - "learning_rate": 0.00043007601270596735, - "loss": 0.6153, - "step": 53175 - }, - { - "epoch": 12.98, - "learning_rate": 0.00043004281358561126, - "loss": 0.6683, - "step": 53200 - }, - { - "epoch": 12.99, - "learning_rate": 0.0004300096144652552, - "loss": 0.616, - "step": 53225 - }, - { - "epoch": 12.99, - "learning_rate": 0.000429976415344899, - "loss": 0.6465, - "step": 53250 - }, - { - "epoch": 13.0, - "learning_rate": 0.0004299432162245429, - "loss": 0.6009, - "step": 53275 - }, - { - "epoch": 13.01, - "learning_rate": 0.0004299100171041868, - "loss": 0.5988, - "step": 53300 - }, - { - "epoch": 13.01, - "learning_rate": 0.0004298768179838307, - "loss": 0.6029, - "step": 53325 - }, - { - "epoch": 13.02, - "learning_rate": 0.00042984361886347464, - "loss": 0.6456, - "step": 53350 - }, - { - "epoch": 13.02, - "learning_rate": 0.0004298104197431185, - "loss": 0.5629, - "step": 53375 - }, - { - "epoch": 13.03, - "learning_rate": 0.00042977722062276236, - "loss": 0.6884, - "step": 53400 - }, - { - "epoch": 13.04, - "learning_rate": 0.00042974402150240627, - "loss": 0.5485, - "step": 53425 - }, - { - "epoch": 13.04, - "learning_rate": 0.0004297108223820502, - "loss": 0.6364, - "step": 53450 - }, - { - "epoch": 13.05, - "learning_rate": 0.0004296776232616941, - "loss": 0.6216, - "step": 53475 - }, - { - "epoch": 13.06, - "learning_rate": 0.00042964442414133796, - "loss": 0.6327, - "step": 53500 - }, - { - "epoch": 13.06, - "learning_rate": 0.00042961122502098187, - "loss": 0.5482, - "step": 53525 - }, - { - "epoch": 13.07, - "learning_rate": 0.00042957802590062573, - "loss": 0.6113, - "step": 53550 - }, - { - "epoch": 13.07, - "learning_rate": 0.00042954482678026965, - "loss": 0.6428, - "step": 53575 - }, - { - "epoch": 13.08, - "learning_rate": 0.0004295116276599135, - "loss": 0.6235, - "step": 53600 - }, - { - "epoch": 13.09, - "learning_rate": 0.0004294784285395574, - "loss": 0.5614, - "step": 53625 - }, - { - "epoch": 13.09, - "learning_rate": 0.00042944522941920133, - "loss": 0.6227, - "step": 53650 - }, - { - "epoch": 13.1, - "learning_rate": 0.00042941203029884525, - "loss": 0.6198, - "step": 53675 - }, - { - "epoch": 13.1, - "learning_rate": 0.0004293788311784891, - "loss": 0.6465, - "step": 53700 - }, - { - "epoch": 13.11, - "learning_rate": 0.00042934563205813297, - "loss": 0.5627, - "step": 53725 - }, - { - "epoch": 13.12, - "learning_rate": 0.0004293124329377769, - "loss": 0.5748, - "step": 53750 - }, - { - "epoch": 13.12, - "learning_rate": 0.0004292792338174208, - "loss": 0.6012, - "step": 53775 - }, - { - "epoch": 13.13, - "learning_rate": 0.0004292460346970647, - "loss": 0.6468, - "step": 53800 - }, - { - "epoch": 13.13, - "learning_rate": 0.00042921283557670857, - "loss": 0.5995, - "step": 53825 - }, - { - "epoch": 13.14, - "learning_rate": 0.00042917963645635243, - "loss": 0.6065, - "step": 53850 - }, - { - "epoch": 13.15, - "learning_rate": 0.00042914643733599634, - "loss": 0.5887, - "step": 53875 - }, - { - "epoch": 13.15, - "learning_rate": 0.00042911323821564026, - "loss": 0.63, - "step": 53900 - }, - { - "epoch": 13.16, - "learning_rate": 0.00042908003909528417, - "loss": 0.5393, - "step": 53925 - }, - { - "epoch": 13.16, - "learning_rate": 0.00042904683997492803, - "loss": 0.5984, - "step": 53950 - }, - { - "epoch": 13.17, - "learning_rate": 0.00042901364085457194, - "loss": 0.626, - "step": 53975 - }, - { - "epoch": 13.18, - "learning_rate": 0.0004289804417342158, - "loss": 0.615, - "step": 54000 - }, - { - "epoch": 13.18, - "eval_cer": 0.13237785283820827, - "eval_loss": 0.4704066812992096, - "eval_runtime": 146.2141, - "eval_samples_per_second": 28.677, - "eval_steps_per_second": 7.174, - "eval_wer": 0.5296900489396411, - "step": 54000 - }, - { - "epoch": 13.18, - "learning_rate": 0.0004289472426138597, - "loss": 0.5829, - "step": 54025 - }, - { - "epoch": 13.19, - "learning_rate": 0.0004289140434935036, - "loss": 0.6365, - "step": 54050 - }, - { - "epoch": 13.2, - "learning_rate": 0.0004288808443731475, - "loss": 0.6134, - "step": 54075 - }, - { - "epoch": 13.2, - "learning_rate": 0.0004288476452527914, - "loss": 0.6517, - "step": 54100 - }, - { - "epoch": 13.21, - "learning_rate": 0.0004288144461324353, - "loss": 0.5775, - "step": 54125 - }, - { - "epoch": 13.21, - "learning_rate": 0.0004287812470120792, - "loss": 0.6561, - "step": 54150 - }, - { - "epoch": 13.22, - "learning_rate": 0.00042874804789172304, - "loss": 0.5299, - "step": 54175 - }, - { - "epoch": 13.23, - "learning_rate": 0.00042871484877136695, - "loss": 0.608, - "step": 54200 - }, - { - "epoch": 13.23, - "learning_rate": 0.00042868164965101087, - "loss": 0.5702, - "step": 54225 - }, - { - "epoch": 13.24, - "learning_rate": 0.0004286484505306548, - "loss": 0.6428, - "step": 54250 - }, - { - "epoch": 13.24, - "learning_rate": 0.00042861525141029864, - "loss": 0.5802, - "step": 54275 - }, - { - "epoch": 13.25, - "learning_rate": 0.0004285820522899425, - "loss": 0.5996, - "step": 54300 - }, - { - "epoch": 13.26, - "learning_rate": 0.0004285488531695864, - "loss": 0.5291, - "step": 54325 - }, - { - "epoch": 13.26, - "learning_rate": 0.00042851565404923033, - "loss": 0.6271, - "step": 54350 - }, - { - "epoch": 13.27, - "learning_rate": 0.00042848245492887424, - "loss": 0.5607, - "step": 54375 - }, - { - "epoch": 13.27, - "learning_rate": 0.0004284492558085181, - "loss": 0.6246, - "step": 54400 - }, - { - "epoch": 13.28, - "learning_rate": 0.000428416056688162, - "loss": 0.5731, - "step": 54425 - }, - { - "epoch": 13.29, - "learning_rate": 0.0004283828575678059, - "loss": 0.6058, - "step": 54450 - }, - { - "epoch": 13.29, - "learning_rate": 0.0004283496584474498, - "loss": 0.5722, - "step": 54475 - }, - { - "epoch": 13.3, - "learning_rate": 0.00042831645932709365, - "loss": 0.614, - "step": 54500 - }, - { - "epoch": 13.31, - "learning_rate": 0.00042828326020673756, - "loss": 0.6, - "step": 54525 - }, - { - "epoch": 13.31, - "learning_rate": 0.0004282500610863815, - "loss": 0.6331, - "step": 54550 - }, - { - "epoch": 13.32, - "learning_rate": 0.0004282168619660254, - "loss": 0.6208, - "step": 54575 - }, - { - "epoch": 13.32, - "learning_rate": 0.00042818366284566925, - "loss": 0.6295, - "step": 54600 - }, - { - "epoch": 13.33, - "learning_rate": 0.0004281504637253131, - "loss": 0.6451, - "step": 54625 - }, - { - "epoch": 13.34, - "learning_rate": 0.000428117264604957, - "loss": 0.6238, - "step": 54650 - }, - { - "epoch": 13.34, - "learning_rate": 0.00042808406548460094, - "loss": 0.5815, - "step": 54675 - }, - { - "epoch": 13.35, - "learning_rate": 0.00042805086636424485, - "loss": 0.6429, - "step": 54700 - }, - { - "epoch": 13.35, - "learning_rate": 0.00042801766724388877, - "loss": 0.6381, - "step": 54725 - }, - { - "epoch": 13.36, - "learning_rate": 0.0004279844681235326, - "loss": 0.5901, - "step": 54750 - }, - { - "epoch": 13.37, - "learning_rate": 0.0004279512690031765, - "loss": 0.5912, - "step": 54775 - }, - { - "epoch": 13.37, - "learning_rate": 0.0004279180698828204, - "loss": 0.6324, - "step": 54800 - }, - { - "epoch": 13.38, - "learning_rate": 0.0004278848707624643, - "loss": 0.6042, - "step": 54825 - }, - { - "epoch": 13.38, - "learning_rate": 0.0004278516716421082, - "loss": 0.653, - "step": 54850 - }, - { - "epoch": 13.39, - "learning_rate": 0.0004278184725217521, - "loss": 0.5603, - "step": 54875 - }, - { - "epoch": 13.4, - "learning_rate": 0.00042778527340139595, - "loss": 0.6358, - "step": 54900 - }, - { - "epoch": 13.4, - "learning_rate": 0.00042775207428103986, - "loss": 0.5259, - "step": 54925 - }, - { - "epoch": 13.41, - "learning_rate": 0.0004277188751606838, - "loss": 0.6624, - "step": 54950 - }, - { - "epoch": 13.42, - "learning_rate": 0.00042768567604032764, - "loss": 0.5836, - "step": 54975 - }, - { - "epoch": 13.42, - "learning_rate": 0.00042765247691997155, - "loss": 0.659, - "step": 55000 - }, - { - "epoch": 13.43, - "learning_rate": 0.0004276192777996154, - "loss": 0.5618, - "step": 55025 - }, - { - "epoch": 13.43, - "learning_rate": 0.0004275860786792593, - "loss": 0.6365, - "step": 55050 - }, - { - "epoch": 13.44, - "learning_rate": 0.0004275528795589032, - "loss": 0.596, - "step": 55075 - }, - { - "epoch": 13.45, - "learning_rate": 0.0004275196804385471, - "loss": 0.6246, - "step": 55100 - }, - { - "epoch": 13.45, - "learning_rate": 0.000427486481318191, - "loss": 0.6119, - "step": 55125 - }, - { - "epoch": 13.46, - "learning_rate": 0.0004274532821978349, - "loss": 0.6495, - "step": 55150 - }, - { - "epoch": 13.46, - "learning_rate": 0.0004274200830774788, - "loss": 0.5684, - "step": 55175 - }, - { - "epoch": 13.47, - "learning_rate": 0.00042738688395712265, - "loss": 0.6245, - "step": 55200 - }, - { - "epoch": 13.48, - "learning_rate": 0.00042735501280158084, - "loss": 0.5476, - "step": 55225 - }, - { - "epoch": 13.48, - "learning_rate": 0.0004273218136812247, - "loss": 0.6062, - "step": 55250 - }, - { - "epoch": 13.49, - "learning_rate": 0.0004272886145608686, - "loss": 0.5916, - "step": 55275 - }, - { - "epoch": 13.49, - "learning_rate": 0.0004272554154405125, - "loss": 0.6337, - "step": 55300 - }, - { - "epoch": 13.5, - "learning_rate": 0.0004272222163201564, - "loss": 0.5957, - "step": 55325 - }, - { - "epoch": 13.51, - "learning_rate": 0.0004271890171998003, - "loss": 0.6467, - "step": 55350 - }, - { - "epoch": 13.51, - "learning_rate": 0.0004271558180794442, - "loss": 0.5772, - "step": 55375 - }, - { - "epoch": 13.52, - "learning_rate": 0.000427122618959088, - "loss": 0.649, - "step": 55400 - }, - { - "epoch": 13.52, - "learning_rate": 0.00042708941983873194, - "loss": 0.5464, - "step": 55425 - }, - { - "epoch": 13.53, - "learning_rate": 0.00042705622071837585, - "loss": 0.6423, - "step": 55450 - }, - { - "epoch": 13.54, - "learning_rate": 0.00042702302159801977, - "loss": 0.6658, - "step": 55475 - }, - { - "epoch": 13.54, - "learning_rate": 0.0004269898224776637, - "loss": 0.6415, - "step": 55500 - }, - { - "epoch": 13.55, - "learning_rate": 0.00042695662335730754, - "loss": 0.5512, - "step": 55525 - }, - { - "epoch": 13.56, - "learning_rate": 0.0004269234242369514, - "loss": 0.6279, - "step": 55550 - }, - { - "epoch": 13.56, - "learning_rate": 0.0004268902251165953, - "loss": 0.6403, - "step": 55575 - }, - { - "epoch": 13.57, - "learning_rate": 0.00042685702599623923, - "loss": 0.6368, - "step": 55600 - }, - { - "epoch": 13.57, - "learning_rate": 0.0004268238268758831, - "loss": 0.6262, - "step": 55625 - }, - { - "epoch": 13.58, - "learning_rate": 0.000426790627755527, - "loss": 0.6254, - "step": 55650 - }, - { - "epoch": 13.59, - "learning_rate": 0.0004267574286351709, - "loss": 0.5924, - "step": 55675 - }, - { - "epoch": 13.59, - "learning_rate": 0.0004267242295148148, - "loss": 0.6158, - "step": 55700 - }, - { - "epoch": 13.6, - "learning_rate": 0.0004266910303944587, - "loss": 0.6169, - "step": 55725 - }, - { - "epoch": 13.6, - "learning_rate": 0.00042665783127410255, - "loss": 0.617, - "step": 55750 - }, - { - "epoch": 13.61, - "learning_rate": 0.00042662463215374646, - "loss": 0.5882, - "step": 55775 - }, - { - "epoch": 13.62, - "learning_rate": 0.0004265914330333904, - "loss": 0.6228, - "step": 55800 - }, - { - "epoch": 13.62, - "learning_rate": 0.00042655823391303424, - "loss": 0.5645, - "step": 55825 - }, - { - "epoch": 13.63, - "learning_rate": 0.0004265250347926781, - "loss": 0.6124, - "step": 55850 - }, - { - "epoch": 13.63, - "learning_rate": 0.000426491835672322, - "loss": 0.6378, - "step": 55875 - }, - { - "epoch": 13.64, - "learning_rate": 0.0004264586365519659, - "loss": 0.6315, - "step": 55900 - }, - { - "epoch": 13.65, - "learning_rate": 0.00042642543743160984, - "loss": 0.5701, - "step": 55925 - }, - { - "epoch": 13.65, - "learning_rate": 0.00042639223831125375, - "loss": 0.6325, - "step": 55950 - }, - { - "epoch": 13.66, - "learning_rate": 0.00042635903919089756, - "loss": 0.5678, - "step": 55975 - }, - { - "epoch": 13.67, - "learning_rate": 0.00042632584007054147, - "loss": 0.6605, - "step": 56000 - }, - { - "epoch": 13.67, - "learning_rate": 0.0004262926409501854, - "loss": 0.5455, - "step": 56025 - }, - { - "epoch": 13.68, - "learning_rate": 0.0004262594418298293, - "loss": 0.6301, - "step": 56050 - }, - { - "epoch": 13.68, - "learning_rate": 0.0004262262427094732, - "loss": 0.6023, - "step": 56075 - }, - { - "epoch": 13.69, - "learning_rate": 0.0004261930435891171, - "loss": 0.6524, - "step": 56100 - }, - { - "epoch": 13.7, - "learning_rate": 0.00042615984446876093, - "loss": 0.5723, - "step": 56125 - }, - { - "epoch": 13.7, - "learning_rate": 0.00042612664534840485, - "loss": 0.6332, - "step": 56150 - }, - { - "epoch": 13.71, - "learning_rate": 0.00042609344622804876, - "loss": 0.4887, - "step": 56175 - }, - { - "epoch": 13.71, - "learning_rate": 0.0004260602471076926, - "loss": 0.6688, - "step": 56200 - }, - { - "epoch": 13.72, - "learning_rate": 0.00042602704798733654, - "loss": 0.6288, - "step": 56225 - }, - { - "epoch": 13.73, - "learning_rate": 0.00042599384886698045, - "loss": 0.6548, - "step": 56250 - }, - { - "epoch": 13.73, - "learning_rate": 0.0004259606497466243, - "loss": 0.6337, - "step": 56275 - }, - { - "epoch": 13.74, - "learning_rate": 0.0004259274506262682, - "loss": 0.6278, - "step": 56300 - }, - { - "epoch": 13.74, - "learning_rate": 0.0004258942515059121, - "loss": 0.6219, - "step": 56325 - }, - { - "epoch": 13.75, - "learning_rate": 0.000425861052385556, - "loss": 0.6294, - "step": 56350 - }, - { - "epoch": 13.76, - "learning_rate": 0.0004258278532651999, - "loss": 0.5719, - "step": 56375 - }, - { - "epoch": 13.76, - "learning_rate": 0.0004257946541448438, - "loss": 0.6342, - "step": 56400 - }, - { - "epoch": 13.77, - "learning_rate": 0.00042576145502448763, - "loss": 0.6385, - "step": 56425 - }, - { - "epoch": 13.78, - "learning_rate": 0.00042572825590413154, - "loss": 0.6423, - "step": 56450 - }, - { - "epoch": 13.78, - "learning_rate": 0.00042569505678377546, - "loss": 0.5712, - "step": 56475 - }, - { - "epoch": 13.79, - "learning_rate": 0.00042566185766341937, - "loss": 0.5906, - "step": 56500 - }, - { - "epoch": 13.79, - "learning_rate": 0.0004256286585430633, - "loss": 0.6113, - "step": 56525 - }, - { - "epoch": 13.8, - "learning_rate": 0.00042559545942270715, - "loss": 0.6131, - "step": 56550 - }, - { - "epoch": 13.81, - "learning_rate": 0.000425562260302351, - "loss": 0.5752, - "step": 56575 - }, - { - "epoch": 13.81, - "learning_rate": 0.0004255290611819949, - "loss": 0.6672, - "step": 56600 - }, - { - "epoch": 13.82, - "learning_rate": 0.00042549586206163883, - "loss": 0.6447, - "step": 56625 - }, - { - "epoch": 13.82, - "learning_rate": 0.0004254626629412827, - "loss": 0.611, - "step": 56650 - }, - { - "epoch": 13.83, - "learning_rate": 0.0004254294638209266, - "loss": 0.5499, - "step": 56675 - }, - { - "epoch": 13.84, - "learning_rate": 0.0004253962647005705, - "loss": 0.6201, - "step": 56700 - }, - { - "epoch": 13.84, - "learning_rate": 0.0004253630655802144, - "loss": 0.6202, - "step": 56725 - }, - { - "epoch": 13.85, - "learning_rate": 0.0004253298664598583, - "loss": 0.6132, - "step": 56750 - }, - { - "epoch": 13.85, - "learning_rate": 0.00042529666733950216, - "loss": 0.5538, - "step": 56775 - }, - { - "epoch": 13.86, - "learning_rate": 0.00042526346821914607, - "loss": 0.6536, - "step": 56800 - }, - { - "epoch": 13.87, - "learning_rate": 0.00042523026909879, - "loss": 0.5926, - "step": 56825 - }, - { - "epoch": 13.87, - "learning_rate": 0.0004251970699784339, - "loss": 0.6069, - "step": 56850 - }, - { - "epoch": 13.88, - "learning_rate": 0.0004251638708580777, - "loss": 0.5366, - "step": 56875 - }, - { - "epoch": 13.88, - "learning_rate": 0.0004251306717377216, - "loss": 0.6103, - "step": 56900 - }, - { - "epoch": 13.89, - "learning_rate": 0.00042509747261736553, - "loss": 0.6493, - "step": 56925 - }, - { - "epoch": 13.9, - "learning_rate": 0.00042506427349700944, - "loss": 0.6284, - "step": 56950 - }, - { - "epoch": 13.9, - "learning_rate": 0.00042503107437665336, - "loss": 0.6125, - "step": 56975 - }, - { - "epoch": 13.91, - "learning_rate": 0.0004249978752562972, - "loss": 0.6308, - "step": 57000 - }, - { - "epoch": 13.91, - "eval_cer": 0.1298163300925023, - "eval_loss": 0.4570181965827942, - "eval_runtime": 145.5018, - "eval_samples_per_second": 28.818, - "eval_steps_per_second": 7.21, - "eval_wer": 0.5181402936378466, - "step": 57000 - }, - { - "epoch": 13.92, - "learning_rate": 0.0004249646761359411, - "loss": 0.591, - "step": 57025 - }, - { - "epoch": 13.92, - "learning_rate": 0.000424931477015585, - "loss": 0.6476, - "step": 57050 - }, - { - "epoch": 13.93, - "learning_rate": 0.0004248982778952289, - "loss": 0.6229, - "step": 57075 - }, - { - "epoch": 13.93, - "learning_rate": 0.00042486507877487277, - "loss": 0.6675, - "step": 57100 - }, - { - "epoch": 13.94, - "learning_rate": 0.0004248318796545167, - "loss": 0.6594, - "step": 57125 - }, - { - "epoch": 13.95, - "learning_rate": 0.0004247986805341606, - "loss": 0.623, - "step": 57150 - }, - { - "epoch": 13.95, - "learning_rate": 0.00042476548141380445, - "loss": 0.5794, - "step": 57175 - }, - { - "epoch": 13.96, - "learning_rate": 0.00042473228229344837, - "loss": 0.6319, - "step": 57200 - }, - { - "epoch": 13.96, - "learning_rate": 0.00042469908317309223, - "loss": 0.5749, - "step": 57225 - }, - { - "epoch": 13.97, - "learning_rate": 0.00042466588405273614, - "loss": 0.6396, - "step": 57250 - }, - { - "epoch": 13.98, - "learning_rate": 0.00042463268493238006, - "loss": 0.5968, - "step": 57275 - }, - { - "epoch": 13.98, - "learning_rate": 0.00042459948581202397, - "loss": 0.6442, - "step": 57300 - }, - { - "epoch": 13.99, - "learning_rate": 0.00042456628669166783, - "loss": 0.561, - "step": 57325 - }, - { - "epoch": 13.99, - "learning_rate": 0.0004245330875713117, - "loss": 0.617, - "step": 57350 - }, - { - "epoch": 14.0, - "learning_rate": 0.0004244998884509556, - "loss": 0.5744, - "step": 57375 - }, - { - "epoch": 14.01, - "learning_rate": 0.0004244666893305995, - "loss": 0.6043, - "step": 57400 - }, - { - "epoch": 14.01, - "learning_rate": 0.00042443349021024343, - "loss": 0.5643, - "step": 57425 - }, - { - "epoch": 14.02, - "learning_rate": 0.0004244002910898873, - "loss": 0.6069, - "step": 57450 - }, - { - "epoch": 14.03, - "learning_rate": 0.00042436709196953115, - "loss": 0.5898, - "step": 57475 - }, - { - "epoch": 14.03, - "learning_rate": 0.00042433389284917506, - "loss": 0.5904, - "step": 57500 - }, - { - "epoch": 14.04, - "learning_rate": 0.000424300693728819, - "loss": 0.5918, - "step": 57525 - }, - { - "epoch": 14.04, - "learning_rate": 0.0004242674946084629, - "loss": 0.5941, - "step": 57550 - }, - { - "epoch": 14.05, - "learning_rate": 0.00042423429548810675, - "loss": 0.6079, - "step": 57575 - }, - { - "epoch": 14.06, - "learning_rate": 0.00042420109636775067, - "loss": 0.5946, - "step": 57600 - }, - { - "epoch": 14.06, - "learning_rate": 0.0004241678972473945, - "loss": 0.6464, - "step": 57625 - }, - { - "epoch": 14.07, - "learning_rate": 0.00042413469812703844, - "loss": 0.6279, - "step": 57650 - }, - { - "epoch": 14.07, - "learning_rate": 0.00042410282697149653, - "loss": 0.5383, - "step": 57675 - }, - { - "epoch": 14.08, - "learning_rate": 0.00042406962785114044, - "loss": 0.5984, - "step": 57700 - }, - { - "epoch": 14.09, - "learning_rate": 0.00042403642873078436, - "loss": 0.588, - "step": 57725 - }, - { - "epoch": 14.09, - "learning_rate": 0.00042400322961042827, - "loss": 0.6184, - "step": 57750 - }, - { - "epoch": 14.1, - "learning_rate": 0.00042397003049007213, - "loss": 0.5526, - "step": 57775 - }, - { - "epoch": 14.1, - "learning_rate": 0.00042393683136971605, - "loss": 0.6482, - "step": 57800 - }, - { - "epoch": 14.11, - "learning_rate": 0.0004239036322493599, - "loss": 0.5692, - "step": 57825 - }, - { - "epoch": 14.12, - "learning_rate": 0.0004238704331290038, - "loss": 0.5955, - "step": 57850 - }, - { - "epoch": 14.12, - "learning_rate": 0.00042383723400864773, - "loss": 0.6025, - "step": 57875 - }, - { - "epoch": 14.13, - "learning_rate": 0.0004238040348882916, - "loss": 0.6018, - "step": 57900 - }, - { - "epoch": 14.13, - "learning_rate": 0.0004237708357679355, - "loss": 0.5857, - "step": 57925 - }, - { - "epoch": 14.14, - "learning_rate": 0.0004237376366475794, - "loss": 0.5763, - "step": 57950 - }, - { - "epoch": 14.15, - "learning_rate": 0.0004237044375272233, - "loss": 0.6155, - "step": 57975 - }, - { - "epoch": 14.15, - "learning_rate": 0.00042367123840686714, - "loss": 0.6198, - "step": 58000 - }, - { - "epoch": 14.16, - "learning_rate": 0.00042363803928651105, - "loss": 0.5932, - "step": 58025 - }, - { - "epoch": 14.17, - "learning_rate": 0.00042360484016615497, - "loss": 0.5814, - "step": 58050 - }, - { - "epoch": 14.17, - "learning_rate": 0.0004235716410457989, - "loss": 0.5931, - "step": 58075 - }, - { - "epoch": 14.18, - "learning_rate": 0.0004235384419254428, - "loss": 0.5842, - "step": 58100 - }, - { - "epoch": 14.18, - "learning_rate": 0.0004235052428050866, - "loss": 0.5457, - "step": 58125 - }, - { - "epoch": 14.19, - "learning_rate": 0.0004234720436847305, - "loss": 0.6123, - "step": 58150 - }, - { - "epoch": 14.2, - "learning_rate": 0.00042343884456437443, - "loss": 0.5326, - "step": 58175 - }, - { - "epoch": 14.2, - "learning_rate": 0.00042340564544401834, - "loss": 0.5919, - "step": 58200 - }, - { - "epoch": 14.21, - "learning_rate": 0.0004233724463236622, - "loss": 0.5965, - "step": 58225 - }, - { - "epoch": 14.21, - "learning_rate": 0.0004233392472033061, - "loss": 0.5863, - "step": 58250 - }, - { - "epoch": 14.22, - "learning_rate": 0.00042330604808295, - "loss": 0.5605, - "step": 58275 - }, - { - "epoch": 14.23, - "learning_rate": 0.0004232728489625939, - "loss": 0.614, - "step": 58300 - }, - { - "epoch": 14.23, - "learning_rate": 0.0004232396498422378, - "loss": 0.5654, - "step": 58325 - }, - { - "epoch": 14.24, - "learning_rate": 0.00042320645072188167, - "loss": 0.5933, - "step": 58350 - }, - { - "epoch": 14.24, - "learning_rate": 0.0004231732516015256, - "loss": 0.5873, - "step": 58375 - }, - { - "epoch": 14.25, - "learning_rate": 0.0004231400524811695, - "loss": 0.5915, - "step": 58400 - }, - { - "epoch": 14.26, - "learning_rate": 0.00042310685336081335, - "loss": 0.6126, - "step": 58425 - }, - { - "epoch": 14.26, - "learning_rate": 0.0004230736542404572, - "loss": 0.6042, - "step": 58450 - }, - { - "epoch": 14.27, - "learning_rate": 0.0004230404551201011, - "loss": 0.5961, - "step": 58475 - }, - { - "epoch": 14.28, - "learning_rate": 0.00042300725599974504, - "loss": 0.6288, - "step": 58500 - }, - { - "epoch": 14.28, - "learning_rate": 0.00042297405687938895, - "loss": 0.4981, - "step": 58525 - }, - { - "epoch": 14.29, - "learning_rate": 0.00042294085775903287, - "loss": 0.5907, - "step": 58550 - }, - { - "epoch": 14.29, - "learning_rate": 0.0004229076586386767, - "loss": 0.5619, - "step": 58575 - }, - { - "epoch": 14.3, - "learning_rate": 0.0004228744595183206, - "loss": 0.6181, - "step": 58600 - }, - { - "epoch": 14.31, - "learning_rate": 0.0004228412603979645, - "loss": 0.5144, - "step": 58625 - }, - { - "epoch": 14.31, - "learning_rate": 0.0004228080612776084, - "loss": 0.6199, - "step": 58650 - }, - { - "epoch": 14.32, - "learning_rate": 0.00042277486215725233, - "loss": 0.6018, - "step": 58675 - }, - { - "epoch": 14.32, - "learning_rate": 0.0004227416630368962, - "loss": 0.5986, - "step": 58700 - }, - { - "epoch": 14.33, - "learning_rate": 0.00042270846391654005, - "loss": 0.5543, - "step": 58725 - }, - { - "epoch": 14.34, - "learning_rate": 0.00042267526479618396, - "loss": 0.6112, - "step": 58750 - }, - { - "epoch": 14.34, - "learning_rate": 0.0004226420656758279, - "loss": 0.5911, - "step": 58775 - }, - { - "epoch": 14.35, - "learning_rate": 0.00042260886655547174, - "loss": 0.6487, - "step": 58800 - }, - { - "epoch": 14.35, - "learning_rate": 0.00042257566743511565, - "loss": 0.5668, - "step": 58825 - }, - { - "epoch": 14.36, - "learning_rate": 0.00042254246831475957, - "loss": 0.5784, - "step": 58850 - }, - { - "epoch": 14.37, - "learning_rate": 0.0004225092691944034, - "loss": 0.5174, - "step": 58875 - }, - { - "epoch": 14.37, - "learning_rate": 0.00042247607007404734, - "loss": 0.5878, - "step": 58900 - }, - { - "epoch": 14.38, - "learning_rate": 0.0004224428709536912, - "loss": 0.5745, - "step": 58925 - }, - { - "epoch": 14.39, - "learning_rate": 0.0004224096718333351, - "loss": 0.6411, - "step": 58950 - }, - { - "epoch": 14.39, - "learning_rate": 0.000422376472712979, - "loss": 0.5667, - "step": 58975 - }, - { - "epoch": 14.4, - "learning_rate": 0.00042234327359262294, - "loss": 0.6156, - "step": 59000 - }, - { - "epoch": 14.4, - "learning_rate": 0.00042231007447226675, - "loss": 0.5767, - "step": 59025 - }, - { - "epoch": 14.41, - "learning_rate": 0.00042227687535191066, - "loss": 0.6067, - "step": 59050 - }, - { - "epoch": 14.42, - "learning_rate": 0.0004222436762315546, - "loss": 0.5967, - "step": 59075 - }, - { - "epoch": 14.42, - "learning_rate": 0.0004222104771111985, - "loss": 0.6227, - "step": 59100 - }, - { - "epoch": 14.43, - "learning_rate": 0.0004221772779908424, - "loss": 0.5626, - "step": 59125 - }, - { - "epoch": 14.43, - "learning_rate": 0.00042214407887048626, - "loss": 0.6133, - "step": 59150 - }, - { - "epoch": 14.44, - "learning_rate": 0.0004221108797501301, - "loss": 0.5761, - "step": 59175 - }, - { - "epoch": 14.45, - "learning_rate": 0.00042207768062977404, - "loss": 0.5861, - "step": 59200 - }, - { - "epoch": 14.45, - "learning_rate": 0.00042204448150941795, - "loss": 0.5882, - "step": 59225 - }, - { - "epoch": 14.46, - "learning_rate": 0.0004220112823890618, - "loss": 0.6155, - "step": 59250 - }, - { - "epoch": 14.46, - "learning_rate": 0.0004219780832687057, - "loss": 0.5599, - "step": 59275 - }, - { - "epoch": 14.47, - "learning_rate": 0.00042194488414834964, - "loss": 0.5907, - "step": 59300 - }, - { - "epoch": 14.48, - "learning_rate": 0.0004219116850279935, - "loss": 0.5632, - "step": 59325 - }, - { - "epoch": 14.48, - "learning_rate": 0.0004218784859076374, - "loss": 0.6302, - "step": 59350 - }, - { - "epoch": 14.49, - "learning_rate": 0.00042184528678728127, - "loss": 0.5725, - "step": 59375 - }, - { - "epoch": 14.49, - "learning_rate": 0.0004218120876669252, - "loss": 0.639, - "step": 59400 - }, - { - "epoch": 14.5, - "learning_rate": 0.0004217788885465691, - "loss": 0.5299, - "step": 59425 - }, - { - "epoch": 14.51, - "learning_rate": 0.000421745689426213, - "loss": 0.6035, - "step": 59450 - }, - { - "epoch": 14.51, - "learning_rate": 0.0004217124903058568, - "loss": 0.5558, - "step": 59475 - }, - { - "epoch": 14.52, - "learning_rate": 0.00042167929118550073, - "loss": 0.6101, - "step": 59500 - }, - { - "epoch": 14.53, - "learning_rate": 0.00042164609206514465, - "loss": 0.6208, - "step": 59525 - }, - { - "epoch": 14.53, - "learning_rate": 0.00042161289294478856, - "loss": 0.6033, - "step": 59550 - }, - { - "epoch": 14.54, - "learning_rate": 0.0004215796938244325, - "loss": 0.598, - "step": 59575 - }, - { - "epoch": 14.54, - "learning_rate": 0.00042154649470407633, - "loss": 0.6098, - "step": 59600 - }, - { - "epoch": 14.55, - "learning_rate": 0.0004215132955837202, - "loss": 0.5855, - "step": 59625 - }, - { - "epoch": 14.56, - "learning_rate": 0.0004214800964633641, - "loss": 0.5699, - "step": 59650 - }, - { - "epoch": 14.56, - "learning_rate": 0.000421446897343008, - "loss": 0.5767, - "step": 59675 - }, - { - "epoch": 14.57, - "learning_rate": 0.00042141369822265194, - "loss": 0.6179, - "step": 59700 - }, - { - "epoch": 14.57, - "learning_rate": 0.0004213804991022958, - "loss": 0.5859, - "step": 59725 - }, - { - "epoch": 14.58, - "learning_rate": 0.0004213472999819397, - "loss": 0.6002, - "step": 59750 - }, - { - "epoch": 14.59, - "learning_rate": 0.00042131410086158357, - "loss": 0.6104, - "step": 59775 - }, - { - "epoch": 14.59, - "learning_rate": 0.0004212809017412275, - "loss": 0.6178, - "step": 59800 - }, - { - "epoch": 14.6, - "learning_rate": 0.00042124770262087134, - "loss": 0.6554, - "step": 59825 - }, - { - "epoch": 14.6, - "learning_rate": 0.00042121450350051526, - "loss": 0.6093, - "step": 59850 - }, - { - "epoch": 14.61, - "learning_rate": 0.00042118130438015917, - "loss": 0.5681, - "step": 59875 - }, - { - "epoch": 14.62, - "learning_rate": 0.0004211481052598031, - "loss": 0.5955, - "step": 59900 - }, - { - "epoch": 14.62, - "learning_rate": 0.00042111490613944694, - "loss": 0.5824, - "step": 59925 - }, - { - "epoch": 14.63, - "learning_rate": 0.0004210817070190908, - "loss": 0.5922, - "step": 59950 - }, - { - "epoch": 14.64, - "learning_rate": 0.0004210485078987347, - "loss": 0.6048, - "step": 59975 - }, - { - "epoch": 14.64, - "learning_rate": 0.00042101530877837863, - "loss": 0.6169, - "step": 60000 - }, - { - "epoch": 14.64, - "eval_cer": 0.12906173321150272, - "eval_loss": 0.45141759514808655, - "eval_runtime": 146.1787, - "eval_samples_per_second": 28.684, - "eval_steps_per_second": 7.176, - "eval_wer": 0.5106362153344208, - "step": 60000 - }, - { - "epoch": 14.65, - "learning_rate": 0.00042098210965802255, - "loss": 0.5448, - "step": 60025 - }, - { - "epoch": 14.65, - "learning_rate": 0.0004209489105376664, - "loss": 0.5884, - "step": 60050 - }, - { - "epoch": 14.66, - "learning_rate": 0.00042091571141731027, - "loss": 0.6039, - "step": 60075 - }, - { - "epoch": 14.67, - "learning_rate": 0.0004208825122969542, - "loss": 0.5554, - "step": 60100 - }, - { - "epoch": 14.67, - "learning_rate": 0.0004208493131765981, - "loss": 0.5541, - "step": 60125 - }, - { - "epoch": 14.68, - "learning_rate": 0.000420816114056242, - "loss": 0.6163, - "step": 60150 - }, - { - "epoch": 14.68, - "learning_rate": 0.00042078291493588587, - "loss": 0.5741, - "step": 60175 - }, - { - "epoch": 14.69, - "learning_rate": 0.0004207497158155298, - "loss": 0.6034, - "step": 60200 - }, - { - "epoch": 14.7, - "learning_rate": 0.00042071651669517364, - "loss": 0.6086, - "step": 60225 - }, - { - "epoch": 14.7, - "learning_rate": 0.00042068331757481756, - "loss": 0.5983, - "step": 60250 - }, - { - "epoch": 14.71, - "learning_rate": 0.0004206501184544614, - "loss": 0.5811, - "step": 60275 - }, - { - "epoch": 14.71, - "learning_rate": 0.00042061691933410533, - "loss": 0.629, - "step": 60300 - }, - { - "epoch": 14.72, - "learning_rate": 0.00042058372021374924, - "loss": 0.5687, - "step": 60325 - }, - { - "epoch": 14.73, - "learning_rate": 0.00042055052109339316, - "loss": 0.5759, - "step": 60350 - }, - { - "epoch": 14.73, - "learning_rate": 0.000420517321973037, - "loss": 0.6268, - "step": 60375 - }, - { - "epoch": 14.74, - "learning_rate": 0.0004204841228526809, - "loss": 0.6366, - "step": 60400 - }, - { - "epoch": 14.74, - "learning_rate": 0.0004204509237323248, - "loss": 0.5926, - "step": 60425 - }, - { - "epoch": 14.75, - "learning_rate": 0.0004204177246119687, - "loss": 0.5949, - "step": 60450 - }, - { - "epoch": 14.76, - "learning_rate": 0.0004203845254916126, - "loss": 0.5102, - "step": 60475 - }, - { - "epoch": 14.76, - "learning_rate": 0.0004203513263712564, - "loss": 0.5873, - "step": 60500 - }, - { - "epoch": 14.77, - "learning_rate": 0.00042031812725090034, - "loss": 0.5693, - "step": 60525 - }, - { - "epoch": 14.78, - "learning_rate": 0.00042028492813054425, - "loss": 0.6257, - "step": 60550 - }, - { - "epoch": 14.78, - "learning_rate": 0.00042025172901018817, - "loss": 0.6004, - "step": 60575 - }, - { - "epoch": 14.79, - "learning_rate": 0.0004202185298898321, - "loss": 0.6049, - "step": 60600 - }, - { - "epoch": 14.79, - "learning_rate": 0.00042018533076947594, - "loss": 0.5733, - "step": 60625 - }, - { - "epoch": 14.8, - "learning_rate": 0.0004201521316491198, - "loss": 0.6075, - "step": 60650 - }, - { - "epoch": 14.81, - "learning_rate": 0.0004201189325287637, - "loss": 0.5729, - "step": 60675 - }, - { - "epoch": 14.81, - "learning_rate": 0.00042008573340840763, - "loss": 0.6376, - "step": 60700 - }, - { - "epoch": 14.82, - "learning_rate": 0.0004200525342880515, - "loss": 0.5921, - "step": 60725 - }, - { - "epoch": 14.82, - "learning_rate": 0.0004200193351676954, - "loss": 0.6365, - "step": 60750 - }, - { - "epoch": 14.83, - "learning_rate": 0.0004199861360473393, - "loss": 0.5834, - "step": 60775 - }, - { - "epoch": 14.84, - "learning_rate": 0.0004199529369269832, - "loss": 0.6236, - "step": 60800 - }, - { - "epoch": 14.84, - "learning_rate": 0.0004199197378066271, - "loss": 0.5911, - "step": 60825 - }, - { - "epoch": 14.85, - "learning_rate": 0.00041988653868627095, - "loss": 0.597, - "step": 60850 - }, - { - "epoch": 14.85, - "learning_rate": 0.00041985333956591486, - "loss": 0.5702, - "step": 60875 - }, - { - "epoch": 14.86, - "learning_rate": 0.0004198201404455588, - "loss": 0.5864, - "step": 60900 - }, - { - "epoch": 14.87, - "learning_rate": 0.0004197869413252027, - "loss": 0.5568, - "step": 60925 - }, - { - "epoch": 14.87, - "learning_rate": 0.0004197537422048465, - "loss": 0.6031, - "step": 60950 - }, - { - "epoch": 14.88, - "learning_rate": 0.0004197205430844904, - "loss": 0.6211, - "step": 60975 - }, - { - "epoch": 14.89, - "learning_rate": 0.0004196873439641343, - "loss": 0.624, - "step": 61000 - }, - { - "epoch": 14.89, - "learning_rate": 0.00041965414484377824, - "loss": 0.5962, - "step": 61025 - }, - { - "epoch": 14.9, - "learning_rate": 0.00041962094572342215, - "loss": 0.6123, - "step": 61050 - }, - { - "epoch": 14.9, - "learning_rate": 0.000419587746603066, - "loss": 0.5665, - "step": 61075 - }, - { - "epoch": 14.91, - "learning_rate": 0.00041955454748270987, - "loss": 0.623, - "step": 61100 - }, - { - "epoch": 14.92, - "learning_rate": 0.0004195213483623538, - "loss": 0.5411, - "step": 61125 - }, - { - "epoch": 14.92, - "learning_rate": 0.0004194881492419977, - "loss": 0.6203, - "step": 61150 - }, - { - "epoch": 14.93, - "learning_rate": 0.0004194549501216416, - "loss": 0.5577, - "step": 61175 - }, - { - "epoch": 14.93, - "learning_rate": 0.0004194217510012855, - "loss": 0.6094, - "step": 61200 - }, - { - "epoch": 14.94, - "learning_rate": 0.0004193885518809294, - "loss": 0.6089, - "step": 61225 - }, - { - "epoch": 14.95, - "learning_rate": 0.00041935535276057325, - "loss": 0.6125, - "step": 61250 - }, - { - "epoch": 14.95, - "learning_rate": 0.00041932215364021716, - "loss": 0.5804, - "step": 61275 - }, - { - "epoch": 14.96, - "learning_rate": 0.000419288954519861, - "loss": 0.5942, - "step": 61300 - }, - { - "epoch": 14.96, - "learning_rate": 0.00041925575539950493, - "loss": 0.6231, - "step": 61325 - }, - { - "epoch": 14.97, - "learning_rate": 0.00041922255627914885, - "loss": 0.6048, - "step": 61350 - }, - { - "epoch": 14.98, - "learning_rate": 0.00041918935715879276, - "loss": 0.5772, - "step": 61375 - }, - { - "epoch": 14.98, - "learning_rate": 0.0004191561580384366, - "loss": 0.6248, - "step": 61400 - }, - { - "epoch": 14.99, - "learning_rate": 0.0004191229589180805, - "loss": 0.6252, - "step": 61425 - }, - { - "epoch": 15.0, - "learning_rate": 0.0004190897597977244, - "loss": 0.6205, - "step": 61450 - }, - { - "epoch": 15.0, - "learning_rate": 0.0004190565606773683, - "loss": 0.5726, - "step": 61475 - }, - { - "epoch": 15.01, - "learning_rate": 0.0004190233615570122, - "loss": 0.5984, - "step": 61500 - }, - { - "epoch": 15.01, - "learning_rate": 0.0004189901624366561, - "loss": 0.5569, - "step": 61525 - }, - { - "epoch": 15.02, - "learning_rate": 0.00041895696331629994, - "loss": 0.6261, - "step": 61550 - }, - { - "epoch": 15.03, - "learning_rate": 0.00041892376419594386, - "loss": 0.5558, - "step": 61575 - }, - { - "epoch": 15.03, - "learning_rate": 0.00041889056507558777, - "loss": 0.5589, - "step": 61600 - }, - { - "epoch": 15.04, - "learning_rate": 0.0004188573659552317, - "loss": 0.6264, - "step": 61625 - }, - { - "epoch": 15.04, - "learning_rate": 0.00041882416683487555, - "loss": 0.5598, - "step": 61650 - }, - { - "epoch": 15.05, - "learning_rate": 0.0004187922956793337, - "loss": 0.5917, - "step": 61675 - }, - { - "epoch": 15.06, - "learning_rate": 0.0004187590965589776, - "loss": 0.6053, - "step": 61700 - }, - { - "epoch": 15.06, - "learning_rate": 0.0004187258974386215, - "loss": 0.5212, - "step": 61725 - }, - { - "epoch": 15.07, - "learning_rate": 0.0004186926983182653, - "loss": 0.6262, - "step": 61750 - }, - { - "epoch": 15.07, - "learning_rate": 0.00041865949919790924, - "loss": 0.5495, - "step": 61775 - }, - { - "epoch": 15.08, - "learning_rate": 0.00041862630007755315, - "loss": 0.6077, - "step": 61800 - }, - { - "epoch": 15.09, - "learning_rate": 0.00041859310095719707, - "loss": 0.5933, - "step": 61825 - }, - { - "epoch": 15.09, - "learning_rate": 0.0004185599018368409, - "loss": 0.5604, - "step": 61850 - }, - { - "epoch": 15.1, - "learning_rate": 0.00041852670271648484, - "loss": 0.5932, - "step": 61875 - }, - { - "epoch": 15.1, - "learning_rate": 0.0004184935035961287, - "loss": 0.5503, - "step": 61900 - }, - { - "epoch": 15.11, - "learning_rate": 0.0004184603044757726, - "loss": 0.5703, - "step": 61925 - }, - { - "epoch": 15.12, - "learning_rate": 0.0004184271053554165, - "loss": 0.5733, - "step": 61950 - }, - { - "epoch": 15.12, - "learning_rate": 0.0004183939062350604, - "loss": 0.5573, - "step": 61975 - }, - { - "epoch": 15.13, - "learning_rate": 0.0004183607071147043, - "loss": 0.598, - "step": 62000 - }, - { - "epoch": 15.14, - "learning_rate": 0.0004183275079943482, - "loss": 0.579, - "step": 62025 - }, - { - "epoch": 15.14, - "learning_rate": 0.0004182943088739921, - "loss": 0.572, - "step": 62050 - }, - { - "epoch": 15.15, - "learning_rate": 0.00041826110975363593, - "loss": 0.5451, - "step": 62075 - }, - { - "epoch": 15.15, - "learning_rate": 0.00041822791063327985, - "loss": 0.5816, - "step": 62100 - }, - { - "epoch": 15.16, - "learning_rate": 0.00041819471151292376, - "loss": 0.5448, - "step": 62125 - }, - { - "epoch": 15.17, - "learning_rate": 0.0004181615123925677, - "loss": 0.5673, - "step": 62150 - }, - { - "epoch": 15.17, - "learning_rate": 0.0004181283132722116, - "loss": 0.5592, - "step": 62175 - }, - { - "epoch": 15.18, - "learning_rate": 0.0004180951141518554, - "loss": 0.5821, - "step": 62200 - }, - { - "epoch": 15.18, - "learning_rate": 0.0004180619150314993, - "loss": 0.5912, - "step": 62225 - }, - { - "epoch": 15.19, - "learning_rate": 0.0004180287159111432, - "loss": 0.5935, - "step": 62250 - }, - { - "epoch": 15.2, - "learning_rate": 0.00041799551679078714, - "loss": 0.5177, - "step": 62275 - }, - { - "epoch": 15.2, - "learning_rate": 0.00041796231767043105, - "loss": 0.6028, - "step": 62300 - }, - { - "epoch": 15.21, - "learning_rate": 0.0004179291185500749, - "loss": 0.5421, - "step": 62325 - }, - { - "epoch": 15.21, - "learning_rate": 0.00041789591942971877, - "loss": 0.5825, - "step": 62350 - }, - { - "epoch": 15.22, - "learning_rate": 0.0004178627203093627, - "loss": 0.5568, - "step": 62375 - }, - { - "epoch": 15.23, - "learning_rate": 0.0004178295211890066, - "loss": 0.5786, - "step": 62400 - }, - { - "epoch": 15.23, - "learning_rate": 0.00041779632206865046, - "loss": 0.59, - "step": 62425 - }, - { - "epoch": 15.24, - "learning_rate": 0.00041776312294829437, - "loss": 0.5885, - "step": 62450 - }, - { - "epoch": 15.25, - "learning_rate": 0.0004177299238279383, - "loss": 0.5425, - "step": 62475 - }, - { - "epoch": 15.25, - "learning_rate": 0.00041769672470758215, - "loss": 0.5888, - "step": 62500 - }, - { - "epoch": 15.26, - "learning_rate": 0.00041766352558722606, - "loss": 0.5933, - "step": 62525 - }, - { - "epoch": 15.26, - "learning_rate": 0.0004176303264668699, - "loss": 0.5985, - "step": 62550 - }, - { - "epoch": 15.27, - "learning_rate": 0.00041759712734651383, - "loss": 0.5137, - "step": 62575 - }, - { - "epoch": 15.28, - "learning_rate": 0.00041756392822615775, - "loss": 0.5934, - "step": 62600 - }, - { - "epoch": 15.28, - "learning_rate": 0.00041753072910580166, - "loss": 0.5218, - "step": 62625 - }, - { - "epoch": 15.29, - "learning_rate": 0.00041749752998544547, - "loss": 0.6012, - "step": 62650 - }, - { - "epoch": 15.29, - "learning_rate": 0.0004174643308650894, - "loss": 0.6265, - "step": 62675 - }, - { - "epoch": 15.3, - "learning_rate": 0.0004174311317447333, - "loss": 0.5904, - "step": 62700 - }, - { - "epoch": 15.31, - "learning_rate": 0.0004173979326243772, - "loss": 0.582, - "step": 62725 - }, - { - "epoch": 15.31, - "learning_rate": 0.0004173647335040211, - "loss": 0.5837, - "step": 62750 - }, - { - "epoch": 15.32, - "learning_rate": 0.000417331534383665, - "loss": 0.5676, - "step": 62775 - }, - { - "epoch": 15.32, - "learning_rate": 0.00041729833526330884, - "loss": 0.5988, - "step": 62800 - }, - { - "epoch": 15.33, - "learning_rate": 0.00041726513614295276, - "loss": 0.5467, - "step": 62825 - }, - { - "epoch": 15.34, - "learning_rate": 0.00041723193702259667, - "loss": 0.5601, - "step": 62850 - }, - { - "epoch": 15.34, - "learning_rate": 0.00041719873790224053, - "loss": 0.5655, - "step": 62875 - }, - { - "epoch": 15.35, - "learning_rate": 0.00041716553878188444, - "loss": 0.5704, - "step": 62900 - }, - { - "epoch": 15.36, - "learning_rate": 0.00041713233966152836, - "loss": 0.555, - "step": 62925 - }, - { - "epoch": 15.36, - "learning_rate": 0.0004170991405411722, - "loss": 0.5744, - "step": 62950 - }, - { - "epoch": 15.37, - "learning_rate": 0.00041706594142081613, - "loss": 0.5445, - "step": 62975 - }, - { - "epoch": 15.37, - "learning_rate": 0.00041703274230046, - "loss": 0.5731, - "step": 63000 - }, - { - "epoch": 15.37, - "eval_cer": 0.12588421301191954, - "eval_loss": 0.44619035720825195, - "eval_runtime": 146.3854, - "eval_samples_per_second": 28.644, - "eval_steps_per_second": 7.166, - "eval_wer": 0.5028058727569331, - "step": 63000 - }, - { - "epoch": 15.38, - "learning_rate": 0.0004169995431801039, - "loss": 0.5442, - "step": 63025 - }, - { - "epoch": 15.39, - "learning_rate": 0.0004169663440597478, - "loss": 0.6078, - "step": 63050 - }, - { - "epoch": 15.39, - "learning_rate": 0.00041693314493939173, - "loss": 0.575, - "step": 63075 - }, - { - "epoch": 15.4, - "learning_rate": 0.00041689994581903554, - "loss": 0.5903, - "step": 63100 - }, - { - "epoch": 15.4, - "learning_rate": 0.00041686674669867945, - "loss": 0.5715, - "step": 63125 - }, - { - "epoch": 15.41, - "learning_rate": 0.00041683354757832337, - "loss": 0.6195, - "step": 63150 - }, - { - "epoch": 15.42, - "learning_rate": 0.0004168003484579673, - "loss": 0.5652, - "step": 63175 - }, - { - "epoch": 15.42, - "learning_rate": 0.0004167671493376112, - "loss": 0.5955, - "step": 63200 - }, - { - "epoch": 15.43, - "learning_rate": 0.00041673395021725506, - "loss": 0.5727, - "step": 63225 - }, - { - "epoch": 15.43, - "learning_rate": 0.0004167007510968989, - "loss": 0.6131, - "step": 63250 - }, - { - "epoch": 15.44, - "learning_rate": 0.00041666755197654283, - "loss": 0.5705, - "step": 63275 - }, - { - "epoch": 15.45, - "learning_rate": 0.00041663435285618674, - "loss": 0.6169, - "step": 63300 - }, - { - "epoch": 15.45, - "learning_rate": 0.0004166011537358306, - "loss": 0.6131, - "step": 63325 - }, - { - "epoch": 15.46, - "learning_rate": 0.0004165679546154745, - "loss": 0.5592, - "step": 63350 - }, - { - "epoch": 15.46, - "learning_rate": 0.00041653475549511843, - "loss": 0.5564, - "step": 63375 - }, - { - "epoch": 15.47, - "learning_rate": 0.0004165028843395766, - "loss": 0.5988, - "step": 63400 - }, - { - "epoch": 15.48, - "learning_rate": 0.0004164696852192205, - "loss": 0.5358, - "step": 63425 - }, - { - "epoch": 15.48, - "learning_rate": 0.0004164364860988643, - "loss": 0.5594, - "step": 63450 - }, - { - "epoch": 15.49, - "learning_rate": 0.0004164032869785082, - "loss": 0.5878, - "step": 63475 - }, - { - "epoch": 15.5, - "learning_rate": 0.0004163700878581521, - "loss": 0.606, - "step": 63500 - }, - { - "epoch": 15.5, - "learning_rate": 0.00041633688873779604, - "loss": 0.5355, - "step": 63525 - }, - { - "epoch": 15.51, - "learning_rate": 0.0004163036896174399, - "loss": 0.6155, - "step": 63550 - }, - { - "epoch": 15.51, - "learning_rate": 0.0004162704904970838, - "loss": 0.5276, - "step": 63575 - }, - { - "epoch": 15.52, - "learning_rate": 0.00041623729137672767, - "loss": 0.569, - "step": 63600 - }, - { - "epoch": 15.53, - "learning_rate": 0.0004162040922563716, - "loss": 0.5634, - "step": 63625 - }, - { - "epoch": 15.53, - "learning_rate": 0.0004161708931360155, - "loss": 0.5897, - "step": 63650 - }, - { - "epoch": 15.54, - "learning_rate": 0.00041613769401565936, - "loss": 0.5776, - "step": 63675 - }, - { - "epoch": 15.54, - "learning_rate": 0.00041610449489530327, - "loss": 0.5752, - "step": 63700 - }, - { - "epoch": 15.55, - "learning_rate": 0.0004160712957749472, - "loss": 0.5591, - "step": 63725 - }, - { - "epoch": 15.56, - "learning_rate": 0.00041603809665459105, - "loss": 0.6018, - "step": 63750 - }, - { - "epoch": 15.56, - "learning_rate": 0.0004160048975342349, - "loss": 0.5902, - "step": 63775 - }, - { - "epoch": 15.57, - "learning_rate": 0.0004159716984138788, - "loss": 0.5798, - "step": 63800 - }, - { - "epoch": 15.57, - "learning_rate": 0.00041593849929352273, - "loss": 0.5805, - "step": 63825 - }, - { - "epoch": 15.58, - "learning_rate": 0.00041590530017316665, - "loss": 0.5771, - "step": 63850 - }, - { - "epoch": 15.59, - "learning_rate": 0.00041587210105281056, - "loss": 0.5451, - "step": 63875 - }, - { - "epoch": 15.59, - "learning_rate": 0.00041583890193245437, - "loss": 0.5912, - "step": 63900 - }, - { - "epoch": 15.6, - "learning_rate": 0.0004158057028120983, - "loss": 0.5415, - "step": 63925 - }, - { - "epoch": 15.61, - "learning_rate": 0.0004157725036917422, - "loss": 0.5909, - "step": 63950 - }, - { - "epoch": 15.61, - "learning_rate": 0.0004157393045713861, - "loss": 0.6075, - "step": 63975 - }, - { - "epoch": 15.62, - "learning_rate": 0.00041570610545102997, - "loss": 0.5866, - "step": 64000 - }, - { - "epoch": 15.62, - "learning_rate": 0.0004156729063306739, - "loss": 0.548, - "step": 64025 - }, - { - "epoch": 15.63, - "learning_rate": 0.00041563970721031774, - "loss": 0.566, - "step": 64050 - }, - { - "epoch": 15.64, - "learning_rate": 0.00041560650808996166, - "loss": 0.5828, - "step": 64075 - }, - { - "epoch": 15.64, - "learning_rate": 0.00041557330896960557, - "loss": 0.6185, - "step": 64100 - }, - { - "epoch": 15.65, - "learning_rate": 0.00041554010984924943, - "loss": 0.5782, - "step": 64125 - }, - { - "epoch": 15.65, - "learning_rate": 0.00041550691072889334, - "loss": 0.6042, - "step": 64150 - }, - { - "epoch": 15.66, - "learning_rate": 0.00041547371160853726, - "loss": 0.5636, - "step": 64175 - }, - { - "epoch": 15.67, - "learning_rate": 0.0004154405124881811, - "loss": 0.6106, - "step": 64200 - }, - { - "epoch": 15.67, - "learning_rate": 0.000415407313367825, - "loss": 0.5675, - "step": 64225 - }, - { - "epoch": 15.68, - "learning_rate": 0.0004153741142474689, - "loss": 0.5768, - "step": 64250 - }, - { - "epoch": 15.68, - "learning_rate": 0.0004153409151271128, - "loss": 0.5954, - "step": 64275 - }, - { - "epoch": 15.69, - "learning_rate": 0.0004153077160067567, - "loss": 0.5635, - "step": 64300 - }, - { - "epoch": 15.7, - "learning_rate": 0.00041527451688640063, - "loss": 0.5603, - "step": 64325 - }, - { - "epoch": 15.7, - "learning_rate": 0.00041524131776604444, - "loss": 0.5893, - "step": 64350 - }, - { - "epoch": 15.71, - "learning_rate": 0.00041520811864568835, - "loss": 0.5608, - "step": 64375 - }, - { - "epoch": 15.71, - "learning_rate": 0.00041517491952533227, - "loss": 0.5534, - "step": 64400 - }, - { - "epoch": 15.72, - "learning_rate": 0.0004151417204049762, - "loss": 0.5961, - "step": 64425 - }, - { - "epoch": 15.73, - "learning_rate": 0.00041510852128462004, - "loss": 0.5614, - "step": 64450 - }, - { - "epoch": 15.73, - "learning_rate": 0.00041507532216426395, - "loss": 0.5431, - "step": 64475 - }, - { - "epoch": 15.74, - "learning_rate": 0.0004150421230439078, - "loss": 0.588, - "step": 64500 - }, - { - "epoch": 15.75, - "learning_rate": 0.00041500892392355173, - "loss": 0.616, - "step": 64525 - }, - { - "epoch": 15.75, - "learning_rate": 0.00041497572480319564, - "loss": 0.6145, - "step": 64550 - }, - { - "epoch": 15.76, - "learning_rate": 0.0004149425256828395, - "loss": 0.5783, - "step": 64575 - }, - { - "epoch": 15.76, - "learning_rate": 0.0004149093265624834, - "loss": 0.5769, - "step": 64600 - }, - { - "epoch": 15.77, - "learning_rate": 0.00041487612744212733, - "loss": 0.6041, - "step": 64625 - }, - { - "epoch": 15.78, - "learning_rate": 0.0004148429283217712, - "loss": 0.5768, - "step": 64650 - }, - { - "epoch": 15.78, - "learning_rate": 0.00041480972920141505, - "loss": 0.5923, - "step": 64675 - }, - { - "epoch": 15.79, - "learning_rate": 0.00041477653008105896, - "loss": 0.5551, - "step": 64700 - }, - { - "epoch": 15.79, - "learning_rate": 0.0004147433309607029, - "loss": 0.5495, - "step": 64725 - }, - { - "epoch": 15.8, - "learning_rate": 0.0004147101318403468, - "loss": 0.6238, - "step": 64750 - }, - { - "epoch": 15.81, - "learning_rate": 0.0004146769327199907, - "loss": 0.5442, - "step": 64775 - }, - { - "epoch": 15.81, - "learning_rate": 0.0004146437335996345, - "loss": 0.5986, - "step": 64800 - }, - { - "epoch": 15.82, - "learning_rate": 0.0004146105344792784, - "loss": 0.6223, - "step": 64825 - }, - { - "epoch": 15.82, - "learning_rate": 0.00041457733535892234, - "loss": 0.5737, - "step": 64850 - }, - { - "epoch": 15.83, - "learning_rate": 0.00041454413623856625, - "loss": 0.528, - "step": 64875 - }, - { - "epoch": 15.84, - "learning_rate": 0.00041451093711821017, - "loss": 0.615, - "step": 64900 - }, - { - "epoch": 15.84, - "learning_rate": 0.000414477737997854, - "loss": 0.5476, - "step": 64925 - }, - { - "epoch": 15.85, - "learning_rate": 0.0004144445388774979, - "loss": 0.603, - "step": 64950 - }, - { - "epoch": 15.86, - "learning_rate": 0.0004144113397571418, - "loss": 0.5325, - "step": 64975 - }, - { - "epoch": 15.86, - "learning_rate": 0.0004143781406367857, - "loss": 0.6006, - "step": 65000 - }, - { - "epoch": 15.87, - "learning_rate": 0.0004143449415164296, - "loss": 0.5636, - "step": 65025 - }, - { - "epoch": 15.87, - "learning_rate": 0.0004143117423960735, - "loss": 0.6104, - "step": 65050 - }, - { - "epoch": 15.88, - "learning_rate": 0.0004142785432757174, - "loss": 0.5742, - "step": 65075 - }, - { - "epoch": 15.89, - "learning_rate": 0.00041424534415536126, - "loss": 0.5944, - "step": 65100 - }, - { - "epoch": 15.89, - "learning_rate": 0.0004142121450350052, - "loss": 0.6145, - "step": 65125 - }, - { - "epoch": 15.9, - "learning_rate": 0.00041417894591464904, - "loss": 0.5822, - "step": 65150 - }, - { - "epoch": 15.9, - "learning_rate": 0.00041414574679429295, - "loss": 0.6058, - "step": 65175 - }, - { - "epoch": 15.91, - "learning_rate": 0.00041411254767393686, - "loss": 0.6146, - "step": 65200 - }, - { - "epoch": 15.92, - "learning_rate": 0.0004140793485535808, - "loss": 0.5819, - "step": 65225 - }, - { - "epoch": 15.92, - "learning_rate": 0.0004140461494332246, - "loss": 0.5744, - "step": 65250 - }, - { - "epoch": 15.93, - "learning_rate": 0.0004140129503128685, - "loss": 0.5917, - "step": 65275 - }, - { - "epoch": 15.93, - "learning_rate": 0.0004139797511925124, - "loss": 0.5648, - "step": 65300 - }, - { - "epoch": 15.94, - "learning_rate": 0.0004139465520721563, - "loss": 0.6056, - "step": 65325 - }, - { - "epoch": 15.95, - "learning_rate": 0.00041391335295180024, - "loss": 0.5887, - "step": 65350 - }, - { - "epoch": 15.95, - "learning_rate": 0.0004138801538314441, - "loss": 0.5744, - "step": 65375 - }, - { - "epoch": 15.96, - "learning_rate": 0.00041384695471108796, - "loss": 0.5921, - "step": 65400 - }, - { - "epoch": 15.97, - "learning_rate": 0.00041381375559073187, - "loss": 0.5323, - "step": 65425 - }, - { - "epoch": 15.97, - "learning_rate": 0.0004137805564703758, - "loss": 0.5728, - "step": 65450 - }, - { - "epoch": 15.98, - "learning_rate": 0.00041374735735001965, - "loss": 0.5658, - "step": 65475 - }, - { - "epoch": 15.98, - "learning_rate": 0.00041371415822966356, - "loss": 0.6099, - "step": 65500 - }, - { - "epoch": 15.99, - "learning_rate": 0.0004136809591093075, - "loss": 0.5746, - "step": 65525 - }, - { - "epoch": 16.0, - "learning_rate": 0.00041364775998895133, - "loss": 0.6292, - "step": 65550 - }, - { - "epoch": 16.0, - "learning_rate": 0.00041361456086859525, - "loss": 0.5792, - "step": 65575 - }, - { - "epoch": 16.01, - "learning_rate": 0.0004135813617482391, - "loss": 0.5845, - "step": 65600 - }, - { - "epoch": 16.01, - "learning_rate": 0.000413548162627883, - "loss": 0.5785, - "step": 65625 - }, - { - "epoch": 16.02, - "learning_rate": 0.00041351496350752694, - "loss": 0.5528, - "step": 65650 - }, - { - "epoch": 16.03, - "learning_rate": 0.00041348176438717085, - "loss": 0.5395, - "step": 65675 - }, - { - "epoch": 16.03, - "learning_rate": 0.00041344856526681466, - "loss": 0.5619, - "step": 65700 - }, - { - "epoch": 16.04, - "learning_rate": 0.00041341536614645857, - "loss": 0.5891, - "step": 65725 - }, - { - "epoch": 16.04, - "learning_rate": 0.0004133821670261025, - "loss": 0.5549, - "step": 65750 - }, - { - "epoch": 16.05, - "learning_rate": 0.0004133489679057464, - "loss": 0.5421, - "step": 65775 - }, - { - "epoch": 16.06, - "learning_rate": 0.0004133157687853903, - "loss": 0.5779, - "step": 65800 - }, - { - "epoch": 16.06, - "learning_rate": 0.00041328256966503417, - "loss": 0.5777, - "step": 65825 - }, - { - "epoch": 16.07, - "learning_rate": 0.00041324937054467803, - "loss": 0.5473, - "step": 65850 - }, - { - "epoch": 16.07, - "learning_rate": 0.00041321617142432194, - "loss": 0.5424, - "step": 65875 - }, - { - "epoch": 16.08, - "learning_rate": 0.00041318297230396586, - "loss": 0.5444, - "step": 65900 - }, - { - "epoch": 16.09, - "learning_rate": 0.0004131497731836097, - "loss": 0.5406, - "step": 65925 - }, - { - "epoch": 16.09, - "learning_rate": 0.00041311657406325363, - "loss": 0.5825, - "step": 65950 - }, - { - "epoch": 16.1, - "learning_rate": 0.0004130833749428975, - "loss": 0.5226, - "step": 65975 - }, - { - "epoch": 16.11, - "learning_rate": 0.0004130501758225414, - "loss": 0.5328, - "step": 66000 - }, - { - "epoch": 16.11, - "eval_cer": 0.12461115160724003, - "eval_loss": 0.45345035195350647, - "eval_runtime": 146.1861, - "eval_samples_per_second": 28.683, - "eval_steps_per_second": 7.176, - "eval_wer": 0.5022512234910277, - "step": 66000 - }, - { - "epoch": 16.11, - "learning_rate": 0.0004130169767021853, - "loss": 0.5759, - "step": 66025 - }, - { - "epoch": 16.12, - "learning_rate": 0.0004129837775818292, - "loss": 0.6023, - "step": 66050 - }, - { - "epoch": 16.12, - "learning_rate": 0.0004129505784614731, - "loss": 0.5949, - "step": 66075 - }, - { - "epoch": 16.13, - "learning_rate": 0.000412917379341117, - "loss": 0.5579, - "step": 66100 - }, - { - "epoch": 16.14, - "learning_rate": 0.00041288418022076087, - "loss": 0.5562, - "step": 66125 - }, - { - "epoch": 16.14, - "learning_rate": 0.0004128509811004048, - "loss": 0.5863, - "step": 66150 - }, - { - "epoch": 16.15, - "learning_rate": 0.00041281778198004864, - "loss": 0.5399, - "step": 66175 - }, - { - "epoch": 16.15, - "learning_rate": 0.00041278458285969256, - "loss": 0.5882, - "step": 66200 - }, - { - "epoch": 16.16, - "learning_rate": 0.00041275138373933647, - "loss": 0.5625, - "step": 66225 - }, - { - "epoch": 16.17, - "learning_rate": 0.0004127181846189804, - "loss": 0.5508, - "step": 66250 - }, - { - "epoch": 16.17, - "learning_rate": 0.0004126849854986242, - "loss": 0.5435, - "step": 66275 - }, - { - "epoch": 16.18, - "learning_rate": 0.0004126517863782681, - "loss": 0.5725, - "step": 66300 - }, - { - "epoch": 16.18, - "learning_rate": 0.000412618587257912, - "loss": 0.5654, - "step": 66325 - }, - { - "epoch": 16.19, - "learning_rate": 0.00041258538813755593, - "loss": 0.5876, - "step": 66350 - }, - { - "epoch": 16.2, - "learning_rate": 0.00041255218901719984, - "loss": 0.5763, - "step": 66375 - }, - { - "epoch": 16.2, - "learning_rate": 0.0004125189898968437, - "loss": 0.5609, - "step": 66400 - }, - { - "epoch": 16.21, - "learning_rate": 0.00041248579077648756, - "loss": 0.5789, - "step": 66425 - }, - { - "epoch": 16.22, - "learning_rate": 0.0004124525916561315, - "loss": 0.5859, - "step": 66450 - }, - { - "epoch": 16.22, - "learning_rate": 0.0004124193925357754, - "loss": 0.5816, - "step": 66475 - }, - { - "epoch": 16.23, - "learning_rate": 0.00041238619341541925, - "loss": 0.5813, - "step": 66500 - }, - { - "epoch": 16.23, - "learning_rate": 0.00041235299429506317, - "loss": 0.512, - "step": 66525 - }, - { - "epoch": 16.24, - "learning_rate": 0.0004123197951747071, - "loss": 0.5868, - "step": 66550 - }, - { - "epoch": 16.25, - "learning_rate": 0.00041228659605435094, - "loss": 0.5437, - "step": 66575 - }, - { - "epoch": 16.25, - "learning_rate": 0.00041225339693399485, - "loss": 0.5212, - "step": 66600 - }, - { - "epoch": 16.26, - "learning_rate": 0.0004122201978136387, - "loss": 0.542, - "step": 66625 - }, - { - "epoch": 16.26, - "learning_rate": 0.00041218699869328263, - "loss": 0.5695, - "step": 66650 - }, - { - "epoch": 16.27, - "learning_rate": 0.00041215379957292654, - "loss": 0.5057, - "step": 66675 - }, - { - "epoch": 16.28, - "learning_rate": 0.00041212060045257046, - "loss": 0.5713, - "step": 66700 - }, - { - "epoch": 16.28, - "learning_rate": 0.00041208740133221426, - "loss": 0.5371, - "step": 66725 - }, - { - "epoch": 16.29, - "learning_rate": 0.0004120542022118582, - "loss": 0.5522, - "step": 66750 - }, - { - "epoch": 16.29, - "learning_rate": 0.0004120210030915021, - "loss": 0.5789, - "step": 66775 - }, - { - "epoch": 16.3, - "learning_rate": 0.000411987803971146, - "loss": 0.5469, - "step": 66800 - }, - { - "epoch": 16.31, - "learning_rate": 0.0004119546048507899, - "loss": 0.5718, - "step": 66825 - }, - { - "epoch": 16.31, - "learning_rate": 0.0004119214057304338, - "loss": 0.5656, - "step": 66850 - }, - { - "epoch": 16.32, - "learning_rate": 0.00041188820661007764, - "loss": 0.5515, - "step": 66875 - }, - { - "epoch": 16.33, - "learning_rate": 0.00041185500748972155, - "loss": 0.5725, - "step": 66900 - }, - { - "epoch": 16.33, - "learning_rate": 0.00041182180836936546, - "loss": 0.5504, - "step": 66925 - }, - { - "epoch": 16.34, - "learning_rate": 0.0004117886092490093, - "loss": 0.5304, - "step": 66950 - }, - { - "epoch": 16.34, - "learning_rate": 0.00041175541012865324, - "loss": 0.5575, - "step": 66975 - }, - { - "epoch": 16.35, - "learning_rate": 0.00041172221100829715, - "loss": 0.5828, - "step": 67000 - }, - { - "epoch": 16.36, - "learning_rate": 0.000411689011887941, - "loss": 0.5903, - "step": 67025 - }, - { - "epoch": 16.36, - "learning_rate": 0.0004116558127675849, - "loss": 0.5894, - "step": 67050 - }, - { - "epoch": 16.37, - "learning_rate": 0.0004116226136472288, - "loss": 0.5657, - "step": 67075 - }, - { - "epoch": 16.37, - "learning_rate": 0.0004115894145268727, - "loss": 0.5672, - "step": 67100 - }, - { - "epoch": 16.38, - "learning_rate": 0.0004115562154065166, - "loss": 0.5476, - "step": 67125 - }, - { - "epoch": 16.39, - "learning_rate": 0.00041152301628616053, - "loss": 0.5779, - "step": 67150 - }, - { - "epoch": 16.39, - "learning_rate": 0.00041148981716580433, - "loss": 0.5328, - "step": 67175 - }, - { - "epoch": 16.4, - "learning_rate": 0.00041145661804544825, - "loss": 0.5777, - "step": 67200 - }, - { - "epoch": 16.4, - "learning_rate": 0.00041142341892509216, - "loss": 0.5645, - "step": 67225 - }, - { - "epoch": 16.41, - "learning_rate": 0.0004113902198047361, - "loss": 0.582, - "step": 67250 - }, - { - "epoch": 16.42, - "learning_rate": 0.00041135702068438, - "loss": 0.5448, - "step": 67275 - }, - { - "epoch": 16.42, - "learning_rate": 0.00041132382156402385, - "loss": 0.557, - "step": 67300 - }, - { - "epoch": 16.43, - "learning_rate": 0.0004112906224436677, - "loss": 0.5427, - "step": 67325 - }, - { - "epoch": 16.43, - "learning_rate": 0.0004112574233233116, - "loss": 0.553, - "step": 67350 - }, - { - "epoch": 16.44, - "learning_rate": 0.00041122422420295554, - "loss": 0.5965, - "step": 67375 - }, - { - "epoch": 16.45, - "learning_rate": 0.00041119102508259945, - "loss": 0.5488, - "step": 67400 - }, - { - "epoch": 16.45, - "learning_rate": 0.0004111578259622433, - "loss": 0.5309, - "step": 67425 - }, - { - "epoch": 16.46, - "learning_rate": 0.0004111246268418872, - "loss": 0.599, - "step": 67450 - }, - { - "epoch": 16.47, - "learning_rate": 0.0004110914277215311, - "loss": 0.5384, - "step": 67475 - }, - { - "epoch": 16.47, - "learning_rate": 0.000411058228601175, - "loss": 0.5998, - "step": 67500 - }, - { - "epoch": 16.48, - "learning_rate": 0.00041102502948081886, - "loss": 0.545, - "step": 67525 - }, - { - "epoch": 16.48, - "learning_rate": 0.00041099183036046277, - "loss": 0.5732, - "step": 67550 - }, - { - "epoch": 16.49, - "learning_rate": 0.0004109586312401067, - "loss": 0.5608, - "step": 67575 - }, - { - "epoch": 16.5, - "learning_rate": 0.0004109254321197506, - "loss": 0.5466, - "step": 67600 - }, - { - "epoch": 16.5, - "learning_rate": 0.00041089223299939446, - "loss": 0.5771, - "step": 67625 - }, - { - "epoch": 16.51, - "learning_rate": 0.0004108590338790383, - "loss": 0.5959, - "step": 67650 - }, - { - "epoch": 16.51, - "learning_rate": 0.00041082583475868223, - "loss": 0.5573, - "step": 67675 - }, - { - "epoch": 16.52, - "learning_rate": 0.00041079263563832615, - "loss": 0.5681, - "step": 67700 - }, - { - "epoch": 16.53, - "learning_rate": 0.00041075943651797006, - "loss": 0.5956, - "step": 67725 - }, - { - "epoch": 16.53, - "learning_rate": 0.0004107262373976139, - "loss": 0.5685, - "step": 67750 - }, - { - "epoch": 16.54, - "learning_rate": 0.0004106930382772578, - "loss": 0.5794, - "step": 67775 - }, - { - "epoch": 16.54, - "learning_rate": 0.0004106598391569017, - "loss": 0.5751, - "step": 67800 - }, - { - "epoch": 16.55, - "learning_rate": 0.0004106266400365456, - "loss": 0.5426, - "step": 67825 - }, - { - "epoch": 16.56, - "learning_rate": 0.0004105934409161895, - "loss": 0.5655, - "step": 67850 - }, - { - "epoch": 16.56, - "learning_rate": 0.0004105615697606476, - "loss": 0.5888, - "step": 67875 - }, - { - "epoch": 16.57, - "learning_rate": 0.0004105283706402915, - "loss": 0.5562, - "step": 67900 - }, - { - "epoch": 16.58, - "learning_rate": 0.00041049517151993544, - "loss": 0.5631, - "step": 67925 - }, - { - "epoch": 16.58, - "learning_rate": 0.00041046197239957935, - "loss": 0.563, - "step": 67950 - }, - { - "epoch": 16.59, - "learning_rate": 0.00041042877327922316, - "loss": 0.5945, - "step": 67975 - }, - { - "epoch": 16.59, - "learning_rate": 0.0004103955741588671, - "loss": 0.5984, - "step": 68000 - }, - { - "epoch": 16.6, - "learning_rate": 0.000410362375038511, - "loss": 0.5718, - "step": 68025 - }, - { - "epoch": 16.61, - "learning_rate": 0.0004103291759181549, - "loss": 0.5531, - "step": 68050 - }, - { - "epoch": 16.61, - "learning_rate": 0.00041029597679779876, - "loss": 0.5585, - "step": 68075 - }, - { - "epoch": 16.62, - "learning_rate": 0.0004102627776774427, - "loss": 0.6041, - "step": 68100 - }, - { - "epoch": 16.62, - "learning_rate": 0.00041022957855708654, - "loss": 0.5161, - "step": 68125 - }, - { - "epoch": 16.63, - "learning_rate": 0.00041019637943673045, - "loss": 0.576, - "step": 68150 - }, - { - "epoch": 16.64, - "learning_rate": 0.00041016318031637436, - "loss": 0.5904, - "step": 68175 - }, - { - "epoch": 16.64, - "learning_rate": 0.0004101299811960182, - "loss": 0.5504, - "step": 68200 - }, - { - "epoch": 16.65, - "learning_rate": 0.00041009678207566214, - "loss": 0.5495, - "step": 68225 - }, - { - "epoch": 16.65, - "learning_rate": 0.00041006358295530605, - "loss": 0.5813, - "step": 68250 - }, - { - "epoch": 16.66, - "learning_rate": 0.0004100303838349499, - "loss": 0.5604, - "step": 68275 - }, - { - "epoch": 16.67, - "learning_rate": 0.00040999718471459377, - "loss": 0.5899, - "step": 68300 - }, - { - "epoch": 16.67, - "learning_rate": 0.0004099639855942377, - "loss": 0.5665, - "step": 68325 - }, - { - "epoch": 16.68, - "learning_rate": 0.0004099307864738816, - "loss": 0.5539, - "step": 68350 - }, - { - "epoch": 16.68, - "learning_rate": 0.0004098975873535255, - "loss": 0.5938, - "step": 68375 - }, - { - "epoch": 16.69, - "learning_rate": 0.0004098643882331694, - "loss": 0.5765, - "step": 68400 - }, - { - "epoch": 16.7, - "learning_rate": 0.00040983118911281323, - "loss": 0.5873, - "step": 68425 - }, - { - "epoch": 16.7, - "learning_rate": 0.00040979798999245715, - "loss": 0.5986, - "step": 68450 - }, - { - "epoch": 16.71, - "learning_rate": 0.00040976479087210106, - "loss": 0.5746, - "step": 68475 - }, - { - "epoch": 16.72, - "learning_rate": 0.000409731591751745, - "loss": 0.5931, - "step": 68500 - }, - { - "epoch": 16.72, - "learning_rate": 0.0004096983926313889, - "loss": 0.5582, - "step": 68525 - }, - { - "epoch": 16.73, - "learning_rate": 0.00040966519351103275, - "loss": 0.5683, - "step": 68550 - }, - { - "epoch": 16.73, - "learning_rate": 0.0004096319943906766, - "loss": 0.5985, - "step": 68575 - }, - { - "epoch": 16.74, - "learning_rate": 0.0004095987952703205, - "loss": 0.5949, - "step": 68600 - }, - { - "epoch": 16.75, - "learning_rate": 0.00040956559614996444, - "loss": 0.5495, - "step": 68625 - }, - { - "epoch": 16.75, - "learning_rate": 0.0004095323970296083, - "loss": 0.5408, - "step": 68650 - }, - { - "epoch": 16.76, - "learning_rate": 0.0004094991979092522, - "loss": 0.5318, - "step": 68675 - }, - { - "epoch": 16.76, - "learning_rate": 0.0004094659987888961, - "loss": 0.5701, - "step": 68700 - }, - { - "epoch": 16.77, - "learning_rate": 0.00040943279966854, - "loss": 0.5707, - "step": 68725 - }, - { - "epoch": 16.78, - "learning_rate": 0.0004093996005481839, - "loss": 0.5885, - "step": 68750 - }, - { - "epoch": 16.78, - "learning_rate": 0.00040936640142782776, - "loss": 0.5422, - "step": 68775 - }, - { - "epoch": 16.79, - "learning_rate": 0.00040933320230747167, - "loss": 0.598, - "step": 68800 - }, - { - "epoch": 16.79, - "learning_rate": 0.0004093000031871156, - "loss": 0.5318, - "step": 68825 - }, - { - "epoch": 16.8, - "learning_rate": 0.0004092668040667595, - "loss": 0.5587, - "step": 68850 - }, - { - "epoch": 16.81, - "learning_rate": 0.0004092336049464033, - "loss": 0.5803, - "step": 68875 - }, - { - "epoch": 16.81, - "learning_rate": 0.0004092004058260472, - "loss": 0.5688, - "step": 68900 - }, - { - "epoch": 16.82, - "learning_rate": 0.00040916720670569113, - "loss": 0.5538, - "step": 68925 - }, - { - "epoch": 16.83, - "learning_rate": 0.00040913400758533505, - "loss": 0.58, - "step": 68950 - }, - { - "epoch": 16.83, - "learning_rate": 0.00040910080846497896, - "loss": 0.5765, - "step": 68975 - }, - { - "epoch": 16.84, - "learning_rate": 0.0004090676093446228, - "loss": 0.5743, - "step": 69000 - }, - { - "epoch": 16.84, - "eval_cer": 0.1254632814184368, - "eval_loss": 0.45550015568733215, - "eval_runtime": 147.0347, - "eval_samples_per_second": 28.517, - "eval_steps_per_second": 7.134, - "eval_wer": 0.5069168026101142, - "step": 69000 - }, - { - "epoch": 16.84, - "learning_rate": 0.0004090344102242667, - "loss": 0.518, - "step": 69025 - }, - { - "epoch": 16.85, - "learning_rate": 0.0004090012111039106, - "loss": 0.5542, - "step": 69050 - }, - { - "epoch": 16.86, - "learning_rate": 0.0004089680119835545, - "loss": 0.5315, - "step": 69075 - }, - { - "epoch": 16.86, - "learning_rate": 0.00040893481286319837, - "loss": 0.5702, - "step": 69100 - }, - { - "epoch": 16.87, - "learning_rate": 0.0004089016137428423, - "loss": 0.5372, - "step": 69125 - }, - { - "epoch": 16.87, - "learning_rate": 0.0004088684146224862, - "loss": 0.5451, - "step": 69150 - }, - { - "epoch": 16.88, - "learning_rate": 0.00040883521550213006, - "loss": 0.5251, - "step": 69175 - }, - { - "epoch": 16.89, - "learning_rate": 0.00040880201638177397, - "loss": 0.5762, - "step": 69200 - }, - { - "epoch": 16.89, - "learning_rate": 0.00040876881726141783, - "loss": 0.5446, - "step": 69225 - }, - { - "epoch": 16.9, - "learning_rate": 0.00040873561814106174, - "loss": 0.5725, - "step": 69250 - }, - { - "epoch": 16.9, - "learning_rate": 0.00040870241902070566, - "loss": 0.5888, - "step": 69275 - }, - { - "epoch": 16.91, - "learning_rate": 0.00040866921990034957, - "loss": 0.5712, - "step": 69300 - }, - { - "epoch": 16.92, - "learning_rate": 0.0004086360207799934, - "loss": 0.6126, - "step": 69325 - }, - { - "epoch": 16.92, - "learning_rate": 0.0004086028216596373, - "loss": 0.5406, - "step": 69350 - }, - { - "epoch": 16.93, - "learning_rate": 0.0004085696225392812, - "loss": 0.5716, - "step": 69375 - }, - { - "epoch": 16.94, - "learning_rate": 0.0004085364234189251, - "loss": 0.5786, - "step": 69400 - }, - { - "epoch": 16.94, - "learning_rate": 0.00040850322429856903, - "loss": 0.5627, - "step": 69425 - }, - { - "epoch": 16.95, - "learning_rate": 0.0004084700251782129, - "loss": 0.565, - "step": 69450 - }, - { - "epoch": 16.95, - "learning_rate": 0.00040843682605785675, - "loss": 0.55, - "step": 69475 - }, - { - "epoch": 16.96, - "learning_rate": 0.00040840362693750067, - "loss": 0.591, - "step": 69500 - }, - { - "epoch": 16.97, - "learning_rate": 0.0004083704278171446, - "loss": 0.5239, - "step": 69525 - }, - { - "epoch": 16.97, - "learning_rate": 0.00040833722869678844, - "loss": 0.5663, - "step": 69550 - }, - { - "epoch": 16.98, - "learning_rate": 0.00040830402957643235, - "loss": 0.5758, - "step": 69575 - }, - { - "epoch": 16.98, - "learning_rate": 0.00040827083045607627, - "loss": 0.5516, - "step": 69600 - }, - { - "epoch": 16.99, - "learning_rate": 0.00040823763133572013, - "loss": 0.5874, - "step": 69625 - }, - { - "epoch": 17.0, - "learning_rate": 0.00040820443221536404, - "loss": 0.5773, - "step": 69650 - }, - { - "epoch": 17.0, - "learning_rate": 0.00040817256105982213, - "loss": 0.6173, - "step": 69675 - }, - { - "epoch": 17.01, - "learning_rate": 0.00040813936193946605, - "loss": 0.5685, - "step": 69700 - }, - { - "epoch": 17.01, - "learning_rate": 0.00040810616281910996, - "loss": 0.5947, - "step": 69725 - }, - { - "epoch": 17.02, - "learning_rate": 0.0004080729636987539, - "loss": 0.5506, - "step": 69750 - }, - { - "epoch": 17.03, - "learning_rate": 0.00040803976457839773, - "loss": 0.5246, - "step": 69775 - }, - { - "epoch": 17.03, - "learning_rate": 0.00040800656545804165, - "loss": 0.5586, - "step": 69800 - }, - { - "epoch": 17.04, - "learning_rate": 0.0004079733663376855, - "loss": 0.5482, - "step": 69825 - }, - { - "epoch": 17.04, - "learning_rate": 0.0004079401672173294, - "loss": 0.5213, - "step": 69850 - }, - { - "epoch": 17.05, - "learning_rate": 0.00040790696809697333, - "loss": 0.578, - "step": 69875 - }, - { - "epoch": 17.06, - "learning_rate": 0.0004078737689766172, - "loss": 0.5675, - "step": 69900 - }, - { - "epoch": 17.06, - "learning_rate": 0.0004078405698562611, - "loss": 0.5336, - "step": 69925 - }, - { - "epoch": 17.07, - "learning_rate": 0.000407807370735905, - "loss": 0.549, - "step": 69950 - }, - { - "epoch": 17.08, - "learning_rate": 0.0004077741716155489, - "loss": 0.5888, - "step": 69975 - }, - { - "epoch": 17.08, - "learning_rate": 0.00040774097249519274, - "loss": 0.546, - "step": 70000 - }, - { - "epoch": 17.09, - "learning_rate": 0.00040770777337483666, - "loss": 0.5392, - "step": 70025 - }, - { - "epoch": 17.09, - "learning_rate": 0.00040767457425448057, - "loss": 0.5331, - "step": 70050 - }, - { - "epoch": 17.1, - "learning_rate": 0.0004076413751341245, - "loss": 0.4992, - "step": 70075 - }, - { - "epoch": 17.11, - "learning_rate": 0.0004076081760137684, - "loss": 0.5935, - "step": 70100 - }, - { - "epoch": 17.11, - "learning_rate": 0.0004075749768934122, - "loss": 0.5448, - "step": 70125 - }, - { - "epoch": 17.12, - "learning_rate": 0.0004075417777730561, - "loss": 0.5383, - "step": 70150 - }, - { - "epoch": 17.12, - "learning_rate": 0.00040750857865270003, - "loss": 0.5574, - "step": 70175 - }, - { - "epoch": 17.13, - "learning_rate": 0.00040747537953234395, - "loss": 0.5287, - "step": 70200 - }, - { - "epoch": 17.14, - "learning_rate": 0.0004074421804119878, - "loss": 0.5176, - "step": 70225 - }, - { - "epoch": 17.14, - "learning_rate": 0.0004074089812916317, - "loss": 0.514, - "step": 70250 - }, - { - "epoch": 17.15, - "learning_rate": 0.0004073757821712756, - "loss": 0.5223, - "step": 70275 - }, - { - "epoch": 17.15, - "learning_rate": 0.0004073425830509195, - "loss": 0.5599, - "step": 70300 - }, - { - "epoch": 17.16, - "learning_rate": 0.0004073093839305634, - "loss": 0.5492, - "step": 70325 - }, - { - "epoch": 17.17, - "learning_rate": 0.00040727618481020727, - "loss": 0.5432, - "step": 70350 - }, - { - "epoch": 17.17, - "learning_rate": 0.0004072429856898512, - "loss": 0.5706, - "step": 70375 - }, - { - "epoch": 17.18, - "learning_rate": 0.0004072097865694951, - "loss": 0.5642, - "step": 70400 - }, - { - "epoch": 17.19, - "learning_rate": 0.00040717658744913895, - "loss": 0.5706, - "step": 70425 - }, - { - "epoch": 17.19, - "learning_rate": 0.0004071433883287828, - "loss": 0.4991, - "step": 70450 - }, - { - "epoch": 17.2, - "learning_rate": 0.00040711018920842673, - "loss": 0.5495, - "step": 70475 - }, - { - "epoch": 17.2, - "learning_rate": 0.00040707699008807064, - "loss": 0.5227, - "step": 70500 - }, - { - "epoch": 17.21, - "learning_rate": 0.00040704379096771456, - "loss": 0.5789, - "step": 70525 - }, - { - "epoch": 17.22, - "learning_rate": 0.00040701059184735847, - "loss": 0.5442, - "step": 70550 - }, - { - "epoch": 17.22, - "learning_rate": 0.0004069773927270023, - "loss": 0.5567, - "step": 70575 - }, - { - "epoch": 17.23, - "learning_rate": 0.0004069441936066462, - "loss": 0.5408, - "step": 70600 - }, - { - "epoch": 17.23, - "learning_rate": 0.0004069109944862901, - "loss": 0.557, - "step": 70625 - }, - { - "epoch": 17.24, - "learning_rate": 0.000406877795365934, - "loss": 0.5338, - "step": 70650 - }, - { - "epoch": 17.25, - "learning_rate": 0.0004068445962455779, - "loss": 0.5138, - "step": 70675 - }, - { - "epoch": 17.25, - "learning_rate": 0.0004068113971252218, - "loss": 0.5655, - "step": 70700 - }, - { - "epoch": 17.26, - "learning_rate": 0.00040677819800486565, - "loss": 0.5419, - "step": 70725 - }, - { - "epoch": 17.26, - "learning_rate": 0.00040674499888450956, - "loss": 0.5177, - "step": 70750 - }, - { - "epoch": 17.27, - "learning_rate": 0.0004067117997641535, - "loss": 0.5388, - "step": 70775 - }, - { - "epoch": 17.28, - "learning_rate": 0.00040667860064379734, - "loss": 0.5382, - "step": 70800 - }, - { - "epoch": 17.28, - "learning_rate": 0.00040664540152344125, - "loss": 0.5697, - "step": 70825 - }, - { - "epoch": 17.29, - "learning_rate": 0.00040661220240308517, - "loss": 0.5452, - "step": 70850 - }, - { - "epoch": 17.3, - "learning_rate": 0.000406579003282729, - "loss": 0.5611, - "step": 70875 - }, - { - "epoch": 17.3, - "learning_rate": 0.0004065458041623729, - "loss": 0.5321, - "step": 70900 - }, - { - "epoch": 17.31, - "learning_rate": 0.0004065126050420168, - "loss": 0.546, - "step": 70925 - }, - { - "epoch": 17.31, - "learning_rate": 0.0004064794059216607, - "loss": 0.5901, - "step": 70950 - }, - { - "epoch": 17.32, - "learning_rate": 0.00040644620680130463, - "loss": 0.5018, - "step": 70975 - }, - { - "epoch": 17.33, - "learning_rate": 0.00040641300768094854, - "loss": 0.5433, - "step": 71000 - }, - { - "epoch": 17.33, - "learning_rate": 0.00040637980856059235, - "loss": 0.5856, - "step": 71025 - }, - { - "epoch": 17.34, - "learning_rate": 0.00040634660944023626, - "loss": 0.5445, - "step": 71050 - }, - { - "epoch": 17.34, - "learning_rate": 0.0004063134103198802, - "loss": 0.5376, - "step": 71075 - }, - { - "epoch": 17.35, - "learning_rate": 0.0004062802111995241, - "loss": 0.5303, - "step": 71100 - }, - { - "epoch": 17.36, - "learning_rate": 0.000406247012079168, - "loss": 0.5202, - "step": 71125 - }, - { - "epoch": 17.36, - "learning_rate": 0.00040621381295881186, - "loss": 0.5504, - "step": 71150 - }, - { - "epoch": 17.37, - "learning_rate": 0.0004061806138384557, - "loss": 0.5456, - "step": 71175 - }, - { - "epoch": 17.37, - "learning_rate": 0.00040614741471809964, - "loss": 0.565, - "step": 71200 - }, - { - "epoch": 17.38, - "learning_rate": 0.00040611421559774355, - "loss": 0.5316, - "step": 71225 - }, - { - "epoch": 17.39, - "learning_rate": 0.0004060810164773874, - "loss": 0.5479, - "step": 71250 - }, - { - "epoch": 17.39, - "learning_rate": 0.0004060478173570313, - "loss": 0.5441, - "step": 71275 - }, - { - "epoch": 17.4, - "learning_rate": 0.00040601461823667524, - "loss": 0.5295, - "step": 71300 - }, - { - "epoch": 17.4, - "learning_rate": 0.0004059814191163191, - "loss": 0.5384, - "step": 71325 - }, - { - "epoch": 17.41, - "learning_rate": 0.000405948219995963, - "loss": 0.5691, - "step": 71350 - }, - { - "epoch": 17.42, - "learning_rate": 0.00040591502087560687, - "loss": 0.6323, - "step": 71375 - }, - { - "epoch": 17.42, - "learning_rate": 0.0004058818217552508, - "loss": 0.584, - "step": 71400 - }, - { - "epoch": 17.43, - "learning_rate": 0.0004058486226348947, - "loss": 0.5904, - "step": 71425 - }, - { - "epoch": 17.44, - "learning_rate": 0.00040581542351453856, - "loss": 0.56, - "step": 71450 - }, - { - "epoch": 17.44, - "learning_rate": 0.0004057822243941824, - "loss": 0.5599, - "step": 71475 - }, - { - "epoch": 17.45, - "learning_rate": 0.00040574902527382633, - "loss": 0.5294, - "step": 71500 - }, - { - "epoch": 17.45, - "learning_rate": 0.00040571582615347025, - "loss": 0.5451, - "step": 71525 - }, - { - "epoch": 17.46, - "learning_rate": 0.00040568262703311416, - "loss": 0.5828, - "step": 71550 - }, - { - "epoch": 17.47, - "learning_rate": 0.0004056494279127581, - "loss": 0.5037, - "step": 71575 - }, - { - "epoch": 17.47, - "learning_rate": 0.0004056162287924019, - "loss": 0.5308, - "step": 71600 - }, - { - "epoch": 17.48, - "learning_rate": 0.0004055830296720458, - "loss": 0.5456, - "step": 71625 - }, - { - "epoch": 17.48, - "learning_rate": 0.0004055498305516897, - "loss": 0.5405, - "step": 71650 - }, - { - "epoch": 17.49, - "learning_rate": 0.0004055166314313336, - "loss": 0.5725, - "step": 71675 - }, - { - "epoch": 17.5, - "learning_rate": 0.0004054834323109775, - "loss": 0.5379, - "step": 71700 - }, - { - "epoch": 17.5, - "learning_rate": 0.0004054502331906214, - "loss": 0.5498, - "step": 71725 - }, - { - "epoch": 17.51, - "learning_rate": 0.00040541703407026526, - "loss": 0.5228, - "step": 71750 - }, - { - "epoch": 17.51, - "learning_rate": 0.00040538383494990917, - "loss": 0.5078, - "step": 71775 - }, - { - "epoch": 17.52, - "learning_rate": 0.0004053506358295531, - "loss": 0.5552, - "step": 71800 - }, - { - "epoch": 17.53, - "learning_rate": 0.00040531743670919694, - "loss": 0.574, - "step": 71825 - }, - { - "epoch": 17.53, - "learning_rate": 0.00040528423758884086, - "loss": 0.5456, - "step": 71850 - }, - { - "epoch": 17.54, - "learning_rate": 0.00040525103846848477, - "loss": 0.5166, - "step": 71875 - }, - { - "epoch": 17.55, - "learning_rate": 0.00040521783934812863, - "loss": 0.5637, - "step": 71900 - }, - { - "epoch": 17.55, - "learning_rate": 0.0004051846402277725, - "loss": 0.5762, - "step": 71925 - }, - { - "epoch": 17.56, - "learning_rate": 0.0004051514411074164, - "loss": 0.5937, - "step": 71950 - }, - { - "epoch": 17.56, - "learning_rate": 0.0004051182419870603, - "loss": 0.5883, - "step": 71975 - }, - { - "epoch": 17.57, - "learning_rate": 0.00040508504286670423, - "loss": 0.5363, - "step": 72000 - }, - { - "epoch": 17.57, - "eval_cer": 0.12136176503803785, - "eval_loss": 0.4388948678970337, - "eval_runtime": 147.1784, - "eval_samples_per_second": 28.489, - "eval_steps_per_second": 7.127, - "eval_wer": 0.49148450244698205, - "step": 72000 - }, - { - "epoch": 17.58, - "learning_rate": 0.00040505184374634815, - "loss": 0.532, - "step": 72025 - }, - { - "epoch": 17.58, - "learning_rate": 0.00040501864462599195, - "loss": 0.5279, - "step": 72050 - }, - { - "epoch": 17.59, - "learning_rate": 0.00040498544550563587, - "loss": 0.5578, - "step": 72075 - }, - { - "epoch": 17.59, - "learning_rate": 0.0004049522463852798, - "loss": 0.5357, - "step": 72100 - }, - { - "epoch": 17.6, - "learning_rate": 0.0004049190472649237, - "loss": 0.5405, - "step": 72125 - }, - { - "epoch": 17.61, - "learning_rate": 0.00040488584814456755, - "loss": 0.5273, - "step": 72150 - }, - { - "epoch": 17.61, - "learning_rate": 0.00040485264902421147, - "loss": 0.5772, - "step": 72175 - }, - { - "epoch": 17.62, - "learning_rate": 0.00040481944990385533, - "loss": 0.5308, - "step": 72200 - }, - { - "epoch": 17.62, - "learning_rate": 0.00040478625078349924, - "loss": 0.5678, - "step": 72225 - }, - { - "epoch": 17.63, - "learning_rate": 0.00040475305166314316, - "loss": 0.5161, - "step": 72250 - }, - { - "epoch": 17.64, - "learning_rate": 0.000404719852542787, - "loss": 0.5953, - "step": 72275 - }, - { - "epoch": 17.64, - "learning_rate": 0.00040468665342243093, - "loss": 0.5763, - "step": 72300 - }, - { - "epoch": 17.65, - "learning_rate": 0.00040465345430207484, - "loss": 0.545, - "step": 72325 - }, - { - "epoch": 17.65, - "learning_rate": 0.0004046202551817187, - "loss": 0.5738, - "step": 72350 - }, - { - "epoch": 17.66, - "learning_rate": 0.00040458705606136256, - "loss": 0.5208, - "step": 72375 - }, - { - "epoch": 17.67, - "learning_rate": 0.0004045538569410065, - "loss": 0.538, - "step": 72400 - }, - { - "epoch": 17.67, - "learning_rate": 0.0004045206578206504, - "loss": 0.5776, - "step": 72425 - }, - { - "epoch": 17.68, - "learning_rate": 0.0004044874587002943, - "loss": 0.5831, - "step": 72450 - }, - { - "epoch": 17.69, - "learning_rate": 0.0004044542595799382, - "loss": 0.5136, - "step": 72475 - }, - { - "epoch": 17.69, - "learning_rate": 0.000404421060459582, - "loss": 0.5116, - "step": 72500 - }, - { - "epoch": 17.7, - "learning_rate": 0.00040438786133922594, - "loss": 0.5752, - "step": 72525 - }, - { - "epoch": 17.7, - "learning_rate": 0.00040435466221886985, - "loss": 0.5525, - "step": 72550 - }, - { - "epoch": 17.71, - "learning_rate": 0.00040432146309851377, - "loss": 0.5546, - "step": 72575 - }, - { - "epoch": 17.72, - "learning_rate": 0.0004042882639781577, - "loss": 0.5408, - "step": 72600 - }, - { - "epoch": 17.72, - "learning_rate": 0.00040425506485780154, - "loss": 0.5833, - "step": 72625 - }, - { - "epoch": 17.73, - "learning_rate": 0.0004042218657374454, - "loss": 0.565, - "step": 72650 - }, - { - "epoch": 17.73, - "learning_rate": 0.0004041886666170893, - "loss": 0.5366, - "step": 72675 - }, - { - "epoch": 17.74, - "learning_rate": 0.00040415546749673323, - "loss": 0.5232, - "step": 72700 - }, - { - "epoch": 17.75, - "learning_rate": 0.0004041222683763771, - "loss": 0.5818, - "step": 72725 - }, - { - "epoch": 17.75, - "learning_rate": 0.000404089069256021, - "loss": 0.541, - "step": 72750 - }, - { - "epoch": 17.76, - "learning_rate": 0.0004040558701356649, - "loss": 0.5453, - "step": 72775 - }, - { - "epoch": 17.76, - "learning_rate": 0.0004040226710153088, - "loss": 0.5412, - "step": 72800 - }, - { - "epoch": 17.77, - "learning_rate": 0.0004039894718949527, - "loss": 0.5513, - "step": 72825 - }, - { - "epoch": 17.78, - "learning_rate": 0.00040395627277459655, - "loss": 0.5736, - "step": 72850 - }, - { - "epoch": 17.78, - "learning_rate": 0.00040392307365424046, - "loss": 0.5623, - "step": 72875 - }, - { - "epoch": 17.79, - "learning_rate": 0.0004038898745338844, - "loss": 0.5901, - "step": 72900 - }, - { - "epoch": 17.8, - "learning_rate": 0.0004038566754135283, - "loss": 0.5831, - "step": 72925 - }, - { - "epoch": 17.8, - "learning_rate": 0.0004038234762931721, - "loss": 0.5359, - "step": 72950 - }, - { - "epoch": 17.81, - "learning_rate": 0.000403790277172816, - "loss": 0.6014, - "step": 72975 - }, - { - "epoch": 17.81, - "learning_rate": 0.0004037570780524599, - "loss": 0.5446, - "step": 73000 - }, - { - "epoch": 17.82, - "learning_rate": 0.00040372387893210384, - "loss": 0.4802, - "step": 73025 - }, - { - "epoch": 17.83, - "learning_rate": 0.00040369067981174775, - "loss": 0.5288, - "step": 73050 - }, - { - "epoch": 17.83, - "learning_rate": 0.0004036574806913916, - "loss": 0.5275, - "step": 73075 - }, - { - "epoch": 17.84, - "learning_rate": 0.0004036242815710355, - "loss": 0.5719, - "step": 73100 - }, - { - "epoch": 17.84, - "learning_rate": 0.0004035910824506794, - "loss": 0.5496, - "step": 73125 - }, - { - "epoch": 17.85, - "learning_rate": 0.0004035578833303233, - "loss": 0.5475, - "step": 73150 - }, - { - "epoch": 17.86, - "learning_rate": 0.00040352468420996716, - "loss": 0.5142, - "step": 73175 - }, - { - "epoch": 17.86, - "learning_rate": 0.0004034914850896111, - "loss": 0.5324, - "step": 73200 - }, - { - "epoch": 17.87, - "learning_rate": 0.000403458285969255, - "loss": 0.5521, - "step": 73225 - }, - { - "epoch": 17.87, - "learning_rate": 0.00040342508684889885, - "loss": 0.546, - "step": 73250 - }, - { - "epoch": 17.88, - "learning_rate": 0.00040339188772854276, - "loss": 0.5351, - "step": 73275 - }, - { - "epoch": 17.89, - "learning_rate": 0.0004033586886081866, - "loss": 0.5669, - "step": 73300 - }, - { - "epoch": 17.89, - "learning_rate": 0.00040332548948783054, - "loss": 0.5633, - "step": 73325 - }, - { - "epoch": 17.9, - "learning_rate": 0.00040329229036747445, - "loss": 0.5263, - "step": 73350 - }, - { - "epoch": 17.91, - "learning_rate": 0.00040325909124711836, - "loss": 0.5618, - "step": 73375 - }, - { - "epoch": 17.91, - "learning_rate": 0.00040322589212676217, - "loss": 0.545, - "step": 73400 - }, - { - "epoch": 17.92, - "learning_rate": 0.0004031926930064061, - "loss": 0.5756, - "step": 73425 - }, - { - "epoch": 17.92, - "learning_rate": 0.00040315949388605, - "loss": 0.565, - "step": 73450 - }, - { - "epoch": 17.93, - "learning_rate": 0.0004031262947656939, - "loss": 0.5497, - "step": 73475 - }, - { - "epoch": 17.94, - "learning_rate": 0.0004030930956453378, - "loss": 0.558, - "step": 73500 - }, - { - "epoch": 17.94, - "learning_rate": 0.0004030598965249817, - "loss": 0.5668, - "step": 73525 - }, - { - "epoch": 17.95, - "learning_rate": 0.00040302669740462555, - "loss": 0.5363, - "step": 73550 - }, - { - "epoch": 17.95, - "learning_rate": 0.00040299349828426946, - "loss": 0.5227, - "step": 73575 - }, - { - "epoch": 17.96, - "learning_rate": 0.0004029602991639134, - "loss": 0.5817, - "step": 73600 - }, - { - "epoch": 17.97, - "learning_rate": 0.00040292710004355723, - "loss": 0.557, - "step": 73625 - }, - { - "epoch": 17.97, - "learning_rate": 0.00040289390092320115, - "loss": 0.5853, - "step": 73650 - }, - { - "epoch": 17.98, - "learning_rate": 0.00040286070180284506, - "loss": 0.5487, - "step": 73675 - }, - { - "epoch": 17.98, - "learning_rate": 0.0004028275026824889, - "loss": 0.6219, - "step": 73700 - }, - { - "epoch": 17.99, - "learning_rate": 0.00040279430356213283, - "loss": 0.5515, - "step": 73725 - }, - { - "epoch": 18.0, - "learning_rate": 0.0004027611044417767, - "loss": 0.5403, - "step": 73750 - }, - { - "epoch": 18.0, - "learning_rate": 0.0004027279053214206, - "loss": 0.5723, - "step": 73775 - }, - { - "epoch": 18.01, - "learning_rate": 0.0004026947062010645, - "loss": 0.5326, - "step": 73800 - }, - { - "epoch": 18.01, - "learning_rate": 0.00040266150708070844, - "loss": 0.5321, - "step": 73825 - }, - { - "epoch": 18.02, - "learning_rate": 0.0004026283079603523, - "loss": 0.4971, - "step": 73850 - }, - { - "epoch": 18.03, - "learning_rate": 0.00040259510883999616, - "loss": 0.517, - "step": 73875 - }, - { - "epoch": 18.03, - "learning_rate": 0.00040256190971964007, - "loss": 0.4976, - "step": 73900 - }, - { - "epoch": 18.04, - "learning_rate": 0.000402528710599284, - "loss": 0.5843, - "step": 73925 - }, - { - "epoch": 18.05, - "learning_rate": 0.0004024955114789279, - "loss": 0.5477, - "step": 73950 - }, - { - "epoch": 18.05, - "learning_rate": 0.00040246231235857176, - "loss": 0.5345, - "step": 73975 - }, - { - "epoch": 18.06, - "learning_rate": 0.0004024291132382156, - "loss": 0.5536, - "step": 74000 - }, - { - "epoch": 18.06, - "learning_rate": 0.00040239591411785953, - "loss": 0.5754, - "step": 74025 - }, - { - "epoch": 18.07, - "learning_rate": 0.00040236271499750345, - "loss": 0.5296, - "step": 74050 - }, - { - "epoch": 18.08, - "learning_rate": 0.00040232951587714736, - "loss": 0.5145, - "step": 74075 - }, - { - "epoch": 18.08, - "learning_rate": 0.0004022963167567912, - "loss": 0.5274, - "step": 74100 - }, - { - "epoch": 18.09, - "learning_rate": 0.00040226311763643513, - "loss": 0.5229, - "step": 74125 - }, - { - "epoch": 18.09, - "learning_rate": 0.000402229918516079, - "loss": 0.489, - "step": 74150 - }, - { - "epoch": 18.1, - "learning_rate": 0.0004021967193957229, - "loss": 0.5586, - "step": 74175 - }, - { - "epoch": 18.11, - "learning_rate": 0.00040216352027536677, - "loss": 0.5578, - "step": 74200 - }, - { - "epoch": 18.11, - "learning_rate": 0.0004021303211550107, - "loss": 0.5274, - "step": 74225 - }, - { - "epoch": 18.12, - "learning_rate": 0.0004020971220346546, - "loss": 0.5554, - "step": 74250 - }, - { - "epoch": 18.12, - "learning_rate": 0.0004020639229142985, - "loss": 0.5502, - "step": 74275 - }, - { - "epoch": 18.13, - "learning_rate": 0.00040203072379394237, - "loss": 0.5322, - "step": 74300 - }, - { - "epoch": 18.14, - "learning_rate": 0.00040199752467358623, - "loss": 0.4957, - "step": 74325 - }, - { - "epoch": 18.14, - "learning_rate": 0.00040196432555323014, - "loss": 0.483, - "step": 74350 - }, - { - "epoch": 18.15, - "learning_rate": 0.00040193112643287406, - "loss": 0.5155, - "step": 74375 - }, - { - "epoch": 18.16, - "learning_rate": 0.00040189792731251797, - "loss": 0.5262, - "step": 74400 - }, - { - "epoch": 18.16, - "learning_rate": 0.00040186472819216183, - "loss": 0.5277, - "step": 74425 - }, - { - "epoch": 18.17, - "learning_rate": 0.0004018315290718057, - "loss": 0.5151, - "step": 74450 - }, - { - "epoch": 18.17, - "learning_rate": 0.0004017983299514496, - "loss": 0.5304, - "step": 74475 - }, - { - "epoch": 18.18, - "learning_rate": 0.0004017651308310935, - "loss": 0.5293, - "step": 74500 - }, - { - "epoch": 18.19, - "learning_rate": 0.00040173193171073743, - "loss": 0.5295, - "step": 74525 - }, - { - "epoch": 18.19, - "learning_rate": 0.0004016987325903813, - "loss": 0.537, - "step": 74550 - }, - { - "epoch": 18.2, - "learning_rate": 0.0004016655334700252, - "loss": 0.545, - "step": 74575 - }, - { - "epoch": 18.2, - "learning_rate": 0.00040163233434966906, - "loss": 0.5087, - "step": 74600 - }, - { - "epoch": 18.21, - "learning_rate": 0.000401599135229313, - "loss": 0.4987, - "step": 74625 - }, - { - "epoch": 18.22, - "learning_rate": 0.00040156593610895684, - "loss": 0.5241, - "step": 74650 - }, - { - "epoch": 18.22, - "learning_rate": 0.00040153273698860075, - "loss": 0.5354, - "step": 74675 - }, - { - "epoch": 18.23, - "learning_rate": 0.00040149953786824467, - "loss": 0.5366, - "step": 74700 - }, - { - "epoch": 18.23, - "learning_rate": 0.0004014663387478886, - "loss": 0.5404, - "step": 74725 - }, - { - "epoch": 18.24, - "learning_rate": 0.00040143313962753244, - "loss": 0.5026, - "step": 74750 - }, - { - "epoch": 18.25, - "learning_rate": 0.0004013999405071763, - "loss": 0.5621, - "step": 74775 - }, - { - "epoch": 18.25, - "learning_rate": 0.0004013667413868202, - "loss": 0.5328, - "step": 74800 - }, - { - "epoch": 18.26, - "learning_rate": 0.00040133354226646413, - "loss": 0.5611, - "step": 74825 - }, - { - "epoch": 18.27, - "learning_rate": 0.00040130034314610804, - "loss": 0.521, - "step": 74850 - }, - { - "epoch": 18.27, - "learning_rate": 0.00040126714402575196, - "loss": 0.5469, - "step": 74875 - }, - { - "epoch": 18.28, - "learning_rate": 0.00040123394490539576, - "loss": 0.5093, - "step": 74900 - }, - { - "epoch": 18.28, - "learning_rate": 0.0004012007457850397, - "loss": 0.5601, - "step": 74925 - }, - { - "epoch": 18.29, - "learning_rate": 0.0004011675466646836, - "loss": 0.5073, - "step": 74950 - }, - { - "epoch": 18.3, - "learning_rate": 0.0004011343475443275, - "loss": 0.5758, - "step": 74975 - }, - { - "epoch": 18.3, - "learning_rate": 0.0004011024763887856, - "loss": 0.5078, - "step": 75000 - }, - { - "epoch": 18.3, - "eval_cer": 0.12220362822500333, - "eval_loss": 0.45253750681877136, - "eval_runtime": 147.3668, - "eval_samples_per_second": 28.453, - "eval_steps_per_second": 7.118, - "eval_wer": 0.49151712887438825, - "step": 75000 - }, - { - "epoch": 18.31, - "learning_rate": 0.0004010692772684295, - "loss": 0.5379, - "step": 75025 - }, - { - "epoch": 18.31, - "learning_rate": 0.0004010360781480734, - "loss": 0.5546, - "step": 75050 - }, - { - "epoch": 18.32, - "learning_rate": 0.00040100287902771734, - "loss": 0.5149, - "step": 75075 - }, - { - "epoch": 18.33, - "learning_rate": 0.00040096967990736114, - "loss": 0.5255, - "step": 75100 - }, - { - "epoch": 18.33, - "learning_rate": 0.00040093648078700505, - "loss": 0.5352, - "step": 75125 - }, - { - "epoch": 18.34, - "learning_rate": 0.00040090328166664897, - "loss": 0.4802, - "step": 75150 - }, - { - "epoch": 18.34, - "learning_rate": 0.0004008700825462929, - "loss": 0.5256, - "step": 75175 - }, - { - "epoch": 18.35, - "learning_rate": 0.0004008368834259368, - "loss": 0.5439, - "step": 75200 - }, - { - "epoch": 18.36, - "learning_rate": 0.00040080368430558066, - "loss": 0.516, - "step": 75225 - }, - { - "epoch": 18.36, - "learning_rate": 0.0004007704851852245, - "loss": 0.5687, - "step": 75250 - }, - { - "epoch": 18.37, - "learning_rate": 0.00040073728606486843, - "loss": 0.5459, - "step": 75275 - }, - { - "epoch": 18.37, - "learning_rate": 0.00040070408694451234, - "loss": 0.5233, - "step": 75300 - }, - { - "epoch": 18.38, - "learning_rate": 0.0004006708878241562, - "loss": 0.5328, - "step": 75325 - }, - { - "epoch": 18.39, - "learning_rate": 0.0004006376887038001, - "loss": 0.5247, - "step": 75350 - }, - { - "epoch": 18.39, - "learning_rate": 0.00040060448958344403, - "loss": 0.5751, - "step": 75375 - }, - { - "epoch": 18.4, - "learning_rate": 0.0004005712904630879, - "loss": 0.5215, - "step": 75400 - }, - { - "epoch": 18.41, - "learning_rate": 0.0004005380913427318, - "loss": 0.5242, - "step": 75425 - }, - { - "epoch": 18.41, - "learning_rate": 0.00040050489222237567, - "loss": 0.5205, - "step": 75450 - }, - { - "epoch": 18.42, - "learning_rate": 0.0004004716931020196, - "loss": 0.5528, - "step": 75475 - }, - { - "epoch": 18.42, - "learning_rate": 0.0004004384939816635, - "loss": 0.5264, - "step": 75500 - }, - { - "epoch": 18.43, - "learning_rate": 0.0004004052948613074, - "loss": 0.4788, - "step": 75525 - }, - { - "epoch": 18.44, - "learning_rate": 0.0004003720957409512, - "loss": 0.512, - "step": 75550 - }, - { - "epoch": 18.44, - "learning_rate": 0.0004003388966205951, - "loss": 0.5212, - "step": 75575 - }, - { - "epoch": 18.45, - "learning_rate": 0.00040030569750023904, - "loss": 0.5449, - "step": 75600 - }, - { - "epoch": 18.45, - "learning_rate": 0.00040027249837988295, - "loss": 0.5017, - "step": 75625 - }, - { - "epoch": 18.46, - "learning_rate": 0.00040023929925952687, - "loss": 0.5355, - "step": 75650 - }, - { - "epoch": 18.47, - "learning_rate": 0.00040020610013917073, - "loss": 0.5656, - "step": 75675 - }, - { - "epoch": 18.47, - "learning_rate": 0.0004001729010188146, - "loss": 0.5639, - "step": 75700 - }, - { - "epoch": 18.48, - "learning_rate": 0.0004001397018984585, - "loss": 0.5351, - "step": 75725 - }, - { - "epoch": 18.48, - "learning_rate": 0.0004001065027781024, - "loss": 0.506, - "step": 75750 - }, - { - "epoch": 18.49, - "learning_rate": 0.0004000733036577463, - "loss": 0.5343, - "step": 75775 - }, - { - "epoch": 18.5, - "learning_rate": 0.0004000401045373902, - "loss": 0.5089, - "step": 75800 - }, - { - "epoch": 18.5, - "learning_rate": 0.0004000069054170341, - "loss": 0.565, - "step": 75825 - }, - { - "epoch": 18.51, - "learning_rate": 0.00039997370629667796, - "loss": 0.5275, - "step": 75850 - }, - { - "epoch": 18.52, - "learning_rate": 0.0003999405071763219, - "loss": 0.532, - "step": 75875 - }, - { - "epoch": 18.52, - "learning_rate": 0.00039990730805596574, - "loss": 0.5424, - "step": 75900 - }, - { - "epoch": 18.53, - "learning_rate": 0.0003998754369004239, - "loss": 0.5468, - "step": 75925 - }, - { - "epoch": 18.53, - "learning_rate": 0.0003998422377800678, - "loss": 0.5039, - "step": 75950 - }, - { - "epoch": 18.54, - "learning_rate": 0.0003998090386597117, - "loss": 0.5426, - "step": 75975 - }, - { - "epoch": 18.55, - "learning_rate": 0.00039977583953935557, - "loss": 0.5072, - "step": 76000 - }, - { - "epoch": 18.55, - "learning_rate": 0.0003997426404189995, - "loss": 0.5543, - "step": 76025 - }, - { - "epoch": 18.56, - "learning_rate": 0.00039970944129864334, - "loss": 0.5615, - "step": 76050 - }, - { - "epoch": 18.56, - "learning_rate": 0.00039967624217828726, - "loss": 0.5061, - "step": 76075 - }, - { - "epoch": 18.57, - "learning_rate": 0.0003996430430579311, - "loss": 0.5508, - "step": 76100 - }, - { - "epoch": 18.58, - "learning_rate": 0.00039960984393757503, - "loss": 0.5134, - "step": 76125 - }, - { - "epoch": 18.58, - "learning_rate": 0.00039957664481721895, - "loss": 0.5097, - "step": 76150 - }, - { - "epoch": 18.59, - "learning_rate": 0.00039954344569686286, - "loss": 0.4996, - "step": 76175 - }, - { - "epoch": 18.59, - "learning_rate": 0.0003995102465765067, - "loss": 0.4972, - "step": 76200 - }, - { - "epoch": 18.6, - "learning_rate": 0.0003994770474561506, - "loss": 0.562, - "step": 76225 - }, - { - "epoch": 18.61, - "learning_rate": 0.0003994438483357945, - "loss": 0.5387, - "step": 76250 - }, - { - "epoch": 18.61, - "learning_rate": 0.0003994106492154384, - "loss": 0.5599, - "step": 76275 - }, - { - "epoch": 18.62, - "learning_rate": 0.0003993774500950823, - "loss": 0.533, - "step": 76300 - }, - { - "epoch": 18.62, - "learning_rate": 0.00039934425097472623, - "loss": 0.552, - "step": 76325 - }, - { - "epoch": 18.63, - "learning_rate": 0.00039931105185437004, - "loss": 0.5328, - "step": 76350 - }, - { - "epoch": 18.64, - "learning_rate": 0.00039927785273401395, - "loss": 0.5625, - "step": 76375 - }, - { - "epoch": 18.64, - "learning_rate": 0.00039924465361365787, - "loss": 0.5635, - "step": 76400 - }, - { - "epoch": 18.65, - "learning_rate": 0.0003992114544933018, - "loss": 0.5886, - "step": 76425 - }, - { - "epoch": 18.66, - "learning_rate": 0.00039917825537294564, - "loss": 0.5375, - "step": 76450 - }, - { - "epoch": 18.66, - "learning_rate": 0.00039914505625258956, - "loss": 0.5109, - "step": 76475 - }, - { - "epoch": 18.67, - "learning_rate": 0.0003991118571322334, - "loss": 0.5455, - "step": 76500 - }, - { - "epoch": 18.67, - "learning_rate": 0.00039907865801187733, - "loss": 0.5416, - "step": 76525 - }, - { - "epoch": 18.68, - "learning_rate": 0.00039904545889152124, - "loss": 0.5739, - "step": 76550 - }, - { - "epoch": 18.69, - "learning_rate": 0.0003990122597711651, - "loss": 0.5392, - "step": 76575 - }, - { - "epoch": 18.69, - "learning_rate": 0.000398979060650809, - "loss": 0.5753, - "step": 76600 - }, - { - "epoch": 18.7, - "learning_rate": 0.00039894586153045293, - "loss": 0.5331, - "step": 76625 - }, - { - "epoch": 18.7, - "learning_rate": 0.0003989126624100968, - "loss": 0.5166, - "step": 76650 - }, - { - "epoch": 18.71, - "learning_rate": 0.00039887946328974065, - "loss": 0.5217, - "step": 76675 - }, - { - "epoch": 18.72, - "learning_rate": 0.00039884626416938456, - "loss": 0.5389, - "step": 76700 - }, - { - "epoch": 18.72, - "learning_rate": 0.0003988130650490285, - "loss": 0.5295, - "step": 76725 - }, - { - "epoch": 18.73, - "learning_rate": 0.0003987798659286724, - "loss": 0.5699, - "step": 76750 - }, - { - "epoch": 18.73, - "learning_rate": 0.00039874666680831625, - "loss": 0.5373, - "step": 76775 - }, - { - "epoch": 18.74, - "learning_rate": 0.0003987134676879601, - "loss": 0.498, - "step": 76800 - }, - { - "epoch": 18.75, - "learning_rate": 0.000398680268567604, - "loss": 0.5534, - "step": 76825 - }, - { - "epoch": 18.75, - "learning_rate": 0.00039864706944724794, - "loss": 0.5273, - "step": 76850 - }, - { - "epoch": 18.76, - "learning_rate": 0.00039861387032689185, - "loss": 0.5369, - "step": 76875 - }, - { - "epoch": 18.77, - "learning_rate": 0.0003985806712065357, - "loss": 0.5222, - "step": 76900 - }, - { - "epoch": 18.77, - "learning_rate": 0.0003985474720861796, - "loss": 0.5316, - "step": 76925 - }, - { - "epoch": 18.78, - "learning_rate": 0.0003985142729658235, - "loss": 0.5146, - "step": 76950 - }, - { - "epoch": 18.78, - "learning_rate": 0.0003984810738454674, - "loss": 0.5384, - "step": 76975 - }, - { - "epoch": 18.79, - "learning_rate": 0.0003984478747251113, - "loss": 0.5177, - "step": 77000 - }, - { - "epoch": 18.8, - "learning_rate": 0.0003984146756047552, - "loss": 0.5552, - "step": 77025 - }, - { - "epoch": 18.8, - "learning_rate": 0.0003983814764843991, - "loss": 0.5154, - "step": 77050 - }, - { - "epoch": 18.81, - "learning_rate": 0.00039834827736404295, - "loss": 0.5189, - "step": 77075 - }, - { - "epoch": 18.81, - "learning_rate": 0.00039831507824368686, - "loss": 0.5299, - "step": 77100 - }, - { - "epoch": 18.82, - "learning_rate": 0.0003982818791233307, - "loss": 0.4983, - "step": 77125 - }, - { - "epoch": 18.83, - "learning_rate": 0.00039824868000297464, - "loss": 0.5253, - "step": 77150 - }, - { - "epoch": 18.83, - "learning_rate": 0.00039821548088261855, - "loss": 0.5739, - "step": 77175 - }, - { - "epoch": 18.84, - "learning_rate": 0.00039818228176226246, - "loss": 0.5569, - "step": 77200 - }, - { - "epoch": 18.84, - "learning_rate": 0.0003981490826419063, - "loss": 0.5496, - "step": 77225 - }, - { - "epoch": 18.85, - "learning_rate": 0.0003981158835215502, - "loss": 0.5505, - "step": 77250 - }, - { - "epoch": 18.86, - "learning_rate": 0.0003980826844011941, - "loss": 0.5687, - "step": 77275 - }, - { - "epoch": 18.86, - "learning_rate": 0.000398049485280838, - "loss": 0.556, - "step": 77300 - }, - { - "epoch": 18.87, - "learning_rate": 0.0003980162861604819, - "loss": 0.5188, - "step": 77325 - }, - { - "epoch": 18.88, - "learning_rate": 0.0003979830870401258, - "loss": 0.5799, - "step": 77350 - }, - { - "epoch": 18.88, - "learning_rate": 0.00039794988791976965, - "loss": 0.5696, - "step": 77375 - }, - { - "epoch": 18.89, - "learning_rate": 0.00039791668879941356, - "loss": 0.53, - "step": 77400 - }, - { - "epoch": 18.89, - "learning_rate": 0.0003978834896790575, - "loss": 0.5746, - "step": 77425 - }, - { - "epoch": 18.9, - "learning_rate": 0.0003978502905587014, - "loss": 0.5483, - "step": 77450 - }, - { - "epoch": 18.91, - "learning_rate": 0.00039781709143834525, - "loss": 0.5689, - "step": 77475 - }, - { - "epoch": 18.91, - "learning_rate": 0.00039778389231798916, - "loss": 0.5191, - "step": 77500 - }, - { - "epoch": 18.92, - "learning_rate": 0.000397750693197633, - "loss": 0.5588, - "step": 77525 - }, - { - "epoch": 18.92, - "learning_rate": 0.00039771749407727694, - "loss": 0.5028, - "step": 77550 - }, - { - "epoch": 18.93, - "learning_rate": 0.00039768429495692085, - "loss": 0.5064, - "step": 77575 - }, - { - "epoch": 18.94, - "learning_rate": 0.0003976510958365647, - "loss": 0.5281, - "step": 77600 - }, - { - "epoch": 18.94, - "learning_rate": 0.0003976178967162086, - "loss": 0.5584, - "step": 77625 - }, - { - "epoch": 18.95, - "learning_rate": 0.00039758469759585254, - "loss": 0.5377, - "step": 77650 - }, - { - "epoch": 18.95, - "learning_rate": 0.0003975514984754964, - "loss": 0.494, - "step": 77675 - }, - { - "epoch": 18.96, - "learning_rate": 0.00039751829935514026, - "loss": 0.5384, - "step": 77700 - }, - { - "epoch": 18.97, - "learning_rate": 0.00039748510023478417, - "loss": 0.5086, - "step": 77725 - }, - { - "epoch": 18.97, - "learning_rate": 0.0003974519011144281, - "loss": 0.555, - "step": 77750 - }, - { - "epoch": 18.98, - "learning_rate": 0.000397418701994072, - "loss": 0.5202, - "step": 77775 - }, - { - "epoch": 18.98, - "learning_rate": 0.0003973855028737159, - "loss": 0.5353, - "step": 77800 - }, - { - "epoch": 18.99, - "learning_rate": 0.0003973523037533597, - "loss": 0.5747, - "step": 77825 - }, - { - "epoch": 19.0, - "learning_rate": 0.00039731910463300363, - "loss": 0.4983, - "step": 77850 - }, - { - "epoch": 19.0, - "learning_rate": 0.00039728590551264755, - "loss": 0.5076, - "step": 77875 - }, - { - "epoch": 19.01, - "learning_rate": 0.00039725270639229146, - "loss": 0.5359, - "step": 77900 - }, - { - "epoch": 19.02, - "learning_rate": 0.0003972195072719353, - "loss": 0.5673, - "step": 77925 - }, - { - "epoch": 19.02, - "learning_rate": 0.00039718630815157923, - "loss": 0.5096, - "step": 77950 - }, - { - "epoch": 19.03, - "learning_rate": 0.0003971531090312231, - "loss": 0.5204, - "step": 77975 - }, - { - "epoch": 19.03, - "learning_rate": 0.000397119909910867, - "loss": 0.5075, - "step": 78000 - }, - { - "epoch": 19.03, - "eval_cer": 0.12079710070531709, - "eval_loss": 0.45315462350845337, - "eval_runtime": 146.6782, - "eval_samples_per_second": 28.586, - "eval_steps_per_second": 7.152, - "eval_wer": 0.4871451876019576, - "step": 78000 - }, - { - "epoch": 19.04, - "learning_rate": 0.0003970867107905109, - "loss": 0.5106, - "step": 78025 - }, - { - "epoch": 19.05, - "learning_rate": 0.0003970535116701548, - "loss": 0.4838, - "step": 78050 - }, - { - "epoch": 19.05, - "learning_rate": 0.0003970203125497987, - "loss": 0.5528, - "step": 78075 - }, - { - "epoch": 19.06, - "learning_rate": 0.0003969871134294426, - "loss": 0.469, - "step": 78100 - }, - { - "epoch": 19.06, - "learning_rate": 0.00039695391430908647, - "loss": 0.4894, - "step": 78125 - }, - { - "epoch": 19.07, - "learning_rate": 0.00039692071518873033, - "loss": 0.4993, - "step": 78150 - }, - { - "epoch": 19.08, - "learning_rate": 0.00039688751606837424, - "loss": 0.5519, - "step": 78175 - }, - { - "epoch": 19.08, - "learning_rate": 0.00039685431694801816, - "loss": 0.5083, - "step": 78200 - }, - { - "epoch": 19.09, - "learning_rate": 0.00039682111782766207, - "loss": 0.5324, - "step": 78225 - }, - { - "epoch": 19.09, - "learning_rate": 0.000396787918707306, - "loss": 0.4881, - "step": 78250 - }, - { - "epoch": 19.1, - "learning_rate": 0.0003967547195869498, - "loss": 0.5419, - "step": 78275 - }, - { - "epoch": 19.11, - "learning_rate": 0.0003967215204665937, - "loss": 0.5162, - "step": 78300 - }, - { - "epoch": 19.11, - "learning_rate": 0.0003966883213462376, - "loss": 0.5256, - "step": 78325 - }, - { - "epoch": 19.12, - "learning_rate": 0.00039665512222588153, - "loss": 0.4996, - "step": 78350 - }, - { - "epoch": 19.13, - "learning_rate": 0.0003966219231055254, - "loss": 0.5156, - "step": 78375 - }, - { - "epoch": 19.13, - "learning_rate": 0.0003965887239851693, - "loss": 0.4767, - "step": 78400 - }, - { - "epoch": 19.14, - "learning_rate": 0.00039655552486481317, - "loss": 0.4836, - "step": 78425 - }, - { - "epoch": 19.14, - "learning_rate": 0.0003965223257444571, - "loss": 0.5414, - "step": 78450 - }, - { - "epoch": 19.15, - "learning_rate": 0.000396489126624101, - "loss": 0.4985, - "step": 78475 - }, - { - "epoch": 19.16, - "learning_rate": 0.00039645592750374485, - "loss": 0.5329, - "step": 78500 - }, - { - "epoch": 19.16, - "learning_rate": 0.00039642272838338877, - "loss": 0.5244, - "step": 78525 - }, - { - "epoch": 19.17, - "learning_rate": 0.0003963895292630327, - "loss": 0.4926, - "step": 78550 - }, - { - "epoch": 19.17, - "learning_rate": 0.00039635633014267654, - "loss": 0.4931, - "step": 78575 - }, - { - "epoch": 19.18, - "learning_rate": 0.0003963231310223204, - "loss": 0.5234, - "step": 78600 - }, - { - "epoch": 19.19, - "learning_rate": 0.0003962899319019643, - "loss": 0.5165, - "step": 78625 - }, - { - "epoch": 19.19, - "learning_rate": 0.00039625673278160823, - "loss": 0.5369, - "step": 78650 - }, - { - "epoch": 19.2, - "learning_rate": 0.00039622353366125214, - "loss": 0.4852, - "step": 78675 - }, - { - "epoch": 19.2, - "learning_rate": 0.00039619033454089606, - "loss": 0.4958, - "step": 78700 - }, - { - "epoch": 19.21, - "learning_rate": 0.00039615713542053986, - "loss": 0.4935, - "step": 78725 - }, - { - "epoch": 19.22, - "learning_rate": 0.0003961239363001838, - "loss": 0.5221, - "step": 78750 - }, - { - "epoch": 19.22, - "learning_rate": 0.0003960907371798277, - "loss": 0.5487, - "step": 78775 - }, - { - "epoch": 19.23, - "learning_rate": 0.0003960575380594716, - "loss": 0.5195, - "step": 78800 - }, - { - "epoch": 19.23, - "learning_rate": 0.0003960243389391155, - "loss": 0.5316, - "step": 78825 - }, - { - "epoch": 19.24, - "learning_rate": 0.0003959911398187594, - "loss": 0.5014, - "step": 78850 - }, - { - "epoch": 19.25, - "learning_rate": 0.00039595794069840324, - "loss": 0.5431, - "step": 78875 - }, - { - "epoch": 19.25, - "learning_rate": 0.00039592474157804715, - "loss": 0.5156, - "step": 78900 - }, - { - "epoch": 19.26, - "learning_rate": 0.00039589154245769107, - "loss": 0.5367, - "step": 78925 - }, - { - "epoch": 19.27, - "learning_rate": 0.0003958583433373349, - "loss": 0.4882, - "step": 78950 - }, - { - "epoch": 19.27, - "learning_rate": 0.00039582514421697884, - "loss": 0.51, - "step": 78975 - }, - { - "epoch": 19.28, - "learning_rate": 0.00039579194509662275, - "loss": 0.4833, - "step": 79000 - }, - { - "epoch": 19.28, - "learning_rate": 0.0003957587459762666, - "loss": 0.5326, - "step": 79025 - }, - { - "epoch": 19.29, - "learning_rate": 0.0003957255468559105, - "loss": 0.4977, - "step": 79050 - }, - { - "epoch": 19.3, - "learning_rate": 0.0003956923477355544, - "loss": 0.5499, - "step": 79075 - }, - { - "epoch": 19.3, - "learning_rate": 0.0003956591486151983, - "loss": 0.5187, - "step": 79100 - }, - { - "epoch": 19.31, - "learning_rate": 0.0003956259494948422, - "loss": 0.5257, - "step": 79125 - }, - { - "epoch": 19.31, - "learning_rate": 0.00039559275037448613, - "loss": 0.5253, - "step": 79150 - }, - { - "epoch": 19.32, - "learning_rate": 0.00039555955125412993, - "loss": 0.5119, - "step": 79175 - }, - { - "epoch": 19.33, - "learning_rate": 0.00039552635213377385, - "loss": 0.5149, - "step": 79200 - }, - { - "epoch": 19.33, - "learning_rate": 0.00039549315301341776, - "loss": 0.5461, - "step": 79225 - }, - { - "epoch": 19.34, - "learning_rate": 0.0003954599538930617, - "loss": 0.5465, - "step": 79250 - }, - { - "epoch": 19.34, - "learning_rate": 0.0003954267547727056, - "loss": 0.5702, - "step": 79275 - }, - { - "epoch": 19.35, - "learning_rate": 0.00039539355565234945, - "loss": 0.5334, - "step": 79300 - }, - { - "epoch": 19.36, - "learning_rate": 0.0003953603565319933, - "loss": 0.5379, - "step": 79325 - }, - { - "epoch": 19.36, - "learning_rate": 0.0003953271574116372, - "loss": 0.5165, - "step": 79350 - }, - { - "epoch": 19.37, - "learning_rate": 0.00039529395829128114, - "loss": 0.5178, - "step": 79375 - }, - { - "epoch": 19.38, - "learning_rate": 0.000395260759170925, - "loss": 0.5007, - "step": 79400 - }, - { - "epoch": 19.38, - "learning_rate": 0.0003952275600505689, - "loss": 0.5203, - "step": 79425 - }, - { - "epoch": 19.39, - "learning_rate": 0.0003951943609302128, - "loss": 0.4874, - "step": 79450 - }, - { - "epoch": 19.39, - "learning_rate": 0.0003951611618098567, - "loss": 0.5472, - "step": 79475 - }, - { - "epoch": 19.4, - "learning_rate": 0.0003951279626895006, - "loss": 0.5123, - "step": 79500 - }, - { - "epoch": 19.41, - "learning_rate": 0.00039509476356914446, - "loss": 0.5628, - "step": 79525 - }, - { - "epoch": 19.41, - "learning_rate": 0.00039506156444878837, - "loss": 0.5127, - "step": 79550 - }, - { - "epoch": 19.42, - "learning_rate": 0.0003950283653284323, - "loss": 0.5461, - "step": 79575 - }, - { - "epoch": 19.42, - "learning_rate": 0.0003949951662080762, - "loss": 0.5187, - "step": 79600 - }, - { - "epoch": 19.43, - "learning_rate": 0.00039496196708772, - "loss": 0.559, - "step": 79625 - }, - { - "epoch": 19.44, - "learning_rate": 0.0003949287679673639, - "loss": 0.498, - "step": 79650 - }, - { - "epoch": 19.44, - "learning_rate": 0.00039489556884700783, - "loss": 0.4965, - "step": 79675 - }, - { - "epoch": 19.45, - "learning_rate": 0.00039486236972665175, - "loss": 0.4793, - "step": 79700 - }, - { - "epoch": 19.45, - "learning_rate": 0.00039482917060629566, - "loss": 0.4825, - "step": 79725 - }, - { - "epoch": 19.46, - "learning_rate": 0.0003947959714859395, - "loss": 0.4814, - "step": 79750 - }, - { - "epoch": 19.47, - "learning_rate": 0.0003947627723655834, - "loss": 0.4946, - "step": 79775 - }, - { - "epoch": 19.47, - "learning_rate": 0.0003947295732452273, - "loss": 0.4516, - "step": 79800 - }, - { - "epoch": 19.48, - "learning_rate": 0.0003946963741248712, - "loss": 0.5269, - "step": 79825 - }, - { - "epoch": 19.49, - "learning_rate": 0.00039466317500451507, - "loss": 0.5135, - "step": 79850 - }, - { - "epoch": 19.49, - "learning_rate": 0.000394629975884159, - "loss": 0.5563, - "step": 79875 - }, - { - "epoch": 19.5, - "learning_rate": 0.0003945967767638029, - "loss": 0.5172, - "step": 79900 - }, - { - "epoch": 19.5, - "learning_rate": 0.00039456357764344676, - "loss": 0.528, - "step": 79925 - }, - { - "epoch": 19.51, - "learning_rate": 0.00039453037852309067, - "loss": 0.5158, - "step": 79950 - }, - { - "epoch": 19.52, - "learning_rate": 0.00039449717940273453, - "loss": 0.5197, - "step": 79975 - }, - { - "epoch": 19.52, - "learning_rate": 0.00039446398028237844, - "loss": 0.522, - "step": 80000 - }, - { - "epoch": 19.53, - "learning_rate": 0.00039443078116202236, - "loss": 0.533, - "step": 80025 - }, - { - "epoch": 19.53, - "learning_rate": 0.00039439758204166627, - "loss": 0.5262, - "step": 80050 - }, - { - "epoch": 19.54, - "learning_rate": 0.0003943643829213101, - "loss": 0.5267, - "step": 80075 - }, - { - "epoch": 19.55, - "learning_rate": 0.000394331183800954, - "loss": 0.4881, - "step": 80100 - }, - { - "epoch": 19.55, - "learning_rate": 0.0003942979846805979, - "loss": 0.5977, - "step": 80125 - }, - { - "epoch": 19.56, - "learning_rate": 0.0003942647855602418, - "loss": 0.4507, - "step": 80150 - }, - { - "epoch": 19.56, - "learning_rate": 0.00039423291440469996, - "loss": 0.5734, - "step": 80175 - }, - { - "epoch": 19.57, - "learning_rate": 0.0003941997152843438, - "loss": 0.5274, - "step": 80200 - }, - { - "epoch": 19.58, - "learning_rate": 0.00039416651616398774, - "loss": 0.5174, - "step": 80225 - }, - { - "epoch": 19.58, - "learning_rate": 0.00039413331704363165, - "loss": 0.552, - "step": 80250 - }, - { - "epoch": 19.59, - "learning_rate": 0.0003941001179232755, - "loss": 0.5026, - "step": 80275 - }, - { - "epoch": 19.59, - "learning_rate": 0.00039406691880291937, - "loss": 0.5017, - "step": 80300 - }, - { - "epoch": 19.6, - "learning_rate": 0.0003940337196825633, - "loss": 0.5122, - "step": 80325 - }, - { - "epoch": 19.61, - "learning_rate": 0.0003940005205622072, - "loss": 0.5116, - "step": 80350 - }, - { - "epoch": 19.61, - "learning_rate": 0.0003939673214418511, - "loss": 0.5608, - "step": 80375 - }, - { - "epoch": 19.62, - "learning_rate": 0.00039393412232149503, - "loss": 0.4792, - "step": 80400 - }, - { - "epoch": 19.63, - "learning_rate": 0.00039390092320113883, - "loss": 0.5337, - "step": 80425 - }, - { - "epoch": 19.63, - "learning_rate": 0.00039386772408078275, - "loss": 0.4826, - "step": 80450 - }, - { - "epoch": 19.64, - "learning_rate": 0.00039383452496042666, - "loss": 0.5173, - "step": 80475 - }, - { - "epoch": 19.64, - "learning_rate": 0.0003938013258400706, - "loss": 0.4629, - "step": 80500 - }, - { - "epoch": 19.65, - "learning_rate": 0.00039376812671971444, - "loss": 0.5717, - "step": 80525 - }, - { - "epoch": 19.66, - "learning_rate": 0.00039373492759935835, - "loss": 0.499, - "step": 80550 - }, - { - "epoch": 19.66, - "learning_rate": 0.0003937017284790022, - "loss": 0.5233, - "step": 80575 - }, - { - "epoch": 19.67, - "learning_rate": 0.0003936685293586461, - "loss": 0.5131, - "step": 80600 - }, - { - "epoch": 19.67, - "learning_rate": 0.00039363533023829004, - "loss": 0.5343, - "step": 80625 - }, - { - "epoch": 19.68, - "learning_rate": 0.0003936021311179339, - "loss": 0.4978, - "step": 80650 - }, - { - "epoch": 19.69, - "learning_rate": 0.0003935689319975778, - "loss": 0.559, - "step": 80675 - }, - { - "epoch": 19.69, - "learning_rate": 0.0003935357328772217, - "loss": 0.5288, - "step": 80700 - }, - { - "epoch": 19.7, - "learning_rate": 0.0003935025337568656, - "loss": 0.5782, - "step": 80725 - }, - { - "epoch": 19.7, - "learning_rate": 0.00039346933463650944, - "loss": 0.5151, - "step": 80750 - }, - { - "epoch": 19.71, - "learning_rate": 0.00039343613551615336, - "loss": 0.5044, - "step": 80775 - }, - { - "epoch": 19.72, - "learning_rate": 0.00039340293639579727, - "loss": 0.5323, - "step": 80800 - }, - { - "epoch": 19.72, - "learning_rate": 0.0003933697372754412, - "loss": 0.5365, - "step": 80825 - }, - { - "epoch": 19.73, - "learning_rate": 0.0003933365381550851, - "loss": 0.5024, - "step": 80850 - }, - { - "epoch": 19.74, - "learning_rate": 0.0003933033390347289, - "loss": 0.5234, - "step": 80875 - }, - { - "epoch": 19.74, - "learning_rate": 0.0003932701399143728, - "loss": 0.5135, - "step": 80900 - }, - { - "epoch": 19.75, - "learning_rate": 0.00039323694079401673, - "loss": 0.5403, - "step": 80925 - }, - { - "epoch": 19.75, - "learning_rate": 0.00039320374167366065, - "loss": 0.5468, - "step": 80950 - }, - { - "epoch": 19.76, - "learning_rate": 0.0003931705425533045, - "loss": 0.4975, - "step": 80975 - }, - { - "epoch": 19.77, - "learning_rate": 0.0003931373434329484, - "loss": 0.5461, - "step": 81000 - }, - { - "epoch": 19.77, - "eval_cer": 0.11960617229448785, - "eval_loss": 0.4400729238986969, - "eval_runtime": 146.8938, - "eval_samples_per_second": 28.544, - "eval_steps_per_second": 7.141, - "eval_wer": 0.4812724306688418, - "step": 81000 - }, - { - "epoch": 19.77, - "learning_rate": 0.0003931041443125923, - "loss": 0.5305, - "step": 81025 - }, - { - "epoch": 19.78, - "learning_rate": 0.0003930709451922362, - "loss": 0.4784, - "step": 81050 - }, - { - "epoch": 19.78, - "learning_rate": 0.0003930377460718801, - "loss": 0.545, - "step": 81075 - }, - { - "epoch": 19.79, - "learning_rate": 0.00039300454695152397, - "loss": 0.4795, - "step": 81100 - }, - { - "epoch": 19.8, - "learning_rate": 0.0003929713478311679, - "loss": 0.5511, - "step": 81125 - }, - { - "epoch": 19.8, - "learning_rate": 0.0003929381487108118, - "loss": 0.5314, - "step": 81150 - }, - { - "epoch": 19.81, - "learning_rate": 0.00039290494959045566, - "loss": 0.5912, - "step": 81175 - }, - { - "epoch": 19.81, - "learning_rate": 0.0003928717504700995, - "loss": 0.5392, - "step": 81200 - }, - { - "epoch": 19.82, - "learning_rate": 0.00039283855134974343, - "loss": 0.504, - "step": 81225 - }, - { - "epoch": 19.83, - "learning_rate": 0.00039280535222938734, - "loss": 0.4723, - "step": 81250 - }, - { - "epoch": 19.83, - "learning_rate": 0.00039277215310903126, - "loss": 0.5295, - "step": 81275 - }, - { - "epoch": 19.84, - "learning_rate": 0.00039273895398867517, - "loss": 0.521, - "step": 81300 - }, - { - "epoch": 19.85, - "learning_rate": 0.000392705754868319, - "loss": 0.5833, - "step": 81325 - }, - { - "epoch": 19.85, - "learning_rate": 0.0003926725557479629, - "loss": 0.5042, - "step": 81350 - }, - { - "epoch": 19.86, - "learning_rate": 0.0003926393566276068, - "loss": 0.5365, - "step": 81375 - }, - { - "epoch": 19.86, - "learning_rate": 0.0003926061575072507, - "loss": 0.4939, - "step": 81400 - }, - { - "epoch": 19.87, - "learning_rate": 0.00039257295838689463, - "loss": 0.5449, - "step": 81425 - }, - { - "epoch": 19.88, - "learning_rate": 0.00039253975926653844, - "loss": 0.5452, - "step": 81450 - }, - { - "epoch": 19.88, - "learning_rate": 0.00039250656014618235, - "loss": 0.5635, - "step": 81475 - }, - { - "epoch": 19.89, - "learning_rate": 0.00039247336102582627, - "loss": 0.5344, - "step": 81500 - }, - { - "epoch": 19.89, - "learning_rate": 0.0003924401619054702, - "loss": 0.5103, - "step": 81525 - }, - { - "epoch": 19.9, - "learning_rate": 0.00039240696278511404, - "loss": 0.5035, - "step": 81550 - }, - { - "epoch": 19.91, - "learning_rate": 0.00039237376366475795, - "loss": 0.5693, - "step": 81575 - }, - { - "epoch": 19.91, - "learning_rate": 0.0003923405645444018, - "loss": 0.5482, - "step": 81600 - }, - { - "epoch": 19.92, - "learning_rate": 0.00039230736542404573, - "loss": 0.527, - "step": 81625 - }, - { - "epoch": 19.92, - "learning_rate": 0.00039227416630368964, - "loss": 0.5014, - "step": 81650 - }, - { - "epoch": 19.93, - "learning_rate": 0.0003922409671833335, - "loss": 0.5306, - "step": 81675 - }, - { - "epoch": 19.94, - "learning_rate": 0.0003922077680629774, - "loss": 0.5236, - "step": 81700 - }, - { - "epoch": 19.94, - "learning_rate": 0.00039217456894262133, - "loss": 0.5108, - "step": 81725 - }, - { - "epoch": 19.95, - "learning_rate": 0.0003921413698222652, - "loss": 0.4858, - "step": 81750 - }, - { - "epoch": 19.95, - "learning_rate": 0.00039210817070190905, - "loss": 0.4938, - "step": 81775 - }, - { - "epoch": 19.96, - "learning_rate": 0.00039207497158155296, - "loss": 0.5359, - "step": 81800 - }, - { - "epoch": 19.97, - "learning_rate": 0.0003920417724611969, - "loss": 0.533, - "step": 81825 - }, - { - "epoch": 19.97, - "learning_rate": 0.0003920085733408408, - "loss": 0.5, - "step": 81850 - }, - { - "epoch": 19.98, - "learning_rate": 0.0003919753742204847, - "loss": 0.5306, - "step": 81875 - }, - { - "epoch": 19.99, - "learning_rate": 0.0003919421751001285, - "loss": 0.5, - "step": 81900 - }, - { - "epoch": 19.99, - "learning_rate": 0.0003919089759797724, - "loss": 0.5182, - "step": 81925 - }, - { - "epoch": 20.0, - "learning_rate": 0.00039187577685941634, - "loss": 0.5104, - "step": 81950 - }, - { - "epoch": 20.0, - "learning_rate": 0.00039184257773906025, - "loss": 0.4774, - "step": 81975 - }, - { - "epoch": 20.01, - "learning_rate": 0.0003918093786187041, - "loss": 0.5177, - "step": 82000 - }, - { - "epoch": 20.02, - "learning_rate": 0.000391776179498348, - "loss": 0.5224, - "step": 82025 - }, - { - "epoch": 20.02, - "learning_rate": 0.0003917429803779919, - "loss": 0.4828, - "step": 82050 - }, - { - "epoch": 20.03, - "learning_rate": 0.0003917097812576358, - "loss": 0.5423, - "step": 82075 - }, - { - "epoch": 20.03, - "learning_rate": 0.0003916765821372797, - "loss": 0.443, - "step": 82100 - }, - { - "epoch": 20.04, - "learning_rate": 0.0003916433830169236, - "loss": 0.5223, - "step": 82125 - }, - { - "epoch": 20.05, - "learning_rate": 0.0003916101838965675, - "loss": 0.4703, - "step": 82150 - }, - { - "epoch": 20.05, - "learning_rate": 0.0003915769847762114, - "loss": 0.5051, - "step": 82175 - }, - { - "epoch": 20.06, - "learning_rate": 0.00039154378565585526, - "loss": 0.486, - "step": 82200 - }, - { - "epoch": 20.06, - "learning_rate": 0.0003915105865354991, - "loss": 0.4924, - "step": 82225 - }, - { - "epoch": 20.07, - "learning_rate": 0.00039147738741514304, - "loss": 0.4963, - "step": 82250 - }, - { - "epoch": 20.08, - "learning_rate": 0.00039144418829478695, - "loss": 0.4922, - "step": 82275 - }, - { - "epoch": 20.08, - "learning_rate": 0.00039141098917443086, - "loss": 0.4911, - "step": 82300 - }, - { - "epoch": 20.09, - "learning_rate": 0.0003913777900540748, - "loss": 0.5315, - "step": 82325 - }, - { - "epoch": 20.1, - "learning_rate": 0.0003913445909337186, - "loss": 0.4826, - "step": 82350 - }, - { - "epoch": 20.1, - "learning_rate": 0.0003913113918133625, - "loss": 0.5536, - "step": 82375 - }, - { - "epoch": 20.11, - "learning_rate": 0.0003912781926930064, - "loss": 0.4998, - "step": 82400 - }, - { - "epoch": 20.11, - "learning_rate": 0.0003912449935726503, - "loss": 0.5207, - "step": 82425 - }, - { - "epoch": 20.12, - "learning_rate": 0.0003912117944522942, - "loss": 0.5061, - "step": 82450 - }, - { - "epoch": 20.13, - "learning_rate": 0.0003911785953319381, - "loss": 0.4999, - "step": 82475 - }, - { - "epoch": 20.13, - "learning_rate": 0.00039114539621158196, - "loss": 0.4868, - "step": 82500 - }, - { - "epoch": 20.14, - "learning_rate": 0.00039111219709122587, - "loss": 0.5307, - "step": 82525 - }, - { - "epoch": 20.14, - "learning_rate": 0.0003910789979708698, - "loss": 0.455, - "step": 82550 - }, - { - "epoch": 20.15, - "learning_rate": 0.00039104579885051365, - "loss": 0.4881, - "step": 82575 - }, - { - "epoch": 20.16, - "learning_rate": 0.00039101259973015756, - "loss": 0.5058, - "step": 82600 - }, - { - "epoch": 20.16, - "learning_rate": 0.0003909794006098015, - "loss": 0.5035, - "step": 82625 - }, - { - "epoch": 20.17, - "learning_rate": 0.00039094620148944533, - "loss": 0.5044, - "step": 82650 - }, - { - "epoch": 20.17, - "learning_rate": 0.00039091300236908925, - "loss": 0.5321, - "step": 82675 - }, - { - "epoch": 20.18, - "learning_rate": 0.00039088113121354734, - "loss": 0.4867, - "step": 82700 - }, - { - "epoch": 20.19, - "learning_rate": 0.00039084793209319125, - "loss": 0.487, - "step": 82725 - }, - { - "epoch": 20.19, - "learning_rate": 0.00039081473297283517, - "loss": 0.5071, - "step": 82750 - }, - { - "epoch": 20.2, - "learning_rate": 0.0003907815338524791, - "loss": 0.4933, - "step": 82775 - }, - { - "epoch": 20.2, - "learning_rate": 0.00039074833473212294, - "loss": 0.5347, - "step": 82800 - }, - { - "epoch": 20.21, - "learning_rate": 0.00039071513561176685, - "loss": 0.486, - "step": 82825 - }, - { - "epoch": 20.22, - "learning_rate": 0.0003906819364914107, - "loss": 0.4886, - "step": 82850 - }, - { - "epoch": 20.22, - "learning_rate": 0.00039064873737105463, - "loss": 0.5365, - "step": 82875 - }, - { - "epoch": 20.23, - "learning_rate": 0.0003906155382506985, - "loss": 0.4923, - "step": 82900 - }, - { - "epoch": 20.24, - "learning_rate": 0.0003905823391303424, - "loss": 0.555, - "step": 82925 - }, - { - "epoch": 20.24, - "learning_rate": 0.0003905491400099863, - "loss": 0.5232, - "step": 82950 - }, - { - "epoch": 20.25, - "learning_rate": 0.00039051594088963023, - "loss": 0.5658, - "step": 82975 - }, - { - "epoch": 20.25, - "learning_rate": 0.0003904827417692741, - "loss": 0.5183, - "step": 83000 - }, - { - "epoch": 20.26, - "learning_rate": 0.00039044954264891795, - "loss": 0.5532, - "step": 83025 - }, - { - "epoch": 20.27, - "learning_rate": 0.00039041634352856186, - "loss": 0.4787, - "step": 83050 - }, - { - "epoch": 20.27, - "learning_rate": 0.0003903831444082058, - "loss": 0.5197, - "step": 83075 - }, - { - "epoch": 20.28, - "learning_rate": 0.0003903499452878497, - "loss": 0.4716, - "step": 83100 - }, - { - "epoch": 20.28, - "learning_rate": 0.00039031674616749355, - "loss": 0.5227, - "step": 83125 - }, - { - "epoch": 20.29, - "learning_rate": 0.0003902835470471374, - "loss": 0.4727, - "step": 83150 - }, - { - "epoch": 20.3, - "learning_rate": 0.0003902503479267813, - "loss": 0.5607, - "step": 83175 - }, - { - "epoch": 20.3, - "learning_rate": 0.00039021714880642524, - "loss": 0.5176, - "step": 83200 - }, - { - "epoch": 20.31, - "learning_rate": 0.00039018394968606915, - "loss": 0.5077, - "step": 83225 - }, - { - "epoch": 20.31, - "learning_rate": 0.000390150750565713, - "loss": 0.5003, - "step": 83250 - }, - { - "epoch": 20.32, - "learning_rate": 0.0003901175514453569, - "loss": 0.5059, - "step": 83275 - }, - { - "epoch": 20.33, - "learning_rate": 0.0003900843523250008, - "loss": 0.4917, - "step": 83300 - }, - { - "epoch": 20.33, - "learning_rate": 0.0003900511532046447, - "loss": 0.5032, - "step": 83325 - }, - { - "epoch": 20.34, - "learning_rate": 0.00039001795408428856, - "loss": 0.5251, - "step": 83350 - }, - { - "epoch": 20.35, - "learning_rate": 0.0003899847549639325, - "loss": 0.5191, - "step": 83375 - }, - { - "epoch": 20.35, - "learning_rate": 0.0003899515558435764, - "loss": 0.489, - "step": 83400 - }, - { - "epoch": 20.36, - "learning_rate": 0.0003899183567232203, - "loss": 0.5331, - "step": 83425 - }, - { - "epoch": 20.36, - "learning_rate": 0.00038988515760286416, - "loss": 0.4853, - "step": 83450 - }, - { - "epoch": 20.37, - "learning_rate": 0.000389851958482508, - "loss": 0.5296, - "step": 83475 - }, - { - "epoch": 20.38, - "learning_rate": 0.00038981875936215194, - "loss": 0.5222, - "step": 83500 - }, - { - "epoch": 20.38, - "learning_rate": 0.00038978556024179585, - "loss": 0.5363, - "step": 83525 - }, - { - "epoch": 20.39, - "learning_rate": 0.00038975236112143976, - "loss": 0.4851, - "step": 83550 - }, - { - "epoch": 20.39, - "learning_rate": 0.0003897191620010836, - "loss": 0.5469, - "step": 83575 - }, - { - "epoch": 20.4, - "learning_rate": 0.0003896859628807275, - "loss": 0.4488, - "step": 83600 - }, - { - "epoch": 20.41, - "learning_rate": 0.0003896527637603714, - "loss": 0.5445, - "step": 83625 - }, - { - "epoch": 20.41, - "learning_rate": 0.0003896195646400153, - "loss": 0.4996, - "step": 83650 - }, - { - "epoch": 20.42, - "learning_rate": 0.0003895863655196592, - "loss": 0.5022, - "step": 83675 - }, - { - "epoch": 20.42, - "learning_rate": 0.0003895531663993031, - "loss": 0.4456, - "step": 83700 - }, - { - "epoch": 20.43, - "learning_rate": 0.000389519967278947, - "loss": 0.531, - "step": 83725 - }, - { - "epoch": 20.44, - "learning_rate": 0.00038948676815859086, - "loss": 0.4859, - "step": 83750 - }, - { - "epoch": 20.44, - "learning_rate": 0.00038945356903823477, - "loss": 0.5109, - "step": 83775 - }, - { - "epoch": 20.45, - "learning_rate": 0.00038942036991787863, - "loss": 0.518, - "step": 83800 - }, - { - "epoch": 20.46, - "learning_rate": 0.00038938717079752255, - "loss": 0.5039, - "step": 83825 - }, - { - "epoch": 20.46, - "learning_rate": 0.00038935397167716646, - "loss": 0.4744, - "step": 83850 - }, - { - "epoch": 20.47, - "learning_rate": 0.0003893207725568104, - "loss": 0.5653, - "step": 83875 - }, - { - "epoch": 20.47, - "learning_rate": 0.00038928757343645423, - "loss": 0.5311, - "step": 83900 - }, - { - "epoch": 20.48, - "learning_rate": 0.0003892543743160981, - "loss": 0.5306, - "step": 83925 - }, - { - "epoch": 20.49, - "learning_rate": 0.000389221175195742, - "loss": 0.4814, - "step": 83950 - }, - { - "epoch": 20.49, - "learning_rate": 0.0003891879760753859, - "loss": 0.5273, - "step": 83975 - }, - { - "epoch": 20.5, - "learning_rate": 0.00038915477695502984, - "loss": 0.5044, - "step": 84000 - }, - { - "epoch": 20.5, - "eval_cer": 0.11443179368191944, - "eval_loss": 0.42682546377182007, - "eval_runtime": 146.7255, - "eval_samples_per_second": 28.577, - "eval_steps_per_second": 7.149, - "eval_wer": 0.46541598694942904, - "step": 84000 - }, - { - "epoch": 20.5, - "learning_rate": 0.00038912157783467375, - "loss": 0.522, - "step": 84025 - }, - { - "epoch": 20.51, - "learning_rate": 0.00038908837871431755, - "loss": 0.4838, - "step": 84050 - }, - { - "epoch": 20.52, - "learning_rate": 0.00038905517959396147, - "loss": 0.4854, - "step": 84075 - }, - { - "epoch": 20.52, - "learning_rate": 0.0003890219804736054, - "loss": 0.463, - "step": 84100 - }, - { - "epoch": 20.53, - "learning_rate": 0.0003889887813532493, - "loss": 0.5307, - "step": 84125 - }, - { - "epoch": 20.53, - "learning_rate": 0.00038895558223289316, - "loss": 0.4744, - "step": 84150 - }, - { - "epoch": 20.54, - "learning_rate": 0.00038892238311253707, - "loss": 0.595, - "step": 84175 - }, - { - "epoch": 20.55, - "learning_rate": 0.00038888918399218093, - "loss": 0.4853, - "step": 84200 - }, - { - "epoch": 20.55, - "learning_rate": 0.00038885598487182484, - "loss": 0.5554, - "step": 84225 - }, - { - "epoch": 20.56, - "learning_rate": 0.00038882278575146876, - "loss": 0.4629, - "step": 84250 - }, - { - "epoch": 20.56, - "learning_rate": 0.0003887895866311126, - "loss": 0.5226, - "step": 84275 - }, - { - "epoch": 20.57, - "learning_rate": 0.00038875638751075653, - "loss": 0.482, - "step": 84300 - }, - { - "epoch": 20.58, - "learning_rate": 0.00038872318839040045, - "loss": 0.4873, - "step": 84325 - }, - { - "epoch": 20.58, - "learning_rate": 0.0003886899892700443, - "loss": 0.539, - "step": 84350 - }, - { - "epoch": 20.59, - "learning_rate": 0.00038865679014968817, - "loss": 0.5458, - "step": 84375 - }, - { - "epoch": 20.6, - "learning_rate": 0.0003886235910293321, - "loss": 0.4841, - "step": 84400 - }, - { - "epoch": 20.6, - "learning_rate": 0.000388590391908976, - "loss": 0.5369, - "step": 84425 - }, - { - "epoch": 20.61, - "learning_rate": 0.0003885571927886199, - "loss": 0.4676, - "step": 84450 - }, - { - "epoch": 20.61, - "learning_rate": 0.0003885239936682638, - "loss": 0.5472, - "step": 84475 - }, - { - "epoch": 20.62, - "learning_rate": 0.0003884907945479076, - "loss": 0.4976, - "step": 84500 - }, - { - "epoch": 20.63, - "learning_rate": 0.00038845759542755154, - "loss": 0.5668, - "step": 84525 - }, - { - "epoch": 20.63, - "learning_rate": 0.00038842439630719545, - "loss": 0.5263, - "step": 84550 - }, - { - "epoch": 20.64, - "learning_rate": 0.00038839119718683937, - "loss": 0.5336, - "step": 84575 - }, - { - "epoch": 20.64, - "learning_rate": 0.00038835799806648323, - "loss": 0.5053, - "step": 84600 - }, - { - "epoch": 20.65, - "learning_rate": 0.00038832479894612714, - "loss": 0.5443, - "step": 84625 - }, - { - "epoch": 20.66, - "learning_rate": 0.000388291599825771, - "loss": 0.4887, - "step": 84650 - }, - { - "epoch": 20.66, - "learning_rate": 0.0003882584007054149, - "loss": 0.4999, - "step": 84675 - }, - { - "epoch": 20.67, - "learning_rate": 0.00038822520158505883, - "loss": 0.5104, - "step": 84700 - }, - { - "epoch": 20.67, - "learning_rate": 0.0003881920024647027, - "loss": 0.507, - "step": 84725 - }, - { - "epoch": 20.68, - "learning_rate": 0.00038816013130916083, - "loss": 0.5064, - "step": 84750 - }, - { - "epoch": 20.69, - "learning_rate": 0.00038812693218880475, - "loss": 0.5079, - "step": 84775 - }, - { - "epoch": 20.69, - "learning_rate": 0.00038809373306844866, - "loss": 0.5362, - "step": 84800 - }, - { - "epoch": 20.7, - "learning_rate": 0.0003880605339480925, - "loss": 0.5332, - "step": 84825 - }, - { - "epoch": 20.71, - "learning_rate": 0.0003880273348277364, - "loss": 0.5191, - "step": 84850 - }, - { - "epoch": 20.71, - "learning_rate": 0.0003879941357073803, - "loss": 0.5049, - "step": 84875 - }, - { - "epoch": 20.72, - "learning_rate": 0.0003879609365870242, - "loss": 0.4828, - "step": 84900 - }, - { - "epoch": 20.72, - "learning_rate": 0.00038792773746666807, - "loss": 0.5217, - "step": 84925 - }, - { - "epoch": 20.73, - "learning_rate": 0.000387894538346312, - "loss": 0.4909, - "step": 84950 - }, - { - "epoch": 20.74, - "learning_rate": 0.0003878613392259559, - "loss": 0.5039, - "step": 84975 - }, - { - "epoch": 20.74, - "learning_rate": 0.00038782946807041404, - "loss": 0.5085, - "step": 85000 - }, - { - "epoch": 20.75, - "learning_rate": 0.00038779626895005796, - "loss": 0.523, - "step": 85025 - }, - { - "epoch": 20.75, - "learning_rate": 0.00038776306982970176, - "loss": 0.4847, - "step": 85050 - }, - { - "epoch": 20.76, - "learning_rate": 0.0003877298707093457, - "loss": 0.4847, - "step": 85075 - }, - { - "epoch": 20.77, - "learning_rate": 0.0003876966715889896, - "loss": 0.5074, - "step": 85100 - }, - { - "epoch": 20.77, - "learning_rate": 0.0003876634724686335, - "loss": 0.5074, - "step": 85125 - }, - { - "epoch": 20.78, - "learning_rate": 0.00038763027334827736, - "loss": 0.4648, - "step": 85150 - }, - { - "epoch": 20.78, - "learning_rate": 0.0003875970742279213, - "loss": 0.5161, - "step": 85175 - }, - { - "epoch": 20.79, - "learning_rate": 0.00038756387510756514, - "loss": 0.5005, - "step": 85200 - }, - { - "epoch": 20.8, - "learning_rate": 0.00038753067598720905, - "loss": 0.5217, - "step": 85225 - }, - { - "epoch": 20.8, - "learning_rate": 0.00038749747686685296, - "loss": 0.5532, - "step": 85250 - }, - { - "epoch": 20.81, - "learning_rate": 0.0003874642777464968, - "loss": 0.4865, - "step": 85275 - }, - { - "epoch": 20.82, - "learning_rate": 0.00038743107862614074, - "loss": 0.4943, - "step": 85300 - }, - { - "epoch": 20.82, - "learning_rate": 0.00038739787950578465, - "loss": 0.4968, - "step": 85325 - }, - { - "epoch": 20.83, - "learning_rate": 0.0003873646803854285, - "loss": 0.5108, - "step": 85350 - }, - { - "epoch": 20.83, - "learning_rate": 0.00038733148126507237, - "loss": 0.5166, - "step": 85375 - }, - { - "epoch": 20.84, - "learning_rate": 0.0003872982821447163, - "loss": 0.5059, - "step": 85400 - }, - { - "epoch": 20.85, - "learning_rate": 0.0003872650830243602, - "loss": 0.5448, - "step": 85425 - }, - { - "epoch": 20.85, - "learning_rate": 0.0003872318839040041, - "loss": 0.459, - "step": 85450 - }, - { - "epoch": 20.86, - "learning_rate": 0.00038719868478364803, - "loss": 0.5601, - "step": 85475 - }, - { - "epoch": 20.86, - "learning_rate": 0.00038716548566329183, - "loss": 0.5406, - "step": 85500 - }, - { - "epoch": 20.87, - "learning_rate": 0.00038713228654293575, - "loss": 0.5668, - "step": 85525 - }, - { - "epoch": 20.88, - "learning_rate": 0.00038709908742257966, - "loss": 0.5244, - "step": 85550 - }, - { - "epoch": 20.88, - "learning_rate": 0.0003870658883022236, - "loss": 0.5241, - "step": 85575 - }, - { - "epoch": 20.89, - "learning_rate": 0.00038703268918186744, - "loss": 0.51, - "step": 85600 - }, - { - "epoch": 20.89, - "learning_rate": 0.00038699949006151135, - "loss": 0.5241, - "step": 85625 - }, - { - "epoch": 20.9, - "learning_rate": 0.0003869662909411552, - "loss": 0.4852, - "step": 85650 - }, - { - "epoch": 20.91, - "learning_rate": 0.0003869330918207991, - "loss": 0.4979, - "step": 85675 - }, - { - "epoch": 20.91, - "learning_rate": 0.00038689989270044304, - "loss": 0.5292, - "step": 85700 - }, - { - "epoch": 20.92, - "learning_rate": 0.0003868666935800869, - "loss": 0.5465, - "step": 85725 - }, - { - "epoch": 20.92, - "learning_rate": 0.0003868334944597308, - "loss": 0.4996, - "step": 85750 - }, - { - "epoch": 20.93, - "learning_rate": 0.0003868002953393747, - "loss": 0.5401, - "step": 85775 - }, - { - "epoch": 20.94, - "learning_rate": 0.0003867670962190186, - "loss": 0.51, - "step": 85800 - }, - { - "epoch": 20.94, - "learning_rate": 0.00038673389709866244, - "loss": 0.5461, - "step": 85825 - }, - { - "epoch": 20.95, - "learning_rate": 0.00038670069797830636, - "loss": 0.5363, - "step": 85850 - }, - { - "epoch": 20.96, - "learning_rate": 0.00038666749885795027, - "loss": 0.5452, - "step": 85875 - }, - { - "epoch": 20.96, - "learning_rate": 0.0003866342997375942, - "loss": 0.4922, - "step": 85900 - }, - { - "epoch": 20.97, - "learning_rate": 0.0003866011006172381, - "loss": 0.5316, - "step": 85925 - }, - { - "epoch": 20.97, - "learning_rate": 0.0003865679014968819, - "loss": 0.4887, - "step": 85950 - }, - { - "epoch": 20.98, - "learning_rate": 0.0003865347023765258, - "loss": 0.5274, - "step": 85975 - }, - { - "epoch": 20.99, - "learning_rate": 0.00038650150325616973, - "loss": 0.4773, - "step": 86000 - }, - { - "epoch": 20.99, - "learning_rate": 0.00038646830413581365, - "loss": 0.5313, - "step": 86025 - }, - { - "epoch": 21.0, - "learning_rate": 0.0003864351050154575, - "loss": 0.4961, - "step": 86050 - }, - { - "epoch": 21.0, - "learning_rate": 0.0003864019058951014, - "loss": 0.529, - "step": 86075 - }, - { - "epoch": 21.01, - "learning_rate": 0.0003863687067747453, - "loss": 0.4501, - "step": 86100 - }, - { - "epoch": 21.02, - "learning_rate": 0.0003863355076543892, - "loss": 0.5192, - "step": 86125 - }, - { - "epoch": 21.02, - "learning_rate": 0.0003863023085340331, - "loss": 0.5108, - "step": 86150 - }, - { - "epoch": 21.03, - "learning_rate": 0.00038626910941367697, - "loss": 0.4851, - "step": 86175 - }, - { - "epoch": 21.03, - "learning_rate": 0.0003862359102933209, - "loss": 0.5181, - "step": 86200 - }, - { - "epoch": 21.04, - "learning_rate": 0.0003862027111729648, - "loss": 0.4622, - "step": 86225 - }, - { - "epoch": 21.05, - "learning_rate": 0.00038616951205260866, - "loss": 0.481, - "step": 86250 - }, - { - "epoch": 21.05, - "learning_rate": 0.0003861363129322525, - "loss": 0.5097, - "step": 86275 - }, - { - "epoch": 21.06, - "learning_rate": 0.00038610311381189643, - "loss": 0.4656, - "step": 86300 - }, - { - "epoch": 21.07, - "learning_rate": 0.00038606991469154034, - "loss": 0.538, - "step": 86325 - }, - { - "epoch": 21.07, - "learning_rate": 0.00038603671557118426, - "loss": 0.4742, - "step": 86350 - }, - { - "epoch": 21.08, - "learning_rate": 0.00038600351645082817, - "loss": 0.5154, - "step": 86375 - }, - { - "epoch": 21.08, - "learning_rate": 0.000385970317330472, - "loss": 0.4569, - "step": 86400 - }, - { - "epoch": 21.09, - "learning_rate": 0.0003859371182101159, - "loss": 0.5032, - "step": 86425 - }, - { - "epoch": 21.1, - "learning_rate": 0.0003859039190897598, - "loss": 0.4849, - "step": 86450 - }, - { - "epoch": 21.1, - "learning_rate": 0.0003858707199694037, - "loss": 0.5501, - "step": 86475 - }, - { - "epoch": 21.11, - "learning_rate": 0.00038583752084904763, - "loss": 0.4792, - "step": 86500 - }, - { - "epoch": 21.11, - "learning_rate": 0.0003858043217286915, - "loss": 0.5251, - "step": 86525 - }, - { - "epoch": 21.12, - "learning_rate": 0.00038577112260833535, - "loss": 0.475, - "step": 86550 - }, - { - "epoch": 21.13, - "learning_rate": 0.00038573792348797927, - "loss": 0.5294, - "step": 86575 - }, - { - "epoch": 21.13, - "learning_rate": 0.0003857047243676232, - "loss": 0.4167, - "step": 86600 - }, - { - "epoch": 21.14, - "learning_rate": 0.00038567152524726704, - "loss": 0.5099, - "step": 86625 - }, - { - "epoch": 21.14, - "learning_rate": 0.00038563832612691095, - "loss": 0.4696, - "step": 86650 - }, - { - "epoch": 21.15, - "learning_rate": 0.00038560512700655487, - "loss": 0.5457, - "step": 86675 - }, - { - "epoch": 21.16, - "learning_rate": 0.00038557192788619873, - "loss": 0.4737, - "step": 86700 - }, - { - "epoch": 21.16, - "learning_rate": 0.00038553872876584264, - "loss": 0.5073, - "step": 86725 - }, - { - "epoch": 21.17, - "learning_rate": 0.0003855055296454865, - "loss": 0.4881, - "step": 86750 - }, - { - "epoch": 21.17, - "learning_rate": 0.0003854723305251304, - "loss": 0.5053, - "step": 86775 - }, - { - "epoch": 21.18, - "learning_rate": 0.00038543913140477433, - "loss": 0.48, - "step": 86800 - }, - { - "epoch": 21.19, - "learning_rate": 0.00038540593228441824, - "loss": 0.5247, - "step": 86825 - }, - { - "epoch": 21.19, - "learning_rate": 0.00038537273316406205, - "loss": 0.4993, - "step": 86850 - }, - { - "epoch": 21.2, - "learning_rate": 0.00038533953404370596, - "loss": 0.5142, - "step": 86875 - }, - { - "epoch": 21.21, - "learning_rate": 0.0003853063349233499, - "loss": 0.4572, - "step": 86900 - }, - { - "epoch": 21.21, - "learning_rate": 0.0003852731358029938, - "loss": 0.4832, - "step": 86925 - }, - { - "epoch": 21.22, - "learning_rate": 0.0003852399366826377, - "loss": 0.451, - "step": 86950 - }, - { - "epoch": 21.22, - "learning_rate": 0.00038520673756228157, - "loss": 0.5437, - "step": 86975 - }, - { - "epoch": 21.23, - "learning_rate": 0.0003851735384419254, - "loss": 0.4332, - "step": 87000 - }, - { - "epoch": 21.23, - "eval_cer": 0.11381066291592662, - "eval_loss": 0.4382989704608917, - "eval_runtime": 145.5564, - "eval_samples_per_second": 28.807, - "eval_steps_per_second": 7.207, - "eval_wer": 0.4626101141924959, - "step": 87000 - }, - { - "epoch": 21.24, - "learning_rate": 0.00038514033932156934, - "loss": 0.5451, - "step": 87025 - }, - { - "epoch": 21.24, - "learning_rate": 0.00038510714020121325, - "loss": 0.4974, - "step": 87050 - }, - { - "epoch": 21.25, - "learning_rate": 0.0003850739410808571, - "loss": 0.5291, - "step": 87075 - }, - { - "epoch": 21.25, - "learning_rate": 0.000385040741960501, - "loss": 0.4776, - "step": 87100 - }, - { - "epoch": 21.26, - "learning_rate": 0.00038500754284014494, - "loss": 0.5247, - "step": 87125 - }, - { - "epoch": 21.27, - "learning_rate": 0.0003849743437197888, - "loss": 0.4935, - "step": 87150 - }, - { - "epoch": 21.27, - "learning_rate": 0.0003849411445994327, - "loss": 0.4734, - "step": 87175 - }, - { - "epoch": 21.28, - "learning_rate": 0.0003849079454790766, - "loss": 0.4757, - "step": 87200 - }, - { - "epoch": 21.28, - "learning_rate": 0.0003848747463587205, - "loss": 0.5306, - "step": 87225 - }, - { - "epoch": 21.29, - "learning_rate": 0.0003848415472383644, - "loss": 0.4507, - "step": 87250 - }, - { - "epoch": 21.3, - "learning_rate": 0.0003848083481180083, - "loss": 0.5105, - "step": 87275 - }, - { - "epoch": 21.3, - "learning_rate": 0.0003847751489976521, - "loss": 0.4828, - "step": 87300 - }, - { - "epoch": 21.31, - "learning_rate": 0.00038474194987729604, - "loss": 0.5197, - "step": 87325 - }, - { - "epoch": 21.32, - "learning_rate": 0.00038470875075693995, - "loss": 0.4839, - "step": 87350 - }, - { - "epoch": 21.32, - "learning_rate": 0.00038467555163658386, - "loss": 0.5558, - "step": 87375 - }, - { - "epoch": 21.33, - "learning_rate": 0.0003846423525162278, - "loss": 0.4666, - "step": 87400 - }, - { - "epoch": 21.33, - "learning_rate": 0.00038460915339587164, - "loss": 0.4927, - "step": 87425 - }, - { - "epoch": 21.34, - "learning_rate": 0.0003845759542755155, - "loss": 0.4601, - "step": 87450 - }, - { - "epoch": 21.35, - "learning_rate": 0.0003845427551551594, - "loss": 0.5292, - "step": 87475 - }, - { - "epoch": 21.35, - "learning_rate": 0.0003845095560348033, - "loss": 0.4723, - "step": 87500 - }, - { - "epoch": 21.36, - "learning_rate": 0.0003844763569144472, - "loss": 0.4613, - "step": 87525 - }, - { - "epoch": 21.36, - "learning_rate": 0.0003844431577940911, - "loss": 0.484, - "step": 87550 - }, - { - "epoch": 21.37, - "learning_rate": 0.000384409958673735, - "loss": 0.5306, - "step": 87575 - }, - { - "epoch": 21.38, - "learning_rate": 0.00038437675955337887, - "loss": 0.4712, - "step": 87600 - }, - { - "epoch": 21.38, - "learning_rate": 0.0003843435604330228, - "loss": 0.5464, - "step": 87625 - }, - { - "epoch": 21.39, - "learning_rate": 0.00038431036131266665, - "loss": 0.4775, - "step": 87650 - }, - { - "epoch": 21.39, - "learning_rate": 0.00038427716219231056, - "loss": 0.4835, - "step": 87675 - }, - { - "epoch": 21.4, - "learning_rate": 0.0003842439630719545, - "loss": 0.4547, - "step": 87700 - }, - { - "epoch": 21.41, - "learning_rate": 0.00038421076395159833, - "loss": 0.5336, - "step": 87725 - }, - { - "epoch": 21.41, - "learning_rate": 0.0003841775648312422, - "loss": 0.5115, - "step": 87750 - }, - { - "epoch": 21.42, - "learning_rate": 0.0003841443657108861, - "loss": 0.4953, - "step": 87775 - }, - { - "epoch": 21.43, - "learning_rate": 0.00038411116659053, - "loss": 0.4706, - "step": 87800 - }, - { - "epoch": 21.43, - "learning_rate": 0.00038407796747017394, - "loss": 0.4955, - "step": 87825 - }, - { - "epoch": 21.44, - "learning_rate": 0.00038404476834981785, - "loss": 0.494, - "step": 87850 - }, - { - "epoch": 21.44, - "learning_rate": 0.00038401156922946166, - "loss": 0.5419, - "step": 87875 - }, - { - "epoch": 21.45, - "learning_rate": 0.00038397837010910557, - "loss": 0.4793, - "step": 87900 - }, - { - "epoch": 21.46, - "learning_rate": 0.0003839451709887495, - "loss": 0.4904, - "step": 87925 - }, - { - "epoch": 21.46, - "learning_rate": 0.0003839119718683934, - "loss": 0.4811, - "step": 87950 - }, - { - "epoch": 21.47, - "learning_rate": 0.0003838787727480373, - "loss": 0.5167, - "step": 87975 - }, - { - "epoch": 21.47, - "learning_rate": 0.00038384557362768117, - "loss": 0.4956, - "step": 88000 - }, - { - "epoch": 21.48, - "learning_rate": 0.00038381237450732503, - "loss": 0.5186, - "step": 88025 - }, - { - "epoch": 21.49, - "learning_rate": 0.00038377917538696894, - "loss": 0.4889, - "step": 88050 - }, - { - "epoch": 21.49, - "learning_rate": 0.00038374597626661286, - "loss": 0.5104, - "step": 88075 - }, - { - "epoch": 21.5, - "learning_rate": 0.0003837127771462567, - "loss": 0.457, - "step": 88100 - }, - { - "epoch": 21.5, - "learning_rate": 0.00038367957802590063, - "loss": 0.4604, - "step": 88125 - }, - { - "epoch": 21.51, - "learning_rate": 0.00038364637890554455, - "loss": 0.4942, - "step": 88150 - }, - { - "epoch": 21.52, - "learning_rate": 0.0003836131797851884, - "loss": 0.5411, - "step": 88175 - }, - { - "epoch": 21.52, - "learning_rate": 0.0003835799806648323, - "loss": 0.4869, - "step": 88200 - }, - { - "epoch": 21.53, - "learning_rate": 0.0003835467815444762, - "loss": 0.5289, - "step": 88225 - }, - { - "epoch": 21.53, - "learning_rate": 0.0003835135824241201, - "loss": 0.4726, - "step": 88250 - }, - { - "epoch": 21.54, - "learning_rate": 0.000383480383303764, - "loss": 0.4902, - "step": 88275 - }, - { - "epoch": 21.55, - "learning_rate": 0.0003834471841834079, - "loss": 0.4888, - "step": 88300 - }, - { - "epoch": 21.55, - "learning_rate": 0.00038341398506305173, - "loss": 0.5346, - "step": 88325 - }, - { - "epoch": 21.56, - "learning_rate": 0.00038338078594269564, - "loss": 0.4747, - "step": 88350 - }, - { - "epoch": 21.57, - "learning_rate": 0.00038334758682233956, - "loss": 0.5675, - "step": 88375 - }, - { - "epoch": 21.57, - "learning_rate": 0.00038331438770198347, - "loss": 0.5019, - "step": 88400 - }, - { - "epoch": 21.58, - "learning_rate": 0.0003832811885816274, - "loss": 0.5105, - "step": 88425 - }, - { - "epoch": 21.58, - "learning_rate": 0.00038324798946127124, - "loss": 0.4534, - "step": 88450 - }, - { - "epoch": 21.59, - "learning_rate": 0.0003832147903409151, - "loss": 0.472, - "step": 88475 - }, - { - "epoch": 21.6, - "learning_rate": 0.000383181591220559, - "loss": 0.4931, - "step": 88500 - }, - { - "epoch": 21.6, - "learning_rate": 0.00038314839210020293, - "loss": 0.5198, - "step": 88525 - }, - { - "epoch": 21.61, - "learning_rate": 0.0003831151929798468, - "loss": 0.4678, - "step": 88550 - }, - { - "epoch": 21.61, - "learning_rate": 0.0003830819938594907, - "loss": 0.5238, - "step": 88575 - }, - { - "epoch": 21.62, - "learning_rate": 0.0003830487947391346, - "loss": 0.4967, - "step": 88600 - }, - { - "epoch": 21.63, - "learning_rate": 0.0003830155956187785, - "loss": 0.5125, - "step": 88625 - }, - { - "epoch": 21.63, - "learning_rate": 0.0003829823964984224, - "loss": 0.4883, - "step": 88650 - }, - { - "epoch": 21.64, - "learning_rate": 0.00038294919737806625, - "loss": 0.5136, - "step": 88675 - }, - { - "epoch": 21.64, - "learning_rate": 0.00038291599825771017, - "loss": 0.4898, - "step": 88700 - }, - { - "epoch": 21.65, - "learning_rate": 0.0003828827991373541, - "loss": 0.5451, - "step": 88725 - }, - { - "epoch": 21.66, - "learning_rate": 0.000382849600016998, - "loss": 0.464, - "step": 88750 - }, - { - "epoch": 21.66, - "learning_rate": 0.0003828164008966418, - "loss": 0.5639, - "step": 88775 - }, - { - "epoch": 21.67, - "learning_rate": 0.0003827832017762857, - "loss": 0.4639, - "step": 88800 - }, - { - "epoch": 21.68, - "learning_rate": 0.00038275000265592963, - "loss": 0.5164, - "step": 88825 - }, - { - "epoch": 21.68, - "learning_rate": 0.00038271680353557354, - "loss": 0.5242, - "step": 88850 - }, - { - "epoch": 21.69, - "learning_rate": 0.00038268360441521746, - "loss": 0.532, - "step": 88875 - }, - { - "epoch": 21.69, - "learning_rate": 0.0003826504052948613, - "loss": 0.5124, - "step": 88900 - }, - { - "epoch": 21.7, - "learning_rate": 0.0003826172061745052, - "loss": 0.5157, - "step": 88925 - }, - { - "epoch": 21.71, - "learning_rate": 0.0003825840070541491, - "loss": 0.4771, - "step": 88950 - }, - { - "epoch": 21.71, - "learning_rate": 0.000382550807933793, - "loss": 0.5629, - "step": 88975 - }, - { - "epoch": 21.72, - "learning_rate": 0.0003825176088134369, - "loss": 0.473, - "step": 89000 - }, - { - "epoch": 21.72, - "learning_rate": 0.0003824844096930808, - "loss": 0.5363, - "step": 89025 - }, - { - "epoch": 21.73, - "learning_rate": 0.0003824512105727247, - "loss": 0.5015, - "step": 89050 - }, - { - "epoch": 21.74, - "learning_rate": 0.00038241801145236855, - "loss": 0.5072, - "step": 89075 - }, - { - "epoch": 21.74, - "learning_rate": 0.00038238481233201246, - "loss": 0.451, - "step": 89100 - }, - { - "epoch": 21.75, - "learning_rate": 0.0003823516132116563, - "loss": 0.5009, - "step": 89125 - }, - { - "epoch": 21.75, - "learning_rate": 0.00038231841409130024, - "loss": 0.5052, - "step": 89150 - }, - { - "epoch": 21.76, - "learning_rate": 0.00038228521497094415, - "loss": 0.5099, - "step": 89175 - }, - { - "epoch": 21.77, - "learning_rate": 0.00038225201585058807, - "loss": 0.4809, - "step": 89200 - }, - { - "epoch": 21.77, - "learning_rate": 0.0003822188167302319, - "loss": 0.5133, - "step": 89225 - }, - { - "epoch": 21.78, - "learning_rate": 0.0003821856176098758, - "loss": 0.4826, - "step": 89250 - }, - { - "epoch": 21.79, - "learning_rate": 0.0003821524184895197, - "loss": 0.5309, - "step": 89275 - }, - { - "epoch": 21.79, - "learning_rate": 0.0003821192193691636, - "loss": 0.4787, - "step": 89300 - }, - { - "epoch": 21.8, - "learning_rate": 0.00038208602024880753, - "loss": 0.5302, - "step": 89325 - }, - { - "epoch": 21.8, - "learning_rate": 0.0003820528211284514, - "loss": 0.4527, - "step": 89350 - }, - { - "epoch": 21.81, - "learning_rate": 0.00038201962200809525, - "loss": 0.5046, - "step": 89375 - }, - { - "epoch": 21.82, - "learning_rate": 0.00038198642288773916, - "loss": 0.4953, - "step": 89400 - }, - { - "epoch": 21.82, - "learning_rate": 0.0003819532237673831, - "loss": 0.552, - "step": 89425 - }, - { - "epoch": 21.83, - "learning_rate": 0.000381920024647027, - "loss": 0.5051, - "step": 89450 - }, - { - "epoch": 21.83, - "learning_rate": 0.00038188682552667085, - "loss": 0.5126, - "step": 89475 - }, - { - "epoch": 21.84, - "learning_rate": 0.00038185362640631476, - "loss": 0.4988, - "step": 89500 - }, - { - "epoch": 21.85, - "learning_rate": 0.0003912863425360371, - "loss": 0.53, - "step": 89525 - }, - { - "epoch": 21.85, - "learning_rate": 0.0003912570241876374, - "loss": 0.4469, - "step": 89550 - }, - { - "epoch": 21.86, - "learning_rate": 0.00039122648424138776, - "loss": 0.5172, - "step": 89575 - }, - { - "epoch": 21.86, - "learning_rate": 0.00039119594429513807, - "loss": 0.5424, - "step": 89600 - }, - { - "epoch": 21.87, - "learning_rate": 0.00039116540434888837, - "loss": 0.5237, - "step": 89625 - }, - { - "epoch": 21.88, - "learning_rate": 0.0003911348644026387, - "loss": 0.4864, - "step": 89650 - }, - { - "epoch": 21.88, - "learning_rate": 0.0003911043244563889, - "loss": 0.5272, - "step": 89675 - }, - { - "epoch": 21.89, - "learning_rate": 0.0003910737845101392, - "loss": 0.4576, - "step": 89700 - }, - { - "epoch": 21.89, - "learning_rate": 0.0003910432445638896, - "loss": 0.5364, - "step": 89725 - }, - { - "epoch": 21.9, - "learning_rate": 0.0003910127046176399, - "loss": 0.5269, - "step": 89750 - }, - { - "epoch": 21.91, - "learning_rate": 0.0003909821646713902, - "loss": 0.523, - "step": 89775 - }, - { - "epoch": 21.91, - "learning_rate": 0.0003909516247251405, - "loss": 0.444, - "step": 89800 - }, - { - "epoch": 21.92, - "learning_rate": 0.0003909210847788908, - "loss": 0.5496, - "step": 89825 - }, - { - "epoch": 21.93, - "learning_rate": 0.0003908905448326411, - "loss": 0.4531, - "step": 89850 - }, - { - "epoch": 21.93, - "learning_rate": 0.0003908600048863914, - "loss": 0.492, - "step": 89875 - }, - { - "epoch": 21.94, - "learning_rate": 0.0003908294649401417, - "loss": 0.4916, - "step": 89900 - }, - { - "epoch": 21.94, - "learning_rate": 0.000390798924993892, - "loss": 0.5314, - "step": 89925 - }, - { - "epoch": 21.95, - "learning_rate": 0.0003907683850476423, - "loss": 0.469, - "step": 89950 - }, - { - "epoch": 21.96, - "learning_rate": 0.00039073784510139267, - "loss": 0.5014, - "step": 89975 - }, - { - "epoch": 21.96, - "learning_rate": 0.0003907073051551429, - "loss": 0.4671, - "step": 90000 - }, - { - "epoch": 21.96, - "eval_cer": 0.11175220475755367, - "eval_loss": 0.4197826087474823, - "eval_runtime": 144.9411, - "eval_samples_per_second": 28.929, - "eval_steps_per_second": 7.237, - "eval_wer": 0.45471451876019575, - "step": 90000 - }, - { - "epoch": 21.97, - "learning_rate": 0.0003906767652088932, - "loss": 0.5545, - "step": 90025 - }, - { - "epoch": 21.97, - "learning_rate": 0.0003906462252626435, - "loss": 0.4985, - "step": 90050 - }, - { - "epoch": 21.98, - "learning_rate": 0.00039061568531639383, - "loss": 0.5421, - "step": 90075 - }, - { - "epoch": 21.99, - "learning_rate": 0.0003905851453701442, - "loss": 0.4719, - "step": 90100 - }, - { - "epoch": 21.99, - "learning_rate": 0.0003905546054238945, - "loss": 0.4999, - "step": 90125 - }, - { - "epoch": 22.0, - "learning_rate": 0.00039052406547764474, - "loss": 0.4586, - "step": 90150 - }, - { - "epoch": 22.0, - "learning_rate": 0.00039049352553139504, - "loss": 0.5135, - "step": 90175 - }, - { - "epoch": 22.01, - "learning_rate": 0.00039046298558514535, - "loss": 0.4611, - "step": 90200 - }, - { - "epoch": 22.02, - "learning_rate": 0.0003904324456388957, - "loss": 0.4822, - "step": 90225 - }, - { - "epoch": 22.02, - "learning_rate": 0.000390401905692646, - "loss": 0.4451, - "step": 90250 - }, - { - "epoch": 22.03, - "learning_rate": 0.0003903713657463963, - "loss": 0.5283, - "step": 90275 - }, - { - "epoch": 22.04, - "learning_rate": 0.0003903408258001466, - "loss": 0.4192, - "step": 90300 - }, - { - "epoch": 22.04, - "learning_rate": 0.00039031028585389686, - "loss": 0.5237, - "step": 90325 - }, - { - "epoch": 22.05, - "learning_rate": 0.0003902797459076472, - "loss": 0.4501, - "step": 90350 - }, - { - "epoch": 22.05, - "learning_rate": 0.0003902492059613975, - "loss": 0.4873, - "step": 90375 - }, - { - "epoch": 22.06, - "learning_rate": 0.00039021866601514783, - "loss": 0.4595, - "step": 90400 - }, - { - "epoch": 22.07, - "learning_rate": 0.00039018812606889813, - "loss": 0.517, - "step": 90425 - }, - { - "epoch": 22.07, - "learning_rate": 0.00039015758612264843, - "loss": 0.455, - "step": 90450 - }, - { - "epoch": 22.08, - "learning_rate": 0.00039012704617639874, - "loss": 0.5074, - "step": 90475 - }, - { - "epoch": 22.08, - "learning_rate": 0.00039009650623014904, - "loss": 0.4544, - "step": 90500 - }, - { - "epoch": 22.09, - "learning_rate": 0.00039006596628389934, - "loss": 0.4933, - "step": 90525 - }, - { - "epoch": 22.1, - "learning_rate": 0.00039003542633764965, - "loss": 0.4465, - "step": 90550 - }, - { - "epoch": 22.1, - "learning_rate": 0.00039000488639139995, - "loss": 0.4574, - "step": 90575 - }, - { - "epoch": 22.11, - "learning_rate": 0.0003899743464451503, - "loss": 0.4509, - "step": 90600 - }, - { - "epoch": 22.11, - "learning_rate": 0.00038994380649890056, - "loss": 0.5082, - "step": 90625 - }, - { - "epoch": 22.12, - "learning_rate": 0.00038991326655265086, - "loss": 0.4783, - "step": 90650 - }, - { - "epoch": 22.13, - "learning_rate": 0.00038988272660640116, - "loss": 0.4925, - "step": 90675 - }, - { - "epoch": 22.13, - "learning_rate": 0.00038985218666015147, - "loss": 0.4301, - "step": 90700 - }, - { - "epoch": 22.14, - "learning_rate": 0.0003898216467139018, - "loss": 0.5307, - "step": 90725 - }, - { - "epoch": 22.14, - "learning_rate": 0.00038979110676765213, - "loss": 0.4506, - "step": 90750 - }, - { - "epoch": 22.15, - "learning_rate": 0.00038976056682140243, - "loss": 0.4787, - "step": 90775 - }, - { - "epoch": 22.16, - "learning_rate": 0.0003897300268751527, - "loss": 0.4733, - "step": 90800 - }, - { - "epoch": 22.16, - "learning_rate": 0.000389699486928903, - "loss": 0.5464, - "step": 90825 - }, - { - "epoch": 22.17, - "learning_rate": 0.00038966894698265334, - "loss": 0.4397, - "step": 90850 - }, - { - "epoch": 22.18, - "learning_rate": 0.00038963840703640365, - "loss": 0.4903, - "step": 90875 - }, - { - "epoch": 22.18, - "learning_rate": 0.00038960786709015395, - "loss": 0.4126, - "step": 90900 - }, - { - "epoch": 22.19, - "learning_rate": 0.00038957732714390425, - "loss": 0.5237, - "step": 90925 - }, - { - "epoch": 22.19, - "learning_rate": 0.0003895467871976545, - "loss": 0.5362, - "step": 90950 - }, - { - "epoch": 22.2, - "learning_rate": 0.00038951624725140486, - "loss": 0.5327, - "step": 90975 - }, - { - "epoch": 22.21, - "learning_rate": 0.00038948570730515516, - "loss": 0.4644, - "step": 91000 - }, - { - "epoch": 22.21, - "learning_rate": 0.00038945516735890547, - "loss": 0.5763, - "step": 91025 - }, - { - "epoch": 22.22, - "learning_rate": 0.00038942462741265577, - "loss": 0.4837, - "step": 91050 - }, - { - "epoch": 22.22, - "learning_rate": 0.00038939408746640607, - "loss": 0.5277, - "step": 91075 - }, - { - "epoch": 22.23, - "learning_rate": 0.0003893635475201563, - "loss": 0.4429, - "step": 91100 - }, - { - "epoch": 22.24, - "learning_rate": 0.0003893330075739067, - "loss": 0.5015, - "step": 91125 - }, - { - "epoch": 22.24, - "learning_rate": 0.000389302467627657, - "loss": 0.4684, - "step": 91150 - }, - { - "epoch": 22.25, - "learning_rate": 0.0003892719276814073, - "loss": 0.5632, - "step": 91175 - }, - { - "epoch": 22.25, - "learning_rate": 0.0003892413877351576, - "loss": 0.4923, - "step": 91200 - }, - { - "epoch": 22.26, - "learning_rate": 0.0003892108477889079, - "loss": 0.5177, - "step": 91225 - }, - { - "epoch": 22.27, - "learning_rate": 0.00038918030784265825, - "loss": 0.4963, - "step": 91250 - }, - { - "epoch": 22.27, - "learning_rate": 0.0003891497678964085, - "loss": 0.4868, - "step": 91275 - }, - { - "epoch": 22.28, - "learning_rate": 0.0003891192279501588, - "loss": 0.4688, - "step": 91300 - }, - { - "epoch": 22.29, - "learning_rate": 0.0003890886880039091, - "loss": 0.495, - "step": 91325 - }, - { - "epoch": 22.29, - "learning_rate": 0.0003890581480576594, - "loss": 0.4599, - "step": 91350 - }, - { - "epoch": 22.3, - "learning_rate": 0.00038902760811140977, - "loss": 0.4995, - "step": 91375 - }, - { - "epoch": 22.3, - "learning_rate": 0.00038899706816516007, - "loss": 0.4644, - "step": 91400 - }, - { - "epoch": 22.31, - "learning_rate": 0.0003889665282189103, - "loss": 0.5083, - "step": 91425 - }, - { - "epoch": 22.32, - "learning_rate": 0.0003889359882726606, - "loss": 0.4402, - "step": 91450 - }, - { - "epoch": 22.32, - "learning_rate": 0.0003889054483264109, - "loss": 0.4883, - "step": 91475 - }, - { - "epoch": 22.33, - "learning_rate": 0.0003888749083801613, - "loss": 0.4897, - "step": 91500 - }, - { - "epoch": 22.33, - "learning_rate": 0.0003888443684339116, - "loss": 0.5078, - "step": 91525 - }, - { - "epoch": 22.34, - "learning_rate": 0.0003888138284876619, - "loss": 0.4662, - "step": 91550 - }, - { - "epoch": 22.35, - "learning_rate": 0.00038878451013926214, - "loss": 0.5353, - "step": 91575 - }, - { - "epoch": 22.35, - "learning_rate": 0.00038875397019301245, - "loss": 0.4879, - "step": 91600 - }, - { - "epoch": 22.36, - "learning_rate": 0.00038872343024676275, - "loss": 0.5197, - "step": 91625 - }, - { - "epoch": 22.36, - "learning_rate": 0.0003886928903005131, - "loss": 0.4503, - "step": 91650 - }, - { - "epoch": 22.37, - "learning_rate": 0.0003886623503542634, - "loss": 0.5222, - "step": 91675 - }, - { - "epoch": 22.38, - "learning_rate": 0.0003886318104080137, - "loss": 0.4813, - "step": 91700 - }, - { - "epoch": 22.38, - "learning_rate": 0.000388601270461764, - "loss": 0.5059, - "step": 91725 - }, - { - "epoch": 22.39, - "learning_rate": 0.00038857073051551427, - "loss": 0.4764, - "step": 91750 - }, - { - "epoch": 22.4, - "learning_rate": 0.00038854019056926457, - "loss": 0.5375, - "step": 91775 - }, - { - "epoch": 22.4, - "learning_rate": 0.0003885096506230149, - "loss": 0.4988, - "step": 91800 - }, - { - "epoch": 22.41, - "learning_rate": 0.00038847911067676523, - "loss": 0.4746, - "step": 91825 - }, - { - "epoch": 22.41, - "learning_rate": 0.00038844857073051553, - "loss": 0.5125, - "step": 91850 - }, - { - "epoch": 22.42, - "learning_rate": 0.00038841803078426584, - "loss": 0.5544, - "step": 91875 - }, - { - "epoch": 22.43, - "learning_rate": 0.0003883874908380161, - "loss": 0.4323, - "step": 91900 - }, - { - "epoch": 22.43, - "learning_rate": 0.00038835695089176644, - "loss": 0.4781, - "step": 91925 - }, - { - "epoch": 22.44, - "learning_rate": 0.00038832641094551675, - "loss": 0.5042, - "step": 91950 - }, - { - "epoch": 22.44, - "learning_rate": 0.00038829587099926705, - "loss": 0.5044, - "step": 91975 - }, - { - "epoch": 22.45, - "learning_rate": 0.00038826533105301735, - "loss": 0.4864, - "step": 92000 - }, - { - "epoch": 22.46, - "learning_rate": 0.00038823479110676766, - "loss": 0.561, - "step": 92025 - }, - { - "epoch": 22.46, - "learning_rate": 0.00038820425116051796, - "loss": 0.4371, - "step": 92050 - }, - { - "epoch": 22.47, - "learning_rate": 0.00038817371121426826, - "loss": 0.4977, - "step": 92075 - }, - { - "epoch": 22.47, - "learning_rate": 0.00038814317126801857, - "loss": 0.4416, - "step": 92100 - }, - { - "epoch": 22.48, - "learning_rate": 0.00038811263132176887, - "loss": 0.5439, - "step": 92125 - }, - { - "epoch": 22.49, - "learning_rate": 0.0003880820913755192, - "loss": 0.443, - "step": 92150 - }, - { - "epoch": 22.49, - "learning_rate": 0.00038805155142926953, - "loss": 0.533, - "step": 92175 - }, - { - "epoch": 22.5, - "learning_rate": 0.00038802101148301983, - "loss": 0.4652, - "step": 92200 - }, - { - "epoch": 22.5, - "learning_rate": 0.0003879904715367701, - "loss": 0.5629, - "step": 92225 - }, - { - "epoch": 22.51, - "learning_rate": 0.0003879599315905204, - "loss": 0.4605, - "step": 92250 - }, - { - "epoch": 22.52, - "learning_rate": 0.0003879293916442707, - "loss": 0.5329, - "step": 92275 - }, - { - "epoch": 22.52, - "learning_rate": 0.00038789885169802105, - "loss": 0.4571, - "step": 92300 - }, - { - "epoch": 22.53, - "learning_rate": 0.00038786831175177135, - "loss": 0.4795, - "step": 92325 - }, - { - "epoch": 22.54, - "learning_rate": 0.00038783777180552165, - "loss": 0.4904, - "step": 92350 - }, - { - "epoch": 22.54, - "learning_rate": 0.0003878072318592719, - "loss": 0.5605, - "step": 92375 - }, - { - "epoch": 22.55, - "learning_rate": 0.0003877766919130222, - "loss": 0.4585, - "step": 92400 - }, - { - "epoch": 22.55, - "learning_rate": 0.00038774615196677256, - "loss": 0.5349, - "step": 92425 - }, - { - "epoch": 22.56, - "learning_rate": 0.00038771561202052287, - "loss": 0.4769, - "step": 92450 - }, - { - "epoch": 22.57, - "learning_rate": 0.00038768507207427317, - "loss": 0.491, - "step": 92475 - }, - { - "epoch": 22.57, - "learning_rate": 0.0003876545321280235, - "loss": 0.4512, - "step": 92500 - }, - { - "epoch": 22.58, - "learning_rate": 0.0003876239921817737, - "loss": 0.5088, - "step": 92525 - }, - { - "epoch": 22.58, - "learning_rate": 0.0003875934522355241, - "loss": 0.4509, - "step": 92550 - }, - { - "epoch": 22.59, - "learning_rate": 0.0003875629122892744, - "loss": 0.5303, - "step": 92575 - }, - { - "epoch": 22.6, - "learning_rate": 0.0003875323723430247, - "loss": 0.4676, - "step": 92600 - }, - { - "epoch": 22.6, - "learning_rate": 0.000387501832396775, - "loss": 0.4776, - "step": 92625 - }, - { - "epoch": 22.61, - "learning_rate": 0.0003874712924505253, - "loss": 0.4843, - "step": 92650 - }, - { - "epoch": 22.61, - "learning_rate": 0.0003874407525042756, - "loss": 0.504, - "step": 92675 - }, - { - "epoch": 22.62, - "learning_rate": 0.0003874102125580259, - "loss": 0.4525, - "step": 92700 - }, - { - "epoch": 22.63, - "learning_rate": 0.0003873796726117762, - "loss": 0.4874, - "step": 92725 - }, - { - "epoch": 22.63, - "learning_rate": 0.0003873491326655265, - "loss": 0.5024, - "step": 92750 - }, - { - "epoch": 22.64, - "learning_rate": 0.0003873185927192768, - "loss": 0.5104, - "step": 92775 - }, - { - "epoch": 22.65, - "learning_rate": 0.00038728805277302717, - "loss": 0.4292, - "step": 92800 - }, - { - "epoch": 22.65, - "learning_rate": 0.00038725751282677747, - "loss": 0.4798, - "step": 92825 - }, - { - "epoch": 22.66, - "learning_rate": 0.0003872269728805277, - "loss": 0.4755, - "step": 92850 - }, - { - "epoch": 22.66, - "learning_rate": 0.000387196432934278, - "loss": 0.5197, - "step": 92875 - }, - { - "epoch": 22.67, - "learning_rate": 0.00038716589298802833, - "loss": 0.4345, - "step": 92900 - }, - { - "epoch": 22.68, - "learning_rate": 0.0003871353530417787, - "loss": 0.5431, - "step": 92925 - }, - { - "epoch": 22.68, - "learning_rate": 0.000387104813095529, - "loss": 0.4644, - "step": 92950 - }, - { - "epoch": 22.69, - "learning_rate": 0.0003870742731492793, - "loss": 0.4992, - "step": 92975 - }, - { - "epoch": 22.69, - "learning_rate": 0.00038704373320302954, - "loss": 0.4451, - "step": 93000 - }, - { - "epoch": 22.69, - "eval_cer": 0.11186000431198218, - "eval_loss": 0.44263726472854614, - "eval_runtime": 146.1403, - "eval_samples_per_second": 28.692, - "eval_steps_per_second": 7.178, - "eval_wer": 0.4508646003262643, - "step": 93000 - }, - { - "epoch": 22.7, - "learning_rate": 0.00038701319325677984, - "loss": 0.4674, - "step": 93025 - }, - { - "epoch": 22.71, - "learning_rate": 0.0003869826533105302, - "loss": 0.4967, - "step": 93050 - }, - { - "epoch": 22.71, - "learning_rate": 0.0003869521133642805, - "loss": 0.5561, - "step": 93075 - }, - { - "epoch": 22.72, - "learning_rate": 0.0003869215734180308, - "loss": 0.5109, - "step": 93100 - }, - { - "epoch": 22.72, - "learning_rate": 0.0003868910334717811, - "loss": 0.494, - "step": 93125 - }, - { - "epoch": 22.73, - "learning_rate": 0.00038686049352553136, - "loss": 0.4803, - "step": 93150 - }, - { - "epoch": 22.74, - "learning_rate": 0.00038682995357928166, - "loss": 0.523, - "step": 93175 - }, - { - "epoch": 22.74, - "learning_rate": 0.000386799413633032, - "loss": 0.4682, - "step": 93200 - }, - { - "epoch": 22.75, - "learning_rate": 0.0003867688736867823, - "loss": 0.4921, - "step": 93225 - }, - { - "epoch": 22.76, - "learning_rate": 0.00038673833374053263, - "loss": 0.4338, - "step": 93250 - }, - { - "epoch": 22.76, - "learning_rate": 0.00038670779379428293, - "loss": 0.5046, - "step": 93275 - }, - { - "epoch": 22.77, - "learning_rate": 0.00038667725384803324, - "loss": 0.4381, - "step": 93300 - }, - { - "epoch": 22.77, - "learning_rate": 0.00038664671390178354, - "loss": 0.5095, - "step": 93325 - }, - { - "epoch": 22.78, - "learning_rate": 0.00038661617395553384, - "loss": 0.4569, - "step": 93350 - }, - { - "epoch": 22.79, - "learning_rate": 0.00038658563400928415, - "loss": 0.5539, - "step": 93375 - }, - { - "epoch": 22.79, - "learning_rate": 0.00038655509406303445, - "loss": 0.4506, - "step": 93400 - }, - { - "epoch": 22.8, - "learning_rate": 0.00038652455411678475, - "loss": 0.4904, - "step": 93425 - }, - { - "epoch": 22.8, - "learning_rate": 0.0003864940141705351, - "loss": 0.4195, - "step": 93450 - }, - { - "epoch": 22.81, - "learning_rate": 0.00038646347422428536, - "loss": 0.5241, - "step": 93475 - }, - { - "epoch": 22.82, - "learning_rate": 0.00038643293427803566, - "loss": 0.5006, - "step": 93500 - }, - { - "epoch": 22.82, - "learning_rate": 0.00038640239433178597, - "loss": 0.5539, - "step": 93525 - }, - { - "epoch": 22.83, - "learning_rate": 0.00038637185438553627, - "loss": 0.4748, - "step": 93550 - }, - { - "epoch": 22.83, - "learning_rate": 0.0003863413144392866, - "loss": 0.5467, - "step": 93575 - }, - { - "epoch": 22.84, - "learning_rate": 0.00038631077449303693, - "loss": 0.4706, - "step": 93600 - }, - { - "epoch": 22.85, - "learning_rate": 0.0003862802345467872, - "loss": 0.5325, - "step": 93625 - }, - { - "epoch": 22.85, - "learning_rate": 0.0003862496946005375, - "loss": 0.4695, - "step": 93650 - }, - { - "epoch": 22.86, - "learning_rate": 0.0003862191546542878, - "loss": 0.4782, - "step": 93675 - }, - { - "epoch": 22.86, - "learning_rate": 0.00038618861470803814, - "loss": 0.4095, - "step": 93700 - }, - { - "epoch": 22.87, - "learning_rate": 0.00038615807476178845, - "loss": 0.51, - "step": 93725 - }, - { - "epoch": 22.88, - "learning_rate": 0.00038612753481553875, - "loss": 0.4564, - "step": 93750 - }, - { - "epoch": 22.88, - "learning_rate": 0.00038609699486928905, - "loss": 0.5336, - "step": 93775 - }, - { - "epoch": 22.89, - "learning_rate": 0.0003860664549230393, - "loss": 0.5094, - "step": 93800 - }, - { - "epoch": 22.9, - "learning_rate": 0.00038603591497678966, - "loss": 0.5279, - "step": 93825 - }, - { - "epoch": 22.9, - "learning_rate": 0.00038600537503053996, - "loss": 0.5133, - "step": 93850 - }, - { - "epoch": 22.91, - "learning_rate": 0.00038597483508429027, - "loss": 0.4836, - "step": 93875 - }, - { - "epoch": 22.91, - "learning_rate": 0.00038594429513804057, - "loss": 0.4918, - "step": 93900 - }, - { - "epoch": 22.92, - "learning_rate": 0.0003859137551917909, - "loss": 0.5372, - "step": 93925 - }, - { - "epoch": 22.93, - "learning_rate": 0.0003858832152455412, - "loss": 0.4791, - "step": 93950 - }, - { - "epoch": 22.93, - "learning_rate": 0.0003858526752992915, - "loss": 0.5199, - "step": 93975 - }, - { - "epoch": 22.94, - "learning_rate": 0.0003858233569508918, - "loss": 0.4629, - "step": 94000 - }, - { - "epoch": 22.94, - "learning_rate": 0.0003857928170046421, - "loss": 0.5178, - "step": 94025 - }, - { - "epoch": 22.95, - "learning_rate": 0.0003857622770583924, - "loss": 0.5132, - "step": 94050 - }, - { - "epoch": 22.96, - "learning_rate": 0.0003857317371121427, - "loss": 0.5321, - "step": 94075 - }, - { - "epoch": 22.96, - "learning_rate": 0.00038570119716589295, - "loss": 0.4338, - "step": 94100 - }, - { - "epoch": 22.97, - "learning_rate": 0.0003856706572196433, - "loss": 0.4782, - "step": 94125 - }, - { - "epoch": 22.97, - "learning_rate": 0.0003856401172733936, - "loss": 0.5093, - "step": 94150 - }, - { - "epoch": 22.98, - "learning_rate": 0.0003856095773271439, - "loss": 0.4996, - "step": 94175 - }, - { - "epoch": 22.99, - "learning_rate": 0.0003855790373808942, - "loss": 0.4576, - "step": 94200 - }, - { - "epoch": 22.99, - "learning_rate": 0.0003855484974346445, - "loss": 0.5363, - "step": 94225 - }, - { - "epoch": 23.0, - "learning_rate": 0.0003855179574883949, - "loss": 0.4586, - "step": 94250 - }, - { - "epoch": 23.01, - "learning_rate": 0.0003854874175421451, - "loss": 0.5103, - "step": 94275 - }, - { - "epoch": 23.01, - "learning_rate": 0.0003854568775958954, - "loss": 0.4995, - "step": 94300 - }, - { - "epoch": 23.02, - "learning_rate": 0.00038542633764964573, - "loss": 0.4858, - "step": 94325 - }, - { - "epoch": 23.02, - "learning_rate": 0.00038539579770339603, - "loss": 0.4616, - "step": 94350 - }, - { - "epoch": 23.03, - "learning_rate": 0.0003853652577571464, - "loss": 0.4772, - "step": 94375 - }, - { - "epoch": 23.04, - "learning_rate": 0.0003853347178108967, - "loss": 0.4242, - "step": 94400 - }, - { - "epoch": 23.04, - "learning_rate": 0.00038530417786464694, - "loss": 0.4551, - "step": 94425 - }, - { - "epoch": 23.05, - "learning_rate": 0.00038527363791839725, - "loss": 0.4337, - "step": 94450 - }, - { - "epoch": 23.05, - "learning_rate": 0.00038524309797214755, - "loss": 0.5081, - "step": 94475 - }, - { - "epoch": 23.06, - "learning_rate": 0.0003852125580258979, - "loss": 0.4795, - "step": 94500 - }, - { - "epoch": 23.07, - "learning_rate": 0.0003851820180796482, - "loss": 0.4721, - "step": 94525 - }, - { - "epoch": 23.07, - "learning_rate": 0.0003851514781333985, - "loss": 0.4625, - "step": 94550 - }, - { - "epoch": 23.08, - "learning_rate": 0.00038512093818714876, - "loss": 0.5091, - "step": 94575 - }, - { - "epoch": 23.08, - "learning_rate": 0.00038509039824089907, - "loss": 0.4679, - "step": 94600 - }, - { - "epoch": 23.09, - "learning_rate": 0.0003850598582946494, - "loss": 0.4813, - "step": 94625 - }, - { - "epoch": 23.1, - "learning_rate": 0.00038502931834839973, - "loss": 0.4172, - "step": 94650 - }, - { - "epoch": 23.1, - "learning_rate": 0.00038499877840215003, - "loss": 0.4948, - "step": 94675 - }, - { - "epoch": 23.11, - "learning_rate": 0.00038496823845590033, - "loss": 0.4403, - "step": 94700 - }, - { - "epoch": 23.11, - "learning_rate": 0.00038493769850965064, - "loss": 0.4947, - "step": 94725 - }, - { - "epoch": 23.12, - "learning_rate": 0.00038490715856340094, - "loss": 0.44, - "step": 94750 - }, - { - "epoch": 23.13, - "learning_rate": 0.00038487661861715124, - "loss": 0.5244, - "step": 94775 - }, - { - "epoch": 23.13, - "learning_rate": 0.00038484607867090155, - "loss": 0.4809, - "step": 94800 - }, - { - "epoch": 23.14, - "learning_rate": 0.00038481553872465185, - "loss": 0.4803, - "step": 94825 - }, - { - "epoch": 23.15, - "learning_rate": 0.00038478499877840215, - "loss": 0.4412, - "step": 94850 - }, - { - "epoch": 23.15, - "learning_rate": 0.0003847544588321525, - "loss": 0.5365, - "step": 94875 - }, - { - "epoch": 23.16, - "learning_rate": 0.00038472391888590276, - "loss": 0.4305, - "step": 94900 - }, - { - "epoch": 23.16, - "learning_rate": 0.00038469337893965306, - "loss": 0.5242, - "step": 94925 - }, - { - "epoch": 23.17, - "learning_rate": 0.00038466283899340337, - "loss": 0.4683, - "step": 94950 - }, - { - "epoch": 23.18, - "learning_rate": 0.00038463229904715367, - "loss": 0.5065, - "step": 94975 - }, - { - "epoch": 23.18, - "learning_rate": 0.00038460175910090403, - "loss": 0.4666, - "step": 95000 - }, - { - "epoch": 23.19, - "learning_rate": 0.00038457121915465433, - "loss": 0.4901, - "step": 95025 - }, - { - "epoch": 23.19, - "learning_rate": 0.0003845406792084046, - "loss": 0.461, - "step": 95050 - }, - { - "epoch": 23.2, - "learning_rate": 0.0003845101392621549, - "loss": 0.4689, - "step": 95075 - }, - { - "epoch": 23.21, - "learning_rate": 0.0003844795993159052, - "loss": 0.4183, - "step": 95100 - }, - { - "epoch": 23.21, - "learning_rate": 0.0003844490593696555, - "loss": 0.4992, - "step": 95125 - }, - { - "epoch": 23.22, - "learning_rate": 0.00038441851942340585, - "loss": 0.4255, - "step": 95150 - }, - { - "epoch": 23.22, - "learning_rate": 0.00038438797947715615, - "loss": 0.4857, - "step": 95175 - }, - { - "epoch": 23.23, - "learning_rate": 0.00038435743953090646, - "loss": 0.474, - "step": 95200 - }, - { - "epoch": 23.24, - "learning_rate": 0.0003843268995846567, - "loss": 0.4662, - "step": 95225 - }, - { - "epoch": 23.24, - "learning_rate": 0.000384296359638407, - "loss": 0.4002, - "step": 95250 - }, - { - "epoch": 23.25, - "learning_rate": 0.00038426581969215737, - "loss": 0.4931, - "step": 95275 - }, - { - "epoch": 23.26, - "learning_rate": 0.00038423527974590767, - "loss": 0.4502, - "step": 95300 - }, - { - "epoch": 23.26, - "learning_rate": 0.00038420473979965797, - "loss": 0.4826, - "step": 95325 - }, - { - "epoch": 23.27, - "learning_rate": 0.0003841741998534083, - "loss": 0.4563, - "step": 95350 - }, - { - "epoch": 23.27, - "learning_rate": 0.0003841436599071585, - "loss": 0.4959, - "step": 95375 - }, - { - "epoch": 23.28, - "learning_rate": 0.0003841131199609089, - "loss": 0.4783, - "step": 95400 - }, - { - "epoch": 23.29, - "learning_rate": 0.0003840825800146592, - "loss": 0.5152, - "step": 95425 - }, - { - "epoch": 23.29, - "learning_rate": 0.0003840520400684095, - "loss": 0.473, - "step": 95450 - }, - { - "epoch": 23.3, - "learning_rate": 0.0003840215001221598, - "loss": 0.495, - "step": 95475 - }, - { - "epoch": 23.3, - "learning_rate": 0.0003839909601759101, - "loss": 0.4423, - "step": 95500 - }, - { - "epoch": 23.31, - "learning_rate": 0.0003839604202296604, - "loss": 0.5382, - "step": 95525 - }, - { - "epoch": 23.32, - "learning_rate": 0.0003839298802834107, - "loss": 0.4199, - "step": 95550 - }, - { - "epoch": 23.32, - "learning_rate": 0.000383899340337161, - "loss": 0.4925, - "step": 95575 - }, - { - "epoch": 23.33, - "learning_rate": 0.0003838688003909113, - "loss": 0.4474, - "step": 95600 - }, - { - "epoch": 23.33, - "learning_rate": 0.0003838382604446616, - "loss": 0.5181, - "step": 95625 - }, - { - "epoch": 23.34, - "learning_rate": 0.00038380772049841197, - "loss": 0.4751, - "step": 95650 - }, - { - "epoch": 23.35, - "learning_rate": 0.0003837771805521623, - "loss": 0.4907, - "step": 95675 - }, - { - "epoch": 23.35, - "learning_rate": 0.0003837466406059125, - "loss": 0.4483, - "step": 95700 - }, - { - "epoch": 23.36, - "learning_rate": 0.0003837161006596628, - "loss": 0.5041, - "step": 95725 - }, - { - "epoch": 23.37, - "learning_rate": 0.00038368556071341313, - "loss": 0.4663, - "step": 95750 - }, - { - "epoch": 23.37, - "learning_rate": 0.0003836550207671635, - "loss": 0.5671, - "step": 95775 - }, - { - "epoch": 23.38, - "learning_rate": 0.0003836244808209138, - "loss": 0.4279, - "step": 95800 - }, - { - "epoch": 23.38, - "learning_rate": 0.0003835939408746641, - "loss": 0.4945, - "step": 95825 - }, - { - "epoch": 23.39, - "learning_rate": 0.00038356340092841434, - "loss": 0.4691, - "step": 95850 - }, - { - "epoch": 23.4, - "learning_rate": 0.00038353286098216465, - "loss": 0.5027, - "step": 95875 - }, - { - "epoch": 23.4, - "learning_rate": 0.000383502321035915, - "loss": 0.4723, - "step": 95900 - }, - { - "epoch": 23.41, - "learning_rate": 0.0003834717810896653, - "loss": 0.5334, - "step": 95925 - }, - { - "epoch": 23.41, - "learning_rate": 0.0003834412411434156, - "loss": 0.437, - "step": 95950 - }, - { - "epoch": 23.42, - "learning_rate": 0.0003834107011971659, - "loss": 0.4901, - "step": 95975 - }, - { - "epoch": 23.43, - "learning_rate": 0.00038338016125091616, - "loss": 0.4319, - "step": 96000 - }, - { - "epoch": 23.43, - "eval_cer": 0.10958081373263658, - "eval_loss": 0.4272046983242035, - "eval_runtime": 149.2388, - "eval_samples_per_second": 28.096, - "eval_steps_per_second": 7.029, - "eval_wer": 0.4472430668841762, - "step": 96000 - }, - { - "epoch": 23.43, - "learning_rate": 0.0003833496213046665, - "loss": 0.5031, - "step": 96025 - }, - { - "epoch": 23.44, - "learning_rate": 0.0003833190813584168, - "loss": 0.4644, - "step": 96050 - }, - { - "epoch": 23.44, - "learning_rate": 0.0003832885414121671, - "loss": 0.5066, - "step": 96075 - }, - { - "epoch": 23.45, - "learning_rate": 0.00038325800146591743, - "loss": 0.4638, - "step": 96100 - }, - { - "epoch": 23.46, - "learning_rate": 0.00038322746151966773, - "loss": 0.4751, - "step": 96125 - }, - { - "epoch": 23.46, - "learning_rate": 0.00038319692157341804, - "loss": 0.4367, - "step": 96150 - }, - { - "epoch": 23.47, - "learning_rate": 0.0003831676032250183, - "loss": 0.5076, - "step": 96175 - }, - { - "epoch": 23.47, - "learning_rate": 0.00038313706327876865, - "loss": 0.3962, - "step": 96200 - }, - { - "epoch": 23.48, - "learning_rate": 0.00038310652333251895, - "loss": 0.5018, - "step": 96225 - }, - { - "epoch": 23.49, - "learning_rate": 0.00038307598338626925, - "loss": 0.4345, - "step": 96250 - }, - { - "epoch": 23.49, - "learning_rate": 0.00038304544344001956, - "loss": 0.5086, - "step": 96275 - }, - { - "epoch": 23.5, - "learning_rate": 0.00038301490349376986, - "loss": 0.4465, - "step": 96300 - }, - { - "epoch": 23.51, - "learning_rate": 0.00038298436354752016, - "loss": 0.5403, - "step": 96325 - }, - { - "epoch": 23.51, - "learning_rate": 0.00038295382360127047, - "loss": 0.4466, - "step": 96350 - }, - { - "epoch": 23.52, - "learning_rate": 0.00038292328365502077, - "loss": 0.5121, - "step": 96375 - }, - { - "epoch": 23.52, - "learning_rate": 0.0003828927437087711, - "loss": 0.4536, - "step": 96400 - }, - { - "epoch": 23.53, - "learning_rate": 0.0003828622037625214, - "loss": 0.4811, - "step": 96425 - }, - { - "epoch": 23.54, - "learning_rate": 0.00038283166381627173, - "loss": 0.4512, - "step": 96450 - }, - { - "epoch": 23.54, - "learning_rate": 0.000382801123870022, - "loss": 0.5013, - "step": 96475 - }, - { - "epoch": 23.55, - "learning_rate": 0.0003827705839237723, - "loss": 0.4513, - "step": 96500 - }, - { - "epoch": 23.55, - "learning_rate": 0.0003827400439775226, - "loss": 0.4703, - "step": 96525 - }, - { - "epoch": 23.56, - "learning_rate": 0.0003827095040312729, - "loss": 0.4889, - "step": 96550 - }, - { - "epoch": 23.57, - "learning_rate": 0.00038267896408502325, - "loss": 0.4766, - "step": 96575 - }, - { - "epoch": 23.57, - "learning_rate": 0.00038264842413877355, - "loss": 0.4529, - "step": 96600 - }, - { - "epoch": 23.58, - "learning_rate": 0.0003826178841925238, - "loss": 0.493, - "step": 96625 - }, - { - "epoch": 23.58, - "learning_rate": 0.0003825873442462741, - "loss": 0.4478, - "step": 96650 - }, - { - "epoch": 23.59, - "learning_rate": 0.0003825568043000244, - "loss": 0.5043, - "step": 96675 - }, - { - "epoch": 23.6, - "learning_rate": 0.00038252626435377477, - "loss": 0.4583, - "step": 96700 - }, - { - "epoch": 23.6, - "learning_rate": 0.00038249572440752507, - "loss": 0.5067, - "step": 96725 - }, - { - "epoch": 23.61, - "learning_rate": 0.0003824651844612754, - "loss": 0.4689, - "step": 96750 - }, - { - "epoch": 23.62, - "learning_rate": 0.0003824346445150257, - "loss": 0.5348, - "step": 96775 - }, - { - "epoch": 23.62, - "learning_rate": 0.0003824041045687759, - "loss": 0.4366, - "step": 96800 - }, - { - "epoch": 23.63, - "learning_rate": 0.0003823735646225263, - "loss": 0.508, - "step": 96825 - }, - { - "epoch": 23.63, - "learning_rate": 0.0003823430246762766, - "loss": 0.4352, - "step": 96850 - }, - { - "epoch": 23.64, - "learning_rate": 0.0003823124847300269, - "loss": 0.5385, - "step": 96875 - }, - { - "epoch": 23.65, - "learning_rate": 0.0003822819447837772, - "loss": 0.4585, - "step": 96900 - }, - { - "epoch": 23.65, - "learning_rate": 0.0003822514048375275, - "loss": 0.5147, - "step": 96925 - }, - { - "epoch": 23.66, - "learning_rate": 0.0003822208648912778, - "loss": 0.4456, - "step": 96950 - }, - { - "epoch": 23.66, - "learning_rate": 0.0003821903249450281, - "loss": 0.4983, - "step": 96975 - }, - { - "epoch": 23.67, - "learning_rate": 0.0003821597849987784, - "loss": 0.4749, - "step": 97000 - }, - { - "epoch": 23.68, - "learning_rate": 0.0003821292450525287, - "loss": 0.5113, - "step": 97025 - }, - { - "epoch": 23.68, - "learning_rate": 0.000382098705106279, - "loss": 0.5146, - "step": 97050 - }, - { - "epoch": 23.69, - "learning_rate": 0.00038206816516002937, - "loss": 0.495, - "step": 97075 - }, - { - "epoch": 23.69, - "learning_rate": 0.0003820376252137796, - "loss": 0.4706, - "step": 97100 - }, - { - "epoch": 23.7, - "learning_rate": 0.0003820070852675299, - "loss": 0.5337, - "step": 97125 - }, - { - "epoch": 23.71, - "learning_rate": 0.00038197654532128023, - "loss": 0.4133, - "step": 97150 - }, - { - "epoch": 23.71, - "learning_rate": 0.00038194600537503053, - "loss": 0.502, - "step": 97175 - }, - { - "epoch": 23.72, - "learning_rate": 0.00038191546542878083, - "loss": 0.4532, - "step": 97200 - }, - { - "epoch": 23.72, - "learning_rate": 0.0003818849254825312, - "loss": 0.5145, - "step": 97225 - }, - { - "epoch": 23.73, - "learning_rate": 0.0003818543855362815, - "loss": 0.4581, - "step": 97250 - }, - { - "epoch": 23.74, - "learning_rate": 0.00038182384559003174, - "loss": 0.5038, - "step": 97275 - }, - { - "epoch": 23.74, - "learning_rate": 0.00038179330564378205, - "loss": 0.4292, - "step": 97300 - }, - { - "epoch": 23.75, - "learning_rate": 0.00038176276569753235, - "loss": 0.5076, - "step": 97325 - }, - { - "epoch": 23.76, - "learning_rate": 0.0003817322257512827, - "loss": 0.4406, - "step": 97350 - }, - { - "epoch": 23.76, - "learning_rate": 0.000381701685805033, - "loss": 0.5133, - "step": 97375 - }, - { - "epoch": 23.77, - "learning_rate": 0.0003816711458587833, - "loss": 0.4, - "step": 97400 - }, - { - "epoch": 23.77, - "learning_rate": 0.00038164060591253356, - "loss": 0.4934, - "step": 97425 - }, - { - "epoch": 23.78, - "learning_rate": 0.00038161006596628387, - "loss": 0.4434, - "step": 97450 - }, - { - "epoch": 23.79, - "learning_rate": 0.0003815795260200342, - "loss": 0.5085, - "step": 97475 - }, - { - "epoch": 23.79, - "learning_rate": 0.00038154898607378453, - "loss": 0.4546, - "step": 97500 - }, - { - "epoch": 23.8, - "learning_rate": 0.00038151844612753483, - "loss": 0.499, - "step": 97525 - }, - { - "epoch": 23.8, - "learning_rate": 0.00038148790618128514, - "loss": 0.4719, - "step": 97550 - }, - { - "epoch": 23.81, - "learning_rate": 0.0003814573662350354, - "loss": 0.5191, - "step": 97575 - }, - { - "epoch": 23.82, - "learning_rate": 0.00038142682628878574, - "loss": 0.4995, - "step": 97600 - }, - { - "epoch": 23.82, - "learning_rate": 0.00038139628634253605, - "loss": 0.5225, - "step": 97625 - }, - { - "epoch": 23.83, - "learning_rate": 0.00038136574639628635, - "loss": 0.4468, - "step": 97650 - }, - { - "epoch": 23.83, - "learning_rate": 0.00038133520645003665, - "loss": 0.5187, - "step": 97675 - }, - { - "epoch": 23.84, - "learning_rate": 0.00038130466650378696, - "loss": 0.426, - "step": 97700 - }, - { - "epoch": 23.85, - "learning_rate": 0.0003812741265575373, - "loss": 0.486, - "step": 97725 - }, - { - "epoch": 23.85, - "learning_rate": 0.00038124358661128756, - "loss": 0.5055, - "step": 97750 - }, - { - "epoch": 23.86, - "learning_rate": 0.00038121304666503787, - "loss": 0.5072, - "step": 97775 - }, - { - "epoch": 23.87, - "learning_rate": 0.00038118250671878817, - "loss": 0.4402, - "step": 97800 - }, - { - "epoch": 23.87, - "learning_rate": 0.00038115196677253847, - "loss": 0.4967, - "step": 97825 - }, - { - "epoch": 23.88, - "learning_rate": 0.00038112142682628883, - "loss": 0.4496, - "step": 97850 - }, - { - "epoch": 23.88, - "learning_rate": 0.00038109088688003913, - "loss": 0.5174, - "step": 97875 - }, - { - "epoch": 23.89, - "learning_rate": 0.0003810603469337894, - "loss": 0.4629, - "step": 97900 - }, - { - "epoch": 23.9, - "learning_rate": 0.0003810298069875397, - "loss": 0.4647, - "step": 97925 - }, - { - "epoch": 23.9, - "learning_rate": 0.00038099926704129, - "loss": 0.4622, - "step": 97950 - }, - { - "epoch": 23.91, - "learning_rate": 0.00038096872709504035, - "loss": 0.4721, - "step": 97975 - }, - { - "epoch": 23.91, - "learning_rate": 0.00038093818714879065, - "loss": 0.4376, - "step": 98000 - }, - { - "epoch": 23.92, - "learning_rate": 0.00038090764720254095, - "loss": 0.5157, - "step": 98025 - }, - { - "epoch": 23.93, - "learning_rate": 0.0003808771072562912, - "loss": 0.4177, - "step": 98050 - }, - { - "epoch": 23.93, - "learning_rate": 0.0003808465673100415, - "loss": 0.4717, - "step": 98075 - }, - { - "epoch": 23.94, - "learning_rate": 0.00038081602736379186, - "loss": 0.434, - "step": 98100 - }, - { - "epoch": 23.94, - "learning_rate": 0.00038078548741754217, - "loss": 0.4996, - "step": 98125 - }, - { - "epoch": 23.95, - "learning_rate": 0.00038075494747129247, - "loss": 0.4659, - "step": 98150 - }, - { - "epoch": 23.96, - "learning_rate": 0.0003807244075250428, - "loss": 0.5177, - "step": 98175 - }, - { - "epoch": 23.96, - "learning_rate": 0.0003806938675787931, - "loss": 0.4773, - "step": 98200 - }, - { - "epoch": 23.97, - "learning_rate": 0.0003806633276325434, - "loss": 0.5166, - "step": 98225 - }, - { - "epoch": 23.98, - "learning_rate": 0.0003806327876862937, - "loss": 0.4357, - "step": 98250 - }, - { - "epoch": 23.98, - "learning_rate": 0.000380602247740044, - "loss": 0.5099, - "step": 98275 - }, - { - "epoch": 23.99, - "learning_rate": 0.0003805717077937943, - "loss": 0.4399, - "step": 98300 - }, - { - "epoch": 23.99, - "learning_rate": 0.0003805411678475446, - "loss": 0.4911, - "step": 98325 - }, - { - "epoch": 24.0, - "learning_rate": 0.00038051062790129495, - "loss": 0.4196, - "step": 98350 - }, - { - "epoch": 24.01, - "learning_rate": 0.0003804800879550452, - "loss": 0.5231, - "step": 98375 - }, - { - "epoch": 24.01, - "learning_rate": 0.0003804495480087955, - "loss": 0.4501, - "step": 98400 - }, - { - "epoch": 24.02, - "learning_rate": 0.0003804190080625458, - "loss": 0.4743, - "step": 98425 - }, - { - "epoch": 24.02, - "learning_rate": 0.0003803884681162961, - "loss": 0.4069, - "step": 98450 - }, - { - "epoch": 24.03, - "learning_rate": 0.00038035792817004647, - "loss": 0.4805, - "step": 98475 - }, - { - "epoch": 24.04, - "learning_rate": 0.00038032738822379677, - "loss": 0.4623, - "step": 98500 - }, - { - "epoch": 24.04, - "learning_rate": 0.000380296848277547, - "loss": 0.5046, - "step": 98525 - }, - { - "epoch": 24.05, - "learning_rate": 0.0003802663083312973, - "loss": 0.4241, - "step": 98550 - }, - { - "epoch": 24.05, - "learning_rate": 0.0003802357683850476, - "loss": 0.4994, - "step": 98575 - }, - { - "epoch": 24.06, - "learning_rate": 0.00038020522843879793, - "loss": 0.4444, - "step": 98600 - }, - { - "epoch": 24.07, - "learning_rate": 0.0003801746884925483, - "loss": 0.495, - "step": 98625 - }, - { - "epoch": 24.07, - "learning_rate": 0.0003801441485462986, - "loss": 0.4386, - "step": 98650 - }, - { - "epoch": 24.08, - "learning_rate": 0.0003801136086000489, - "loss": 0.4757, - "step": 98675 - }, - { - "epoch": 24.08, - "learning_rate": 0.00038008306865379914, - "loss": 0.4466, - "step": 98700 - }, - { - "epoch": 24.09, - "learning_rate": 0.00038005252870754945, - "loss": 0.4837, - "step": 98725 - }, - { - "epoch": 24.1, - "learning_rate": 0.0003800219887612998, - "loss": 0.4318, - "step": 98750 - }, - { - "epoch": 24.1, - "learning_rate": 0.0003799914488150501, - "loss": 0.4878, - "step": 98775 - }, - { - "epoch": 24.11, - "learning_rate": 0.0003799621304666504, - "loss": 0.4346, - "step": 98800 - }, - { - "epoch": 24.12, - "learning_rate": 0.0003799315905204007, - "loss": 0.5095, - "step": 98825 - }, - { - "epoch": 24.12, - "learning_rate": 0.00037990105057415097, - "loss": 0.4116, - "step": 98850 - }, - { - "epoch": 24.13, - "learning_rate": 0.00037987051062790127, - "loss": 0.4906, - "step": 98875 - }, - { - "epoch": 24.13, - "learning_rate": 0.00037983997068165163, - "loss": 0.4252, - "step": 98900 - }, - { - "epoch": 24.14, - "learning_rate": 0.00037980943073540193, - "loss": 0.5012, - "step": 98925 - }, - { - "epoch": 24.15, - "learning_rate": 0.00037977889078915223, - "loss": 0.4239, - "step": 98950 - }, - { - "epoch": 24.15, - "learning_rate": 0.00037974835084290254, - "loss": 0.4926, - "step": 98975 - }, - { - "epoch": 24.16, - "learning_rate": 0.0003797178108966528, - "loss": 0.3624, - "step": 99000 - }, - { - "epoch": 24.16, - "eval_cer": 0.10784575423754915, - "eval_loss": 0.4347018301486969, - "eval_runtime": 148.8009, - "eval_samples_per_second": 28.179, - "eval_steps_per_second": 7.05, - "eval_wer": 0.4436541598694943, - "step": 99000 - }, - { - "epoch": 24.16, - "learning_rate": 0.00037968727095040314, - "loss": 0.5116, - "step": 99025 - }, - { - "epoch": 24.17, - "learning_rate": 0.00037965673100415345, - "loss": 0.4564, - "step": 99050 - }, - { - "epoch": 24.18, - "learning_rate": 0.00037962619105790375, - "loss": 0.4854, - "step": 99075 - }, - { - "epoch": 24.18, - "learning_rate": 0.00037959565111165405, - "loss": 0.4459, - "step": 99100 - }, - { - "epoch": 24.19, - "learning_rate": 0.00037956511116540436, - "loss": 0.5061, - "step": 99125 - }, - { - "epoch": 24.19, - "learning_rate": 0.0003795345712191547, - "loss": 0.4437, - "step": 99150 - }, - { - "epoch": 24.2, - "learning_rate": 0.00037950403127290496, - "loss": 0.4884, - "step": 99175 - }, - { - "epoch": 24.21, - "learning_rate": 0.00037947349132665527, - "loss": 0.4645, - "step": 99200 - }, - { - "epoch": 24.21, - "learning_rate": 0.00037944295138040557, - "loss": 0.4735, - "step": 99225 - }, - { - "epoch": 24.22, - "learning_rate": 0.0003794124114341559, - "loss": 0.4911, - "step": 99250 - }, - { - "epoch": 24.23, - "learning_rate": 0.0003793818714879062, - "loss": 0.5021, - "step": 99275 - }, - { - "epoch": 24.23, - "learning_rate": 0.00037935133154165654, - "loss": 0.4534, - "step": 99300 - }, - { - "epoch": 24.24, - "learning_rate": 0.0003793207915954068, - "loss": 0.4726, - "step": 99325 - }, - { - "epoch": 24.24, - "learning_rate": 0.0003792902516491571, - "loss": 0.4014, - "step": 99350 - }, - { - "epoch": 24.25, - "learning_rate": 0.0003792597117029074, - "loss": 0.4678, - "step": 99375 - }, - { - "epoch": 24.26, - "learning_rate": 0.0003792291717566577, - "loss": 0.3988, - "step": 99400 - }, - { - "epoch": 24.26, - "learning_rate": 0.00037919863181040805, - "loss": 0.4794, - "step": 99425 - }, - { - "epoch": 24.27, - "learning_rate": 0.00037916809186415836, - "loss": 0.4524, - "step": 99450 - }, - { - "epoch": 24.27, - "learning_rate": 0.0003791375519179086, - "loss": 0.4803, - "step": 99475 - }, - { - "epoch": 24.28, - "learning_rate": 0.0003791070119716589, - "loss": 0.4655, - "step": 99500 - }, - { - "epoch": 24.29, - "learning_rate": 0.0003790764720254092, - "loss": 0.4993, - "step": 99525 - }, - { - "epoch": 24.29, - "learning_rate": 0.00037904593207915957, - "loss": 0.4255, - "step": 99550 - }, - { - "epoch": 24.3, - "learning_rate": 0.00037901539213290987, - "loss": 0.4846, - "step": 99575 - }, - { - "epoch": 24.3, - "learning_rate": 0.0003789848521866602, - "loss": 0.4249, - "step": 99600 - }, - { - "epoch": 24.31, - "learning_rate": 0.0003789543122404104, - "loss": 0.5019, - "step": 99625 - }, - { - "epoch": 24.32, - "learning_rate": 0.00037892377229416073, - "loss": 0.4535, - "step": 99650 - }, - { - "epoch": 24.32, - "learning_rate": 0.0003788932323479111, - "loss": 0.4661, - "step": 99675 - }, - { - "epoch": 24.33, - "learning_rate": 0.0003788626924016614, - "loss": 0.4599, - "step": 99700 - }, - { - "epoch": 24.34, - "learning_rate": 0.0003788321524554117, - "loss": 0.4824, - "step": 99725 - }, - { - "epoch": 24.34, - "learning_rate": 0.000378801612509162, - "loss": 0.4772, - "step": 99750 - }, - { - "epoch": 24.35, - "learning_rate": 0.0003787710725629123, - "loss": 0.5119, - "step": 99775 - }, - { - "epoch": 24.35, - "learning_rate": 0.0003787405326166626, - "loss": 0.4115, - "step": 99800 - }, - { - "epoch": 24.36, - "learning_rate": 0.0003787099926704129, - "loss": 0.4619, - "step": 99825 - }, - { - "epoch": 24.37, - "learning_rate": 0.0003786794527241632, - "loss": 0.4373, - "step": 99850 - }, - { - "epoch": 24.37, - "learning_rate": 0.0003786489127779135, - "loss": 0.473, - "step": 99875 - }, - { - "epoch": 24.38, - "learning_rate": 0.0003786183728316638, - "loss": 0.4698, - "step": 99900 - }, - { - "epoch": 24.38, - "learning_rate": 0.0003785878328854142, - "loss": 0.5249, - "step": 99925 - }, - { - "epoch": 24.39, - "learning_rate": 0.0003785572929391644, - "loss": 0.4278, - "step": 99950 - }, - { - "epoch": 24.4, - "learning_rate": 0.0003785267529929147, - "loss": 0.5147, - "step": 99975 - }, - { - "epoch": 24.4, - "learning_rate": 0.00037849621304666503, - "loss": 0.4447, - "step": 100000 - }, - { - "epoch": 24.41, - "learning_rate": 0.00037846567310041533, - "loss": 0.4606, - "step": 100025 - }, - { - "epoch": 24.41, - "learning_rate": 0.0003784351331541657, - "loss": 0.4419, - "step": 100050 - }, - { - "epoch": 24.42, - "learning_rate": 0.000378404593207916, - "loss": 0.5273, - "step": 100075 - }, - { - "epoch": 24.43, - "learning_rate": 0.00037837405326166624, - "loss": 0.4586, - "step": 100100 - }, - { - "epoch": 24.43, - "learning_rate": 0.00037834351331541655, - "loss": 0.4693, - "step": 100125 - }, - { - "epoch": 24.44, - "learning_rate": 0.00037831297336916685, - "loss": 0.4369, - "step": 100150 - }, - { - "epoch": 24.44, - "learning_rate": 0.0003782824334229172, - "loss": 0.4678, - "step": 100175 - }, - { - "epoch": 24.45, - "learning_rate": 0.0003782518934766675, - "loss": 0.4281, - "step": 100200 - }, - { - "epoch": 24.46, - "learning_rate": 0.0003782213535304178, - "loss": 0.5052, - "step": 100225 - }, - { - "epoch": 24.46, - "learning_rate": 0.0003781908135841681, - "loss": 0.4302, - "step": 100250 - }, - { - "epoch": 24.47, - "learning_rate": 0.00037816027363791837, - "loss": 0.5099, - "step": 100275 - }, - { - "epoch": 24.48, - "learning_rate": 0.0003781297336916687, - "loss": 0.4803, - "step": 100300 - }, - { - "epoch": 24.48, - "learning_rate": 0.000378099193745419, - "loss": 0.465, - "step": 100325 - }, - { - "epoch": 24.49, - "learning_rate": 0.00037806865379916933, - "loss": 0.4174, - "step": 100350 - }, - { - "epoch": 24.49, - "learning_rate": 0.00037803811385291963, - "loss": 0.4863, - "step": 100375 - }, - { - "epoch": 24.5, - "learning_rate": 0.00037800757390666994, - "loss": 0.4603, - "step": 100400 - }, - { - "epoch": 24.51, - "learning_rate": 0.00037797703396042024, - "loss": 0.4693, - "step": 100425 - }, - { - "epoch": 24.51, - "learning_rate": 0.00037794649401417054, - "loss": 0.4687, - "step": 100450 - }, - { - "epoch": 24.52, - "learning_rate": 0.00037791595406792085, - "loss": 0.4858, - "step": 100475 - }, - { - "epoch": 24.52, - "learning_rate": 0.00037788541412167115, - "loss": 0.4145, - "step": 100500 - }, - { - "epoch": 24.53, - "learning_rate": 0.00037785487417542145, - "loss": 0.5032, - "step": 100525 - }, - { - "epoch": 24.54, - "learning_rate": 0.0003778243342291718, - "loss": 0.4617, - "step": 100550 - }, - { - "epoch": 24.54, - "learning_rate": 0.00037779379428292206, - "loss": 0.479, - "step": 100575 - }, - { - "epoch": 24.55, - "learning_rate": 0.00037776325433667236, - "loss": 0.4391, - "step": 100600 - }, - { - "epoch": 24.55, - "learning_rate": 0.00037773271439042267, - "loss": 0.4667, - "step": 100625 - }, - { - "epoch": 24.56, - "learning_rate": 0.00037770217444417297, - "loss": 0.4343, - "step": 100650 - }, - { - "epoch": 24.57, - "learning_rate": 0.0003776716344979233, - "loss": 0.5094, - "step": 100675 - }, - { - "epoch": 24.57, - "learning_rate": 0.00037764109455167363, - "loss": 0.4378, - "step": 100700 - }, - { - "epoch": 24.58, - "learning_rate": 0.00037761055460542393, - "loss": 0.4847, - "step": 100725 - }, - { - "epoch": 24.59, - "learning_rate": 0.0003775800146591742, - "loss": 0.486, - "step": 100750 - }, - { - "epoch": 24.59, - "learning_rate": 0.0003775494747129245, - "loss": 0.4984, - "step": 100775 - }, - { - "epoch": 24.6, - "learning_rate": 0.0003775189347666748, - "loss": 0.4548, - "step": 100800 - }, - { - "epoch": 24.6, - "learning_rate": 0.00037748839482042515, - "loss": 0.4844, - "step": 100825 - }, - { - "epoch": 24.61, - "learning_rate": 0.00037745785487417545, - "loss": 0.4017, - "step": 100850 - }, - { - "epoch": 24.62, - "learning_rate": 0.00037742731492792575, - "loss": 0.5021, - "step": 100875 - }, - { - "epoch": 24.62, - "learning_rate": 0.000377396774981676, - "loss": 0.4189, - "step": 100900 - }, - { - "epoch": 24.63, - "learning_rate": 0.0003773662350354263, - "loss": 0.4647, - "step": 100925 - }, - { - "epoch": 24.63, - "learning_rate": 0.00037733569508917666, - "loss": 0.4269, - "step": 100950 - }, - { - "epoch": 24.64, - "learning_rate": 0.00037730515514292697, - "loss": 0.5024, - "step": 100975 - }, - { - "epoch": 24.65, - "learning_rate": 0.00037727461519667727, - "loss": 0.4887, - "step": 101000 - }, - { - "epoch": 24.65, - "learning_rate": 0.0003772440752504276, - "loss": 0.5028, - "step": 101025 - }, - { - "epoch": 24.66, - "learning_rate": 0.0003772135353041778, - "loss": 0.4119, - "step": 101050 - }, - { - "epoch": 24.66, - "learning_rate": 0.0003771829953579282, - "loss": 0.5086, - "step": 101075 - }, - { - "epoch": 24.67, - "learning_rate": 0.0003771524554116785, - "loss": 0.4606, - "step": 101100 - }, - { - "epoch": 24.68, - "learning_rate": 0.0003771219154654288, - "loss": 0.5296, - "step": 101125 - }, - { - "epoch": 24.68, - "learning_rate": 0.0003770913755191791, - "loss": 0.4198, - "step": 101150 - }, - { - "epoch": 24.69, - "learning_rate": 0.0003770608355729294, - "loss": 0.5104, - "step": 101175 - }, - { - "epoch": 24.69, - "learning_rate": 0.00037703029562667975, - "loss": 0.4763, - "step": 101200 - }, - { - "epoch": 24.7, - "learning_rate": 0.00037699975568043, - "loss": 0.4919, - "step": 101225 - }, - { - "epoch": 24.71, - "learning_rate": 0.0003769692157341803, - "loss": 0.4559, - "step": 101250 - }, - { - "epoch": 24.71, - "learning_rate": 0.0003769386757879306, - "loss": 0.4789, - "step": 101275 - }, - { - "epoch": 24.72, - "learning_rate": 0.0003769081358416809, - "loss": 0.3941, - "step": 101300 - }, - { - "epoch": 24.73, - "learning_rate": 0.00037687759589543127, - "loss": 0.4652, - "step": 101325 - }, - { - "epoch": 24.73, - "learning_rate": 0.00037684705594918157, - "loss": 0.4512, - "step": 101350 - }, - { - "epoch": 24.74, - "learning_rate": 0.0003768165160029318, - "loss": 0.5269, - "step": 101375 - }, - { - "epoch": 24.74, - "learning_rate": 0.0003767859760566821, - "loss": 0.4127, - "step": 101400 - }, - { - "epoch": 24.75, - "learning_rate": 0.00037675543611043243, - "loss": 0.5224, - "step": 101425 - }, - { - "epoch": 24.76, - "learning_rate": 0.0003767248961641828, - "loss": 0.4827, - "step": 101450 - }, - { - "epoch": 24.76, - "learning_rate": 0.0003766943562179331, - "loss": 0.5129, - "step": 101475 - }, - { - "epoch": 24.77, - "learning_rate": 0.0003766638162716834, - "loss": 0.4572, - "step": 101500 - }, - { - "epoch": 24.77, - "learning_rate": 0.00037663327632543364, - "loss": 0.4873, - "step": 101525 - }, - { - "epoch": 24.78, - "learning_rate": 0.00037660273637918395, - "loss": 0.4274, - "step": 101550 - }, - { - "epoch": 24.79, - "learning_rate": 0.0003765721964329343, - "loss": 0.4658, - "step": 101575 - }, - { - "epoch": 24.79, - "learning_rate": 0.0003765416564866846, - "loss": 0.4689, - "step": 101600 - }, - { - "epoch": 24.8, - "learning_rate": 0.0003765111165404349, - "loss": 0.4879, - "step": 101625 - }, - { - "epoch": 24.8, - "learning_rate": 0.0003764805765941852, - "loss": 0.452, - "step": 101650 - }, - { - "epoch": 24.81, - "learning_rate": 0.0003764500366479355, - "loss": 0.5189, - "step": 101675 - }, - { - "epoch": 24.82, - "learning_rate": 0.0003764194967016858, - "loss": 0.4351, - "step": 101700 - }, - { - "epoch": 24.82, - "learning_rate": 0.0003763889567554361, - "loss": 0.5103, - "step": 101725 - }, - { - "epoch": 24.83, - "learning_rate": 0.0003763584168091864, - "loss": 0.4763, - "step": 101750 - }, - { - "epoch": 24.84, - "learning_rate": 0.00037632787686293673, - "loss": 0.4859, - "step": 101775 - }, - { - "epoch": 24.84, - "learning_rate": 0.00037629733691668703, - "loss": 0.4515, - "step": 101800 - }, - { - "epoch": 24.85, - "learning_rate": 0.0003762667969704374, - "loss": 0.5135, - "step": 101825 - }, - { - "epoch": 24.85, - "learning_rate": 0.00037623625702418764, - "loss": 0.4947, - "step": 101850 - }, - { - "epoch": 24.86, - "learning_rate": 0.00037620571707793794, - "loss": 0.5274, - "step": 101875 - }, - { - "epoch": 24.87, - "learning_rate": 0.00037617517713168825, - "loss": 0.4772, - "step": 101900 - }, - { - "epoch": 24.87, - "learning_rate": 0.00037614463718543855, - "loss": 0.4879, - "step": 101925 - }, - { - "epoch": 24.88, - "learning_rate": 0.00037611531883703886, - "loss": 0.3944, - "step": 101950 - }, - { - "epoch": 24.88, - "learning_rate": 0.00037608477889078916, - "loss": 0.4763, - "step": 101975 - }, - { - "epoch": 24.89, - "learning_rate": 0.00037605423894453946, - "loss": 0.4512, - "step": 102000 - }, - { - "epoch": 24.89, - "eval_cer": 0.1102122111228607, - "eval_loss": 0.4270845651626587, - "eval_runtime": 147.9389, - "eval_samples_per_second": 28.343, - "eval_steps_per_second": 7.091, - "eval_wer": 0.4470799347471452, - "step": 102000 - }, - { - "epoch": 24.9, - "learning_rate": 0.00037602369899828977, - "loss": 0.475, - "step": 102025 - }, - { - "epoch": 24.9, - "learning_rate": 0.00037599315905204007, - "loss": 0.4679, - "step": 102050 - }, - { - "epoch": 24.91, - "learning_rate": 0.00037596261910579037, - "loss": 0.4831, - "step": 102075 - }, - { - "epoch": 24.91, - "learning_rate": 0.0003759320791595407, - "loss": 0.4822, - "step": 102100 - }, - { - "epoch": 24.92, - "learning_rate": 0.00037590153921329103, - "loss": 0.4793, - "step": 102125 - }, - { - "epoch": 24.93, - "learning_rate": 0.00037587099926704134, - "loss": 0.4366, - "step": 102150 - }, - { - "epoch": 24.93, - "learning_rate": 0.0003758404593207916, - "loss": 0.4796, - "step": 102175 - }, - { - "epoch": 24.94, - "learning_rate": 0.0003758099193745419, - "loss": 0.4369, - "step": 102200 - }, - { - "epoch": 24.95, - "learning_rate": 0.0003757793794282922, - "loss": 0.4931, - "step": 102225 - }, - { - "epoch": 24.95, - "learning_rate": 0.00037574883948204255, - "loss": 0.446, - "step": 102250 - }, - { - "epoch": 24.96, - "learning_rate": 0.00037571829953579285, - "loss": 0.5142, - "step": 102275 - }, - { - "epoch": 24.96, - "learning_rate": 0.00037568775958954316, - "loss": 0.4343, - "step": 102300 - }, - { - "epoch": 24.97, - "learning_rate": 0.0003756572196432934, - "loss": 0.4518, - "step": 102325 - }, - { - "epoch": 24.98, - "learning_rate": 0.0003756266796970437, - "loss": 0.4916, - "step": 102350 - }, - { - "epoch": 24.98, - "learning_rate": 0.00037559613975079407, - "loss": 0.494, - "step": 102375 - }, - { - "epoch": 24.99, - "learning_rate": 0.00037556559980454437, - "loss": 0.4307, - "step": 102400 - }, - { - "epoch": 24.99, - "learning_rate": 0.0003755350598582947, - "loss": 0.4706, - "step": 102425 - }, - { - "epoch": 25.0, - "learning_rate": 0.000375504519912045, - "loss": 0.4222, - "step": 102450 - }, - { - "epoch": 25.01, - "learning_rate": 0.0003754739799657952, - "loss": 0.4631, - "step": 102475 - }, - { - "epoch": 25.01, - "learning_rate": 0.0003754434400195456, - "loss": 0.4621, - "step": 102500 - }, - { - "epoch": 25.02, - "learning_rate": 0.0003754129000732959, - "loss": 0.4992, - "step": 102525 - }, - { - "epoch": 25.02, - "learning_rate": 0.0003753823601270462, - "loss": 0.3952, - "step": 102550 - }, - { - "epoch": 25.03, - "learning_rate": 0.0003753518201807965, - "loss": 0.4637, - "step": 102575 - }, - { - "epoch": 25.04, - "learning_rate": 0.0003753212802345468, - "loss": 0.4229, - "step": 102600 - }, - { - "epoch": 25.04, - "learning_rate": 0.00037529074028829715, - "loss": 0.4872, - "step": 102625 - }, - { - "epoch": 25.05, - "learning_rate": 0.0003752602003420474, - "loss": 0.4627, - "step": 102650 - }, - { - "epoch": 25.05, - "learning_rate": 0.0003752296603957977, - "loss": 0.4823, - "step": 102675 - }, - { - "epoch": 25.06, - "learning_rate": 0.000375199120449548, - "loss": 0.4422, - "step": 102700 - }, - { - "epoch": 25.07, - "learning_rate": 0.0003751685805032983, - "loss": 0.4868, - "step": 102725 - }, - { - "epoch": 25.07, - "learning_rate": 0.0003751380405570486, - "loss": 0.4075, - "step": 102750 - }, - { - "epoch": 25.08, - "learning_rate": 0.000375107500610799, - "loss": 0.5041, - "step": 102775 - }, - { - "epoch": 25.09, - "learning_rate": 0.0003750769606645492, - "loss": 0.4685, - "step": 102800 - }, - { - "epoch": 25.09, - "learning_rate": 0.00037504642071829953, - "loss": 0.424, - "step": 102825 - }, - { - "epoch": 25.1, - "learning_rate": 0.00037501588077204983, - "loss": 0.4336, - "step": 102850 - }, - { - "epoch": 25.1, - "learning_rate": 0.00037498534082580013, - "loss": 0.4604, - "step": 102875 - }, - { - "epoch": 25.11, - "learning_rate": 0.0003749548008795505, - "loss": 0.4349, - "step": 102900 - }, - { - "epoch": 25.12, - "learning_rate": 0.0003749242609333008, - "loss": 0.4693, - "step": 102925 - }, - { - "epoch": 25.12, - "learning_rate": 0.00037489372098705104, - "loss": 0.4401, - "step": 102950 - }, - { - "epoch": 25.13, - "learning_rate": 0.00037486318104080135, - "loss": 0.4709, - "step": 102975 - }, - { - "epoch": 25.13, - "learning_rate": 0.00037483264109455165, - "loss": 0.4279, - "step": 103000 - }, - { - "epoch": 25.14, - "learning_rate": 0.000374802101148302, - "loss": 0.4952, - "step": 103025 - }, - { - "epoch": 25.15, - "learning_rate": 0.0003747715612020523, - "loss": 0.4015, - "step": 103050 - }, - { - "epoch": 25.15, - "learning_rate": 0.0003747410212558026, - "loss": 0.4887, - "step": 103075 - }, - { - "epoch": 25.16, - "learning_rate": 0.00037471048130955286, - "loss": 0.4545, - "step": 103100 - }, - { - "epoch": 25.16, - "learning_rate": 0.00037467994136330317, - "loss": 0.4596, - "step": 103125 - }, - { - "epoch": 25.17, - "learning_rate": 0.0003746494014170535, - "loss": 0.4146, - "step": 103150 - }, - { - "epoch": 25.18, - "learning_rate": 0.00037461886147080383, - "loss": 0.4797, - "step": 103175 - }, - { - "epoch": 25.18, - "learning_rate": 0.00037458832152455413, - "loss": 0.4724, - "step": 103200 - }, - { - "epoch": 25.19, - "learning_rate": 0.00037455778157830443, - "loss": 0.5207, - "step": 103225 - }, - { - "epoch": 25.2, - "learning_rate": 0.00037452724163205474, - "loss": 0.4235, - "step": 103250 - }, - { - "epoch": 25.2, - "learning_rate": 0.00037449670168580504, - "loss": 0.5035, - "step": 103275 - }, - { - "epoch": 25.21, - "learning_rate": 0.00037446616173955534, - "loss": 0.4209, - "step": 103300 - }, - { - "epoch": 25.21, - "learning_rate": 0.00037443562179330565, - "loss": 0.4922, - "step": 103325 - }, - { - "epoch": 25.22, - "learning_rate": 0.00037440508184705595, - "loss": 0.4448, - "step": 103350 - }, - { - "epoch": 25.23, - "learning_rate": 0.00037437454190080626, - "loss": 0.473, - "step": 103375 - }, - { - "epoch": 25.23, - "learning_rate": 0.0003743440019545566, - "loss": 0.4392, - "step": 103400 - }, - { - "epoch": 25.24, - "learning_rate": 0.00037431346200830686, - "loss": 0.466, - "step": 103425 - }, - { - "epoch": 25.24, - "learning_rate": 0.00037428292206205717, - "loss": 0.4162, - "step": 103450 - }, - { - "epoch": 25.25, - "learning_rate": 0.00037425238211580747, - "loss": 0.472, - "step": 103475 - }, - { - "epoch": 25.26, - "learning_rate": 0.00037422184216955777, - "loss": 0.4314, - "step": 103500 - }, - { - "epoch": 25.26, - "learning_rate": 0.00037419130222330813, - "loss": 0.4779, - "step": 103525 - }, - { - "epoch": 25.27, - "learning_rate": 0.00037416076227705843, - "loss": 0.4327, - "step": 103550 - }, - { - "epoch": 25.27, - "learning_rate": 0.0003741302223308087, - "loss": 0.4718, - "step": 103575 - }, - { - "epoch": 25.28, - "learning_rate": 0.000374099682384559, - "loss": 0.4607, - "step": 103600 - }, - { - "epoch": 25.29, - "learning_rate": 0.0003740691424383093, - "loss": 0.4718, - "step": 103625 - }, - { - "epoch": 25.29, - "learning_rate": 0.00037403860249205965, - "loss": 0.385, - "step": 103650 - }, - { - "epoch": 25.3, - "learning_rate": 0.00037400806254580995, - "loss": 0.448, - "step": 103675 - }, - { - "epoch": 25.31, - "learning_rate": 0.00037397752259956025, - "loss": 0.4499, - "step": 103700 - }, - { - "epoch": 25.31, - "learning_rate": 0.00037394698265331056, - "loss": 0.481, - "step": 103725 - }, - { - "epoch": 25.32, - "learning_rate": 0.0003739164427070608, - "loss": 0.3851, - "step": 103750 - }, - { - "epoch": 25.32, - "learning_rate": 0.00037388590276081116, - "loss": 0.4922, - "step": 103775 - }, - { - "epoch": 25.33, - "learning_rate": 0.0003738565844124114, - "loss": 0.4214, - "step": 103800 - }, - { - "epoch": 25.34, - "learning_rate": 0.00037382604446616177, - "loss": 0.4982, - "step": 103825 - }, - { - "epoch": 25.34, - "learning_rate": 0.0003737955045199121, - "loss": 0.4485, - "step": 103850 - }, - { - "epoch": 25.35, - "learning_rate": 0.0003737649645736624, - "loss": 0.4842, - "step": 103875 - }, - { - "epoch": 25.35, - "learning_rate": 0.00037373442462741263, - "loss": 0.4432, - "step": 103900 - }, - { - "epoch": 25.36, - "learning_rate": 0.00037370388468116293, - "loss": 0.4599, - "step": 103925 - }, - { - "epoch": 25.37, - "learning_rate": 0.0003736733447349133, - "loss": 0.456, - "step": 103950 - }, - { - "epoch": 25.37, - "learning_rate": 0.0003736428047886636, - "loss": 0.4892, - "step": 103975 - }, - { - "epoch": 25.38, - "learning_rate": 0.0003736122648424139, - "loss": 0.428, - "step": 104000 - }, - { - "epoch": 25.38, - "learning_rate": 0.0003735817248961642, - "loss": 0.4879, - "step": 104025 - }, - { - "epoch": 25.39, - "learning_rate": 0.00037355118494991445, - "loss": 0.4605, - "step": 104050 - }, - { - "epoch": 25.4, - "learning_rate": 0.0003735206450036648, - "loss": 0.4768, - "step": 104075 - }, - { - "epoch": 25.4, - "learning_rate": 0.0003734901050574151, - "loss": 0.4498, - "step": 104100 - }, - { - "epoch": 25.41, - "learning_rate": 0.0003734595651111654, - "loss": 0.4897, - "step": 104125 - }, - { - "epoch": 25.41, - "learning_rate": 0.0003734290251649157, - "loss": 0.4544, - "step": 104150 - }, - { - "epoch": 25.42, - "learning_rate": 0.000373398485218666, - "loss": 0.5028, - "step": 104175 - }, - { - "epoch": 25.43, - "learning_rate": 0.0003733679452724164, - "loss": 0.3967, - "step": 104200 - }, - { - "epoch": 25.43, - "learning_rate": 0.0003733374053261666, - "loss": 0.4598, - "step": 104225 - }, - { - "epoch": 25.44, - "learning_rate": 0.00037330686537991693, - "loss": 0.4726, - "step": 104250 - }, - { - "epoch": 25.45, - "learning_rate": 0.00037327632543366723, - "loss": 0.4783, - "step": 104275 - }, - { - "epoch": 25.45, - "learning_rate": 0.00037324578548741754, - "loss": 0.3883, - "step": 104300 - }, - { - "epoch": 25.46, - "learning_rate": 0.0003732152455411679, - "loss": 0.4943, - "step": 104325 - }, - { - "epoch": 25.46, - "learning_rate": 0.0003731847055949182, - "loss": 0.4262, - "step": 104350 - }, - { - "epoch": 25.47, - "learning_rate": 0.00037315416564866845, - "loss": 0.5044, - "step": 104375 - }, - { - "epoch": 25.48, - "learning_rate": 0.00037312362570241875, - "loss": 0.4264, - "step": 104400 - }, - { - "epoch": 25.48, - "learning_rate": 0.00037309308575616905, - "loss": 0.4692, - "step": 104425 - }, - { - "epoch": 25.49, - "learning_rate": 0.0003730625458099194, - "loss": 0.4578, - "step": 104450 - }, - { - "epoch": 25.49, - "learning_rate": 0.0003730320058636697, - "loss": 0.4825, - "step": 104475 - }, - { - "epoch": 25.5, - "learning_rate": 0.00037300146591742, - "loss": 0.472, - "step": 104500 - }, - { - "epoch": 25.51, - "learning_rate": 0.00037297092597117027, - "loss": 0.5078, - "step": 104525 - }, - { - "epoch": 25.51, - "learning_rate": 0.00037294038602492057, - "loss": 0.38, - "step": 104550 - }, - { - "epoch": 25.52, - "learning_rate": 0.0003729098460786709, - "loss": 0.4674, - "step": 104575 - }, - { - "epoch": 25.52, - "learning_rate": 0.00037287930613242123, - "loss": 0.428, - "step": 104600 - }, - { - "epoch": 25.53, - "learning_rate": 0.00037284876618617153, - "loss": 0.47, - "step": 104625 - }, - { - "epoch": 25.54, - "learning_rate": 0.00037281822623992184, - "loss": 0.403, - "step": 104650 - }, - { - "epoch": 25.54, - "learning_rate": 0.00037278768629367214, - "loss": 0.476, - "step": 104675 - }, - { - "epoch": 25.55, - "learning_rate": 0.0003727571463474224, - "loss": 0.433, - "step": 104700 - }, - { - "epoch": 25.56, - "learning_rate": 0.00037272660640117275, - "loss": 0.4434, - "step": 104725 - }, - { - "epoch": 25.56, - "learning_rate": 0.00037269606645492305, - "loss": 0.4667, - "step": 104750 - }, - { - "epoch": 25.57, - "learning_rate": 0.00037266552650867335, - "loss": 0.4814, - "step": 104775 - }, - { - "epoch": 25.57, - "learning_rate": 0.00037263498656242366, - "loss": 0.4665, - "step": 104800 - }, - { - "epoch": 25.58, - "learning_rate": 0.00037260444661617396, - "loss": 0.475, - "step": 104825 - }, - { - "epoch": 25.59, - "learning_rate": 0.00037257390666992426, - "loss": 0.4225, - "step": 104850 - }, - { - "epoch": 25.59, - "learning_rate": 0.00037254336672367457, - "loss": 0.5022, - "step": 104875 - }, - { - "epoch": 25.6, - "learning_rate": 0.00037251282677742487, - "loss": 0.396, - "step": 104900 - }, - { - "epoch": 25.6, - "learning_rate": 0.0003724822868311752, - "loss": 0.4856, - "step": 104925 - }, - { - "epoch": 25.61, - "learning_rate": 0.0003724517468849255, - "loss": 0.4229, - "step": 104950 - }, - { - "epoch": 25.62, - "learning_rate": 0.00037242120693867583, - "loss": 0.4621, - "step": 104975 - }, - { - "epoch": 25.62, - "learning_rate": 0.0003723906669924261, - "loss": 0.4049, - "step": 105000 - }, - { - "epoch": 25.62, - "eval_cer": 0.10712195722924345, - "eval_loss": 0.42072468996047974, - "eval_runtime": 147.7106, - "eval_samples_per_second": 28.387, - "eval_steps_per_second": 7.102, - "eval_wer": 0.43494290375203915, - "step": 105000 - }, - { - "epoch": 25.63, - "learning_rate": 0.0003723601270461764, - "loss": 0.465, - "step": 105025 - }, - { - "epoch": 25.63, - "learning_rate": 0.0003723295870999267, - "loss": 0.4088, - "step": 105050 - }, - { - "epoch": 25.64, - "learning_rate": 0.000372299047153677, - "loss": 0.4739, - "step": 105075 - }, - { - "epoch": 25.65, - "learning_rate": 0.00037226850720742735, - "loss": 0.4535, - "step": 105100 - }, - { - "epoch": 25.65, - "learning_rate": 0.00037223796726117765, - "loss": 0.4836, - "step": 105125 - }, - { - "epoch": 25.66, - "learning_rate": 0.00037220742731492796, - "loss": 0.4339, - "step": 105150 - }, - { - "epoch": 25.66, - "learning_rate": 0.0003721768873686782, - "loss": 0.4807, - "step": 105175 - }, - { - "epoch": 25.67, - "learning_rate": 0.0003721463474224285, - "loss": 0.3848, - "step": 105200 - }, - { - "epoch": 25.68, - "learning_rate": 0.00037211580747617887, - "loss": 0.488, - "step": 105225 - }, - { - "epoch": 25.68, - "learning_rate": 0.00037208526752992917, - "loss": 0.4458, - "step": 105250 - }, - { - "epoch": 25.69, - "learning_rate": 0.0003720547275836795, - "loss": 0.4587, - "step": 105275 - }, - { - "epoch": 25.7, - "learning_rate": 0.0003720241876374298, - "loss": 0.4346, - "step": 105300 - }, - { - "epoch": 25.7, - "learning_rate": 0.00037199364769118003, - "loss": 0.505, - "step": 105325 - }, - { - "epoch": 25.71, - "learning_rate": 0.0003719631077449304, - "loss": 0.4108, - "step": 105350 - }, - { - "epoch": 25.71, - "learning_rate": 0.0003719325677986807, - "loss": 0.4868, - "step": 105375 - }, - { - "epoch": 25.72, - "learning_rate": 0.000371902027852431, - "loss": 0.4004, - "step": 105400 - }, - { - "epoch": 25.73, - "learning_rate": 0.0003718714879061813, - "loss": 0.4812, - "step": 105425 - }, - { - "epoch": 25.73, - "learning_rate": 0.0003718409479599316, - "loss": 0.4186, - "step": 105450 - }, - { - "epoch": 25.74, - "learning_rate": 0.0003718104080136819, - "loss": 0.4643, - "step": 105475 - }, - { - "epoch": 25.74, - "learning_rate": 0.0003717798680674322, - "loss": 0.4142, - "step": 105500 - }, - { - "epoch": 25.75, - "learning_rate": 0.0003717493281211825, - "loss": 0.4678, - "step": 105525 - }, - { - "epoch": 25.76, - "learning_rate": 0.0003717187881749328, - "loss": 0.4754, - "step": 105550 - }, - { - "epoch": 25.76, - "learning_rate": 0.0003716882482286831, - "loss": 0.4888, - "step": 105575 - }, - { - "epoch": 25.77, - "learning_rate": 0.00037165770828243347, - "loss": 0.4401, - "step": 105600 - }, - { - "epoch": 25.77, - "learning_rate": 0.0003716271683361838, - "loss": 0.4438, - "step": 105625 - }, - { - "epoch": 25.78, - "learning_rate": 0.000371596628389934, - "loss": 0.3972, - "step": 105650 - }, - { - "epoch": 25.79, - "learning_rate": 0.00037156608844368433, - "loss": 0.5188, - "step": 105675 - }, - { - "epoch": 25.79, - "learning_rate": 0.00037153554849743463, - "loss": 0.433, - "step": 105700 - }, - { - "epoch": 25.8, - "learning_rate": 0.000371505008551185, - "loss": 0.4854, - "step": 105725 - }, - { - "epoch": 25.81, - "learning_rate": 0.0003714744686049353, - "loss": 0.4058, - "step": 105750 - }, - { - "epoch": 25.81, - "learning_rate": 0.0003714439286586856, - "loss": 0.4883, - "step": 105775 - }, - { - "epoch": 25.82, - "learning_rate": 0.00037141338871243585, - "loss": 0.45, - "step": 105800 - }, - { - "epoch": 25.82, - "learning_rate": 0.00037138284876618615, - "loss": 0.4894, - "step": 105825 - }, - { - "epoch": 25.83, - "learning_rate": 0.0003713523088199365, - "loss": 0.4054, - "step": 105850 - }, - { - "epoch": 25.84, - "learning_rate": 0.0003713217688736868, - "loss": 0.484, - "step": 105875 - }, - { - "epoch": 25.84, - "learning_rate": 0.0003712912289274371, - "loss": 0.4124, - "step": 105900 - }, - { - "epoch": 25.85, - "learning_rate": 0.0003712606889811874, - "loss": 0.446, - "step": 105925 - }, - { - "epoch": 25.85, - "learning_rate": 0.00037123014903493767, - "loss": 0.4206, - "step": 105950 - }, - { - "epoch": 25.86, - "learning_rate": 0.00037119960908868797, - "loss": 0.4667, - "step": 105975 - }, - { - "epoch": 25.87, - "learning_rate": 0.0003711690691424383, - "loss": 0.4795, - "step": 106000 - }, - { - "epoch": 25.87, - "learning_rate": 0.00037113852919618863, - "loss": 0.4763, - "step": 106025 - }, - { - "epoch": 25.88, - "learning_rate": 0.00037110798924993893, - "loss": 0.4272, - "step": 106050 - }, - { - "epoch": 25.88, - "learning_rate": 0.00037107744930368924, - "loss": 0.4659, - "step": 106075 - }, - { - "epoch": 25.89, - "learning_rate": 0.00037104690935743954, - "loss": 0.439, - "step": 106100 - }, - { - "epoch": 25.9, - "learning_rate": 0.00037101636941118984, - "loss": 0.4927, - "step": 106125 - }, - { - "epoch": 25.9, - "learning_rate": 0.00037098582946494015, - "loss": 0.4184, - "step": 106150 - }, - { - "epoch": 25.91, - "learning_rate": 0.00037095528951869045, - "loss": 0.4802, - "step": 106175 - }, - { - "epoch": 25.92, - "learning_rate": 0.00037092474957244075, - "loss": 0.412, - "step": 106200 - }, - { - "epoch": 25.92, - "learning_rate": 0.00037089420962619106, - "loss": 0.5181, - "step": 106225 - }, - { - "epoch": 25.93, - "learning_rate": 0.0003708636696799414, - "loss": 0.4222, - "step": 106250 - }, - { - "epoch": 25.93, - "learning_rate": 0.00037083312973369166, - "loss": 0.4779, - "step": 106275 - }, - { - "epoch": 25.94, - "learning_rate": 0.00037080258978744197, - "loss": 0.4188, - "step": 106300 - }, - { - "epoch": 25.95, - "learning_rate": 0.00037077204984119227, - "loss": 0.4708, - "step": 106325 - }, - { - "epoch": 25.95, - "learning_rate": 0.0003707415098949426, - "loss": 0.4742, - "step": 106350 - }, - { - "epoch": 25.96, - "learning_rate": 0.00037071096994869293, - "loss": 0.4712, - "step": 106375 - }, - { - "epoch": 25.96, - "learning_rate": 0.00037068043000244323, - "loss": 0.4305, - "step": 106400 - }, - { - "epoch": 25.97, - "learning_rate": 0.0003706498900561935, - "loss": 0.4821, - "step": 106425 - }, - { - "epoch": 25.98, - "learning_rate": 0.0003706193501099438, - "loss": 0.4488, - "step": 106450 - }, - { - "epoch": 25.98, - "learning_rate": 0.0003705888101636941, - "loss": 0.4867, - "step": 106475 - }, - { - "epoch": 25.99, - "learning_rate": 0.00037055827021744445, - "loss": 0.3886, - "step": 106500 - }, - { - "epoch": 25.99, - "learning_rate": 0.00037052773027119475, - "loss": 0.4734, - "step": 106525 - }, - { - "epoch": 26.0, - "learning_rate": 0.00037049719032494505, - "loss": 0.4751, - "step": 106550 - }, - { - "epoch": 26.01, - "learning_rate": 0.0003704666503786953, - "loss": 0.4749, - "step": 106575 - }, - { - "epoch": 26.01, - "learning_rate": 0.0003704361104324456, - "loss": 0.4585, - "step": 106600 - }, - { - "epoch": 26.02, - "learning_rate": 0.00037040557048619596, - "loss": 0.4786, - "step": 106625 - }, - { - "epoch": 26.02, - "learning_rate": 0.00037037503053994627, - "loss": 0.4364, - "step": 106650 - }, - { - "epoch": 26.03, - "learning_rate": 0.00037034449059369657, - "loss": 0.4331, - "step": 106675 - }, - { - "epoch": 26.04, - "learning_rate": 0.0003703139506474469, - "loss": 0.4266, - "step": 106700 - }, - { - "epoch": 26.04, - "learning_rate": 0.0003702834107011972, - "loss": 0.4936, - "step": 106725 - }, - { - "epoch": 26.05, - "learning_rate": 0.0003702528707549475, - "loss": 0.3865, - "step": 106750 - }, - { - "epoch": 26.06, - "learning_rate": 0.0003702223308086978, - "loss": 0.4762, - "step": 106775 - }, - { - "epoch": 26.06, - "learning_rate": 0.0003701917908624481, - "loss": 0.4166, - "step": 106800 - }, - { - "epoch": 26.07, - "learning_rate": 0.0003701612509161984, - "loss": 0.4492, - "step": 106825 - }, - { - "epoch": 26.07, - "learning_rate": 0.0003701307109699487, - "loss": 0.4309, - "step": 106850 - }, - { - "epoch": 26.08, - "learning_rate": 0.00037010017102369905, - "loss": 0.4462, - "step": 106875 - }, - { - "epoch": 26.09, - "learning_rate": 0.0003700696310774493, - "loss": 0.4186, - "step": 106900 - }, - { - "epoch": 26.09, - "learning_rate": 0.0003700390911311996, - "loss": 0.4786, - "step": 106925 - }, - { - "epoch": 26.1, - "learning_rate": 0.0003700085511849499, - "loss": 0.4521, - "step": 106950 - }, - { - "epoch": 26.1, - "learning_rate": 0.0003699780112387002, - "loss": 0.466, - "step": 106975 - }, - { - "epoch": 26.11, - "learning_rate": 0.00036994747129245057, - "loss": 0.4263, - "step": 107000 - }, - { - "epoch": 26.12, - "learning_rate": 0.00036991693134620087, - "loss": 0.4895, - "step": 107025 - }, - { - "epoch": 26.12, - "learning_rate": 0.0003698863913999511, - "loss": 0.4347, - "step": 107050 - }, - { - "epoch": 26.13, - "learning_rate": 0.0003698558514537014, - "loss": 0.4321, - "step": 107075 - }, - { - "epoch": 26.13, - "learning_rate": 0.00036982531150745173, - "loss": 0.4198, - "step": 107100 - }, - { - "epoch": 26.14, - "learning_rate": 0.0003697947715612021, - "loss": 0.4793, - "step": 107125 - }, - { - "epoch": 26.15, - "learning_rate": 0.0003697642316149524, - "loss": 0.4299, - "step": 107150 - }, - { - "epoch": 26.15, - "learning_rate": 0.0003697336916687027, - "loss": 0.4252, - "step": 107175 - }, - { - "epoch": 26.16, - "learning_rate": 0.000369703151722453, - "loss": 0.4794, - "step": 107200 - }, - { - "epoch": 26.17, - "learning_rate": 0.00036967261177620324, - "loss": 0.4622, - "step": 107225 - }, - { - "epoch": 26.17, - "learning_rate": 0.00036964207182995355, - "loss": 0.3999, - "step": 107250 - }, - { - "epoch": 26.18, - "learning_rate": 0.0003696115318837039, - "loss": 0.4948, - "step": 107275 - }, - { - "epoch": 26.18, - "learning_rate": 0.0003695809919374542, - "loss": 0.4358, - "step": 107300 - }, - { - "epoch": 26.19, - "learning_rate": 0.0003695504519912045, - "loss": 0.4585, - "step": 107325 - }, - { - "epoch": 26.2, - "learning_rate": 0.0003695199120449548, - "loss": 0.4442, - "step": 107350 - }, - { - "epoch": 26.2, - "learning_rate": 0.00036948937209870506, - "loss": 0.457, - "step": 107375 - }, - { - "epoch": 26.21, - "learning_rate": 0.0003694588321524554, - "loss": 0.4335, - "step": 107400 - }, - { - "epoch": 26.21, - "learning_rate": 0.0003694282922062057, - "loss": 0.4654, - "step": 107425 - }, - { - "epoch": 26.22, - "learning_rate": 0.00036939775225995603, - "loss": 0.4224, - "step": 107450 - }, - { - "epoch": 26.23, - "learning_rate": 0.00036936721231370633, - "loss": 0.4256, - "step": 107475 - }, - { - "epoch": 26.23, - "learning_rate": 0.00036933667236745664, - "loss": 0.4323, - "step": 107500 - }, - { - "epoch": 26.24, - "learning_rate": 0.00036930613242120694, - "loss": 0.485, - "step": 107525 - }, - { - "epoch": 26.24, - "learning_rate": 0.00036927559247495724, - "loss": 0.3872, - "step": 107550 - }, - { - "epoch": 26.25, - "learning_rate": 0.00036924505252870755, - "loss": 0.4637, - "step": 107575 - }, - { - "epoch": 26.26, - "learning_rate": 0.00036921451258245785, - "loss": 0.4406, - "step": 107600 - }, - { - "epoch": 26.26, - "learning_rate": 0.00036918397263620815, - "loss": 0.4668, - "step": 107625 - }, - { - "epoch": 26.27, - "learning_rate": 0.0003691534326899585, - "loss": 0.4599, - "step": 107650 - }, - { - "epoch": 26.28, - "learning_rate": 0.0003691228927437088, - "loss": 0.4629, - "step": 107675 - }, - { - "epoch": 26.28, - "learning_rate": 0.00036909235279745906, - "loss": 0.427, - "step": 107700 - }, - { - "epoch": 26.29, - "learning_rate": 0.00036906181285120937, - "loss": 0.4687, - "step": 107725 - }, - { - "epoch": 26.29, - "learning_rate": 0.00036903127290495967, - "loss": 0.4723, - "step": 107750 - }, - { - "epoch": 26.3, - "learning_rate": 0.00036900073295871, - "loss": 0.4637, - "step": 107775 - }, - { - "epoch": 26.31, - "learning_rate": 0.00036897019301246033, - "loss": 0.3946, - "step": 107800 - }, - { - "epoch": 26.31, - "learning_rate": 0.00036893965306621063, - "loss": 0.5078, - "step": 107825 - }, - { - "epoch": 26.32, - "learning_rate": 0.0003689091131199609, - "loss": 0.4029, - "step": 107850 - }, - { - "epoch": 26.32, - "learning_rate": 0.0003688785731737112, - "loss": 0.4586, - "step": 107875 - }, - { - "epoch": 26.33, - "learning_rate": 0.00036884803322746154, - "loss": 0.4345, - "step": 107900 - }, - { - "epoch": 26.34, - "learning_rate": 0.00036881749328121185, - "loss": 0.4809, - "step": 107925 - }, - { - "epoch": 26.34, - "learning_rate": 0.00036878695333496215, - "loss": 0.4448, - "step": 107950 - }, - { - "epoch": 26.35, - "learning_rate": 0.00036875641338871245, - "loss": 0.4703, - "step": 107975 - }, - { - "epoch": 26.35, - "learning_rate": 0.0003687258734424627, - "loss": 0.4134, - "step": 108000 - }, - { - "epoch": 26.35, - "eval_cer": 0.1060593616213053, - "eval_loss": 0.43024691939353943, - "eval_runtime": 147.9221, - "eval_samples_per_second": 28.346, - "eval_steps_per_second": 7.092, - "eval_wer": 0.43507340946166395, - "step": 108000 - }, - { - "epoch": 26.36, - "learning_rate": 0.00036869533349621306, - "loss": 0.4485, - "step": 108025 - }, - { - "epoch": 26.37, - "learning_rate": 0.00036866479354996336, - "loss": 0.4284, - "step": 108050 - }, - { - "epoch": 26.37, - "learning_rate": 0.00036863425360371367, - "loss": 0.462, - "step": 108075 - }, - { - "epoch": 26.38, - "learning_rate": 0.000368604935255314, - "loss": 0.4297, - "step": 108100 - }, - { - "epoch": 26.38, - "learning_rate": 0.0003685743953090643, - "loss": 0.4739, - "step": 108125 - }, - { - "epoch": 26.39, - "learning_rate": 0.0003685438553628146, - "loss": 0.4459, - "step": 108150 - }, - { - "epoch": 26.4, - "learning_rate": 0.00036851331541656483, - "loss": 0.4728, - "step": 108175 - }, - { - "epoch": 26.4, - "learning_rate": 0.0003684827754703152, - "loss": 0.3765, - "step": 108200 - }, - { - "epoch": 26.41, - "learning_rate": 0.0003684522355240655, - "loss": 0.4611, - "step": 108225 - }, - { - "epoch": 26.42, - "learning_rate": 0.0003684216955778158, - "loss": 0.4038, - "step": 108250 - }, - { - "epoch": 26.42, - "learning_rate": 0.0003683911556315661, - "loss": 0.4677, - "step": 108275 - }, - { - "epoch": 26.43, - "learning_rate": 0.0003683606156853164, - "loss": 0.4224, - "step": 108300 - }, - { - "epoch": 26.43, - "learning_rate": 0.0003683300757390667, - "loss": 0.4738, - "step": 108325 - }, - { - "epoch": 26.44, - "learning_rate": 0.000368299535792817, - "loss": 0.4373, - "step": 108350 - }, - { - "epoch": 26.45, - "learning_rate": 0.0003682689958465673, - "loss": 0.4712, - "step": 108375 - }, - { - "epoch": 26.45, - "learning_rate": 0.0003682384559003176, - "loss": 0.4267, - "step": 108400 - }, - { - "epoch": 26.46, - "learning_rate": 0.0003682079159540679, - "loss": 0.4353, - "step": 108425 - }, - { - "epoch": 26.46, - "learning_rate": 0.0003681773760078183, - "loss": 0.4254, - "step": 108450 - }, - { - "epoch": 26.47, - "learning_rate": 0.0003681468360615685, - "loss": 0.4527, - "step": 108475 - }, - { - "epoch": 26.48, - "learning_rate": 0.0003681162961153188, - "loss": 0.4297, - "step": 108500 - }, - { - "epoch": 26.48, - "learning_rate": 0.00036808575616906913, - "loss": 0.4702, - "step": 108525 - }, - { - "epoch": 26.49, - "learning_rate": 0.00036805521622281943, - "loss": 0.4419, - "step": 108550 - }, - { - "epoch": 26.49, - "learning_rate": 0.0003680246762765698, - "loss": 0.4729, - "step": 108575 - }, - { - "epoch": 26.5, - "learning_rate": 0.0003679941363303201, - "loss": 0.4453, - "step": 108600 - }, - { - "epoch": 26.51, - "learning_rate": 0.0003679635963840704, - "loss": 0.4262, - "step": 108625 - }, - { - "epoch": 26.51, - "learning_rate": 0.00036793305643782065, - "loss": 0.4974, - "step": 108650 - }, - { - "epoch": 26.52, - "learning_rate": 0.00036790251649157095, - "loss": 0.4659, - "step": 108675 - }, - { - "epoch": 26.53, - "learning_rate": 0.0003678719765453213, - "loss": 0.4658, - "step": 108700 - }, - { - "epoch": 26.53, - "learning_rate": 0.0003678414365990716, - "loss": 0.4668, - "step": 108725 - }, - { - "epoch": 26.54, - "learning_rate": 0.0003678108966528219, - "loss": 0.4197, - "step": 108750 - }, - { - "epoch": 26.54, - "learning_rate": 0.0003677803567065722, - "loss": 0.4794, - "step": 108775 - }, - { - "epoch": 26.55, - "learning_rate": 0.00036774981676032247, - "loss": 0.413, - "step": 108800 - }, - { - "epoch": 26.56, - "learning_rate": 0.0003677192768140728, - "loss": 0.4852, - "step": 108825 - }, - { - "epoch": 26.56, - "learning_rate": 0.00036768873686782313, - "loss": 0.4619, - "step": 108850 - }, - { - "epoch": 26.57, - "learning_rate": 0.00036765819692157343, - "loss": 0.4534, - "step": 108875 - }, - { - "epoch": 26.57, - "learning_rate": 0.00036762765697532373, - "loss": 0.4627, - "step": 108900 - }, - { - "epoch": 26.58, - "learning_rate": 0.00036759711702907404, - "loss": 0.4897, - "step": 108925 - }, - { - "epoch": 26.59, - "learning_rate": 0.00036756657708282434, - "loss": 0.3912, - "step": 108950 - }, - { - "epoch": 26.59, - "learning_rate": 0.00036753603713657464, - "loss": 0.4565, - "step": 108975 - }, - { - "epoch": 26.6, - "learning_rate": 0.00036750549719032495, - "loss": 0.3951, - "step": 109000 - }, - { - "epoch": 26.6, - "learning_rate": 0.00036747495724407525, - "loss": 0.4592, - "step": 109025 - }, - { - "epoch": 26.61, - "learning_rate": 0.00036744441729782555, - "loss": 0.4158, - "step": 109050 - }, - { - "epoch": 26.62, - "learning_rate": 0.0003674138773515759, - "loss": 0.4869, - "step": 109075 - }, - { - "epoch": 26.62, - "learning_rate": 0.0003673833374053262, - "loss": 0.4344, - "step": 109100 - }, - { - "epoch": 26.63, - "learning_rate": 0.00036735279745907646, - "loss": 0.477, - "step": 109125 - }, - { - "epoch": 26.63, - "learning_rate": 0.00036732225751282677, - "loss": 0.4105, - "step": 109150 - }, - { - "epoch": 26.64, - "learning_rate": 0.00036729171756657707, - "loss": 0.4881, - "step": 109175 - }, - { - "epoch": 26.65, - "learning_rate": 0.00036726117762032743, - "loss": 0.4537, - "step": 109200 - }, - { - "epoch": 26.65, - "learning_rate": 0.00036723063767407773, - "loss": 0.4819, - "step": 109225 - }, - { - "epoch": 26.66, - "learning_rate": 0.00036720009772782804, - "loss": 0.4284, - "step": 109250 - }, - { - "epoch": 26.67, - "learning_rate": 0.0003671695577815783, - "loss": 0.4793, - "step": 109275 - }, - { - "epoch": 26.67, - "learning_rate": 0.0003671390178353286, - "loss": 0.3908, - "step": 109300 - }, - { - "epoch": 26.68, - "learning_rate": 0.0003671084778890789, - "loss": 0.4925, - "step": 109325 - }, - { - "epoch": 26.68, - "learning_rate": 0.00036707793794282925, - "loss": 0.4475, - "step": 109350 - }, - { - "epoch": 26.69, - "learning_rate": 0.00036704739799657955, - "loss": 0.446, - "step": 109375 - }, - { - "epoch": 26.7, - "learning_rate": 0.00036701685805032986, - "loss": 0.4149, - "step": 109400 - }, - { - "epoch": 26.7, - "learning_rate": 0.0003669863181040801, - "loss": 0.4352, - "step": 109425 - }, - { - "epoch": 26.71, - "learning_rate": 0.0003669557781578304, - "loss": 0.4381, - "step": 109450 - }, - { - "epoch": 26.71, - "learning_rate": 0.00036692523821158077, - "loss": 0.5132, - "step": 109475 - }, - { - "epoch": 26.72, - "learning_rate": 0.00036689469826533107, - "loss": 0.4933, - "step": 109500 - }, - { - "epoch": 26.73, - "learning_rate": 0.00036686415831908137, - "loss": 0.4786, - "step": 109525 - }, - { - "epoch": 26.73, - "learning_rate": 0.0003668336183728317, - "loss": 0.4435, - "step": 109550 - }, - { - "epoch": 26.74, - "learning_rate": 0.000366803078426582, - "loss": 0.4473, - "step": 109575 - }, - { - "epoch": 26.74, - "learning_rate": 0.0003667725384803323, - "loss": 0.433, - "step": 109600 - }, - { - "epoch": 26.75, - "learning_rate": 0.0003667419985340826, - "loss": 0.516, - "step": 109625 - }, - { - "epoch": 26.76, - "learning_rate": 0.0003667114585878329, - "loss": 0.4701, - "step": 109650 - }, - { - "epoch": 26.76, - "learning_rate": 0.0003666809186415832, - "loss": 0.4402, - "step": 109675 - }, - { - "epoch": 26.77, - "learning_rate": 0.0003666503786953335, - "loss": 0.438, - "step": 109700 - }, - { - "epoch": 26.78, - "learning_rate": 0.00036661983874908385, - "loss": 0.4546, - "step": 109725 - }, - { - "epoch": 26.78, - "learning_rate": 0.0003665892988028341, - "loss": 0.4501, - "step": 109750 - }, - { - "epoch": 26.79, - "learning_rate": 0.0003665587588565844, - "loss": 0.4646, - "step": 109775 - }, - { - "epoch": 26.79, - "learning_rate": 0.0003665282189103347, - "loss": 0.4086, - "step": 109800 - }, - { - "epoch": 26.8, - "learning_rate": 0.000366497678964085, - "loss": 0.4808, - "step": 109825 - }, - { - "epoch": 26.81, - "learning_rate": 0.00036646713901783537, - "loss": 0.4235, - "step": 109850 - }, - { - "epoch": 26.81, - "learning_rate": 0.0003664365990715857, - "loss": 0.4595, - "step": 109875 - }, - { - "epoch": 26.82, - "learning_rate": 0.0003664060591253359, - "loss": 0.4173, - "step": 109900 - }, - { - "epoch": 26.82, - "learning_rate": 0.0003663755191790862, - "loss": 0.4892, - "step": 109925 - }, - { - "epoch": 26.83, - "learning_rate": 0.00036634497923283653, - "loss": 0.4327, - "step": 109950 - }, - { - "epoch": 26.84, - "learning_rate": 0.0003663144392865869, - "loss": 0.4168, - "step": 109975 - }, - { - "epoch": 26.84, - "learning_rate": 0.0003662838993403372, - "loss": 0.4306, - "step": 110000 - }, - { - "epoch": 26.85, - "learning_rate": 0.0003662533593940875, - "loss": 0.4481, - "step": 110025 - }, - { - "epoch": 26.85, - "learning_rate": 0.00036622281944783774, - "loss": 0.4577, - "step": 110050 - }, - { - "epoch": 26.86, - "learning_rate": 0.00036619227950158805, - "loss": 0.4434, - "step": 110075 - }, - { - "epoch": 26.87, - "learning_rate": 0.0003661617395553384, - "loss": 0.3799, - "step": 110100 - }, - { - "epoch": 26.87, - "learning_rate": 0.0003661311996090887, - "loss": 0.4699, - "step": 110125 - }, - { - "epoch": 26.88, - "learning_rate": 0.000366100659662839, - "loss": 0.4373, - "step": 110150 - }, - { - "epoch": 26.89, - "learning_rate": 0.0003660701197165893, - "loss": 0.4765, - "step": 110175 - }, - { - "epoch": 26.89, - "learning_rate": 0.0003660395797703396, - "loss": 0.3899, - "step": 110200 - }, - { - "epoch": 26.9, - "learning_rate": 0.0003660090398240899, - "loss": 0.4409, - "step": 110225 - }, - { - "epoch": 26.9, - "learning_rate": 0.0003659784998778402, - "loss": 0.3785, - "step": 110250 - }, - { - "epoch": 26.91, - "learning_rate": 0.0003659479599315905, - "loss": 0.441, - "step": 110275 - }, - { - "epoch": 26.92, - "learning_rate": 0.00036591741998534083, - "loss": 0.4695, - "step": 110300 - }, - { - "epoch": 26.92, - "learning_rate": 0.00036588688003909113, - "loss": 0.4657, - "step": 110325 - }, - { - "epoch": 26.93, - "learning_rate": 0.00036585756169069144, - "loss": 0.4103, - "step": 110350 - }, - { - "epoch": 26.93, - "learning_rate": 0.0003658270217444417, - "loss": 0.4654, - "step": 110375 - }, - { - "epoch": 26.94, - "learning_rate": 0.00036579648179819205, - "loss": 0.4098, - "step": 110400 - }, - { - "epoch": 26.95, - "learning_rate": 0.00036576594185194235, - "loss": 0.4484, - "step": 110425 - }, - { - "epoch": 26.95, - "learning_rate": 0.00036573540190569265, - "loss": 0.4432, - "step": 110450 - }, - { - "epoch": 26.96, - "learning_rate": 0.00036570486195944296, - "loss": 0.4621, - "step": 110475 - }, - { - "epoch": 26.96, - "learning_rate": 0.00036567432201319326, - "loss": 0.4394, - "step": 110500 - }, - { - "epoch": 26.97, - "learning_rate": 0.00036564378206694356, - "loss": 0.4914, - "step": 110525 - }, - { - "epoch": 26.98, - "learning_rate": 0.00036561324212069387, - "loss": 0.4076, - "step": 110550 - }, - { - "epoch": 26.98, - "learning_rate": 0.00036558270217444417, - "loss": 0.4726, - "step": 110575 - }, - { - "epoch": 26.99, - "learning_rate": 0.0003655521622281945, - "loss": 0.4478, - "step": 110600 - }, - { - "epoch": 26.99, - "learning_rate": 0.0003655216222819448, - "loss": 0.4744, - "step": 110625 - }, - { - "epoch": 27.0, - "learning_rate": 0.00036549108233569513, - "loss": 0.4539, - "step": 110650 - }, - { - "epoch": 27.01, - "learning_rate": 0.00036546054238944544, - "loss": 0.4507, - "step": 110675 - }, - { - "epoch": 27.01, - "learning_rate": 0.0003654300024431957, - "loss": 0.3868, - "step": 110700 - }, - { - "epoch": 27.02, - "learning_rate": 0.000365399462496946, - "loss": 0.4459, - "step": 110725 - }, - { - "epoch": 27.03, - "learning_rate": 0.0003653689225506963, - "loss": 0.4198, - "step": 110750 - }, - { - "epoch": 27.03, - "learning_rate": 0.00036533838260444665, - "loss": 0.4551, - "step": 110775 - }, - { - "epoch": 27.04, - "learning_rate": 0.00036530784265819695, - "loss": 0.4359, - "step": 110800 - }, - { - "epoch": 27.04, - "learning_rate": 0.00036527730271194726, - "loss": 0.4391, - "step": 110825 - }, - { - "epoch": 27.05, - "learning_rate": 0.0003652467627656975, - "loss": 0.3863, - "step": 110850 - }, - { - "epoch": 27.06, - "learning_rate": 0.0003652162228194478, - "loss": 0.4541, - "step": 110875 - }, - { - "epoch": 27.06, - "learning_rate": 0.00036518568287319817, - "loss": 0.4366, - "step": 110900 - }, - { - "epoch": 27.07, - "learning_rate": 0.00036515514292694847, - "loss": 0.4762, - "step": 110925 - }, - { - "epoch": 27.07, - "learning_rate": 0.0003651246029806988, - "loss": 0.448, - "step": 110950 - }, - { - "epoch": 27.08, - "learning_rate": 0.0003650940630344491, - "loss": 0.4342, - "step": 110975 - }, - { - "epoch": 27.09, - "learning_rate": 0.0003650635230881993, - "loss": 0.4083, - "step": 111000 - }, - { - "epoch": 27.09, - "eval_cer": 0.10622876092112153, - "eval_loss": 0.45828574895858765, - "eval_runtime": 148.8526, - "eval_samples_per_second": 28.169, - "eval_steps_per_second": 7.047, - "eval_wer": 0.4320065252854812, - "step": 111000 - }, - { - "epoch": 27.09, - "learning_rate": 0.0003650329831419497, - "loss": 0.4351, - "step": 111025 - }, - { - "epoch": 27.1, - "learning_rate": 0.0003650024431957, - "loss": 0.3727, - "step": 111050 - }, - { - "epoch": 27.1, - "learning_rate": 0.0003649719032494503, - "loss": 0.4853, - "step": 111075 - }, - { - "epoch": 27.11, - "learning_rate": 0.0003649413633032006, - "loss": 0.4361, - "step": 111100 - }, - { - "epoch": 27.12, - "learning_rate": 0.0003649108233569509, - "loss": 0.4412, - "step": 111125 - }, - { - "epoch": 27.12, - "learning_rate": 0.00036488028341070126, - "loss": 0.3631, - "step": 111150 - }, - { - "epoch": 27.13, - "learning_rate": 0.0003648497434644515, - "loss": 0.4637, - "step": 111175 - }, - { - "epoch": 27.14, - "learning_rate": 0.0003648192035182018, - "loss": 0.3881, - "step": 111200 - }, - { - "epoch": 27.14, - "learning_rate": 0.0003647886635719521, - "loss": 0.4586, - "step": 111225 - }, - { - "epoch": 27.15, - "learning_rate": 0.0003647581236257024, - "loss": 0.4445, - "step": 111250 - }, - { - "epoch": 27.15, - "learning_rate": 0.00036472758367945277, - "loss": 0.4346, - "step": 111275 - }, - { - "epoch": 27.16, - "learning_rate": 0.0003646970437332031, - "loss": 0.3992, - "step": 111300 - }, - { - "epoch": 27.17, - "learning_rate": 0.0003646665037869533, - "loss": 0.4515, - "step": 111325 - }, - { - "epoch": 27.17, - "learning_rate": 0.00036463596384070363, - "loss": 0.3972, - "step": 111350 - }, - { - "epoch": 27.18, - "learning_rate": 0.00036460542389445393, - "loss": 0.4142, - "step": 111375 - }, - { - "epoch": 27.18, - "learning_rate": 0.00036457488394820423, - "loss": 0.3766, - "step": 111400 - }, - { - "epoch": 27.19, - "learning_rate": 0.0003645443440019546, - "loss": 0.4359, - "step": 111425 - }, - { - "epoch": 27.2, - "learning_rate": 0.0003645138040557049, - "loss": 0.3852, - "step": 111450 - }, - { - "epoch": 27.2, - "learning_rate": 0.00036448326410945514, - "loss": 0.4507, - "step": 111475 - }, - { - "epoch": 27.21, - "learning_rate": 0.00036445272416320545, - "loss": 0.4212, - "step": 111500 - }, - { - "epoch": 27.21, - "learning_rate": 0.00036442218421695575, - "loss": 0.4715, - "step": 111525 - }, - { - "epoch": 27.22, - "learning_rate": 0.0003643916442707061, - "loss": 0.4006, - "step": 111550 - }, - { - "epoch": 27.23, - "learning_rate": 0.0003643611043244564, - "loss": 0.4579, - "step": 111575 - }, - { - "epoch": 27.23, - "learning_rate": 0.0003643305643782067, - "loss": 0.4084, - "step": 111600 - }, - { - "epoch": 27.24, - "learning_rate": 0.000364300024431957, - "loss": 0.4738, - "step": 111625 - }, - { - "epoch": 27.24, - "learning_rate": 0.00036426948448570727, - "loss": 0.472, - "step": 111650 - }, - { - "epoch": 27.25, - "learning_rate": 0.0003642389445394576, - "loss": 0.4421, - "step": 111675 - }, - { - "epoch": 27.26, - "learning_rate": 0.00036420840459320793, - "loss": 0.4112, - "step": 111700 - }, - { - "epoch": 27.26, - "learning_rate": 0.00036417786464695823, - "loss": 0.457, - "step": 111725 - }, - { - "epoch": 27.27, - "learning_rate": 0.00036414732470070854, - "loss": 0.4342, - "step": 111750 - }, - { - "epoch": 27.28, - "learning_rate": 0.00036411678475445884, - "loss": 0.4509, - "step": 111775 - }, - { - "epoch": 27.28, - "learning_rate": 0.00036408624480820914, - "loss": 0.3766, - "step": 111800 - }, - { - "epoch": 27.29, - "learning_rate": 0.00036405570486195945, - "loss": 0.4579, - "step": 111825 - }, - { - "epoch": 27.29, - "learning_rate": 0.00036402638651355975, - "loss": 0.4228, - "step": 111850 - }, - { - "epoch": 27.3, - "learning_rate": 0.00036399584656731006, - "loss": 0.4387, - "step": 111875 - }, - { - "epoch": 27.31, - "learning_rate": 0.00036396530662106036, - "loss": 0.407, - "step": 111900 - }, - { - "epoch": 27.31, - "learning_rate": 0.00036393476667481066, - "loss": 0.4576, - "step": 111925 - }, - { - "epoch": 27.32, - "learning_rate": 0.00036390422672856097, - "loss": 0.3912, - "step": 111950 - }, - { - "epoch": 27.32, - "learning_rate": 0.00036387368678231127, - "loss": 0.4313, - "step": 111975 - }, - { - "epoch": 27.33, - "learning_rate": 0.00036384314683606157, - "loss": 0.4289, - "step": 112000 - }, - { - "epoch": 27.34, - "learning_rate": 0.0003638126068898119, - "loss": 0.4334, - "step": 112025 - }, - { - "epoch": 27.34, - "learning_rate": 0.0003637820669435622, - "loss": 0.4155, - "step": 112050 - }, - { - "epoch": 27.35, - "learning_rate": 0.00036375152699731254, - "loss": 0.4347, - "step": 112075 - }, - { - "epoch": 27.35, - "learning_rate": 0.00036372098705106284, - "loss": 0.4325, - "step": 112100 - }, - { - "epoch": 27.36, - "learning_rate": 0.0003636904471048131, - "loss": 0.4639, - "step": 112125 - }, - { - "epoch": 27.37, - "learning_rate": 0.0003636599071585634, - "loss": 0.4588, - "step": 112150 - }, - { - "epoch": 27.37, - "learning_rate": 0.0003636293672123137, - "loss": 0.4401, - "step": 112175 - }, - { - "epoch": 27.38, - "learning_rate": 0.000363598827266064, - "loss": 0.4654, - "step": 112200 - }, - { - "epoch": 27.39, - "learning_rate": 0.00036356828731981436, - "loss": 0.4443, - "step": 112225 - }, - { - "epoch": 27.39, - "learning_rate": 0.00036353774737356466, - "loss": 0.4255, - "step": 112250 - }, - { - "epoch": 27.4, - "learning_rate": 0.0003635072074273149, - "loss": 0.4641, - "step": 112275 - }, - { - "epoch": 27.4, - "learning_rate": 0.0003634766674810652, - "loss": 0.4369, - "step": 112300 - }, - { - "epoch": 27.41, - "learning_rate": 0.0003634461275348155, - "loss": 0.446, - "step": 112325 - }, - { - "epoch": 27.42, - "learning_rate": 0.0003634155875885659, - "loss": 0.4385, - "step": 112350 - }, - { - "epoch": 27.42, - "learning_rate": 0.0003633850476423162, - "loss": 0.4708, - "step": 112375 - }, - { - "epoch": 27.43, - "learning_rate": 0.0003633545076960665, - "loss": 0.4086, - "step": 112400 - }, - { - "epoch": 27.43, - "learning_rate": 0.00036332396774981673, - "loss": 0.4416, - "step": 112425 - }, - { - "epoch": 27.44, - "learning_rate": 0.00036329342780356703, - "loss": 0.4096, - "step": 112450 - }, - { - "epoch": 27.45, - "learning_rate": 0.0003632628878573174, - "loss": 0.4395, - "step": 112475 - }, - { - "epoch": 27.45, - "learning_rate": 0.0003632323479110677, - "loss": 0.4392, - "step": 112500 - }, - { - "epoch": 27.46, - "learning_rate": 0.000363201807964818, - "loss": 0.4743, - "step": 112525 - }, - { - "epoch": 27.46, - "learning_rate": 0.0003631712680185683, - "loss": 0.4474, - "step": 112550 - }, - { - "epoch": 27.47, - "learning_rate": 0.0003631407280723186, - "loss": 0.4738, - "step": 112575 - }, - { - "epoch": 27.48, - "learning_rate": 0.0003631101881260689, - "loss": 0.3719, - "step": 112600 - }, - { - "epoch": 27.48, - "learning_rate": 0.0003630796481798192, - "loss": 0.4503, - "step": 112625 - }, - { - "epoch": 27.49, - "learning_rate": 0.0003630491082335695, - "loss": 0.4223, - "step": 112650 - }, - { - "epoch": 27.5, - "learning_rate": 0.0003630185682873198, - "loss": 0.4613, - "step": 112675 - }, - { - "epoch": 27.5, - "learning_rate": 0.0003629880283410701, - "loss": 0.4107, - "step": 112700 - }, - { - "epoch": 27.51, - "learning_rate": 0.0003629574883948205, - "loss": 0.4359, - "step": 112725 - }, - { - "epoch": 27.51, - "learning_rate": 0.0003629269484485707, - "loss": 0.3979, - "step": 112750 - }, - { - "epoch": 27.52, - "learning_rate": 0.00036289640850232103, - "loss": 0.481, - "step": 112775 - }, - { - "epoch": 27.53, - "learning_rate": 0.00036286586855607133, - "loss": 0.4453, - "step": 112800 - }, - { - "epoch": 27.53, - "learning_rate": 0.00036283532860982164, - "loss": 0.4792, - "step": 112825 - }, - { - "epoch": 27.54, - "learning_rate": 0.000362804788663572, - "loss": 0.4001, - "step": 112850 - }, - { - "epoch": 27.54, - "learning_rate": 0.0003627742487173223, - "loss": 0.43, - "step": 112875 - }, - { - "epoch": 27.55, - "learning_rate": 0.00036274370877107255, - "loss": 0.3869, - "step": 112900 - }, - { - "epoch": 27.56, - "learning_rate": 0.00036271316882482285, - "loss": 0.4596, - "step": 112925 - }, - { - "epoch": 27.56, - "learning_rate": 0.00036268262887857315, - "loss": 0.4507, - "step": 112950 - }, - { - "epoch": 27.57, - "learning_rate": 0.0003626520889323235, - "loss": 0.4765, - "step": 112975 - }, - { - "epoch": 27.57, - "learning_rate": 0.0003626215489860738, - "loss": 0.4441, - "step": 113000 - }, - { - "epoch": 27.58, - "learning_rate": 0.0003625910090398241, - "loss": 0.4576, - "step": 113025 - }, - { - "epoch": 27.59, - "learning_rate": 0.0003625604690935744, - "loss": 0.4279, - "step": 113050 - }, - { - "epoch": 27.59, - "learning_rate": 0.00036252992914732467, - "loss": 0.4251, - "step": 113075 - }, - { - "epoch": 27.6, - "learning_rate": 0.00036249938920107503, - "loss": 0.4277, - "step": 113100 - }, - { - "epoch": 27.6, - "learning_rate": 0.00036246884925482533, - "loss": 0.4642, - "step": 113125 - }, - { - "epoch": 27.61, - "learning_rate": 0.00036243830930857563, - "loss": 0.3901, - "step": 113150 - }, - { - "epoch": 27.62, - "learning_rate": 0.00036240776936232594, - "loss": 0.4645, - "step": 113175 - }, - { - "epoch": 27.62, - "learning_rate": 0.00036237722941607624, - "loss": 0.4778, - "step": 113200 - }, - { - "epoch": 27.63, - "learning_rate": 0.00036234668946982654, - "loss": 0.4684, - "step": 113225 - }, - { - "epoch": 27.64, - "learning_rate": 0.00036231614952357685, - "loss": 0.4339, - "step": 113250 - }, - { - "epoch": 27.64, - "learning_rate": 0.00036228560957732715, - "loss": 0.4372, - "step": 113275 - }, - { - "epoch": 27.65, - "learning_rate": 0.00036225506963107745, - "loss": 0.4579, - "step": 113300 - }, - { - "epoch": 27.65, - "learning_rate": 0.00036222452968482776, - "loss": 0.4499, - "step": 113325 - }, - { - "epoch": 27.66, - "learning_rate": 0.0003621939897385781, - "loss": 0.4247, - "step": 113350 - }, - { - "epoch": 27.67, - "learning_rate": 0.00036216344979232836, - "loss": 0.4518, - "step": 113375 - }, - { - "epoch": 27.67, - "learning_rate": 0.00036213290984607867, - "loss": 0.4446, - "step": 113400 - }, - { - "epoch": 27.68, - "learning_rate": 0.00036210236989982897, - "loss": 0.4472, - "step": 113425 - }, - { - "epoch": 27.68, - "learning_rate": 0.0003620718299535793, - "loss": 0.3938, - "step": 113450 - }, - { - "epoch": 27.69, - "learning_rate": 0.0003620412900073296, - "loss": 0.4338, - "step": 113475 - }, - { - "epoch": 27.7, - "learning_rate": 0.00036201075006107994, - "loss": 0.3876, - "step": 113500 - }, - { - "epoch": 27.7, - "learning_rate": 0.00036198021011483024, - "loss": 0.4739, - "step": 113525 - }, - { - "epoch": 27.71, - "learning_rate": 0.0003619496701685805, - "loss": 0.4749, - "step": 113550 - }, - { - "epoch": 27.71, - "learning_rate": 0.0003619191302223308, - "loss": 0.4201, - "step": 113575 - }, - { - "epoch": 27.72, - "learning_rate": 0.0003618885902760811, - "loss": 0.4033, - "step": 113600 - }, - { - "epoch": 27.73, - "learning_rate": 0.00036185805032983145, - "loss": 0.4496, - "step": 113625 - }, - { - "epoch": 27.73, - "learning_rate": 0.00036182751038358176, - "loss": 0.4209, - "step": 113650 - }, - { - "epoch": 27.74, - "learning_rate": 0.00036179697043733206, - "loss": 0.4398, - "step": 113675 - }, - { - "epoch": 27.75, - "learning_rate": 0.0003617664304910823, - "loss": 0.4328, - "step": 113700 - }, - { - "epoch": 27.75, - "learning_rate": 0.0003617358905448326, - "loss": 0.4169, - "step": 113725 - }, - { - "epoch": 27.76, - "learning_rate": 0.00036170535059858297, - "loss": 0.4463, - "step": 113750 - }, - { - "epoch": 27.76, - "learning_rate": 0.00036167481065233327, - "loss": 0.4666, - "step": 113775 - }, - { - "epoch": 27.77, - "learning_rate": 0.0003616442707060836, - "loss": 0.4087, - "step": 113800 - }, - { - "epoch": 27.78, - "learning_rate": 0.0003616137307598339, - "loss": 0.4208, - "step": 113825 - }, - { - "epoch": 27.78, - "learning_rate": 0.00036158319081358413, - "loss": 0.4215, - "step": 113850 - }, - { - "epoch": 27.79, - "learning_rate": 0.0003615526508673345, - "loss": 0.4414, - "step": 113875 - }, - { - "epoch": 27.79, - "learning_rate": 0.0003615221109210848, - "loss": 0.4207, - "step": 113900 - }, - { - "epoch": 27.8, - "learning_rate": 0.0003614915709748351, - "loss": 0.4305, - "step": 113925 - }, - { - "epoch": 27.81, - "learning_rate": 0.0003614610310285854, - "loss": 0.3685, - "step": 113950 - }, - { - "epoch": 27.81, - "learning_rate": 0.0003614304910823357, - "loss": 0.4715, - "step": 113975 - }, - { - "epoch": 27.82, - "learning_rate": 0.000361399951136086, - "loss": 0.4618, - "step": 114000 - }, - { - "epoch": 27.82, - "eval_cer": 0.10462203422892519, - "eval_loss": 0.42293429374694824, - "eval_runtime": 148.9045, - "eval_samples_per_second": 28.159, - "eval_steps_per_second": 7.045, - "eval_wer": 0.42812398042414357, - "step": 114000 - }, - { - "epoch": 27.82, - "learning_rate": 0.0003613694111898363, - "loss": 0.4892, - "step": 114025 - }, - { - "epoch": 27.83, - "learning_rate": 0.0003613388712435866, - "loss": 0.4525, - "step": 114050 - }, - { - "epoch": 27.84, - "learning_rate": 0.0003613083312973369, - "loss": 0.443, - "step": 114075 - }, - { - "epoch": 27.84, - "learning_rate": 0.0003612777913510872, - "loss": 0.4399, - "step": 114100 - }, - { - "epoch": 27.85, - "learning_rate": 0.0003612472514048376, - "loss": 0.4276, - "step": 114125 - }, - { - "epoch": 27.86, - "learning_rate": 0.0003612167114585879, - "loss": 0.3892, - "step": 114150 - }, - { - "epoch": 27.86, - "learning_rate": 0.0003611861715123381, - "loss": 0.4562, - "step": 114175 - }, - { - "epoch": 27.87, - "learning_rate": 0.00036115563156608843, - "loss": 0.4128, - "step": 114200 - }, - { - "epoch": 27.87, - "learning_rate": 0.00036112509161983873, - "loss": 0.4409, - "step": 114225 - }, - { - "epoch": 27.88, - "learning_rate": 0.0003610945516735891, - "loss": 0.4134, - "step": 114250 - }, - { - "epoch": 27.89, - "learning_rate": 0.0003610640117273394, - "loss": 0.4426, - "step": 114275 - }, - { - "epoch": 27.89, - "learning_rate": 0.0003610334717810897, - "loss": 0.4581, - "step": 114300 - }, - { - "epoch": 27.9, - "learning_rate": 0.00036100293183483995, - "loss": 0.445, - "step": 114325 - }, - { - "epoch": 27.9, - "learning_rate": 0.00036097239188859025, - "loss": 0.4231, - "step": 114350 - }, - { - "epoch": 27.91, - "learning_rate": 0.0003609418519423406, - "loss": 0.4608, - "step": 114375 - }, - { - "epoch": 27.92, - "learning_rate": 0.0003609113119960909, - "loss": 0.4112, - "step": 114400 - }, - { - "epoch": 27.92, - "learning_rate": 0.0003608807720498412, - "loss": 0.4675, - "step": 114425 - }, - { - "epoch": 27.93, - "learning_rate": 0.0003608502321035915, - "loss": 0.4105, - "step": 114450 - }, - { - "epoch": 27.93, - "learning_rate": 0.00036081969215734177, - "loss": 0.4548, - "step": 114475 - }, - { - "epoch": 27.94, - "learning_rate": 0.0003607891522110921, - "loss": 0.471, - "step": 114500 - }, - { - "epoch": 27.95, - "learning_rate": 0.0003607586122648424, - "loss": 0.4264, - "step": 114525 - }, - { - "epoch": 27.95, - "learning_rate": 0.00036072807231859273, - "loss": 0.418, - "step": 114550 - }, - { - "epoch": 27.96, - "learning_rate": 0.00036069753237234303, - "loss": 0.4569, - "step": 114575 - }, - { - "epoch": 27.96, - "learning_rate": 0.00036066699242609334, - "loss": 0.4326, - "step": 114600 - }, - { - "epoch": 27.97, - "learning_rate": 0.0003606364524798437, - "loss": 0.4641, - "step": 114625 - }, - { - "epoch": 27.98, - "learning_rate": 0.00036060591253359394, - "loss": 0.4108, - "step": 114650 - }, - { - "epoch": 27.98, - "learning_rate": 0.00036057537258734425, - "loss": 0.4225, - "step": 114675 - }, - { - "epoch": 27.99, - "learning_rate": 0.00036054483264109455, - "loss": 0.45, - "step": 114700 - }, - { - "epoch": 28.0, - "learning_rate": 0.00036051429269484485, - "loss": 0.4469, - "step": 114725 - }, - { - "epoch": 28.0, - "learning_rate": 0.00036048375274859516, - "loss": 0.3933, - "step": 114750 - }, - { - "epoch": 28.01, - "learning_rate": 0.0003604532128023455, - "loss": 0.4146, - "step": 114775 - }, - { - "epoch": 28.01, - "learning_rate": 0.00036042267285609576, - "loss": 0.4307, - "step": 114800 - }, - { - "epoch": 28.02, - "learning_rate": 0.00036039213290984607, - "loss": 0.4348, - "step": 114825 - }, - { - "epoch": 28.03, - "learning_rate": 0.00036036159296359637, - "loss": 0.499, - "step": 114850 - }, - { - "epoch": 28.03, - "learning_rate": 0.0003603310530173467, - "loss": 0.441, - "step": 114875 - }, - { - "epoch": 28.04, - "learning_rate": 0.00036030051307109703, - "loss": 0.4065, - "step": 114900 - }, - { - "epoch": 28.04, - "learning_rate": 0.00036026997312484733, - "loss": 0.4322, - "step": 114925 - }, - { - "epoch": 28.05, - "learning_rate": 0.0003602394331785976, - "loss": 0.4002, - "step": 114950 - }, - { - "epoch": 28.06, - "learning_rate": 0.0003602088932323479, - "loss": 0.4478, - "step": 114975 - }, - { - "epoch": 28.06, - "learning_rate": 0.0003601783532860982, - "loss": 0.3767, - "step": 115000 - }, - { - "epoch": 28.07, - "learning_rate": 0.00036014781333984855, - "loss": 0.4317, - "step": 115025 - }, - { - "epoch": 28.07, - "learning_rate": 0.00036011727339359885, - "loss": 0.451, - "step": 115050 - }, - { - "epoch": 28.08, - "learning_rate": 0.00036008673344734915, - "loss": 0.4586, - "step": 115075 - }, - { - "epoch": 28.09, - "learning_rate": 0.00036005619350109946, - "loss": 0.4371, - "step": 115100 - }, - { - "epoch": 28.09, - "learning_rate": 0.0003600256535548497, - "loss": 0.4382, - "step": 115125 - }, - { - "epoch": 28.1, - "learning_rate": 0.00035999511360860006, - "loss": 0.3706, - "step": 115150 - }, - { - "epoch": 28.11, - "learning_rate": 0.00035996457366235037, - "loss": 0.4424, - "step": 115175 - }, - { - "epoch": 28.11, - "learning_rate": 0.00035993403371610067, - "loss": 0.4072, - "step": 115200 - }, - { - "epoch": 28.12, - "learning_rate": 0.000359903493769851, - "loss": 0.4112, - "step": 115225 - }, - { - "epoch": 28.12, - "learning_rate": 0.0003598729538236013, - "loss": 0.3865, - "step": 115250 - }, - { - "epoch": 28.13, - "learning_rate": 0.0003598424138773516, - "loss": 0.4749, - "step": 115275 - }, - { - "epoch": 28.14, - "learning_rate": 0.0003598118739311019, - "loss": 0.416, - "step": 115300 - }, - { - "epoch": 28.14, - "learning_rate": 0.0003597813339848522, - "loss": 0.4019, - "step": 115325 - }, - { - "epoch": 28.15, - "learning_rate": 0.0003597507940386025, - "loss": 0.4413, - "step": 115350 - }, - { - "epoch": 28.15, - "learning_rate": 0.0003597202540923528, - "loss": 0.427, - "step": 115375 - }, - { - "epoch": 28.16, - "learning_rate": 0.00035968971414610315, - "loss": 0.3767, - "step": 115400 - }, - { - "epoch": 28.17, - "learning_rate": 0.0003596591741998534, - "loss": 0.4356, - "step": 115425 - }, - { - "epoch": 28.17, - "learning_rate": 0.0003596286342536037, - "loss": 0.4551, - "step": 115450 - }, - { - "epoch": 28.18, - "learning_rate": 0.000359598094307354, - "loss": 0.446, - "step": 115475 - }, - { - "epoch": 28.18, - "learning_rate": 0.0003595675543611043, - "loss": 0.4216, - "step": 115500 - }, - { - "epoch": 28.19, - "learning_rate": 0.00035953701441485467, - "loss": 0.4307, - "step": 115525 - }, - { - "epoch": 28.2, - "learning_rate": 0.00035950647446860497, - "loss": 0.4476, - "step": 115550 - }, - { - "epoch": 28.2, - "learning_rate": 0.0003594759345223553, - "loss": 0.4522, - "step": 115575 - }, - { - "epoch": 28.21, - "learning_rate": 0.0003594453945761055, - "loss": 0.398, - "step": 115600 - }, - { - "epoch": 28.21, - "learning_rate": 0.00035941485462985583, - "loss": 0.4434, - "step": 115625 - }, - { - "epoch": 28.22, - "learning_rate": 0.0003593843146836062, - "loss": 0.4161, - "step": 115650 - }, - { - "epoch": 28.23, - "learning_rate": 0.0003593537747373565, - "loss": 0.4172, - "step": 115675 - }, - { - "epoch": 28.23, - "learning_rate": 0.0003593232347911068, - "loss": 0.4633, - "step": 115700 - }, - { - "epoch": 28.24, - "learning_rate": 0.0003592926948448571, - "loss": 0.4339, - "step": 115725 - }, - { - "epoch": 28.25, - "learning_rate": 0.00035926215489860735, - "loss": 0.4266, - "step": 115750 - }, - { - "epoch": 28.25, - "learning_rate": 0.0003592316149523577, - "loss": 0.4322, - "step": 115775 - }, - { - "epoch": 28.26, - "learning_rate": 0.000359201075006108, - "loss": 0.4352, - "step": 115800 - }, - { - "epoch": 28.26, - "learning_rate": 0.0003591705350598583, - "loss": 0.4283, - "step": 115825 - }, - { - "epoch": 28.27, - "learning_rate": 0.0003591399951136086, - "loss": 0.4588, - "step": 115850 - }, - { - "epoch": 28.28, - "learning_rate": 0.0003591094551673589, - "loss": 0.4461, - "step": 115875 - }, - { - "epoch": 28.28, - "learning_rate": 0.0003590789152211092, - "loss": 0.3807, - "step": 115900 - }, - { - "epoch": 28.29, - "learning_rate": 0.0003590483752748595, - "loss": 0.4291, - "step": 115925 - }, - { - "epoch": 28.29, - "learning_rate": 0.0003590178353286098, - "loss": 0.4416, - "step": 115950 - }, - { - "epoch": 28.3, - "learning_rate": 0.00035898729538236013, - "loss": 0.4219, - "step": 115975 - }, - { - "epoch": 28.31, - "learning_rate": 0.00035895675543611043, - "loss": 0.4263, - "step": 116000 - }, - { - "epoch": 28.31, - "learning_rate": 0.0003589262154898608, - "loss": 0.4394, - "step": 116025 - }, - { - "epoch": 28.32, - "learning_rate": 0.0003588956755436111, - "loss": 0.4312, - "step": 116050 - }, - { - "epoch": 28.32, - "learning_rate": 0.00035886513559736134, - "loss": 0.4249, - "step": 116075 - }, - { - "epoch": 28.33, - "learning_rate": 0.00035883459565111165, - "loss": 0.4145, - "step": 116100 - }, - { - "epoch": 28.34, - "learning_rate": 0.00035880405570486195, - "loss": 0.4173, - "step": 116125 - }, - { - "epoch": 28.34, - "learning_rate": 0.00035877351575861225, - "loss": 0.4505, - "step": 116150 - }, - { - "epoch": 28.35, - "learning_rate": 0.0003587429758123626, - "loss": 0.4273, - "step": 116175 - }, - { - "epoch": 28.36, - "learning_rate": 0.0003587124358661129, - "loss": 0.3887, - "step": 116200 - }, - { - "epoch": 28.36, - "learning_rate": 0.00035868189591986316, - "loss": 0.416, - "step": 116225 - }, - { - "epoch": 28.37, - "learning_rate": 0.00035865135597361347, - "loss": 0.4085, - "step": 116250 - }, - { - "epoch": 28.37, - "learning_rate": 0.00035862081602736377, - "loss": 0.4551, - "step": 116275 - }, - { - "epoch": 28.38, - "learning_rate": 0.0003585914976789641, - "loss": 0.42, - "step": 116300 - }, - { - "epoch": 28.39, - "learning_rate": 0.00035856095773271443, - "loss": 0.4185, - "step": 116325 - }, - { - "epoch": 28.39, - "learning_rate": 0.00035853041778646474, - "loss": 0.4174, - "step": 116350 - }, - { - "epoch": 28.4, - "learning_rate": 0.000358499877840215, - "loss": 0.4303, - "step": 116375 - }, - { - "epoch": 28.4, - "learning_rate": 0.0003584693378939653, - "loss": 0.4787, - "step": 116400 - }, - { - "epoch": 28.41, - "learning_rate": 0.0003584387979477156, - "loss": 0.4276, - "step": 116425 - }, - { - "epoch": 28.42, - "learning_rate": 0.00035840825800146595, - "loss": 0.4364, - "step": 116450 - }, - { - "epoch": 28.42, - "learning_rate": 0.00035837771805521625, - "loss": 0.4598, - "step": 116475 - }, - { - "epoch": 28.43, - "learning_rate": 0.00035834717810896656, - "loss": 0.4465, - "step": 116500 - }, - { - "epoch": 28.43, - "learning_rate": 0.00035831663816271686, - "loss": 0.4561, - "step": 116525 - }, - { - "epoch": 28.44, - "learning_rate": 0.0003582860982164671, - "loss": 0.3765, - "step": 116550 - }, - { - "epoch": 28.45, - "learning_rate": 0.00035825555827021747, - "loss": 0.3965, - "step": 116575 - }, - { - "epoch": 28.45, - "learning_rate": 0.00035822501832396777, - "loss": 0.4291, - "step": 116600 - }, - { - "epoch": 28.46, - "learning_rate": 0.0003581944783777181, - "loss": 0.4005, - "step": 116625 - }, - { - "epoch": 28.47, - "learning_rate": 0.0003581639384314684, - "loss": 0.4187, - "step": 116650 - }, - { - "epoch": 28.47, - "learning_rate": 0.0003581333984852187, - "loss": 0.4803, - "step": 116675 - }, - { - "epoch": 28.48, - "learning_rate": 0.00035810285853896893, - "loss": 0.4358, - "step": 116700 - }, - { - "epoch": 28.48, - "learning_rate": 0.0003580723185927193, - "loss": 0.4248, - "step": 116725 - }, - { - "epoch": 28.49, - "learning_rate": 0.0003580417786464696, - "loss": 0.4353, - "step": 116750 - }, - { - "epoch": 28.5, - "learning_rate": 0.0003580112387002199, - "loss": 0.4402, - "step": 116775 - }, - { - "epoch": 28.5, - "learning_rate": 0.0003579806987539702, - "loss": 0.4198, - "step": 116800 - }, - { - "epoch": 28.51, - "learning_rate": 0.0003579501588077205, - "loss": 0.4321, - "step": 116825 - }, - { - "epoch": 28.51, - "learning_rate": 0.0003579196188614708, - "loss": 0.4073, - "step": 116850 - }, - { - "epoch": 28.52, - "learning_rate": 0.0003578890789152211, - "loss": 0.4597, - "step": 116875 - }, - { - "epoch": 28.53, - "learning_rate": 0.0003578585389689714, - "loss": 0.43, - "step": 116900 - }, - { - "epoch": 28.53, - "learning_rate": 0.0003578279990227217, - "loss": 0.454, - "step": 116925 - }, - { - "epoch": 28.54, - "learning_rate": 0.000357797459076472, - "loss": 0.3605, - "step": 116950 - }, - { - "epoch": 28.54, - "learning_rate": 0.0003577669191302224, - "loss": 0.4225, - "step": 116975 - }, - { - "epoch": 28.55, - "learning_rate": 0.0003577363791839727, - "loss": 0.4538, - "step": 117000 - }, - { - "epoch": 28.55, - "eval_cer": 0.10224531071938237, - "eval_loss": 0.4060422480106354, - "eval_runtime": 148.9547, - "eval_samples_per_second": 28.149, - "eval_steps_per_second": 7.042, - "eval_wer": 0.42, - "step": 117000 - }, - { - "epoch": 28.56, - "learning_rate": 0.00035770583923772293, - "loss": 0.4308, - "step": 117025 - }, - { - "epoch": 28.56, - "learning_rate": 0.00035767529929147323, - "loss": 0.4009, - "step": 117050 - }, - { - "epoch": 28.57, - "learning_rate": 0.00035764475934522353, - "loss": 0.4436, - "step": 117075 - }, - { - "epoch": 28.57, - "learning_rate": 0.0003576142193989739, - "loss": 0.383, - "step": 117100 - }, - { - "epoch": 28.58, - "learning_rate": 0.0003575836794527242, - "loss": 0.4641, - "step": 117125 - }, - { - "epoch": 28.59, - "learning_rate": 0.0003575531395064745, - "loss": 0.4427, - "step": 117150 - }, - { - "epoch": 28.59, - "learning_rate": 0.00035752259956022475, - "loss": 0.4591, - "step": 117175 - }, - { - "epoch": 28.6, - "learning_rate": 0.00035749205961397505, - "loss": 0.4661, - "step": 117200 - }, - { - "epoch": 28.61, - "learning_rate": 0.0003574615196677254, - "loss": 0.5024, - "step": 117225 - }, - { - "epoch": 28.61, - "learning_rate": 0.0003574309797214757, - "loss": 0.457, - "step": 117250 - }, - { - "epoch": 28.62, - "learning_rate": 0.000357400439775226, - "loss": 0.4456, - "step": 117275 - }, - { - "epoch": 28.62, - "learning_rate": 0.0003573698998289763, - "loss": 0.4282, - "step": 117300 - }, - { - "epoch": 28.63, - "learning_rate": 0.00035733935988272657, - "loss": 0.457, - "step": 117325 - }, - { - "epoch": 28.64, - "learning_rate": 0.0003573088199364769, - "loss": 0.3939, - "step": 117350 - }, - { - "epoch": 28.64, - "learning_rate": 0.00035727827999022723, - "loss": 0.4394, - "step": 117375 - }, - { - "epoch": 28.65, - "learning_rate": 0.00035724774004397753, - "loss": 0.4435, - "step": 117400 - }, - { - "epoch": 28.65, - "learning_rate": 0.00035721720009772783, - "loss": 0.4603, - "step": 117425 - }, - { - "epoch": 28.66, - "learning_rate": 0.00035718666015147814, - "loss": 0.4088, - "step": 117450 - }, - { - "epoch": 28.67, - "learning_rate": 0.00035715612020522844, - "loss": 0.4357, - "step": 117475 - }, - { - "epoch": 28.67, - "learning_rate": 0.00035712558025897874, - "loss": 0.3844, - "step": 117500 - }, - { - "epoch": 28.68, - "learning_rate": 0.00035709504031272905, - "loss": 0.4333, - "step": 117525 - }, - { - "epoch": 28.68, - "learning_rate": 0.00035706450036647935, - "loss": 0.4354, - "step": 117550 - }, - { - "epoch": 28.69, - "learning_rate": 0.00035703396042022965, - "loss": 0.4478, - "step": 117575 - }, - { - "epoch": 28.7, - "learning_rate": 0.00035700342047398, - "loss": 0.44, - "step": 117600 - }, - { - "epoch": 28.7, - "learning_rate": 0.0003569728805277303, - "loss": 0.4312, - "step": 117625 - }, - { - "epoch": 28.71, - "learning_rate": 0.00035694234058148056, - "loss": 0.3937, - "step": 117650 - }, - { - "epoch": 28.72, - "learning_rate": 0.00035691180063523087, - "loss": 0.4529, - "step": 117675 - }, - { - "epoch": 28.72, - "learning_rate": 0.00035688126068898117, - "loss": 0.4707, - "step": 117700 - }, - { - "epoch": 28.73, - "learning_rate": 0.00035685072074273153, - "loss": 0.4158, - "step": 117725 - }, - { - "epoch": 28.73, - "learning_rate": 0.00035682018079648183, - "loss": 0.4417, - "step": 117750 - }, - { - "epoch": 28.74, - "learning_rate": 0.00035678964085023214, - "loss": 0.4441, - "step": 117775 - }, - { - "epoch": 28.75, - "learning_rate": 0.0003567591009039824, - "loss": 0.4552, - "step": 117800 - }, - { - "epoch": 28.75, - "learning_rate": 0.0003567285609577327, - "loss": 0.4226, - "step": 117825 - }, - { - "epoch": 28.76, - "learning_rate": 0.00035669802101148305, - "loss": 0.4139, - "step": 117850 - }, - { - "epoch": 28.76, - "learning_rate": 0.00035666748106523335, - "loss": 0.4315, - "step": 117875 - }, - { - "epoch": 28.77, - "learning_rate": 0.00035663694111898365, - "loss": 0.4402, - "step": 117900 - }, - { - "epoch": 28.78, - "learning_rate": 0.00035660640117273396, - "loss": 0.4528, - "step": 117925 - }, - { - "epoch": 28.78, - "learning_rate": 0.0003565758612264842, - "loss": 0.3793, - "step": 117950 - }, - { - "epoch": 28.79, - "learning_rate": 0.00035654532128023456, - "loss": 0.424, - "step": 117975 - }, - { - "epoch": 28.79, - "learning_rate": 0.00035651478133398487, - "loss": 0.4328, - "step": 118000 - }, - { - "epoch": 28.8, - "learning_rate": 0.00035648424138773517, - "loss": 0.4264, - "step": 118025 - }, - { - "epoch": 28.81, - "learning_rate": 0.00035645370144148547, - "loss": 0.4129, - "step": 118050 - }, - { - "epoch": 28.81, - "learning_rate": 0.0003564231614952358, - "loss": 0.4328, - "step": 118075 - }, - { - "epoch": 28.82, - "learning_rate": 0.00035639262154898613, - "loss": 0.3993, - "step": 118100 - }, - { - "epoch": 28.83, - "learning_rate": 0.0003563620816027364, - "loss": 0.4388, - "step": 118125 - }, - { - "epoch": 28.83, - "learning_rate": 0.0003563315416564867, - "loss": 0.4482, - "step": 118150 - }, - { - "epoch": 28.84, - "learning_rate": 0.000356301001710237, - "loss": 0.4477, - "step": 118175 - }, - { - "epoch": 28.84, - "learning_rate": 0.0003562704617639873, - "loss": 0.3916, - "step": 118200 - }, - { - "epoch": 28.85, - "learning_rate": 0.0003562399218177376, - "loss": 0.4721, - "step": 118225 - }, - { - "epoch": 28.86, - "learning_rate": 0.00035620938187148795, - "loss": 0.3895, - "step": 118250 - }, - { - "epoch": 28.86, - "learning_rate": 0.0003561788419252382, - "loss": 0.4329, - "step": 118275 - }, - { - "epoch": 28.87, - "learning_rate": 0.0003561483019789885, - "loss": 0.4063, - "step": 118300 - }, - { - "epoch": 28.87, - "learning_rate": 0.0003561177620327388, - "loss": 0.4025, - "step": 118325 - }, - { - "epoch": 28.88, - "learning_rate": 0.0003560872220864891, - "loss": 0.4194, - "step": 118350 - }, - { - "epoch": 28.89, - "learning_rate": 0.00035605668214023947, - "loss": 0.4511, - "step": 118375 - }, - { - "epoch": 28.89, - "learning_rate": 0.0003560261421939898, - "loss": 0.3908, - "step": 118400 - }, - { - "epoch": 28.9, - "learning_rate": 0.00035599560224774, - "loss": 0.449, - "step": 118425 - }, - { - "epoch": 28.9, - "learning_rate": 0.0003559650623014903, - "loss": 0.391, - "step": 118450 - }, - { - "epoch": 28.91, - "learning_rate": 0.00035593452235524063, - "loss": 0.4691, - "step": 118475 - }, - { - "epoch": 28.92, - "learning_rate": 0.000355903982408991, - "loss": 0.4369, - "step": 118500 - }, - { - "epoch": 28.92, - "learning_rate": 0.0003558734424627413, - "loss": 0.4306, - "step": 118525 - }, - { - "epoch": 28.93, - "learning_rate": 0.0003558429025164916, - "loss": 0.4192, - "step": 118550 - }, - { - "epoch": 28.93, - "learning_rate": 0.0003558123625702419, - "loss": 0.4288, - "step": 118575 - }, - { - "epoch": 28.94, - "learning_rate": 0.00035578182262399215, - "loss": 0.4263, - "step": 118600 - }, - { - "epoch": 28.95, - "learning_rate": 0.0003557512826777425, - "loss": 0.4425, - "step": 118625 - }, - { - "epoch": 28.95, - "learning_rate": 0.0003557207427314928, - "loss": 0.425, - "step": 118650 - }, - { - "epoch": 28.96, - "learning_rate": 0.0003556902027852431, - "loss": 0.4438, - "step": 118675 - }, - { - "epoch": 28.97, - "learning_rate": 0.0003556608844368434, - "loss": 0.4005, - "step": 118700 - }, - { - "epoch": 28.97, - "learning_rate": 0.0003556303444905937, - "loss": 0.4537, - "step": 118725 - }, - { - "epoch": 28.98, - "learning_rate": 0.00035559980454434397, - "loss": 0.4252, - "step": 118750 - }, - { - "epoch": 28.98, - "learning_rate": 0.00035556926459809427, - "loss": 0.4506, - "step": 118775 - }, - { - "epoch": 28.99, - "learning_rate": 0.00035553872465184463, - "loss": 0.403, - "step": 118800 - }, - { - "epoch": 29.0, - "learning_rate": 0.00035550818470559493, - "loss": 0.4524, - "step": 118825 - }, - { - "epoch": 29.0, - "learning_rate": 0.00035547886635719524, - "loss": 0.4421, - "step": 118850 - }, - { - "epoch": 29.01, - "learning_rate": 0.00035544832641094554, - "loss": 0.4191, - "step": 118875 - }, - { - "epoch": 29.01, - "learning_rate": 0.0003554177864646958, - "loss": 0.3572, - "step": 118900 - }, - { - "epoch": 29.02, - "learning_rate": 0.0003553872465184461, - "loss": 0.4421, - "step": 118925 - }, - { - "epoch": 29.03, - "learning_rate": 0.00035535670657219645, - "loss": 0.4118, - "step": 118950 - }, - { - "epoch": 29.03, - "learning_rate": 0.00035532616662594676, - "loss": 0.4155, - "step": 118975 - }, - { - "epoch": 29.04, - "learning_rate": 0.00035529562667969706, - "loss": 0.3973, - "step": 119000 - }, - { - "epoch": 29.04, - "learning_rate": 0.00035526508673344736, - "loss": 0.3976, - "step": 119025 - }, - { - "epoch": 29.05, - "learning_rate": 0.00035523454678719767, - "loss": 0.401, - "step": 119050 - }, - { - "epoch": 29.06, - "learning_rate": 0.00035520400684094797, - "loss": 0.4373, - "step": 119075 - }, - { - "epoch": 29.06, - "learning_rate": 0.0003551734668946983, - "loss": 0.4238, - "step": 119100 - }, - { - "epoch": 29.07, - "learning_rate": 0.0003551429269484486, - "loss": 0.4185, - "step": 119125 - }, - { - "epoch": 29.08, - "learning_rate": 0.0003551123870021989, - "loss": 0.4378, - "step": 119150 - }, - { - "epoch": 29.08, - "learning_rate": 0.0003550818470559492, - "loss": 0.4117, - "step": 119175 - }, - { - "epoch": 29.09, - "learning_rate": 0.00035505130710969954, - "loss": 0.3991, - "step": 119200 - }, - { - "epoch": 29.09, - "learning_rate": 0.0003550207671634498, - "loss": 0.4033, - "step": 119225 - }, - { - "epoch": 29.1, - "learning_rate": 0.0003549902272172001, - "loss": 0.4718, - "step": 119250 - }, - { - "epoch": 29.11, - "learning_rate": 0.0003549596872709504, - "loss": 0.4167, - "step": 119275 - }, - { - "epoch": 29.11, - "learning_rate": 0.0003549291473247007, - "loss": 0.3826, - "step": 119300 - }, - { - "epoch": 29.12, - "learning_rate": 0.00035489860737845106, - "loss": 0.396, - "step": 119325 - }, - { - "epoch": 29.12, - "learning_rate": 0.00035486806743220136, - "loss": 0.4078, - "step": 119350 - }, - { - "epoch": 29.13, - "learning_rate": 0.0003548375274859516, - "loss": 0.4355, - "step": 119375 - }, - { - "epoch": 29.14, - "learning_rate": 0.0003548069875397019, - "loss": 0.4185, - "step": 119400 - }, - { - "epoch": 29.14, - "learning_rate": 0.0003547764475934522, - "loss": 0.4028, - "step": 119425 - }, - { - "epoch": 29.15, - "learning_rate": 0.0003547459076472026, - "loss": 0.4133, - "step": 119450 - }, - { - "epoch": 29.15, - "learning_rate": 0.0003547153677009529, - "loss": 0.4119, - "step": 119475 - }, - { - "epoch": 29.16, - "learning_rate": 0.0003546848277547032, - "loss": 0.4123, - "step": 119500 - }, - { - "epoch": 29.17, - "learning_rate": 0.0003546542878084535, - "loss": 0.4062, - "step": 119525 - }, - { - "epoch": 29.17, - "learning_rate": 0.00035462374786220373, - "loss": 0.3728, - "step": 119550 - }, - { - "epoch": 29.18, - "learning_rate": 0.00035459320791595404, - "loss": 0.4246, - "step": 119575 - }, - { - "epoch": 29.18, - "learning_rate": 0.0003545626679697044, - "loss": 0.4404, - "step": 119600 - }, - { - "epoch": 29.19, - "learning_rate": 0.0003545321280234547, - "loss": 0.3943, - "step": 119625 - }, - { - "epoch": 29.2, - "learning_rate": 0.000354501588077205, - "loss": 0.3738, - "step": 119650 - }, - { - "epoch": 29.2, - "learning_rate": 0.0003544710481309553, - "loss": 0.4253, - "step": 119675 - }, - { - "epoch": 29.21, - "learning_rate": 0.00035444050818470555, - "loss": 0.395, - "step": 119700 - }, - { - "epoch": 29.22, - "learning_rate": 0.0003544099682384559, - "loss": 0.4025, - "step": 119725 - }, - { - "epoch": 29.22, - "learning_rate": 0.0003543794282922062, - "loss": 0.3931, - "step": 119750 - }, - { - "epoch": 29.23, - "learning_rate": 0.0003543488883459565, - "loss": 0.4414, - "step": 119775 - }, - { - "epoch": 29.23, - "learning_rate": 0.0003543183483997068, - "loss": 0.4295, - "step": 119800 - }, - { - "epoch": 29.24, - "learning_rate": 0.0003542878084534571, - "loss": 0.4193, - "step": 119825 - }, - { - "epoch": 29.25, - "learning_rate": 0.00035425726850720743, - "loss": 0.43, - "step": 119850 - }, - { - "epoch": 29.25, - "learning_rate": 0.00035422672856095773, - "loss": 0.4229, - "step": 119875 - }, - { - "epoch": 29.26, - "learning_rate": 0.00035419618861470803, - "loss": 0.4609, - "step": 119900 - }, - { - "epoch": 29.26, - "learning_rate": 0.00035416564866845834, - "loss": 0.4193, - "step": 119925 - }, - { - "epoch": 29.27, - "learning_rate": 0.00035413510872220864, - "loss": 0.3949, - "step": 119950 - }, - { - "epoch": 29.28, - "learning_rate": 0.000354104568775959, - "loss": 0.441, - "step": 119975 - }, - { - "epoch": 29.28, - "learning_rate": 0.0003540740288297093, - "loss": 0.4378, - "step": 120000 - }, - { - "epoch": 29.28, - "eval_cer": 0.10296397441557241, - "eval_loss": 0.4238515794277191, - "eval_runtime": 148.9169, - "eval_samples_per_second": 28.157, - "eval_steps_per_second": 7.044, - "eval_wer": 0.4160522022838499, - "step": 120000 - }, - { - "epoch": 29.29, - "learning_rate": 0.00035404348888345955, - "loss": 0.4231, - "step": 120025 - }, - { - "epoch": 29.29, - "learning_rate": 0.00035401294893720985, - "loss": 0.4101, - "step": 120050 - }, - { - "epoch": 29.3, - "learning_rate": 0.00035398240899096016, - "loss": 0.4088, - "step": 120075 - }, - { - "epoch": 29.31, - "learning_rate": 0.0003539518690447105, - "loss": 0.3619, - "step": 120100 - }, - { - "epoch": 29.31, - "learning_rate": 0.0003539213290984608, - "loss": 0.4457, - "step": 120125 - }, - { - "epoch": 29.32, - "learning_rate": 0.0003538907891522111, - "loss": 0.3938, - "step": 120150 - }, - { - "epoch": 29.33, - "learning_rate": 0.00035386024920596137, - "loss": 0.4105, - "step": 120175 - }, - { - "epoch": 29.33, - "learning_rate": 0.0003538297092597117, - "loss": 0.371, - "step": 120200 - }, - { - "epoch": 29.34, - "learning_rate": 0.00035379916931346203, - "loss": 0.4368, - "step": 120225 - }, - { - "epoch": 29.34, - "learning_rate": 0.00035376862936721234, - "loss": 0.3776, - "step": 120250 - }, - { - "epoch": 29.35, - "learning_rate": 0.00035373808942096264, - "loss": 0.43, - "step": 120275 - }, - { - "epoch": 29.36, - "learning_rate": 0.00035370754947471294, - "loss": 0.3932, - "step": 120300 - }, - { - "epoch": 29.36, - "learning_rate": 0.0003536770095284632, - "loss": 0.4435, - "step": 120325 - }, - { - "epoch": 29.37, - "learning_rate": 0.00035364646958221355, - "loss": 0.3809, - "step": 120350 - }, - { - "epoch": 29.37, - "learning_rate": 0.00035361592963596385, - "loss": 0.4235, - "step": 120375 - }, - { - "epoch": 29.38, - "learning_rate": 0.00035358538968971416, - "loss": 0.4317, - "step": 120400 - }, - { - "epoch": 29.39, - "learning_rate": 0.00035355484974346446, - "loss": 0.4346, - "step": 120425 - }, - { - "epoch": 29.39, - "learning_rate": 0.00035352430979721476, - "loss": 0.4661, - "step": 120450 - }, - { - "epoch": 29.4, - "learning_rate": 0.0003534937698509651, - "loss": 0.4154, - "step": 120475 - }, - { - "epoch": 29.4, - "learning_rate": 0.00035346322990471537, - "loss": 0.4087, - "step": 120500 - }, - { - "epoch": 29.41, - "learning_rate": 0.00035343268995846567, - "loss": 0.4124, - "step": 120525 - }, - { - "epoch": 29.42, - "learning_rate": 0.000353402150012216, - "loss": 0.3801, - "step": 120550 - }, - { - "epoch": 29.42, - "learning_rate": 0.0003533716100659663, - "loss": 0.4197, - "step": 120575 - }, - { - "epoch": 29.43, - "learning_rate": 0.00035334107011971664, - "loss": 0.4203, - "step": 120600 - }, - { - "epoch": 29.44, - "learning_rate": 0.00035331053017346694, - "loss": 0.4267, - "step": 120625 - }, - { - "epoch": 29.44, - "learning_rate": 0.0003532799902272172, - "loss": 0.4088, - "step": 120650 - }, - { - "epoch": 29.45, - "learning_rate": 0.0003532494502809675, - "loss": 0.4504, - "step": 120675 - }, - { - "epoch": 29.45, - "learning_rate": 0.0003532189103347178, - "loss": 0.3981, - "step": 120700 - }, - { - "epoch": 29.46, - "learning_rate": 0.00035318837038846815, - "loss": 0.4532, - "step": 120725 - }, - { - "epoch": 29.47, - "learning_rate": 0.00035315783044221846, - "loss": 0.4276, - "step": 120750 - }, - { - "epoch": 29.47, - "learning_rate": 0.00035312729049596876, - "loss": 0.4059, - "step": 120775 - }, - { - "epoch": 29.48, - "learning_rate": 0.000353096750549719, - "loss": 0.376, - "step": 120800 - }, - { - "epoch": 29.48, - "learning_rate": 0.0003530662106034693, - "loss": 0.3947, - "step": 120825 - }, - { - "epoch": 29.49, - "learning_rate": 0.0003530356706572196, - "loss": 0.4219, - "step": 120850 - }, - { - "epoch": 29.5, - "learning_rate": 0.00035300513071097, - "loss": 0.3965, - "step": 120875 - }, - { - "epoch": 29.5, - "learning_rate": 0.0003529745907647203, - "loss": 0.426, - "step": 120900 - }, - { - "epoch": 29.51, - "learning_rate": 0.0003529440508184706, - "loss": 0.3877, - "step": 120925 - }, - { - "epoch": 29.51, - "learning_rate": 0.0003529135108722209, - "loss": 0.4478, - "step": 120950 - }, - { - "epoch": 29.52, - "learning_rate": 0.00035288297092597113, - "loss": 0.3986, - "step": 120975 - }, - { - "epoch": 29.53, - "learning_rate": 0.0003528524309797215, - "loss": 0.3896, - "step": 121000 - }, - { - "epoch": 29.53, - "learning_rate": 0.0003528218910334718, - "loss": 0.4218, - "step": 121025 - }, - { - "epoch": 29.54, - "learning_rate": 0.0003527913510872221, - "loss": 0.4153, - "step": 121050 - }, - { - "epoch": 29.54, - "learning_rate": 0.0003527608111409724, - "loss": 0.4367, - "step": 121075 - }, - { - "epoch": 29.55, - "learning_rate": 0.0003527302711947227, - "loss": 0.3787, - "step": 121100 - }, - { - "epoch": 29.56, - "learning_rate": 0.000352699731248473, - "loss": 0.4276, - "step": 121125 - }, - { - "epoch": 29.56, - "learning_rate": 0.0003526691913022233, - "loss": 0.4234, - "step": 121150 - }, - { - "epoch": 29.57, - "learning_rate": 0.0003526386513559736, - "loss": 0.4023, - "step": 121175 - }, - { - "epoch": 29.58, - "learning_rate": 0.0003526081114097239, - "loss": 0.4466, - "step": 121200 - }, - { - "epoch": 29.58, - "learning_rate": 0.0003525775714634742, - "loss": 0.421, - "step": 121225 - }, - { - "epoch": 29.59, - "learning_rate": 0.0003525470315172246, - "loss": 0.3944, - "step": 121250 - }, - { - "epoch": 29.59, - "learning_rate": 0.00035251649157097483, - "loss": 0.4337, - "step": 121275 - }, - { - "epoch": 29.6, - "learning_rate": 0.00035248595162472513, - "loss": 0.4379, - "step": 121300 - }, - { - "epoch": 29.61, - "learning_rate": 0.00035245541167847543, - "loss": 0.4306, - "step": 121325 - }, - { - "epoch": 29.61, - "learning_rate": 0.00035242487173222574, - "loss": 0.4094, - "step": 121350 - }, - { - "epoch": 29.62, - "learning_rate": 0.0003523943317859761, - "loss": 0.4306, - "step": 121375 - }, - { - "epoch": 29.62, - "learning_rate": 0.0003523637918397264, - "loss": 0.4026, - "step": 121400 - }, - { - "epoch": 29.63, - "learning_rate": 0.00035233325189347665, - "loss": 0.3812, - "step": 121425 - }, - { - "epoch": 29.64, - "learning_rate": 0.00035230271194722695, - "loss": 0.4086, - "step": 121450 - }, - { - "epoch": 29.64, - "learning_rate": 0.00035227217200097725, - "loss": 0.4389, - "step": 121475 - }, - { - "epoch": 29.65, - "learning_rate": 0.0003522416320547276, - "loss": 0.436, - "step": 121500 - }, - { - "epoch": 29.65, - "learning_rate": 0.0003522110921084779, - "loss": 0.4004, - "step": 121525 - }, - { - "epoch": 29.66, - "learning_rate": 0.0003521805521622282, - "loss": 0.4273, - "step": 121550 - }, - { - "epoch": 29.67, - "learning_rate": 0.0003521500122159785, - "loss": 0.3943, - "step": 121575 - }, - { - "epoch": 29.67, - "learning_rate": 0.00035211947226972877, - "loss": 0.4429, - "step": 121600 - }, - { - "epoch": 29.68, - "learning_rate": 0.00035208893232347913, - "loss": 0.424, - "step": 121625 - }, - { - "epoch": 29.69, - "learning_rate": 0.00035205839237722943, - "loss": 0.3805, - "step": 121650 - }, - { - "epoch": 29.69, - "learning_rate": 0.00035202785243097974, - "loss": 0.439, - "step": 121675 - }, - { - "epoch": 29.7, - "learning_rate": 0.00035199731248473004, - "loss": 0.4186, - "step": 121700 - }, - { - "epoch": 29.7, - "learning_rate": 0.00035196677253848034, - "loss": 0.4109, - "step": 121725 - }, - { - "epoch": 29.71, - "learning_rate": 0.00035193623259223065, - "loss": 0.4328, - "step": 121750 - }, - { - "epoch": 29.72, - "learning_rate": 0.00035190569264598095, - "loss": 0.4071, - "step": 121775 - }, - { - "epoch": 29.72, - "learning_rate": 0.00035187515269973125, - "loss": 0.4389, - "step": 121800 - }, - { - "epoch": 29.73, - "learning_rate": 0.00035184461275348156, - "loss": 0.418, - "step": 121825 - }, - { - "epoch": 29.73, - "learning_rate": 0.00035181407280723186, - "loss": 0.4152, - "step": 121850 - }, - { - "epoch": 29.74, - "learning_rate": 0.0003517835328609822, - "loss": 0.4223, - "step": 121875 - }, - { - "epoch": 29.75, - "learning_rate": 0.00035175299291473247, - "loss": 0.3847, - "step": 121900 - }, - { - "epoch": 29.75, - "learning_rate": 0.00035172245296848277, - "loss": 0.4277, - "step": 121925 - }, - { - "epoch": 29.76, - "learning_rate": 0.00035169191302223307, - "loss": 0.4348, - "step": 121950 - }, - { - "epoch": 29.76, - "learning_rate": 0.0003516613730759834, - "loss": 0.4434, - "step": 121975 - }, - { - "epoch": 29.77, - "learning_rate": 0.00035163083312973373, - "loss": 0.3893, - "step": 122000 - }, - { - "epoch": 29.78, - "learning_rate": 0.00035160029318348404, - "loss": 0.4229, - "step": 122025 - }, - { - "epoch": 29.78, - "learning_rate": 0.00035156975323723434, - "loss": 0.4222, - "step": 122050 - }, - { - "epoch": 29.79, - "learning_rate": 0.0003515392132909846, - "loss": 0.4246, - "step": 122075 - }, - { - "epoch": 29.8, - "learning_rate": 0.0003515086733447349, - "loss": 0.4318, - "step": 122100 - }, - { - "epoch": 29.8, - "learning_rate": 0.00035147813339848525, - "loss": 0.4136, - "step": 122125 - }, - { - "epoch": 29.81, - "learning_rate": 0.00035144759345223555, - "loss": 0.438, - "step": 122150 - }, - { - "epoch": 29.81, - "learning_rate": 0.00035141705350598586, - "loss": 0.4111, - "step": 122175 - }, - { - "epoch": 29.82, - "learning_rate": 0.00035138651355973616, - "loss": 0.449, - "step": 122200 - }, - { - "epoch": 29.83, - "learning_rate": 0.0003513559736134864, - "loss": 0.4086, - "step": 122225 - }, - { - "epoch": 29.83, - "learning_rate": 0.0003513254336672367, - "loss": 0.4543, - "step": 122250 - }, - { - "epoch": 29.84, - "learning_rate": 0.00035129489372098707, - "loss": 0.4528, - "step": 122275 - }, - { - "epoch": 29.84, - "learning_rate": 0.00035126435377473737, - "loss": 0.4258, - "step": 122300 - }, - { - "epoch": 29.85, - "learning_rate": 0.0003512338138284877, - "loss": 0.4424, - "step": 122325 - }, - { - "epoch": 29.86, - "learning_rate": 0.000351203273882238, - "loss": 0.4306, - "step": 122350 - }, - { - "epoch": 29.86, - "learning_rate": 0.00035117273393598823, - "loss": 0.4086, - "step": 122375 - }, - { - "epoch": 29.87, - "learning_rate": 0.0003511421939897386, - "loss": 0.4361, - "step": 122400 - }, - { - "epoch": 29.87, - "learning_rate": 0.0003511116540434889, - "loss": 0.4252, - "step": 122425 - }, - { - "epoch": 29.88, - "learning_rate": 0.0003510811140972392, - "loss": 0.4612, - "step": 122450 - }, - { - "epoch": 29.89, - "learning_rate": 0.0003510505741509895, - "loss": 0.4051, - "step": 122475 - }, - { - "epoch": 29.89, - "learning_rate": 0.0003510200342047398, - "loss": 0.4299, - "step": 122500 - }, - { - "epoch": 29.9, - "learning_rate": 0.00035098949425849016, - "loss": 0.4407, - "step": 122525 - }, - { - "epoch": 29.9, - "learning_rate": 0.0003509589543122404, - "loss": 0.3986, - "step": 122550 - }, - { - "epoch": 29.91, - "learning_rate": 0.0003509284143659907, - "loss": 0.4274, - "step": 122575 - }, - { - "epoch": 29.92, - "learning_rate": 0.000350897874419741, - "loss": 0.4169, - "step": 122600 - }, - { - "epoch": 29.92, - "learning_rate": 0.0003508673344734913, - "loss": 0.4529, - "step": 122625 - }, - { - "epoch": 29.93, - "learning_rate": 0.0003508367945272417, - "loss": 0.3713, - "step": 122650 - }, - { - "epoch": 29.94, - "learning_rate": 0.000350806254580992, - "loss": 0.4434, - "step": 122675 - }, - { - "epoch": 29.94, - "learning_rate": 0.0003507757146347422, - "loss": 0.4097, - "step": 122700 - }, - { - "epoch": 29.95, - "learning_rate": 0.00035074517468849253, - "loss": 0.4375, - "step": 122725 - }, - { - "epoch": 29.95, - "learning_rate": 0.00035071463474224283, - "loss": 0.4445, - "step": 122750 - }, - { - "epoch": 29.96, - "learning_rate": 0.0003506840947959932, - "loss": 0.4342, - "step": 122775 - }, - { - "epoch": 29.97, - "learning_rate": 0.0003506535548497435, - "loss": 0.3904, - "step": 122800 - }, - { - "epoch": 29.97, - "learning_rate": 0.0003506230149034938, - "loss": 0.409, - "step": 122825 - }, - { - "epoch": 29.98, - "learning_rate": 0.00035059247495724405, - "loss": 0.4287, - "step": 122850 - }, - { - "epoch": 29.98, - "learning_rate": 0.00035056193501099435, - "loss": 0.4229, - "step": 122875 - }, - { - "epoch": 29.99, - "learning_rate": 0.0003505313950647447, - "loss": 0.3857, - "step": 122900 - }, - { - "epoch": 30.0, - "learning_rate": 0.000350500855118495, - "loss": 0.4666, - "step": 122925 - }, - { - "epoch": 30.0, - "learning_rate": 0.0003504703151722453, - "loss": 0.4071, - "step": 122950 - }, - { - "epoch": 30.01, - "learning_rate": 0.0003504397752259956, - "loss": 0.4184, - "step": 122975 - }, - { - "epoch": 30.01, - "learning_rate": 0.0003504104568775959, - "loss": 0.4062, - "step": 123000 - }, - { - "epoch": 30.01, - "eval_cer": 0.10116218186298163, - "eval_loss": 0.41296249628067017, - "eval_runtime": 148.9733, - "eval_samples_per_second": 28.146, - "eval_steps_per_second": 7.042, - "eval_wer": 0.41706362153344206, - "step": 123000 - }, - { - "epoch": 30.02, - "learning_rate": 0.0003503799169313462, - "loss": 0.4304, - "step": 123025 - }, - { - "epoch": 30.03, - "learning_rate": 0.0003503493769850965, - "loss": 0.4434, - "step": 123050 - }, - { - "epoch": 30.03, - "learning_rate": 0.00035031883703884683, - "loss": 0.408, - "step": 123075 - }, - { - "epoch": 30.04, - "learning_rate": 0.00035028951869044714, - "loss": 0.4147, - "step": 123100 - }, - { - "epoch": 30.05, - "learning_rate": 0.00035025897874419744, - "loss": 0.3929, - "step": 123125 - }, - { - "epoch": 30.05, - "learning_rate": 0.00035022843879794775, - "loss": 0.4164, - "step": 123150 - }, - { - "epoch": 30.06, - "learning_rate": 0.000350197898851698, - "loss": 0.4251, - "step": 123175 - }, - { - "epoch": 30.06, - "learning_rate": 0.0003501673589054483, - "loss": 0.3855, - "step": 123200 - }, - { - "epoch": 30.07, - "learning_rate": 0.00035013681895919866, - "loss": 0.4134, - "step": 123225 - }, - { - "epoch": 30.08, - "learning_rate": 0.00035010627901294896, - "loss": 0.4397, - "step": 123250 - }, - { - "epoch": 30.08, - "learning_rate": 0.00035007573906669926, - "loss": 0.4235, - "step": 123275 - }, - { - "epoch": 30.09, - "learning_rate": 0.00035004519912044957, - "loss": 0.3841, - "step": 123300 - }, - { - "epoch": 30.09, - "learning_rate": 0.0003500146591741998, - "loss": 0.402, - "step": 123325 - }, - { - "epoch": 30.1, - "learning_rate": 0.0003499841192279502, - "loss": 0.4278, - "step": 123350 - }, - { - "epoch": 30.11, - "learning_rate": 0.0003499535792817005, - "loss": 0.4193, - "step": 123375 - }, - { - "epoch": 30.11, - "learning_rate": 0.0003499230393354508, - "loss": 0.3789, - "step": 123400 - }, - { - "epoch": 30.12, - "learning_rate": 0.0003498924993892011, - "loss": 0.4279, - "step": 123425 - }, - { - "epoch": 30.12, - "learning_rate": 0.0003498619594429514, - "loss": 0.3855, - "step": 123450 - }, - { - "epoch": 30.13, - "learning_rate": 0.00034983141949670174, - "loss": 0.4093, - "step": 123475 - }, - { - "epoch": 30.14, - "learning_rate": 0.000349800879550452, - "loss": 0.3989, - "step": 123500 - }, - { - "epoch": 30.14, - "learning_rate": 0.0003497703396042023, - "loss": 0.412, - "step": 123525 - }, - { - "epoch": 30.15, - "learning_rate": 0.0003497397996579526, - "loss": 0.4134, - "step": 123550 - }, - { - "epoch": 30.15, - "learning_rate": 0.0003497092597117029, - "loss": 0.4041, - "step": 123575 - }, - { - "epoch": 30.16, - "learning_rate": 0.00034967871976545326, - "loss": 0.4094, - "step": 123600 - }, - { - "epoch": 30.17, - "learning_rate": 0.00034964817981920356, - "loss": 0.4239, - "step": 123625 - }, - { - "epoch": 30.17, - "learning_rate": 0.0003496176398729538, - "loss": 0.3698, - "step": 123650 - }, - { - "epoch": 30.18, - "learning_rate": 0.0003495870999267041, - "loss": 0.3939, - "step": 123675 - }, - { - "epoch": 30.19, - "learning_rate": 0.0003495565599804544, - "loss": 0.4228, - "step": 123700 - }, - { - "epoch": 30.19, - "learning_rate": 0.0003495260200342047, - "loss": 0.4043, - "step": 123725 - }, - { - "epoch": 30.2, - "learning_rate": 0.0003494954800879551, - "loss": 0.401, - "step": 123750 - }, - { - "epoch": 30.2, - "learning_rate": 0.0003494649401417054, - "loss": 0.3792, - "step": 123775 - }, - { - "epoch": 30.21, - "learning_rate": 0.00034943440019545563, - "loss": 0.3988, - "step": 123800 - }, - { - "epoch": 30.22, - "learning_rate": 0.00034940386024920594, - "loss": 0.432, - "step": 123825 - }, - { - "epoch": 30.22, - "learning_rate": 0.00034937332030295624, - "loss": 0.4485, - "step": 123850 - }, - { - "epoch": 30.23, - "learning_rate": 0.0003493427803567066, - "loss": 0.4091, - "step": 123875 - }, - { - "epoch": 30.23, - "learning_rate": 0.0003493122404104569, - "loss": 0.3819, - "step": 123900 - }, - { - "epoch": 30.24, - "learning_rate": 0.0003492817004642072, - "loss": 0.4148, - "step": 123925 - }, - { - "epoch": 30.25, - "learning_rate": 0.0003492511605179575, - "loss": 0.4096, - "step": 123950 - }, - { - "epoch": 30.25, - "learning_rate": 0.00034922062057170776, - "loss": 0.3938, - "step": 123975 - }, - { - "epoch": 30.26, - "learning_rate": 0.0003491900806254581, - "loss": 0.4216, - "step": 124000 - }, - { - "epoch": 30.26, - "learning_rate": 0.0003491595406792084, - "loss": 0.4014, - "step": 124025 - }, - { - "epoch": 30.27, - "learning_rate": 0.0003491290007329587, - "loss": 0.4154, - "step": 124050 - }, - { - "epoch": 30.28, - "learning_rate": 0.000349098460786709, - "loss": 0.426, - "step": 124075 - }, - { - "epoch": 30.28, - "learning_rate": 0.00034906792084045933, - "loss": 0.4188, - "step": 124100 - }, - { - "epoch": 30.29, - "learning_rate": 0.00034903738089420963, - "loss": 0.3845, - "step": 124125 - }, - { - "epoch": 30.3, - "learning_rate": 0.00034900684094795993, - "loss": 0.4222, - "step": 124150 - }, - { - "epoch": 30.3, - "learning_rate": 0.00034897630100171024, - "loss": 0.411, - "step": 124175 - }, - { - "epoch": 30.31, - "learning_rate": 0.00034894576105546054, - "loss": 0.4288, - "step": 124200 - }, - { - "epoch": 30.31, - "learning_rate": 0.00034891522110921085, - "loss": 0.4252, - "step": 124225 - }, - { - "epoch": 30.32, - "learning_rate": 0.0003488846811629612, - "loss": 0.4216, - "step": 124250 - }, - { - "epoch": 30.33, - "learning_rate": 0.00034885414121671145, - "loss": 0.4033, - "step": 124275 - }, - { - "epoch": 30.33, - "learning_rate": 0.00034882360127046176, - "loss": 0.4382, - "step": 124300 - }, - { - "epoch": 30.34, - "learning_rate": 0.00034879306132421206, - "loss": 0.4194, - "step": 124325 - }, - { - "epoch": 30.34, - "learning_rate": 0.00034876252137796236, - "loss": 0.3948, - "step": 124350 - }, - { - "epoch": 30.35, - "learning_rate": 0.0003487319814317127, - "loss": 0.4072, - "step": 124375 - }, - { - "epoch": 30.36, - "learning_rate": 0.000348701441485463, - "loss": 0.3921, - "step": 124400 - }, - { - "epoch": 30.36, - "learning_rate": 0.0003486709015392133, - "loss": 0.3927, - "step": 124425 - }, - { - "epoch": 30.37, - "learning_rate": 0.0003486403615929636, - "loss": 0.3803, - "step": 124450 - }, - { - "epoch": 30.37, - "learning_rate": 0.0003486098216467139, - "loss": 0.4021, - "step": 124475 - }, - { - "epoch": 30.38, - "learning_rate": 0.00034857928170046424, - "loss": 0.4273, - "step": 124500 - }, - { - "epoch": 30.39, - "learning_rate": 0.00034854874175421454, - "loss": 0.421, - "step": 124525 - }, - { - "epoch": 30.39, - "learning_rate": 0.00034851820180796484, - "loss": 0.4059, - "step": 124550 - }, - { - "epoch": 30.4, - "learning_rate": 0.00034848766186171515, - "loss": 0.4006, - "step": 124575 - }, - { - "epoch": 30.41, - "learning_rate": 0.0003484571219154654, - "loss": 0.4126, - "step": 124600 - }, - { - "epoch": 30.41, - "learning_rate": 0.00034842658196921575, - "loss": 0.4117, - "step": 124625 - }, - { - "epoch": 30.42, - "learning_rate": 0.00034839604202296606, - "loss": 0.4357, - "step": 124650 - }, - { - "epoch": 30.42, - "learning_rate": 0.00034836550207671636, - "loss": 0.3873, - "step": 124675 - }, - { - "epoch": 30.43, - "learning_rate": 0.00034833496213046666, - "loss": 0.383, - "step": 124700 - }, - { - "epoch": 30.44, - "learning_rate": 0.00034830442218421697, - "loss": 0.3809, - "step": 124725 - }, - { - "epoch": 30.44, - "learning_rate": 0.00034827388223796727, - "loss": 0.3976, - "step": 124750 - }, - { - "epoch": 30.45, - "learning_rate": 0.00034824334229171757, - "loss": 0.3906, - "step": 124775 - }, - { - "epoch": 30.45, - "learning_rate": 0.0003482128023454679, - "loss": 0.3888, - "step": 124800 - }, - { - "epoch": 30.46, - "learning_rate": 0.0003481822623992182, - "loss": 0.4004, - "step": 124825 - }, - { - "epoch": 30.47, - "learning_rate": 0.0003481517224529685, - "loss": 0.4036, - "step": 124850 - }, - { - "epoch": 30.47, - "learning_rate": 0.00034812118250671884, - "loss": 0.4037, - "step": 124875 - }, - { - "epoch": 30.48, - "learning_rate": 0.00034809064256046914, - "loss": 0.396, - "step": 124900 - }, - { - "epoch": 30.48, - "learning_rate": 0.0003480601026142194, - "loss": 0.4076, - "step": 124925 - }, - { - "epoch": 30.49, - "learning_rate": 0.0003480295626679697, - "loss": 0.4193, - "step": 124950 - }, - { - "epoch": 30.5, - "learning_rate": 0.00034799902272172, - "loss": 0.4146, - "step": 124975 - }, - { - "epoch": 30.5, - "learning_rate": 0.0003479684827754703, - "loss": 0.4226, - "step": 125000 - }, - { - "epoch": 30.51, - "learning_rate": 0.00034793794282922066, - "loss": 0.3734, - "step": 125025 - }, - { - "epoch": 30.51, - "learning_rate": 0.00034790740288297096, - "loss": 0.3793, - "step": 125050 - }, - { - "epoch": 30.52, - "learning_rate": 0.0003478768629367212, - "loss": 0.4013, - "step": 125075 - }, - { - "epoch": 30.53, - "learning_rate": 0.0003478463229904715, - "loss": 0.4157, - "step": 125100 - }, - { - "epoch": 30.53, - "learning_rate": 0.0003478157830442218, - "loss": 0.4507, - "step": 125125 - }, - { - "epoch": 30.54, - "learning_rate": 0.0003477852430979722, - "loss": 0.4108, - "step": 125150 - }, - { - "epoch": 30.55, - "learning_rate": 0.0003477547031517225, - "loss": 0.4143, - "step": 125175 - }, - { - "epoch": 30.55, - "learning_rate": 0.0003477241632054728, - "loss": 0.4348, - "step": 125200 - }, - { - "epoch": 30.56, - "learning_rate": 0.00034769362325922303, - "loss": 0.4, - "step": 125225 - }, - { - "epoch": 30.56, - "learning_rate": 0.00034766308331297334, - "loss": 0.4353, - "step": 125250 - }, - { - "epoch": 30.57, - "learning_rate": 0.0003476325433667237, - "loss": 0.4229, - "step": 125275 - }, - { - "epoch": 30.58, - "learning_rate": 0.000347602003420474, - "loss": 0.3911, - "step": 125300 - }, - { - "epoch": 30.58, - "learning_rate": 0.0003475714634742243, - "loss": 0.3888, - "step": 125325 - }, - { - "epoch": 30.59, - "learning_rate": 0.0003475409235279746, - "loss": 0.4081, - "step": 125350 - }, - { - "epoch": 30.59, - "learning_rate": 0.00034751038358172485, - "loss": 0.3961, - "step": 125375 - }, - { - "epoch": 30.6, - "learning_rate": 0.0003474798436354752, - "loss": 0.3993, - "step": 125400 - }, - { - "epoch": 30.61, - "learning_rate": 0.0003474493036892255, - "loss": 0.3694, - "step": 125425 - }, - { - "epoch": 30.61, - "learning_rate": 0.0003474187637429758, - "loss": 0.4185, - "step": 125450 - }, - { - "epoch": 30.62, - "learning_rate": 0.0003473882237967261, - "loss": 0.3864, - "step": 125475 - }, - { - "epoch": 30.62, - "learning_rate": 0.0003473576838504764, - "loss": 0.408, - "step": 125500 - }, - { - "epoch": 30.63, - "learning_rate": 0.0003473271439042268, - "loss": 0.4256, - "step": 125525 - }, - { - "epoch": 30.64, - "learning_rate": 0.00034729660395797703, - "loss": 0.4471, - "step": 125550 - }, - { - "epoch": 30.64, - "learning_rate": 0.00034726606401172733, - "loss": 0.422, - "step": 125575 - }, - { - "epoch": 30.65, - "learning_rate": 0.00034723552406547764, - "loss": 0.4016, - "step": 125600 - }, - { - "epoch": 30.66, - "learning_rate": 0.00034720498411922794, - "loss": 0.3924, - "step": 125625 - }, - { - "epoch": 30.66, - "learning_rate": 0.0003471744441729783, - "loss": 0.3669, - "step": 125650 - }, - { - "epoch": 30.67, - "learning_rate": 0.0003471439042267286, - "loss": 0.4027, - "step": 125675 - }, - { - "epoch": 30.67, - "learning_rate": 0.00034711336428047885, - "loss": 0.4206, - "step": 125700 - }, - { - "epoch": 30.68, - "learning_rate": 0.00034708282433422915, - "loss": 0.4272, - "step": 125725 - }, - { - "epoch": 30.69, - "learning_rate": 0.00034705228438797946, - "loss": 0.3985, - "step": 125750 - }, - { - "epoch": 30.69, - "learning_rate": 0.0003470217444417298, - "loss": 0.4368, - "step": 125775 - }, - { - "epoch": 30.7, - "learning_rate": 0.0003469912044954801, - "loss": 0.4344, - "step": 125800 - }, - { - "epoch": 30.7, - "learning_rate": 0.0003469606645492304, - "loss": 0.399, - "step": 125825 - }, - { - "epoch": 30.71, - "learning_rate": 0.00034693012460298067, - "loss": 0.3887, - "step": 125850 - }, - { - "epoch": 30.72, - "learning_rate": 0.000346899584656731, - "loss": 0.4529, - "step": 125875 - }, - { - "epoch": 30.72, - "learning_rate": 0.00034686904471048133, - "loss": 0.4415, - "step": 125900 - }, - { - "epoch": 30.73, - "learning_rate": 0.00034683850476423164, - "loss": 0.4205, - "step": 125925 - }, - { - "epoch": 30.73, - "learning_rate": 0.00034680796481798194, - "loss": 0.4042, - "step": 125950 - }, - { - "epoch": 30.74, - "learning_rate": 0.00034677742487173224, - "loss": 0.4339, - "step": 125975 - }, - { - "epoch": 30.75, - "learning_rate": 0.00034674688492548255, - "loss": 0.3903, - "step": 126000 - }, - { - "epoch": 30.75, - "eval_cer": 0.10059751753026087, - "eval_loss": 0.41336575150489807, - "eval_runtime": 149.0037, - "eval_samples_per_second": 28.14, - "eval_steps_per_second": 7.04, - "eval_wer": 0.4123654159869494, - "step": 126000 - }, - { - "epoch": 30.75, - "learning_rate": 0.00034671634497923285, - "loss": 0.4048, - "step": 126025 - }, - { - "epoch": 30.76, - "learning_rate": 0.00034668580503298315, - "loss": 0.4314, - "step": 126050 - }, - { - "epoch": 30.77, - "learning_rate": 0.00034665526508673346, - "loss": 0.4407, - "step": 126075 - }, - { - "epoch": 30.77, - "learning_rate": 0.00034662472514048376, - "loss": 0.4225, - "step": 126100 - }, - { - "epoch": 30.78, - "learning_rate": 0.00034659418519423406, - "loss": 0.4267, - "step": 126125 - }, - { - "epoch": 30.78, - "learning_rate": 0.0003465636452479844, - "loss": 0.3801, - "step": 126150 - }, - { - "epoch": 30.79, - "learning_rate": 0.00034653310530173467, - "loss": 0.4037, - "step": 126175 - }, - { - "epoch": 30.8, - "learning_rate": 0.00034650256535548497, - "loss": 0.4098, - "step": 126200 - }, - { - "epoch": 30.8, - "learning_rate": 0.0003464720254092353, - "loss": 0.3993, - "step": 126225 - }, - { - "epoch": 30.81, - "learning_rate": 0.0003464414854629856, - "loss": 0.4666, - "step": 126250 - }, - { - "epoch": 30.81, - "learning_rate": 0.00034641094551673594, - "loss": 0.4039, - "step": 126275 - }, - { - "epoch": 30.82, - "learning_rate": 0.00034638040557048624, - "loss": 0.4366, - "step": 126300 - }, - { - "epoch": 30.83, - "learning_rate": 0.0003463498656242365, - "loss": 0.3941, - "step": 126325 - }, - { - "epoch": 30.83, - "learning_rate": 0.0003463193256779868, - "loss": 0.3714, - "step": 126350 - }, - { - "epoch": 30.84, - "learning_rate": 0.0003462887857317371, - "loss": 0.437, - "step": 126375 - }, - { - "epoch": 30.84, - "learning_rate": 0.0003462582457854874, - "loss": 0.4148, - "step": 126400 - }, - { - "epoch": 30.85, - "learning_rate": 0.00034622770583923776, - "loss": 0.4434, - "step": 126425 - }, - { - "epoch": 30.86, - "learning_rate": 0.00034619716589298806, - "loss": 0.4539, - "step": 126450 - }, - { - "epoch": 30.86, - "learning_rate": 0.00034616662594673836, - "loss": 0.4064, - "step": 126475 - }, - { - "epoch": 30.87, - "learning_rate": 0.0003461360860004886, - "loss": 0.4261, - "step": 126500 - }, - { - "epoch": 30.87, - "learning_rate": 0.0003461055460542389, - "loss": 0.4017, - "step": 126525 - }, - { - "epoch": 30.88, - "learning_rate": 0.0003460750061079893, - "loss": 0.4168, - "step": 126550 - }, - { - "epoch": 30.89, - "learning_rate": 0.0003460444661617396, - "loss": 0.4056, - "step": 126575 - }, - { - "epoch": 30.89, - "learning_rate": 0.0003460139262154899, - "loss": 0.3872, - "step": 126600 - }, - { - "epoch": 30.9, - "learning_rate": 0.0003459833862692402, - "loss": 0.4327, - "step": 126625 - }, - { - "epoch": 30.91, - "learning_rate": 0.00034595284632299043, - "loss": 0.4261, - "step": 126650 - }, - { - "epoch": 30.91, - "learning_rate": 0.0003459223063767408, - "loss": 0.3929, - "step": 126675 - }, - { - "epoch": 30.92, - "learning_rate": 0.0003458917664304911, - "loss": 0.3899, - "step": 126700 - }, - { - "epoch": 30.92, - "learning_rate": 0.0003458612264842414, - "loss": 0.4076, - "step": 126725 - }, - { - "epoch": 30.93, - "learning_rate": 0.0003458306865379917, - "loss": 0.3944, - "step": 126750 - }, - { - "epoch": 30.94, - "learning_rate": 0.000345800146591742, - "loss": 0.4055, - "step": 126775 - }, - { - "epoch": 30.94, - "learning_rate": 0.0003457696066454923, - "loss": 0.4143, - "step": 126800 - }, - { - "epoch": 30.95, - "learning_rate": 0.0003457390666992426, - "loss": 0.4015, - "step": 126825 - }, - { - "epoch": 30.95, - "learning_rate": 0.0003457085267529929, - "loss": 0.4083, - "step": 126850 - }, - { - "epoch": 30.96, - "learning_rate": 0.0003456779868067432, - "loss": 0.4116, - "step": 126875 - }, - { - "epoch": 30.97, - "learning_rate": 0.0003456474468604935, - "loss": 0.4026, - "step": 126900 - }, - { - "epoch": 30.97, - "learning_rate": 0.0003456169069142439, - "loss": 0.3899, - "step": 126925 - }, - { - "epoch": 30.98, - "learning_rate": 0.0003455863669679942, - "loss": 0.427, - "step": 126950 - }, - { - "epoch": 30.98, - "learning_rate": 0.00034555582702174443, - "loss": 0.4051, - "step": 126975 - }, - { - "epoch": 30.99, - "learning_rate": 0.00034552528707549473, - "loss": 0.444, - "step": 127000 - }, - { - "epoch": 31.0, - "learning_rate": 0.00034549474712924504, - "loss": 0.3934, - "step": 127025 - }, - { - "epoch": 31.0, - "learning_rate": 0.0003454642071829954, - "loss": 0.394, - "step": 127050 - }, - { - "epoch": 31.01, - "learning_rate": 0.0003454336672367457, - "loss": 0.3947, - "step": 127075 - }, - { - "epoch": 31.02, - "learning_rate": 0.000345403127290496, - "loss": 0.4078, - "step": 127100 - }, - { - "epoch": 31.02, - "learning_rate": 0.00034537258734424625, - "loss": 0.4122, - "step": 127125 - }, - { - "epoch": 31.03, - "learning_rate": 0.00034534204739799655, - "loss": 0.424, - "step": 127150 - }, - { - "epoch": 31.03, - "learning_rate": 0.0003453115074517469, - "loss": 0.3971, - "step": 127175 - }, - { - "epoch": 31.04, - "learning_rate": 0.0003452809675054972, - "loss": 0.3677, - "step": 127200 - }, - { - "epoch": 31.05, - "learning_rate": 0.0003452504275592475, - "loss": 0.3823, - "step": 127225 - }, - { - "epoch": 31.05, - "learning_rate": 0.0003452198876129978, - "loss": 0.389, - "step": 127250 - }, - { - "epoch": 31.06, - "learning_rate": 0.00034518934766674807, - "loss": 0.4075, - "step": 127275 - }, - { - "epoch": 31.06, - "learning_rate": 0.00034515880772049843, - "loss": 0.4156, - "step": 127300 - }, - { - "epoch": 31.07, - "learning_rate": 0.00034512826777424873, - "loss": 0.402, - "step": 127325 - }, - { - "epoch": 31.08, - "learning_rate": 0.00034509772782799903, - "loss": 0.4084, - "step": 127350 - }, - { - "epoch": 31.08, - "learning_rate": 0.00034506718788174934, - "loss": 0.3867, - "step": 127375 - }, - { - "epoch": 31.09, - "learning_rate": 0.00034503664793549964, - "loss": 0.4277, - "step": 127400 - }, - { - "epoch": 31.09, - "learning_rate": 0.00034500610798925, - "loss": 0.372, - "step": 127425 - }, - { - "epoch": 31.1, - "learning_rate": 0.00034497556804300025, - "loss": 0.4244, - "step": 127450 - }, - { - "epoch": 31.11, - "learning_rate": 0.00034494502809675055, - "loss": 0.3852, - "step": 127475 - }, - { - "epoch": 31.11, - "learning_rate": 0.00034491448815050085, - "loss": 0.4092, - "step": 127500 - }, - { - "epoch": 31.12, - "learning_rate": 0.00034488394820425116, - "loss": 0.3903, - "step": 127525 - }, - { - "epoch": 31.12, - "learning_rate": 0.0003448534082580015, - "loss": 0.4273, - "step": 127550 - }, - { - "epoch": 31.13, - "learning_rate": 0.0003448228683117518, - "loss": 0.3588, - "step": 127575 - }, - { - "epoch": 31.14, - "learning_rate": 0.00034479232836550207, - "loss": 0.416, - "step": 127600 - }, - { - "epoch": 31.14, - "learning_rate": 0.00034476178841925237, - "loss": 0.4172, - "step": 127625 - }, - { - "epoch": 31.15, - "learning_rate": 0.0003447312484730027, - "loss": 0.424, - "step": 127650 - }, - { - "epoch": 31.16, - "learning_rate": 0.000344700708526753, - "loss": 0.3827, - "step": 127675 - }, - { - "epoch": 31.16, - "learning_rate": 0.00034467016858050334, - "loss": 0.4112, - "step": 127700 - }, - { - "epoch": 31.17, - "learning_rate": 0.00034463962863425364, - "loss": 0.3899, - "step": 127725 - }, - { - "epoch": 31.17, - "learning_rate": 0.0003446090886880039, - "loss": 0.4096, - "step": 127750 - }, - { - "epoch": 31.18, - "learning_rate": 0.0003445785487417542, - "loss": 0.3704, - "step": 127775 - }, - { - "epoch": 31.19, - "learning_rate": 0.0003445480087955045, - "loss": 0.3892, - "step": 127800 - }, - { - "epoch": 31.19, - "learning_rate": 0.00034451746884925485, - "loss": 0.4285, - "step": 127825 - }, - { - "epoch": 31.2, - "learning_rate": 0.00034448692890300516, - "loss": 0.3989, - "step": 127850 - }, - { - "epoch": 31.2, - "learning_rate": 0.00034445638895675546, - "loss": 0.3909, - "step": 127875 - }, - { - "epoch": 31.21, - "learning_rate": 0.00034442584901050576, - "loss": 0.3992, - "step": 127900 - }, - { - "epoch": 31.22, - "learning_rate": 0.000344395309064256, - "loss": 0.4138, - "step": 127925 - }, - { - "epoch": 31.22, - "learning_rate": 0.00034436476911800637, - "loss": 0.396, - "step": 127950 - }, - { - "epoch": 31.23, - "learning_rate": 0.00034433422917175667, - "loss": 0.3903, - "step": 127975 - }, - { - "epoch": 31.23, - "learning_rate": 0.000344303689225507, - "loss": 0.424, - "step": 128000 - }, - { - "epoch": 31.24, - "learning_rate": 0.0003442731492792573, - "loss": 0.415, - "step": 128025 - }, - { - "epoch": 31.25, - "learning_rate": 0.0003442426093330076, - "loss": 0.3974, - "step": 128050 - }, - { - "epoch": 31.25, - "learning_rate": 0.0003442120693867579, - "loss": 0.3778, - "step": 128075 - }, - { - "epoch": 31.26, - "learning_rate": 0.0003441815294405082, - "loss": 0.3974, - "step": 128100 - }, - { - "epoch": 31.27, - "learning_rate": 0.0003441509894942585, - "loss": 0.3574, - "step": 128125 - }, - { - "epoch": 31.27, - "learning_rate": 0.0003441204495480088, - "loss": 0.3975, - "step": 128150 - }, - { - "epoch": 31.28, - "learning_rate": 0.0003440899096017591, - "loss": 0.4121, - "step": 128175 - }, - { - "epoch": 31.28, - "learning_rate": 0.00034405936965550946, - "loss": 0.3711, - "step": 128200 - }, - { - "epoch": 31.29, - "learning_rate": 0.0003440288297092597, - "loss": 0.3926, - "step": 128225 - }, - { - "epoch": 31.3, - "learning_rate": 0.00034399828976301, - "loss": 0.3966, - "step": 128250 - }, - { - "epoch": 31.3, - "learning_rate": 0.0003439677498167603, - "loss": 0.3844, - "step": 128275 - }, - { - "epoch": 31.31, - "learning_rate": 0.0003439372098705106, - "loss": 0.4343, - "step": 128300 - }, - { - "epoch": 31.31, - "learning_rate": 0.000343906669924261, - "loss": 0.3874, - "step": 128325 - }, - { - "epoch": 31.32, - "learning_rate": 0.0003438761299780113, - "loss": 0.4114, - "step": 128350 - }, - { - "epoch": 31.33, - "learning_rate": 0.0003438455900317615, - "loss": 0.3896, - "step": 128375 - }, - { - "epoch": 31.33, - "learning_rate": 0.00034381505008551183, - "loss": 0.4045, - "step": 128400 - }, - { - "epoch": 31.34, - "learning_rate": 0.00034378451013926213, - "loss": 0.3992, - "step": 128425 - }, - { - "epoch": 31.34, - "learning_rate": 0.0003437539701930125, - "loss": 0.3824, - "step": 128450 - }, - { - "epoch": 31.35, - "learning_rate": 0.0003437234302467628, - "loss": 0.3524, - "step": 128475 - }, - { - "epoch": 31.36, - "learning_rate": 0.0003436928903005131, - "loss": 0.4461, - "step": 128500 - }, - { - "epoch": 31.36, - "learning_rate": 0.0003436623503542634, - "loss": 0.394, - "step": 128525 - }, - { - "epoch": 31.37, - "learning_rate": 0.00034363181040801365, - "loss": 0.4214, - "step": 128550 - }, - { - "epoch": 31.38, - "learning_rate": 0.000343601270461764, - "loss": 0.392, - "step": 128575 - }, - { - "epoch": 31.38, - "learning_rate": 0.0003435707305155143, - "loss": 0.4457, - "step": 128600 - }, - { - "epoch": 31.39, - "learning_rate": 0.0003435401905692646, - "loss": 0.3787, - "step": 128625 - }, - { - "epoch": 31.39, - "learning_rate": 0.0003435096506230149, - "loss": 0.3963, - "step": 128650 - }, - { - "epoch": 31.4, - "learning_rate": 0.0003434791106767652, - "loss": 0.4293, - "step": 128675 - }, - { - "epoch": 31.41, - "learning_rate": 0.00034344979232836547, - "loss": 0.4412, - "step": 128700 - }, - { - "epoch": 31.41, - "learning_rate": 0.0003434192523821158, - "loss": 0.4166, - "step": 128725 - }, - { - "epoch": 31.42, - "learning_rate": 0.00034338871243586613, - "loss": 0.3929, - "step": 128750 - }, - { - "epoch": 31.42, - "learning_rate": 0.00034335817248961644, - "loss": 0.3735, - "step": 128775 - }, - { - "epoch": 31.43, - "learning_rate": 0.00034332763254336674, - "loss": 0.3691, - "step": 128800 - }, - { - "epoch": 31.44, - "learning_rate": 0.00034329709259711704, - "loss": 0.4261, - "step": 128825 - }, - { - "epoch": 31.44, - "learning_rate": 0.0003432665526508673, - "loss": 0.398, - "step": 128850 - }, - { - "epoch": 31.45, - "learning_rate": 0.00034323601270461765, - "loss": 0.4245, - "step": 128875 - }, - { - "epoch": 31.45, - "learning_rate": 0.00034320547275836795, - "loss": 0.3894, - "step": 128900 - }, - { - "epoch": 31.46, - "learning_rate": 0.00034317493281211826, - "loss": 0.3963, - "step": 128925 - }, - { - "epoch": 31.47, - "learning_rate": 0.00034314439286586856, - "loss": 0.4036, - "step": 128950 - }, - { - "epoch": 31.47, - "learning_rate": 0.00034311385291961886, - "loss": 0.3902, - "step": 128975 - }, - { - "epoch": 31.48, - "learning_rate": 0.0003430833129733692, - "loss": 0.369, - "step": 129000 - }, - { - "epoch": 31.48, - "eval_cer": 0.09760479656684086, - "eval_loss": 0.41631850600242615, - "eval_runtime": 148.2037, - "eval_samples_per_second": 28.292, - "eval_steps_per_second": 7.078, - "eval_wer": 0.400652528548124, - "step": 129000 - }, - { - "epoch": 31.48, - "learning_rate": 0.00034305277302711947, - "loss": 0.3934, - "step": 129025 - }, - { - "epoch": 31.49, - "learning_rate": 0.0003430222330808698, - "loss": 0.4278, - "step": 129050 - }, - { - "epoch": 31.5, - "learning_rate": 0.0003429916931346201, - "loss": 0.3735, - "step": 129075 - }, - { - "epoch": 31.5, - "learning_rate": 0.0003429611531883704, - "loss": 0.4241, - "step": 129100 - }, - { - "epoch": 31.51, - "learning_rate": 0.00034293061324212074, - "loss": 0.3702, - "step": 129125 - }, - { - "epoch": 31.52, - "learning_rate": 0.00034290007329587104, - "loss": 0.4194, - "step": 129150 - }, - { - "epoch": 31.52, - "learning_rate": 0.0003428695333496213, - "loss": 0.3937, - "step": 129175 - }, - { - "epoch": 31.53, - "learning_rate": 0.0003428389934033716, - "loss": 0.4219, - "step": 129200 - }, - { - "epoch": 31.53, - "learning_rate": 0.0003428084534571219, - "loss": 0.407, - "step": 129225 - }, - { - "epoch": 31.54, - "learning_rate": 0.00034277791351087225, - "loss": 0.4078, - "step": 129250 - }, - { - "epoch": 31.55, - "learning_rate": 0.00034274737356462256, - "loss": 0.383, - "step": 129275 - }, - { - "epoch": 31.55, - "learning_rate": 0.00034271683361837286, - "loss": 0.3647, - "step": 129300 - }, - { - "epoch": 31.56, - "learning_rate": 0.0003426862936721231, - "loss": 0.4133, - "step": 129325 - }, - { - "epoch": 31.56, - "learning_rate": 0.0003426557537258734, - "loss": 0.4432, - "step": 129350 - }, - { - "epoch": 31.57, - "learning_rate": 0.00034262521377962377, - "loss": 0.3944, - "step": 129375 - }, - { - "epoch": 31.58, - "learning_rate": 0.0003425946738333741, - "loss": 0.4371, - "step": 129400 - }, - { - "epoch": 31.58, - "learning_rate": 0.0003425641338871244, - "loss": 0.3852, - "step": 129425 - }, - { - "epoch": 31.59, - "learning_rate": 0.0003425335939408747, - "loss": 0.4615, - "step": 129450 - }, - { - "epoch": 31.59, - "learning_rate": 0.000342503053994625, - "loss": 0.3881, - "step": 129475 - }, - { - "epoch": 31.6, - "learning_rate": 0.0003424725140483753, - "loss": 0.3749, - "step": 129500 - }, - { - "epoch": 31.61, - "learning_rate": 0.0003424419741021256, - "loss": 0.3825, - "step": 129525 - }, - { - "epoch": 31.61, - "learning_rate": 0.0003424114341558759, - "loss": 0.3886, - "step": 129550 - }, - { - "epoch": 31.62, - "learning_rate": 0.0003423808942096262, - "loss": 0.3683, - "step": 129575 - }, - { - "epoch": 31.63, - "learning_rate": 0.0003423503542633765, - "loss": 0.3867, - "step": 129600 - }, - { - "epoch": 31.63, - "learning_rate": 0.00034231981431712686, - "loss": 0.347, - "step": 129625 - }, - { - "epoch": 31.64, - "learning_rate": 0.0003422892743708771, - "loss": 0.4264, - "step": 129650 - }, - { - "epoch": 31.64, - "learning_rate": 0.0003422587344246274, - "loss": 0.3993, - "step": 129675 - }, - { - "epoch": 31.65, - "learning_rate": 0.0003422281944783777, - "loss": 0.402, - "step": 129700 - }, - { - "epoch": 31.66, - "learning_rate": 0.000342197654532128, - "loss": 0.3996, - "step": 129725 - }, - { - "epoch": 31.66, - "learning_rate": 0.0003421671145858783, - "loss": 0.3943, - "step": 129750 - }, - { - "epoch": 31.67, - "learning_rate": 0.0003421365746396287, - "loss": 0.3863, - "step": 129775 - }, - { - "epoch": 31.67, - "learning_rate": 0.00034210603469337893, - "loss": 0.3994, - "step": 129800 - }, - { - "epoch": 31.68, - "learning_rate": 0.00034207549474712923, - "loss": 0.4143, - "step": 129825 - }, - { - "epoch": 31.69, - "learning_rate": 0.00034204495480087953, - "loss": 0.3848, - "step": 129850 - }, - { - "epoch": 31.69, - "learning_rate": 0.00034201441485462984, - "loss": 0.3981, - "step": 129875 - }, - { - "epoch": 31.7, - "learning_rate": 0.0003419838749083802, - "loss": 0.421, - "step": 129900 - }, - { - "epoch": 31.7, - "learning_rate": 0.0003419533349621305, - "loss": 0.4067, - "step": 129925 - }, - { - "epoch": 31.71, - "learning_rate": 0.0003419227950158808, - "loss": 0.4321, - "step": 129950 - }, - { - "epoch": 31.72, - "learning_rate": 0.00034189225506963105, - "loss": 0.4127, - "step": 129975 - }, - { - "epoch": 31.72, - "learning_rate": 0.00034186171512338135, - "loss": 0.3806, - "step": 130000 - }, - { - "epoch": 31.73, - "learning_rate": 0.0003418311751771317, - "loss": 0.3789, - "step": 130025 - }, - { - "epoch": 31.73, - "learning_rate": 0.000341800635230882, - "loss": 0.4416, - "step": 130050 - }, - { - "epoch": 31.74, - "learning_rate": 0.0003417700952846323, - "loss": 0.407, - "step": 130075 - }, - { - "epoch": 31.75, - "learning_rate": 0.0003417395553383826, - "loss": 0.3916, - "step": 130100 - }, - { - "epoch": 31.75, - "learning_rate": 0.00034170901539213287, - "loss": 0.3883, - "step": 130125 - }, - { - "epoch": 31.76, - "learning_rate": 0.00034167847544588323, - "loss": 0.4128, - "step": 130150 - }, - { - "epoch": 31.77, - "learning_rate": 0.00034164793549963353, - "loss": 0.354, - "step": 130175 - }, - { - "epoch": 31.77, - "learning_rate": 0.00034161739555338384, - "loss": 0.4558, - "step": 130200 - }, - { - "epoch": 31.78, - "learning_rate": 0.00034158685560713414, - "loss": 0.3599, - "step": 130225 - }, - { - "epoch": 31.78, - "learning_rate": 0.00034155631566088444, - "loss": 0.429, - "step": 130250 - }, - { - "epoch": 31.79, - "learning_rate": 0.00034152577571463475, - "loss": 0.4128, - "step": 130275 - }, - { - "epoch": 31.8, - "learning_rate": 0.00034149523576838505, - "loss": 0.3966, - "step": 130300 - }, - { - "epoch": 31.8, - "learning_rate": 0.00034146469582213535, - "loss": 0.4003, - "step": 130325 - }, - { - "epoch": 31.81, - "learning_rate": 0.00034143415587588566, - "loss": 0.4447, - "step": 130350 - }, - { - "epoch": 31.81, - "learning_rate": 0.00034140361592963596, - "loss": 0.415, - "step": 130375 - }, - { - "epoch": 31.82, - "learning_rate": 0.0003413730759833863, - "loss": 0.4079, - "step": 130400 - }, - { - "epoch": 31.83, - "learning_rate": 0.0003413425360371366, - "loss": 0.4208, - "step": 130425 - }, - { - "epoch": 31.83, - "learning_rate": 0.00034131199609088687, - "loss": 0.4153, - "step": 130450 - }, - { - "epoch": 31.84, - "learning_rate": 0.00034128145614463717, - "loss": 0.3969, - "step": 130475 - }, - { - "epoch": 31.84, - "learning_rate": 0.0003412509161983875, - "loss": 0.4011, - "step": 130500 - }, - { - "epoch": 31.85, - "learning_rate": 0.00034122037625213783, - "loss": 0.3993, - "step": 130525 - }, - { - "epoch": 31.86, - "learning_rate": 0.00034118983630588814, - "loss": 0.444, - "step": 130550 - }, - { - "epoch": 31.86, - "learning_rate": 0.00034115929635963844, - "loss": 0.3871, - "step": 130575 - }, - { - "epoch": 31.87, - "learning_rate": 0.0003411287564133887, - "loss": 0.4001, - "step": 130600 - }, - { - "epoch": 31.88, - "learning_rate": 0.000341098216467139, - "loss": 0.4194, - "step": 130625 - }, - { - "epoch": 31.88, - "learning_rate": 0.00034106767652088935, - "loss": 0.4222, - "step": 130650 - }, - { - "epoch": 31.89, - "learning_rate": 0.00034103713657463965, - "loss": 0.3895, - "step": 130675 - }, - { - "epoch": 31.89, - "learning_rate": 0.00034100659662838996, - "loss": 0.3912, - "step": 130700 - }, - { - "epoch": 31.9, - "learning_rate": 0.00034097605668214026, - "loss": 0.4115, - "step": 130725 - }, - { - "epoch": 31.91, - "learning_rate": 0.0003409455167358905, - "loss": 0.4227, - "step": 130750 - }, - { - "epoch": 31.91, - "learning_rate": 0.00034091497678964087, - "loss": 0.3779, - "step": 130775 - }, - { - "epoch": 31.92, - "learning_rate": 0.00034088443684339117, - "loss": 0.4378, - "step": 130800 - }, - { - "epoch": 31.92, - "learning_rate": 0.0003408538968971415, - "loss": 0.3913, - "step": 130825 - }, - { - "epoch": 31.93, - "learning_rate": 0.0003408233569508918, - "loss": 0.4057, - "step": 130850 - }, - { - "epoch": 31.94, - "learning_rate": 0.0003407928170046421, - "loss": 0.4101, - "step": 130875 - }, - { - "epoch": 31.94, - "learning_rate": 0.00034076227705839244, - "loss": 0.4316, - "step": 130900 - }, - { - "epoch": 31.95, - "learning_rate": 0.0003407317371121427, - "loss": 0.4223, - "step": 130925 - }, - { - "epoch": 31.95, - "learning_rate": 0.000340701197165893, - "loss": 0.4274, - "step": 130950 - }, - { - "epoch": 31.96, - "learning_rate": 0.0003406706572196433, - "loss": 0.3901, - "step": 130975 - }, - { - "epoch": 31.97, - "learning_rate": 0.0003406401172733936, - "loss": 0.4463, - "step": 131000 - }, - { - "epoch": 31.97, - "learning_rate": 0.0003406095773271439, - "loss": 0.4061, - "step": 131025 - }, - { - "epoch": 31.98, - "learning_rate": 0.00034057903738089426, - "loss": 0.4125, - "step": 131050 - }, - { - "epoch": 31.99, - "learning_rate": 0.0003405484974346445, - "loss": 0.3804, - "step": 131075 - }, - { - "epoch": 31.99, - "learning_rate": 0.0003405179574883948, - "loss": 0.4336, - "step": 131100 - }, - { - "epoch": 32.0, - "learning_rate": 0.0003404874175421451, - "loss": 0.3988, - "step": 131125 - }, - { - "epoch": 32.0, - "learning_rate": 0.0003404568775958954, - "loss": 0.4117, - "step": 131150 - }, - { - "epoch": 32.01, - "learning_rate": 0.0003404263376496458, - "loss": 0.3902, - "step": 131175 - }, - { - "epoch": 32.02, - "learning_rate": 0.0003403957977033961, - "loss": 0.4209, - "step": 131200 - }, - { - "epoch": 32.02, - "learning_rate": 0.0003403652577571463, - "loss": 0.3716, - "step": 131225 - }, - { - "epoch": 32.03, - "learning_rate": 0.00034033471781089663, - "loss": 0.3839, - "step": 131250 - }, - { - "epoch": 32.03, - "learning_rate": 0.00034030417786464693, - "loss": 0.3534, - "step": 131275 - }, - { - "epoch": 32.04, - "learning_rate": 0.0003402736379183973, - "loss": 0.4128, - "step": 131300 - }, - { - "epoch": 32.05, - "learning_rate": 0.0003402430979721476, - "loss": 0.384, - "step": 131325 - }, - { - "epoch": 32.05, - "learning_rate": 0.0003402125580258979, - "loss": 0.4055, - "step": 131350 - }, - { - "epoch": 32.06, - "learning_rate": 0.0003401820180796482, - "loss": 0.3563, - "step": 131375 - }, - { - "epoch": 32.06, - "learning_rate": 0.00034015147813339845, - "loss": 0.3818, - "step": 131400 - }, - { - "epoch": 32.07, - "learning_rate": 0.0003401209381871488, - "loss": 0.4055, - "step": 131425 - }, - { - "epoch": 32.08, - "learning_rate": 0.0003400903982408991, - "loss": 0.3967, - "step": 131450 - }, - { - "epoch": 32.08, - "learning_rate": 0.0003400598582946494, - "loss": 0.4005, - "step": 131475 - }, - { - "epoch": 32.09, - "learning_rate": 0.0003400293183483997, - "loss": 0.37, - "step": 131500 - }, - { - "epoch": 32.09, - "learning_rate": 0.00033999877840215, - "loss": 0.3949, - "step": 131525 - }, - { - "epoch": 32.1, - "learning_rate": 0.0003399682384559003, - "loss": 0.3711, - "step": 131550 - }, - { - "epoch": 32.11, - "learning_rate": 0.00033993769850965063, - "loss": 0.3992, - "step": 131575 - }, - { - "epoch": 32.11, - "learning_rate": 0.00033990715856340093, - "loss": 0.3856, - "step": 131600 - }, - { - "epoch": 32.12, - "learning_rate": 0.00033987661861715123, - "loss": 0.3252, - "step": 131625 - }, - { - "epoch": 32.13, - "learning_rate": 0.00033984607867090154, - "loss": 0.3804, - "step": 131650 - }, - { - "epoch": 32.13, - "learning_rate": 0.0003398155387246519, - "loss": 0.3609, - "step": 131675 - }, - { - "epoch": 32.14, - "learning_rate": 0.00033978499877840214, - "loss": 0.4174, - "step": 131700 - }, - { - "epoch": 32.14, - "learning_rate": 0.00033975445883215245, - "loss": 0.3768, - "step": 131725 - }, - { - "epoch": 32.15, - "learning_rate": 0.00033972391888590275, - "loss": 0.3697, - "step": 131750 - }, - { - "epoch": 32.16, - "learning_rate": 0.00033969337893965305, - "loss": 0.3717, - "step": 131775 - }, - { - "epoch": 32.16, - "learning_rate": 0.0003396628389934034, - "loss": 0.4154, - "step": 131800 - }, - { - "epoch": 32.17, - "learning_rate": 0.0003396322990471537, - "loss": 0.3912, - "step": 131825 - }, - { - "epoch": 32.17, - "learning_rate": 0.00033960175910090396, - "loss": 0.4041, - "step": 131850 - }, - { - "epoch": 32.18, - "learning_rate": 0.00033957121915465427, - "loss": 0.3556, - "step": 131875 - }, - { - "epoch": 32.19, - "learning_rate": 0.00033954067920840457, - "loss": 0.3875, - "step": 131900 - }, - { - "epoch": 32.19, - "learning_rate": 0.00033951013926215493, - "loss": 0.3835, - "step": 131925 - }, - { - "epoch": 32.2, - "learning_rate": 0.00033947959931590523, - "loss": 0.4374, - "step": 131950 - }, - { - "epoch": 32.2, - "learning_rate": 0.00033944905936965554, - "loss": 0.3955, - "step": 131975 - }, - { - "epoch": 32.21, - "learning_rate": 0.00033941851942340584, - "loss": 0.3896, - "step": 132000 - }, - { - "epoch": 32.21, - "eval_cer": 0.09856472593246615, - "eval_loss": 0.3984539806842804, - "eval_runtime": 149.0532, - "eval_samples_per_second": 28.131, - "eval_steps_per_second": 7.038, - "eval_wer": 0.40153344208809133, - "step": 132000 - }, - { - "epoch": 32.22, - "learning_rate": 0.0003393879794771561, - "loss": 0.3759, - "step": 132025 - }, - { - "epoch": 32.22, - "learning_rate": 0.00033935743953090645, - "loss": 0.4199, - "step": 132050 - }, - { - "epoch": 32.23, - "learning_rate": 0.00033932689958465675, - "loss": 0.3597, - "step": 132075 - }, - { - "epoch": 32.24, - "learning_rate": 0.00033929635963840705, - "loss": 0.3833, - "step": 132100 - }, - { - "epoch": 32.24, - "learning_rate": 0.00033926581969215736, - "loss": 0.3782, - "step": 132125 - }, - { - "epoch": 32.25, - "learning_rate": 0.00033923527974590766, - "loss": 0.386, - "step": 132150 - }, - { - "epoch": 32.25, - "learning_rate": 0.0003392047397996579, - "loss": 0.3654, - "step": 132175 - }, - { - "epoch": 32.26, - "learning_rate": 0.00033917419985340827, - "loss": 0.3989, - "step": 132200 - }, - { - "epoch": 32.27, - "learning_rate": 0.00033914365990715857, - "loss": 0.3849, - "step": 132225 - }, - { - "epoch": 32.27, - "learning_rate": 0.00033911311996090887, - "loss": 0.3937, - "step": 132250 - }, - { - "epoch": 32.28, - "learning_rate": 0.0003390825800146592, - "loss": 0.3615, - "step": 132275 - }, - { - "epoch": 32.28, - "learning_rate": 0.0003390520400684095, - "loss": 0.3982, - "step": 132300 - }, - { - "epoch": 32.29, - "learning_rate": 0.0003390215001221598, - "loss": 0.3963, - "step": 132325 - }, - { - "epoch": 32.3, - "learning_rate": 0.0003389909601759101, - "loss": 0.4259, - "step": 132350 - }, - { - "epoch": 32.3, - "learning_rate": 0.0003389604202296604, - "loss": 0.3623, - "step": 132375 - }, - { - "epoch": 32.31, - "learning_rate": 0.0003389298802834107, - "loss": 0.3697, - "step": 132400 - }, - { - "epoch": 32.31, - "learning_rate": 0.000338899340337161, - "loss": 0.4037, - "step": 132425 - }, - { - "epoch": 32.32, - "learning_rate": 0.00033886880039091135, - "loss": 0.408, - "step": 132450 - }, - { - "epoch": 32.33, - "learning_rate": 0.00033883826044466166, - "loss": 0.4025, - "step": 132475 - }, - { - "epoch": 32.33, - "learning_rate": 0.0003388077204984119, - "loss": 0.3843, - "step": 132500 - }, - { - "epoch": 32.34, - "learning_rate": 0.0003387771805521622, - "loss": 0.4237, - "step": 132525 - }, - { - "epoch": 32.35, - "learning_rate": 0.0003387466406059125, - "loss": 0.3798, - "step": 132550 - }, - { - "epoch": 32.35, - "learning_rate": 0.0003387173222575128, - "loss": 0.3831, - "step": 132575 - }, - { - "epoch": 32.36, - "learning_rate": 0.0003386867823112632, - "loss": 0.4441, - "step": 132600 - }, - { - "epoch": 32.36, - "learning_rate": 0.0003386562423650135, - "loss": 0.3923, - "step": 132625 - }, - { - "epoch": 32.37, - "learning_rate": 0.00033862570241876373, - "loss": 0.4167, - "step": 132650 - }, - { - "epoch": 32.38, - "learning_rate": 0.00033859516247251403, - "loss": 0.3875, - "step": 132675 - }, - { - "epoch": 32.38, - "learning_rate": 0.00033856462252626434, - "loss": 0.4144, - "step": 132700 - }, - { - "epoch": 32.39, - "learning_rate": 0.0003385340825800147, - "loss": 0.4159, - "step": 132725 - }, - { - "epoch": 32.39, - "learning_rate": 0.000338503542633765, - "loss": 0.3833, - "step": 132750 - }, - { - "epoch": 32.4, - "learning_rate": 0.0003384730026875153, - "loss": 0.4222, - "step": 132775 - }, - { - "epoch": 32.41, - "learning_rate": 0.00033844246274126555, - "loss": 0.3666, - "step": 132800 - }, - { - "epoch": 32.41, - "learning_rate": 0.00033841192279501585, - "loss": 0.3791, - "step": 132825 - }, - { - "epoch": 32.42, - "learning_rate": 0.0003383813828487662, - "loss": 0.3982, - "step": 132850 - }, - { - "epoch": 32.42, - "learning_rate": 0.0003383508429025165, - "loss": 0.3673, - "step": 132875 - }, - { - "epoch": 32.43, - "learning_rate": 0.0003383203029562668, - "loss": 0.3804, - "step": 132900 - }, - { - "epoch": 32.44, - "learning_rate": 0.0003382897630100171, - "loss": 0.3506, - "step": 132925 - }, - { - "epoch": 32.44, - "learning_rate": 0.0003382592230637674, - "loss": 0.4107, - "step": 132950 - }, - { - "epoch": 32.45, - "learning_rate": 0.00033822868311751767, - "loss": 0.3897, - "step": 132975 - }, - { - "epoch": 32.45, - "learning_rate": 0.00033819814317126803, - "loss": 0.3825, - "step": 133000 - }, - { - "epoch": 32.46, - "learning_rate": 0.00033816760322501833, - "loss": 0.408, - "step": 133025 - }, - { - "epoch": 32.47, - "learning_rate": 0.00033813706327876864, - "loss": 0.4054, - "step": 133050 - }, - { - "epoch": 32.47, - "learning_rate": 0.00033810652333251894, - "loss": 0.3952, - "step": 133075 - }, - { - "epoch": 32.48, - "learning_rate": 0.00033807598338626924, - "loss": 0.4028, - "step": 133100 - }, - { - "epoch": 32.49, - "learning_rate": 0.00033804544344001955, - "loss": 0.3898, - "step": 133125 - }, - { - "epoch": 32.49, - "learning_rate": 0.00033801490349376985, - "loss": 0.4198, - "step": 133150 - }, - { - "epoch": 32.5, - "learning_rate": 0.00033798436354752015, - "loss": 0.3762, - "step": 133175 - }, - { - "epoch": 32.5, - "learning_rate": 0.00033795382360127046, - "loss": 0.4403, - "step": 133200 - }, - { - "epoch": 32.51, - "learning_rate": 0.00033792328365502076, - "loss": 0.3825, - "step": 133225 - }, - { - "epoch": 32.52, - "learning_rate": 0.0003378927437087711, - "loss": 0.404, - "step": 133250 - }, - { - "epoch": 32.52, - "learning_rate": 0.00033786220376252137, - "loss": 0.3803, - "step": 133275 - }, - { - "epoch": 32.53, - "learning_rate": 0.00033783166381627167, - "loss": 0.4274, - "step": 133300 - }, - { - "epoch": 32.53, - "learning_rate": 0.000337801123870022, - "loss": 0.3633, - "step": 133325 - }, - { - "epoch": 32.54, - "learning_rate": 0.0003377705839237723, - "loss": 0.4178, - "step": 133350 - }, - { - "epoch": 32.55, - "learning_rate": 0.00033774004397752263, - "loss": 0.386, - "step": 133375 - }, - { - "epoch": 32.55, - "learning_rate": 0.00033770950403127294, - "loss": 0.3567, - "step": 133400 - }, - { - "epoch": 32.56, - "learning_rate": 0.00033767896408502324, - "loss": 0.3817, - "step": 133425 - }, - { - "epoch": 32.56, - "learning_rate": 0.0003376484241387735, - "loss": 0.4123, - "step": 133450 - }, - { - "epoch": 32.57, - "learning_rate": 0.0003376178841925238, - "loss": 0.3853, - "step": 133475 - }, - { - "epoch": 32.58, - "learning_rate": 0.00033758734424627415, - "loss": 0.3949, - "step": 133500 - }, - { - "epoch": 32.58, - "learning_rate": 0.00033755680430002445, - "loss": 0.3601, - "step": 133525 - }, - { - "epoch": 32.59, - "learning_rate": 0.00033752626435377476, - "loss": 0.3768, - "step": 133550 - }, - { - "epoch": 32.6, - "learning_rate": 0.00033749572440752506, - "loss": 0.3772, - "step": 133575 - }, - { - "epoch": 32.6, - "learning_rate": 0.0003374651844612753, - "loss": 0.4496, - "step": 133600 - }, - { - "epoch": 32.61, - "learning_rate": 0.00033743464451502567, - "loss": 0.3942, - "step": 133625 - }, - { - "epoch": 32.61, - "learning_rate": 0.00033740410456877597, - "loss": 0.3922, - "step": 133650 - }, - { - "epoch": 32.62, - "learning_rate": 0.0003373735646225263, - "loss": 0.4161, - "step": 133675 - }, - { - "epoch": 32.63, - "learning_rate": 0.0003373430246762766, - "loss": 0.416, - "step": 133700 - }, - { - "epoch": 32.63, - "learning_rate": 0.0003373124847300269, - "loss": 0.3627, - "step": 133725 - }, - { - "epoch": 32.64, - "learning_rate": 0.0003372819447837772, - "loss": 0.3978, - "step": 133750 - }, - { - "epoch": 32.64, - "learning_rate": 0.0003372514048375275, - "loss": 0.352, - "step": 133775 - }, - { - "epoch": 32.65, - "learning_rate": 0.0003372208648912778, - "loss": 0.3799, - "step": 133800 - }, - { - "epoch": 32.66, - "learning_rate": 0.0003371903249450281, - "loss": 0.3868, - "step": 133825 - }, - { - "epoch": 32.66, - "learning_rate": 0.0003371597849987784, - "loss": 0.4069, - "step": 133850 - }, - { - "epoch": 32.67, - "learning_rate": 0.00033712924505252876, - "loss": 0.358, - "step": 133875 - }, - { - "epoch": 32.67, - "learning_rate": 0.00033709870510627906, - "loss": 0.4397, - "step": 133900 - }, - { - "epoch": 32.68, - "learning_rate": 0.0003370681651600293, - "loss": 0.4316, - "step": 133925 - }, - { - "epoch": 32.69, - "learning_rate": 0.0003370376252137796, - "loss": 0.3767, - "step": 133950 - }, - { - "epoch": 32.69, - "learning_rate": 0.0003370070852675299, - "loss": 0.4035, - "step": 133975 - }, - { - "epoch": 32.7, - "learning_rate": 0.00033697654532128027, - "loss": 0.4051, - "step": 134000 - }, - { - "epoch": 32.7, - "learning_rate": 0.0003369460053750306, - "loss": 0.4183, - "step": 134025 - }, - { - "epoch": 32.71, - "learning_rate": 0.0003369154654287809, - "loss": 0.4046, - "step": 134050 - }, - { - "epoch": 32.72, - "learning_rate": 0.00033688492548253113, - "loss": 0.388, - "step": 134075 - }, - { - "epoch": 32.72, - "learning_rate": 0.00033685438553628143, - "loss": 0.3803, - "step": 134100 - }, - { - "epoch": 32.73, - "learning_rate": 0.0003368238455900318, - "loss": 0.3721, - "step": 134125 - }, - { - "epoch": 32.74, - "learning_rate": 0.0003367933056437821, - "loss": 0.422, - "step": 134150 - }, - { - "epoch": 32.74, - "learning_rate": 0.0003367627656975324, - "loss": 0.3928, - "step": 134175 - }, - { - "epoch": 32.75, - "learning_rate": 0.0003367322257512827, - "loss": 0.4004, - "step": 134200 - }, - { - "epoch": 32.75, - "learning_rate": 0.00033670168580503295, - "loss": 0.3687, - "step": 134225 - }, - { - "epoch": 32.76, - "learning_rate": 0.00033667114585878325, - "loss": 0.3852, - "step": 134250 - }, - { - "epoch": 32.77, - "learning_rate": 0.0003366406059125336, - "loss": 0.3816, - "step": 134275 - }, - { - "epoch": 32.77, - "learning_rate": 0.0003366100659662839, - "loss": 0.4021, - "step": 134300 - }, - { - "epoch": 32.78, - "learning_rate": 0.0003365795260200342, - "loss": 0.3976, - "step": 134325 - }, - { - "epoch": 32.78, - "learning_rate": 0.0003365489860737845, - "loss": 0.4478, - "step": 134350 - }, - { - "epoch": 32.79, - "learning_rate": 0.0003365184461275348, - "loss": 0.3553, - "step": 134375 - }, - { - "epoch": 32.8, - "learning_rate": 0.0003364879061812851, - "loss": 0.4167, - "step": 134400 - }, - { - "epoch": 32.8, - "learning_rate": 0.00033645736623503543, - "loss": 0.3895, - "step": 134425 - }, - { - "epoch": 32.81, - "learning_rate": 0.00033642682628878573, - "loss": 0.3975, - "step": 134450 - }, - { - "epoch": 32.81, - "learning_rate": 0.00033639628634253604, - "loss": 0.3731, - "step": 134475 - }, - { - "epoch": 32.82, - "learning_rate": 0.00033636574639628634, - "loss": 0.4234, - "step": 134500 - }, - { - "epoch": 32.83, - "learning_rate": 0.0003363352064500367, - "loss": 0.3793, - "step": 134525 - }, - { - "epoch": 32.83, - "learning_rate": 0.00033630466650378695, - "loss": 0.4039, - "step": 134550 - }, - { - "epoch": 32.84, - "learning_rate": 0.00033627412655753725, - "loss": 0.3617, - "step": 134575 - }, - { - "epoch": 32.85, - "learning_rate": 0.00033624358661128755, - "loss": 0.4011, - "step": 134600 - }, - { - "epoch": 32.85, - "learning_rate": 0.00033621304666503786, - "loss": 0.3912, - "step": 134625 - }, - { - "epoch": 32.86, - "learning_rate": 0.0003361825067187882, - "loss": 0.3734, - "step": 134650 - }, - { - "epoch": 32.86, - "learning_rate": 0.0003361519667725385, - "loss": 0.3806, - "step": 134675 - }, - { - "epoch": 32.87, - "learning_rate": 0.00033612142682628877, - "loss": 0.3725, - "step": 134700 - }, - { - "epoch": 32.88, - "learning_rate": 0.00033609088688003907, - "loss": 0.4062, - "step": 134725 - }, - { - "epoch": 32.88, - "learning_rate": 0.00033606034693378937, - "loss": 0.4138, - "step": 134750 - }, - { - "epoch": 32.89, - "learning_rate": 0.00033602980698753973, - "loss": 0.3759, - "step": 134775 - }, - { - "epoch": 32.89, - "learning_rate": 0.00033599926704129003, - "loss": 0.3783, - "step": 134800 - }, - { - "epoch": 32.9, - "learning_rate": 0.00033596872709504034, - "loss": 0.367, - "step": 134825 - }, - { - "epoch": 32.91, - "learning_rate": 0.00033593818714879064, - "loss": 0.3837, - "step": 134850 - }, - { - "epoch": 32.91, - "learning_rate": 0.0003359076472025409, - "loss": 0.3679, - "step": 134875 - }, - { - "epoch": 32.92, - "learning_rate": 0.00033587710725629125, - "loss": 0.3842, - "step": 134900 - }, - { - "epoch": 32.92, - "learning_rate": 0.00033584656731004155, - "loss": 0.395, - "step": 134925 - }, - { - "epoch": 32.93, - "learning_rate": 0.00033581602736379185, - "loss": 0.3838, - "step": 134950 - }, - { - "epoch": 32.94, - "learning_rate": 0.00033578548741754216, - "loss": 0.3935, - "step": 134975 - }, - { - "epoch": 32.94, - "learning_rate": 0.00033575494747129246, - "loss": 0.3912, - "step": 135000 - }, - { - "epoch": 32.94, - "eval_cer": 0.09640360153178033, - "eval_loss": 0.41029471158981323, - "eval_runtime": 149.2123, - "eval_samples_per_second": 28.101, - "eval_steps_per_second": 7.03, - "eval_wer": 0.39477977161500816, - "step": 135000 - }, - { - "epoch": 32.95, - "learning_rate": 0.00033572440752504276, - "loss": 0.378, - "step": 135025 - }, - { - "epoch": 32.96, - "learning_rate": 0.00033569386757879307, - "loss": 0.4405, - "step": 135050 - }, - { - "epoch": 32.96, - "learning_rate": 0.00033566332763254337, - "loss": 0.3973, - "step": 135075 - }, - { - "epoch": 32.97, - "learning_rate": 0.0003356327876862937, - "loss": 0.4042, - "step": 135100 - }, - { - "epoch": 32.97, - "learning_rate": 0.000335602247740044, - "loss": 0.3579, - "step": 135125 - }, - { - "epoch": 32.98, - "learning_rate": 0.00033557170779379433, - "loss": 0.3996, - "step": 135150 - }, - { - "epoch": 32.99, - "learning_rate": 0.0003355411678475446, - "loss": 0.3573, - "step": 135175 - }, - { - "epoch": 32.99, - "learning_rate": 0.0003355106279012949, - "loss": 0.4172, - "step": 135200 - }, - { - "epoch": 33.0, - "learning_rate": 0.0003354800879550452, - "loss": 0.3616, - "step": 135225 - }, - { - "epoch": 33.0, - "learning_rate": 0.0003354495480087955, - "loss": 0.3836, - "step": 135250 - }, - { - "epoch": 33.01, - "learning_rate": 0.00033541900806254585, - "loss": 0.3581, - "step": 135275 - }, - { - "epoch": 33.02, - "learning_rate": 0.00033538846811629615, - "loss": 0.3902, - "step": 135300 - }, - { - "epoch": 33.02, - "learning_rate": 0.0003353579281700464, - "loss": 0.3405, - "step": 135325 - }, - { - "epoch": 33.03, - "learning_rate": 0.0003353273882237967, - "loss": 0.368, - "step": 135350 - }, - { - "epoch": 33.03, - "learning_rate": 0.000335296848277547, - "loss": 0.3399, - "step": 135375 - }, - { - "epoch": 33.04, - "learning_rate": 0.00033526630833129737, - "loss": 0.3927, - "step": 135400 - }, - { - "epoch": 33.05, - "learning_rate": 0.00033523576838504767, - "loss": 0.3737, - "step": 135425 - }, - { - "epoch": 33.05, - "learning_rate": 0.000335206450036648, - "loss": 0.3907, - "step": 135450 - }, - { - "epoch": 33.06, - "learning_rate": 0.0003351759100903983, - "loss": 0.3661, - "step": 135475 - }, - { - "epoch": 33.06, - "learning_rate": 0.00033514537014414853, - "loss": 0.3812, - "step": 135500 - }, - { - "epoch": 33.07, - "learning_rate": 0.00033511483019789883, - "loss": 0.3496, - "step": 135525 - }, - { - "epoch": 33.08, - "learning_rate": 0.00033508429025164914, - "loss": 0.3888, - "step": 135550 - }, - { - "epoch": 33.08, - "learning_rate": 0.0003350537503053995, - "loss": 0.3772, - "step": 135575 - }, - { - "epoch": 33.09, - "learning_rate": 0.0003350232103591498, - "loss": 0.4225, - "step": 135600 - }, - { - "epoch": 33.1, - "learning_rate": 0.0003349926704129001, - "loss": 0.3996, - "step": 135625 - }, - { - "epoch": 33.1, - "learning_rate": 0.00033496213046665035, - "loss": 0.3857, - "step": 135650 - }, - { - "epoch": 33.11, - "learning_rate": 0.00033493159052040065, - "loss": 0.3734, - "step": 135675 - }, - { - "epoch": 33.11, - "learning_rate": 0.000334901050574151, - "loss": 0.3788, - "step": 135700 - }, - { - "epoch": 33.12, - "learning_rate": 0.0003348705106279013, - "loss": 0.352, - "step": 135725 - }, - { - "epoch": 33.13, - "learning_rate": 0.0003348399706816516, - "loss": 0.356, - "step": 135750 - }, - { - "epoch": 33.13, - "learning_rate": 0.0003348094307354019, - "loss": 0.355, - "step": 135775 - }, - { - "epoch": 33.14, - "learning_rate": 0.00033477889078915217, - "loss": 0.4078, - "step": 135800 - }, - { - "epoch": 33.14, - "learning_rate": 0.00033474835084290253, - "loss": 0.3636, - "step": 135825 - }, - { - "epoch": 33.15, - "learning_rate": 0.00033471781089665283, - "loss": 0.3836, - "step": 135850 - }, - { - "epoch": 33.16, - "learning_rate": 0.00033468727095040313, - "loss": 0.3747, - "step": 135875 - }, - { - "epoch": 33.16, - "learning_rate": 0.00033465673100415344, - "loss": 0.3978, - "step": 135900 - }, - { - "epoch": 33.17, - "learning_rate": 0.00033462619105790374, - "loss": 0.3753, - "step": 135925 - }, - { - "epoch": 33.17, - "learning_rate": 0.0003345956511116541, - "loss": 0.3733, - "step": 135950 - }, - { - "epoch": 33.18, - "learning_rate": 0.00033456511116540435, - "loss": 0.3348, - "step": 135975 - }, - { - "epoch": 33.19, - "learning_rate": 0.00033453457121915465, - "loss": 0.3901, - "step": 136000 - }, - { - "epoch": 33.19, - "learning_rate": 0.00033450403127290495, - "loss": 0.3628, - "step": 136025 - }, - { - "epoch": 33.2, - "learning_rate": 0.00033447349132665526, - "loss": 0.398, - "step": 136050 - }, - { - "epoch": 33.21, - "learning_rate": 0.0003344429513804056, - "loss": 0.3426, - "step": 136075 - }, - { - "epoch": 33.21, - "learning_rate": 0.0003344124114341559, - "loss": 0.3727, - "step": 136100 - }, - { - "epoch": 33.22, - "learning_rate": 0.00033438187148790617, - "loss": 0.3642, - "step": 136125 - }, - { - "epoch": 33.22, - "learning_rate": 0.00033435133154165647, - "loss": 0.3884, - "step": 136150 - }, - { - "epoch": 33.23, - "learning_rate": 0.0003343220131932568, - "loss": 0.3307, - "step": 136175 - }, - { - "epoch": 33.24, - "learning_rate": 0.0003342914732470071, - "loss": 0.3864, - "step": 136200 - }, - { - "epoch": 33.24, - "learning_rate": 0.0003342609333007574, - "loss": 0.3317, - "step": 136225 - }, - { - "epoch": 33.25, - "learning_rate": 0.00033423039335450774, - "loss": 0.3878, - "step": 136250 - }, - { - "epoch": 33.25, - "learning_rate": 0.000334199853408258, - "loss": 0.3866, - "step": 136275 - }, - { - "epoch": 33.26, - "learning_rate": 0.0003341693134620083, - "loss": 0.3796, - "step": 136300 - }, - { - "epoch": 33.27, - "learning_rate": 0.0003341387735157586, - "loss": 0.336, - "step": 136325 - }, - { - "epoch": 33.27, - "learning_rate": 0.0003341082335695089, - "loss": 0.3943, - "step": 136350 - }, - { - "epoch": 33.28, - "learning_rate": 0.00033407769362325926, - "loss": 0.3875, - "step": 136375 - }, - { - "epoch": 33.28, - "learning_rate": 0.00033404715367700956, - "loss": 0.3827, - "step": 136400 - }, - { - "epoch": 33.29, - "learning_rate": 0.00033401661373075987, - "loss": 0.3293, - "step": 136425 - }, - { - "epoch": 33.3, - "learning_rate": 0.0003339860737845101, - "loss": 0.4467, - "step": 136450 - }, - { - "epoch": 33.3, - "learning_rate": 0.0003339555338382604, - "loss": 0.395, - "step": 136475 - }, - { - "epoch": 33.31, - "learning_rate": 0.0003339249938920108, - "loss": 0.4032, - "step": 136500 - }, - { - "epoch": 33.32, - "learning_rate": 0.0003338944539457611, - "loss": 0.353, - "step": 136525 - }, - { - "epoch": 33.32, - "learning_rate": 0.0003338639139995114, - "loss": 0.401, - "step": 136550 - }, - { - "epoch": 33.33, - "learning_rate": 0.0003338333740532617, - "loss": 0.3823, - "step": 136575 - }, - { - "epoch": 33.33, - "learning_rate": 0.00033380283410701193, - "loss": 0.3959, - "step": 136600 - }, - { - "epoch": 33.34, - "learning_rate": 0.0003337722941607623, - "loss": 0.3629, - "step": 136625 - }, - { - "epoch": 33.35, - "learning_rate": 0.0003337417542145126, - "loss": 0.4072, - "step": 136650 - }, - { - "epoch": 33.35, - "learning_rate": 0.0003337112142682629, - "loss": 0.3992, - "step": 136675 - }, - { - "epoch": 33.36, - "learning_rate": 0.0003336806743220132, - "loss": 0.4557, - "step": 136700 - }, - { - "epoch": 33.36, - "learning_rate": 0.0003336501343757635, - "loss": 0.349, - "step": 136725 - }, - { - "epoch": 33.37, - "learning_rate": 0.0003336195944295138, - "loss": 0.3946, - "step": 136750 - }, - { - "epoch": 33.38, - "learning_rate": 0.0003335890544832641, - "loss": 0.3782, - "step": 136775 - }, - { - "epoch": 33.38, - "learning_rate": 0.0003335585145370144, - "loss": 0.4219, - "step": 136800 - }, - { - "epoch": 33.39, - "learning_rate": 0.0003335279745907647, - "loss": 0.3675, - "step": 136825 - }, - { - "epoch": 33.39, - "learning_rate": 0.000333497434644515, - "loss": 0.3896, - "step": 136850 - }, - { - "epoch": 33.4, - "learning_rate": 0.0003334668946982654, - "loss": 0.3443, - "step": 136875 - }, - { - "epoch": 33.41, - "learning_rate": 0.0003334363547520157, - "loss": 0.3815, - "step": 136900 - }, - { - "epoch": 33.41, - "learning_rate": 0.00033340581480576593, - "loss": 0.4201, - "step": 136925 - }, - { - "epoch": 33.42, - "learning_rate": 0.00033337527485951624, - "loss": 0.3761, - "step": 136950 - }, - { - "epoch": 33.42, - "learning_rate": 0.00033334473491326654, - "loss": 0.3522, - "step": 136975 - }, - { - "epoch": 33.43, - "learning_rate": 0.0003333141949670169, - "loss": 0.424, - "step": 137000 - }, - { - "epoch": 33.44, - "learning_rate": 0.0003332836550207672, - "loss": 0.3266, - "step": 137025 - }, - { - "epoch": 33.44, - "learning_rate": 0.0003332531150745175, - "loss": 0.3849, - "step": 137050 - }, - { - "epoch": 33.45, - "learning_rate": 0.00033322257512826775, - "loss": 0.3785, - "step": 137075 - }, - { - "epoch": 33.46, - "learning_rate": 0.00033319203518201806, - "loss": 0.3789, - "step": 137100 - }, - { - "epoch": 33.46, - "learning_rate": 0.00033316149523576836, - "loss": 0.3665, - "step": 137125 - }, - { - "epoch": 33.47, - "learning_rate": 0.0003331309552895187, - "loss": 0.4229, - "step": 137150 - }, - { - "epoch": 33.47, - "learning_rate": 0.000333100415343269, - "loss": 0.3616, - "step": 137175 - }, - { - "epoch": 33.48, - "learning_rate": 0.0003330698753970193, - "loss": 0.3846, - "step": 137200 - }, - { - "epoch": 33.49, - "learning_rate": 0.00033303933545076957, - "loss": 0.3729, - "step": 137225 - }, - { - "epoch": 33.49, - "learning_rate": 0.0003330087955045199, - "loss": 0.4188, - "step": 137250 - }, - { - "epoch": 33.5, - "learning_rate": 0.00033297825555827023, - "loss": 0.3823, - "step": 137275 - }, - { - "epoch": 33.5, - "learning_rate": 0.00033294771561202054, - "loss": 0.4614, - "step": 137300 - }, - { - "epoch": 33.51, - "learning_rate": 0.00033291717566577084, - "loss": 0.3309, - "step": 137325 - }, - { - "epoch": 33.52, - "learning_rate": 0.00033288663571952114, - "loss": 0.3966, - "step": 137350 - }, - { - "epoch": 33.52, - "learning_rate": 0.00033285609577327145, - "loss": 0.3856, - "step": 137375 - }, - { - "epoch": 33.53, - "learning_rate": 0.00033282555582702175, - "loss": 0.4269, - "step": 137400 - }, - { - "epoch": 33.53, - "learning_rate": 0.00033279501588077205, - "loss": 0.3844, - "step": 137425 - }, - { - "epoch": 33.54, - "learning_rate": 0.00033276447593452236, - "loss": 0.4249, - "step": 137450 - }, - { - "epoch": 33.55, - "learning_rate": 0.00033273393598827266, - "loss": 0.3647, - "step": 137475 - }, - { - "epoch": 33.55, - "learning_rate": 0.00033270339604202296, - "loss": 0.414, - "step": 137500 - }, - { - "epoch": 33.56, - "learning_rate": 0.0003326728560957733, - "loss": 0.389, - "step": 137525 - }, - { - "epoch": 33.57, - "learning_rate": 0.00033264231614952357, - "loss": 0.4292, - "step": 137550 - }, - { - "epoch": 33.57, - "learning_rate": 0.0003326117762032739, - "loss": 0.3596, - "step": 137575 - }, - { - "epoch": 33.58, - "learning_rate": 0.0003325812362570242, - "loss": 0.3767, - "step": 137600 - }, - { - "epoch": 33.58, - "learning_rate": 0.0003325506963107745, - "loss": 0.4002, - "step": 137625 - }, - { - "epoch": 33.59, - "learning_rate": 0.00033252015636452484, - "loss": 0.4151, - "step": 137650 - }, - { - "epoch": 33.6, - "learning_rate": 0.00033248961641827514, - "loss": 0.3565, - "step": 137675 - }, - { - "epoch": 33.6, - "learning_rate": 0.0003324590764720254, - "loss": 0.448, - "step": 137700 - }, - { - "epoch": 33.61, - "learning_rate": 0.0003324285365257757, - "loss": 0.3663, - "step": 137725 - }, - { - "epoch": 33.61, - "learning_rate": 0.000332397996579526, - "loss": 0.4024, - "step": 137750 - }, - { - "epoch": 33.62, - "learning_rate": 0.00033236745663327635, - "loss": 0.3953, - "step": 137775 - }, - { - "epoch": 33.63, - "learning_rate": 0.00033233691668702666, - "loss": 0.4102, - "step": 137800 - }, - { - "epoch": 33.63, - "learning_rate": 0.00033230637674077696, - "loss": 0.3611, - "step": 137825 - }, - { - "epoch": 33.64, - "learning_rate": 0.00033227583679452726, - "loss": 0.4133, - "step": 137850 - }, - { - "epoch": 33.64, - "learning_rate": 0.0003322452968482775, - "loss": 0.4016, - "step": 137875 - }, - { - "epoch": 33.65, - "learning_rate": 0.00033221475690202787, - "loss": 0.4489, - "step": 137900 - }, - { - "epoch": 33.66, - "learning_rate": 0.0003321842169557782, - "loss": 0.4036, - "step": 137925 - }, - { - "epoch": 33.66, - "learning_rate": 0.0003321536770095285, - "loss": 0.4298, - "step": 137950 - }, - { - "epoch": 33.67, - "learning_rate": 0.0003321231370632788, - "loss": 0.3659, - "step": 137975 - }, - { - "epoch": 33.67, - "learning_rate": 0.0003320925971170291, - "loss": 0.3995, - "step": 138000 - }, - { - "epoch": 33.67, - "eval_cer": 0.09747646376394978, - "eval_loss": 0.39622190594673157, - "eval_runtime": 149.4561, - "eval_samples_per_second": 28.055, - "eval_steps_per_second": 7.019, - "eval_wer": 0.4024143556280587, - "step": 138000 - }, - { - "epoch": 33.68, - "learning_rate": 0.0003320620571707794, - "loss": 0.3921, - "step": 138025 - }, - { - "epoch": 33.69, - "learning_rate": 0.0003320315172245297, - "loss": 0.4156, - "step": 138050 - }, - { - "epoch": 33.69, - "learning_rate": 0.00033200097727828, - "loss": 0.3502, - "step": 138075 - }, - { - "epoch": 33.7, - "learning_rate": 0.0003319704373320303, - "loss": 0.3947, - "step": 138100 - }, - { - "epoch": 33.71, - "learning_rate": 0.0003319398973857806, - "loss": 0.3597, - "step": 138125 - }, - { - "epoch": 33.71, - "learning_rate": 0.00033190935743953096, - "loss": 0.3832, - "step": 138150 - }, - { - "epoch": 33.72, - "learning_rate": 0.0003318788174932812, - "loss": 0.3484, - "step": 138175 - }, - { - "epoch": 33.72, - "learning_rate": 0.0003318482775470315, - "loss": 0.3769, - "step": 138200 - }, - { - "epoch": 33.73, - "learning_rate": 0.0003318177376007818, - "loss": 0.3096, - "step": 138225 - }, - { - "epoch": 33.74, - "learning_rate": 0.0003317871976545321, - "loss": 0.3672, - "step": 138250 - }, - { - "epoch": 33.74, - "learning_rate": 0.0003317566577082825, - "loss": 0.3853, - "step": 138275 - }, - { - "epoch": 33.75, - "learning_rate": 0.0003317261177620328, - "loss": 0.3725, - "step": 138300 - }, - { - "epoch": 33.75, - "learning_rate": 0.0003316955778157831, - "loss": 0.3425, - "step": 138325 - }, - { - "epoch": 33.76, - "learning_rate": 0.00033166503786953333, - "loss": 0.3924, - "step": 138350 - }, - { - "epoch": 33.77, - "learning_rate": 0.00033163449792328364, - "loss": 0.3541, - "step": 138375 - }, - { - "epoch": 33.77, - "learning_rate": 0.00033160395797703394, - "loss": 0.4236, - "step": 138400 - }, - { - "epoch": 33.78, - "learning_rate": 0.0003315734180307843, - "loss": 0.3396, - "step": 138425 - }, - { - "epoch": 33.78, - "learning_rate": 0.0003315428780845346, - "loss": 0.4243, - "step": 138450 - }, - { - "epoch": 33.79, - "learning_rate": 0.0003315123381382849, - "loss": 0.3928, - "step": 138475 - }, - { - "epoch": 33.8, - "learning_rate": 0.00033148179819203515, - "loss": 0.4071, - "step": 138500 - }, - { - "epoch": 33.8, - "learning_rate": 0.00033145125824578546, - "loss": 0.3414, - "step": 138525 - }, - { - "epoch": 33.81, - "learning_rate": 0.0003314207182995358, - "loss": 0.4381, - "step": 138550 - }, - { - "epoch": 33.82, - "learning_rate": 0.0003313901783532861, - "loss": 0.3973, - "step": 138575 - }, - { - "epoch": 33.82, - "learning_rate": 0.0003313596384070364, - "loss": 0.361, - "step": 138600 - }, - { - "epoch": 33.83, - "learning_rate": 0.0003313290984607867, - "loss": 0.3328, - "step": 138625 - }, - { - "epoch": 33.83, - "learning_rate": 0.00033129855851453697, - "loss": 0.4502, - "step": 138650 - }, - { - "epoch": 33.84, - "learning_rate": 0.00033126801856828733, - "loss": 0.3692, - "step": 138675 - }, - { - "epoch": 33.85, - "learning_rate": 0.00033123747862203763, - "loss": 0.4154, - "step": 138700 - }, - { - "epoch": 33.85, - "learning_rate": 0.00033120693867578794, - "loss": 0.3633, - "step": 138725 - }, - { - "epoch": 33.86, - "learning_rate": 0.00033117639872953824, - "loss": 0.3845, - "step": 138750 - }, - { - "epoch": 33.86, - "learning_rate": 0.00033114585878328854, - "loss": 0.3683, - "step": 138775 - }, - { - "epoch": 33.87, - "learning_rate": 0.0003311153188370389, - "loss": 0.408, - "step": 138800 - }, - { - "epoch": 33.88, - "learning_rate": 0.00033108477889078915, - "loss": 0.3941, - "step": 138825 - }, - { - "epoch": 33.88, - "learning_rate": 0.00033105423894453945, - "loss": 0.4312, - "step": 138850 - }, - { - "epoch": 33.89, - "learning_rate": 0.00033102369899828976, - "loss": 0.3557, - "step": 138875 - }, - { - "epoch": 33.89, - "learning_rate": 0.00033099315905204006, - "loss": 0.3747, - "step": 138900 - }, - { - "epoch": 33.9, - "learning_rate": 0.0003309626191057904, - "loss": 0.3835, - "step": 138925 - }, - { - "epoch": 33.91, - "learning_rate": 0.0003309320791595407, - "loss": 0.3986, - "step": 138950 - }, - { - "epoch": 33.91, - "learning_rate": 0.00033090153921329097, - "loss": 0.398, - "step": 138975 - }, - { - "epoch": 33.92, - "learning_rate": 0.0003308709992670413, - "loss": 0.4076, - "step": 139000 - }, - { - "epoch": 33.93, - "learning_rate": 0.0003308404593207916, - "loss": 0.3694, - "step": 139025 - }, - { - "epoch": 33.93, - "learning_rate": 0.00033080991937454193, - "loss": 0.3785, - "step": 139050 - }, - { - "epoch": 33.94, - "learning_rate": 0.00033077937942829224, - "loss": 0.3693, - "step": 139075 - }, - { - "epoch": 33.94, - "learning_rate": 0.00033074883948204254, - "loss": 0.4153, - "step": 139100 - }, - { - "epoch": 33.95, - "learning_rate": 0.0003307182995357928, - "loss": 0.3817, - "step": 139125 - }, - { - "epoch": 33.96, - "learning_rate": 0.0003306877595895431, - "loss": 0.3992, - "step": 139150 - }, - { - "epoch": 33.96, - "learning_rate": 0.00033065721964329345, - "loss": 0.3649, - "step": 139175 - }, - { - "epoch": 33.97, - "learning_rate": 0.00033062667969704375, - "loss": 0.3947, - "step": 139200 - }, - { - "epoch": 33.97, - "learning_rate": 0.00033059613975079406, - "loss": 0.3397, - "step": 139225 - }, - { - "epoch": 33.98, - "learning_rate": 0.00033056559980454436, - "loss": 0.4038, - "step": 139250 - }, - { - "epoch": 33.99, - "learning_rate": 0.0003305350598582946, - "loss": 0.373, - "step": 139275 - }, - { - "epoch": 33.99, - "learning_rate": 0.00033050451991204497, - "loss": 0.4479, - "step": 139300 - }, - { - "epoch": 34.0, - "learning_rate": 0.00033047397996579527, - "loss": 0.3613, - "step": 139325 - }, - { - "epoch": 34.0, - "learning_rate": 0.0003304434400195456, - "loss": 0.3761, - "step": 139350 - }, - { - "epoch": 34.01, - "learning_rate": 0.0003304141216711459, - "loss": 0.3521, - "step": 139375 - }, - { - "epoch": 34.02, - "learning_rate": 0.0003303835817248962, - "loss": 0.4, - "step": 139400 - }, - { - "epoch": 34.02, - "learning_rate": 0.0003303530417786465, - "loss": 0.3164, - "step": 139425 - }, - { - "epoch": 34.03, - "learning_rate": 0.00033032250183239674, - "loss": 0.41, - "step": 139450 - }, - { - "epoch": 34.03, - "learning_rate": 0.0003302919618861471, - "loss": 0.3421, - "step": 139475 - }, - { - "epoch": 34.04, - "learning_rate": 0.0003302614219398974, - "loss": 0.3995, - "step": 139500 - }, - { - "epoch": 34.05, - "learning_rate": 0.0003302308819936477, - "loss": 0.3304, - "step": 139525 - }, - { - "epoch": 34.05, - "learning_rate": 0.000330200342047398, - "loss": 0.4101, - "step": 139550 - }, - { - "epoch": 34.06, - "learning_rate": 0.0003301698021011483, - "loss": 0.359, - "step": 139575 - }, - { - "epoch": 34.07, - "learning_rate": 0.0003301392621548986, - "loss": 0.3792, - "step": 139600 - }, - { - "epoch": 34.07, - "learning_rate": 0.0003301087222086489, - "loss": 0.3731, - "step": 139625 - }, - { - "epoch": 34.08, - "learning_rate": 0.0003300781822623992, - "loss": 0.4143, - "step": 139650 - }, - { - "epoch": 34.08, - "learning_rate": 0.0003300476423161495, - "loss": 0.3613, - "step": 139675 - }, - { - "epoch": 34.09, - "learning_rate": 0.0003300171023698998, - "loss": 0.3947, - "step": 139700 - }, - { - "epoch": 34.1, - "learning_rate": 0.0003299865624236502, - "loss": 0.3607, - "step": 139725 - }, - { - "epoch": 34.1, - "learning_rate": 0.00032995602247740043, - "loss": 0.3652, - "step": 139750 - }, - { - "epoch": 34.11, - "learning_rate": 0.00032992548253115073, - "loss": 0.3911, - "step": 139775 - }, - { - "epoch": 34.11, - "learning_rate": 0.00032989494258490104, - "loss": 0.4495, - "step": 139800 - }, - { - "epoch": 34.12, - "learning_rate": 0.00032986440263865134, - "loss": 0.3491, - "step": 139825 - }, - { - "epoch": 34.13, - "learning_rate": 0.0003298338626924017, - "loss": 0.3611, - "step": 139850 - }, - { - "epoch": 34.13, - "learning_rate": 0.000329803322746152, - "loss": 0.3669, - "step": 139875 - }, - { - "epoch": 34.14, - "learning_rate": 0.0003297727827999023, - "loss": 0.3968, - "step": 139900 - }, - { - "epoch": 34.14, - "learning_rate": 0.00032974224285365255, - "loss": 0.341, - "step": 139925 - }, - { - "epoch": 34.15, - "learning_rate": 0.00032971170290740286, - "loss": 0.3937, - "step": 139950 - }, - { - "epoch": 34.16, - "learning_rate": 0.0003296811629611532, - "loss": 0.3728, - "step": 139975 - }, - { - "epoch": 34.16, - "learning_rate": 0.0003296506230149035, - "loss": 0.3908, - "step": 140000 - }, - { - "epoch": 34.17, - "learning_rate": 0.0003296200830686538, - "loss": 0.3814, - "step": 140025 - }, - { - "epoch": 34.18, - "learning_rate": 0.0003295895431224041, - "loss": 0.3616, - "step": 140050 - }, - { - "epoch": 34.18, - "learning_rate": 0.0003295590031761544, - "loss": 0.3442, - "step": 140075 - }, - { - "epoch": 34.19, - "learning_rate": 0.00032952846322990473, - "loss": 0.3822, - "step": 140100 - }, - { - "epoch": 34.19, - "learning_rate": 0.00032949792328365504, - "loss": 0.3766, - "step": 140125 - }, - { - "epoch": 34.2, - "learning_rate": 0.00032946738333740534, - "loss": 0.4176, - "step": 140150 - }, - { - "epoch": 34.21, - "learning_rate": 0.00032943684339115564, - "loss": 0.3375, - "step": 140175 - }, - { - "epoch": 34.21, - "learning_rate": 0.00032940630344490595, - "loss": 0.3641, - "step": 140200 - }, - { - "epoch": 34.22, - "learning_rate": 0.00032937576349865625, - "loss": 0.3556, - "step": 140225 - }, - { - "epoch": 34.22, - "learning_rate": 0.00032934522355240655, - "loss": 0.3915, - "step": 140250 - }, - { - "epoch": 34.23, - "learning_rate": 0.00032931468360615686, - "loss": 0.348, - "step": 140275 - }, - { - "epoch": 34.24, - "learning_rate": 0.00032928414365990716, - "loss": 0.4115, - "step": 140300 - }, - { - "epoch": 34.24, - "learning_rate": 0.00032925360371365746, - "loss": 0.3459, - "step": 140325 - }, - { - "epoch": 34.25, - "learning_rate": 0.0003292230637674078, - "loss": 0.3965, - "step": 140350 - }, - { - "epoch": 34.25, - "learning_rate": 0.0003291925238211581, - "loss": 0.3507, - "step": 140375 - }, - { - "epoch": 34.26, - "learning_rate": 0.00032916198387490837, - "loss": 0.3652, - "step": 140400 - }, - { - "epoch": 34.27, - "learning_rate": 0.0003291314439286587, - "loss": 0.3429, - "step": 140425 - }, - { - "epoch": 34.27, - "learning_rate": 0.000329100903982409, - "loss": 0.3728, - "step": 140450 - }, - { - "epoch": 34.28, - "learning_rate": 0.0003290703640361593, - "loss": 0.3313, - "step": 140475 - }, - { - "epoch": 34.29, - "learning_rate": 0.00032903982408990964, - "loss": 0.4086, - "step": 140500 - }, - { - "epoch": 34.29, - "learning_rate": 0.00032900928414365994, - "loss": 0.3098, - "step": 140525 - }, - { - "epoch": 34.3, - "learning_rate": 0.0003289787441974102, - "loss": 0.3866, - "step": 140550 - }, - { - "epoch": 34.3, - "learning_rate": 0.0003289482042511605, - "loss": 0.3918, - "step": 140575 - }, - { - "epoch": 34.31, - "learning_rate": 0.0003289176643049108, - "loss": 0.3939, - "step": 140600 - }, - { - "epoch": 34.32, - "learning_rate": 0.00032888712435866116, - "loss": 0.3689, - "step": 140625 - }, - { - "epoch": 34.32, - "learning_rate": 0.00032885658441241146, - "loss": 0.4102, - "step": 140650 - }, - { - "epoch": 34.33, - "learning_rate": 0.00032882604446616176, - "loss": 0.4044, - "step": 140675 - }, - { - "epoch": 34.33, - "learning_rate": 0.000328795504519912, - "loss": 0.3637, - "step": 140700 - }, - { - "epoch": 34.34, - "learning_rate": 0.0003287649645736623, - "loss": 0.3501, - "step": 140725 - }, - { - "epoch": 34.35, - "learning_rate": 0.0003287344246274127, - "loss": 0.376, - "step": 140750 - }, - { - "epoch": 34.35, - "learning_rate": 0.000328703884681163, - "loss": 0.3654, - "step": 140775 - }, - { - "epoch": 34.36, - "learning_rate": 0.0003286733447349133, - "loss": 0.3961, - "step": 140800 - }, - { - "epoch": 34.36, - "learning_rate": 0.0003286428047886636, - "loss": 0.3486, - "step": 140825 - }, - { - "epoch": 34.37, - "learning_rate": 0.0003286122648424139, - "loss": 0.4076, - "step": 140850 - }, - { - "epoch": 34.38, - "learning_rate": 0.0003285817248961642, - "loss": 0.3979, - "step": 140875 - }, - { - "epoch": 34.38, - "learning_rate": 0.0003285511849499145, - "loss": 0.3874, - "step": 140900 - }, - { - "epoch": 34.39, - "learning_rate": 0.0003285206450036648, - "loss": 0.3311, - "step": 140925 - }, - { - "epoch": 34.39, - "learning_rate": 0.0003284901050574151, - "loss": 0.3656, - "step": 140950 - }, - { - "epoch": 34.4, - "learning_rate": 0.0003284595651111654, - "loss": 0.3687, - "step": 140975 - }, - { - "epoch": 34.41, - "learning_rate": 0.00032842902516491576, - "loss": 0.4042, - "step": 141000 - }, - { - "epoch": 34.41, - "eval_cer": 0.09400634477377494, - "eval_loss": 0.4195997714996338, - "eval_runtime": 149.5055, - "eval_samples_per_second": 28.046, - "eval_steps_per_second": 7.016, - "eval_wer": 0.39468189233278955, - "step": 141000 - }, - { - "epoch": 34.41, - "learning_rate": 0.000328398485218666, - "loss": 0.3471, - "step": 141025 - }, - { - "epoch": 34.42, - "learning_rate": 0.0003283679452724163, - "loss": 0.3915, - "step": 141050 - }, - { - "epoch": 34.43, - "learning_rate": 0.0003283374053261666, - "loss": 0.3888, - "step": 141075 - }, - { - "epoch": 34.43, - "learning_rate": 0.0003283068653799169, - "loss": 0.4085, - "step": 141100 - }, - { - "epoch": 34.44, - "learning_rate": 0.0003282763254336673, - "loss": 0.3797, - "step": 141125 - }, - { - "epoch": 34.44, - "learning_rate": 0.0003282457854874176, - "loss": 0.4164, - "step": 141150 - }, - { - "epoch": 34.45, - "learning_rate": 0.00032821524554116783, - "loss": 0.3819, - "step": 141175 - }, - { - "epoch": 34.46, - "learning_rate": 0.00032818470559491813, - "loss": 0.39, - "step": 141200 - }, - { - "epoch": 34.46, - "learning_rate": 0.00032815416564866844, - "loss": 0.3658, - "step": 141225 - }, - { - "epoch": 34.47, - "learning_rate": 0.0003281236257024188, - "loss": 0.3993, - "step": 141250 - }, - { - "epoch": 34.47, - "learning_rate": 0.0003280930857561691, - "loss": 0.3643, - "step": 141275 - }, - { - "epoch": 34.48, - "learning_rate": 0.0003280625458099194, - "loss": 0.3629, - "step": 141300 - }, - { - "epoch": 34.49, - "learning_rate": 0.0003280320058636697, - "loss": 0.3807, - "step": 141325 - }, - { - "epoch": 34.49, - "learning_rate": 0.00032800146591741995, - "loss": 0.4153, - "step": 141350 - }, - { - "epoch": 34.5, - "learning_rate": 0.0003279709259711703, - "loss": 0.4157, - "step": 141375 - }, - { - "epoch": 34.5, - "learning_rate": 0.0003279403860249206, - "loss": 0.343, - "step": 141400 - }, - { - "epoch": 34.51, - "learning_rate": 0.0003279098460786709, - "loss": 0.3603, - "step": 141425 - }, - { - "epoch": 34.52, - "learning_rate": 0.0003278793061324212, - "loss": 0.4158, - "step": 141450 - }, - { - "epoch": 34.52, - "learning_rate": 0.0003278487661861715, - "loss": 0.3832, - "step": 141475 - }, - { - "epoch": 34.53, - "learning_rate": 0.00032781822623992183, - "loss": 0.4119, - "step": 141500 - }, - { - "epoch": 34.54, - "learning_rate": 0.00032778768629367213, - "loss": 0.3631, - "step": 141525 - }, - { - "epoch": 34.54, - "learning_rate": 0.00032775714634742243, - "loss": 0.4149, - "step": 141550 - }, - { - "epoch": 34.55, - "learning_rate": 0.00032772660640117274, - "loss": 0.3623, - "step": 141575 - }, - { - "epoch": 34.55, - "learning_rate": 0.00032769606645492304, - "loss": 0.3814, - "step": 141600 - }, - { - "epoch": 34.56, - "learning_rate": 0.0003276655265086734, - "loss": 0.355, - "step": 141625 - }, - { - "epoch": 34.57, - "learning_rate": 0.00032763498656242365, - "loss": 0.4258, - "step": 141650 - }, - { - "epoch": 34.57, - "learning_rate": 0.00032760444661617395, - "loss": 0.3596, - "step": 141675 - }, - { - "epoch": 34.58, - "learning_rate": 0.00032757390666992425, - "loss": 0.3762, - "step": 141700 - }, - { - "epoch": 34.58, - "learning_rate": 0.00032754336672367456, - "loss": 0.3774, - "step": 141725 - }, - { - "epoch": 34.59, - "learning_rate": 0.0003275128267774249, - "loss": 0.433, - "step": 141750 - }, - { - "epoch": 34.6, - "learning_rate": 0.0003274822868311752, - "loss": 0.3318, - "step": 141775 - }, - { - "epoch": 34.6, - "learning_rate": 0.0003274517468849255, - "loss": 0.3979, - "step": 141800 - }, - { - "epoch": 34.61, - "learning_rate": 0.00032742120693867577, - "loss": 0.3382, - "step": 141825 - }, - { - "epoch": 34.61, - "learning_rate": 0.0003273906669924261, - "loss": 0.3676, - "step": 141850 - }, - { - "epoch": 34.62, - "learning_rate": 0.0003273601270461764, - "loss": 0.368, - "step": 141875 - }, - { - "epoch": 34.63, - "learning_rate": 0.00032732958709992674, - "loss": 0.4084, - "step": 141900 - }, - { - "epoch": 34.63, - "learning_rate": 0.00032729904715367704, - "loss": 0.3796, - "step": 141925 - }, - { - "epoch": 34.64, - "learning_rate": 0.00032726850720742734, - "loss": 0.3774, - "step": 141950 - }, - { - "epoch": 34.64, - "learning_rate": 0.0003272379672611776, - "loss": 0.348, - "step": 141975 - }, - { - "epoch": 34.65, - "learning_rate": 0.0003272074273149279, - "loss": 0.3722, - "step": 142000 - }, - { - "epoch": 34.66, - "learning_rate": 0.00032717688736867825, - "loss": 0.378, - "step": 142025 - }, - { - "epoch": 34.66, - "learning_rate": 0.00032714634742242856, - "loss": 0.3905, - "step": 142050 - }, - { - "epoch": 34.67, - "learning_rate": 0.00032711580747617886, - "loss": 0.3589, - "step": 142075 - }, - { - "epoch": 34.68, - "learning_rate": 0.00032708526752992916, - "loss": 0.3792, - "step": 142100 - }, - { - "epoch": 34.68, - "learning_rate": 0.0003270547275836794, - "loss": 0.3419, - "step": 142125 - }, - { - "epoch": 34.69, - "learning_rate": 0.00032702418763742977, - "loss": 0.3986, - "step": 142150 - }, - { - "epoch": 34.69, - "learning_rate": 0.00032699364769118007, - "loss": 0.3673, - "step": 142175 - }, - { - "epoch": 34.7, - "learning_rate": 0.0003269631077449304, - "loss": 0.3795, - "step": 142200 - }, - { - "epoch": 34.71, - "learning_rate": 0.0003269325677986807, - "loss": 0.3767, - "step": 142225 - }, - { - "epoch": 34.71, - "learning_rate": 0.000326902027852431, - "loss": 0.3885, - "step": 142250 - }, - { - "epoch": 34.72, - "learning_rate": 0.00032687148790618134, - "loss": 0.3423, - "step": 142275 - }, - { - "epoch": 34.72, - "learning_rate": 0.0003268409479599316, - "loss": 0.3885, - "step": 142300 - }, - { - "epoch": 34.73, - "learning_rate": 0.0003268104080136819, - "loss": 0.358, - "step": 142325 - }, - { - "epoch": 34.74, - "learning_rate": 0.0003267798680674322, - "loss": 0.4137, - "step": 142350 - }, - { - "epoch": 34.74, - "learning_rate": 0.0003267493281211825, - "loss": 0.3775, - "step": 142375 - }, - { - "epoch": 34.75, - "learning_rate": 0.00032671878817493286, - "loss": 0.4135, - "step": 142400 - }, - { - "epoch": 34.75, - "learning_rate": 0.00032668824822868316, - "loss": 0.3023, - "step": 142425 - }, - { - "epoch": 34.76, - "learning_rate": 0.0003266577082824334, - "loss": 0.4136, - "step": 142450 - }, - { - "epoch": 34.77, - "learning_rate": 0.0003266271683361837, - "loss": 0.3392, - "step": 142475 - }, - { - "epoch": 34.77, - "learning_rate": 0.000326596628389934, - "loss": 0.3892, - "step": 142500 - }, - { - "epoch": 34.78, - "learning_rate": 0.0003265660884436844, - "loss": 0.3577, - "step": 142525 - }, - { - "epoch": 34.79, - "learning_rate": 0.0003265355484974347, - "loss": 0.3798, - "step": 142550 - }, - { - "epoch": 34.79, - "learning_rate": 0.000326505008551185, - "loss": 0.3573, - "step": 142575 - }, - { - "epoch": 34.8, - "learning_rate": 0.00032647446860493523, - "loss": 0.3979, - "step": 142600 - }, - { - "epoch": 34.8, - "learning_rate": 0.00032644392865868553, - "loss": 0.3441, - "step": 142625 - }, - { - "epoch": 34.81, - "learning_rate": 0.0003264133887124359, - "loss": 0.3925, - "step": 142650 - }, - { - "epoch": 34.82, - "learning_rate": 0.0003263828487661862, - "loss": 0.3467, - "step": 142675 - }, - { - "epoch": 34.82, - "learning_rate": 0.0003263523088199365, - "loss": 0.3999, - "step": 142700 - }, - { - "epoch": 34.83, - "learning_rate": 0.0003263217688736868, - "loss": 0.3628, - "step": 142725 - }, - { - "epoch": 34.83, - "learning_rate": 0.00032629122892743705, - "loss": 0.4295, - "step": 142750 - }, - { - "epoch": 34.84, - "learning_rate": 0.0003262606889811874, - "loss": 0.3707, - "step": 142775 - }, - { - "epoch": 34.85, - "learning_rate": 0.0003262301490349377, - "loss": 0.4188, - "step": 142800 - }, - { - "epoch": 34.85, - "learning_rate": 0.000326199609088688, - "loss": 0.4034, - "step": 142825 - }, - { - "epoch": 34.86, - "learning_rate": 0.0003261690691424383, - "loss": 0.3764, - "step": 142850 - }, - { - "epoch": 34.86, - "learning_rate": 0.0003261385291961886, - "loss": 0.3556, - "step": 142875 - }, - { - "epoch": 34.87, - "learning_rate": 0.000326107989249939, - "loss": 0.3941, - "step": 142900 - }, - { - "epoch": 34.88, - "learning_rate": 0.0003260774493036892, - "loss": 0.3578, - "step": 142925 - }, - { - "epoch": 34.88, - "learning_rate": 0.00032604690935743953, - "loss": 0.3759, - "step": 142950 - }, - { - "epoch": 34.89, - "learning_rate": 0.00032601636941118983, - "loss": 0.3667, - "step": 142975 - }, - { - "epoch": 34.9, - "learning_rate": 0.00032598582946494014, - "loss": 0.3712, - "step": 143000 - }, - { - "epoch": 34.9, - "learning_rate": 0.0003259552895186905, - "loss": 0.3266, - "step": 143025 - }, - { - "epoch": 34.91, - "learning_rate": 0.0003259247495724408, - "loss": 0.4101, - "step": 143050 - }, - { - "epoch": 34.91, - "learning_rate": 0.00032589420962619105, - "loss": 0.3533, - "step": 143075 - }, - { - "epoch": 34.92, - "learning_rate": 0.00032586366967994135, - "loss": 0.4007, - "step": 143100 - }, - { - "epoch": 34.93, - "learning_rate": 0.00032583312973369165, - "loss": 0.3463, - "step": 143125 - }, - { - "epoch": 34.93, - "learning_rate": 0.00032580258978744196, - "loss": 0.4053, - "step": 143150 - }, - { - "epoch": 34.94, - "learning_rate": 0.0003257720498411923, - "loss": 0.3764, - "step": 143175 - }, - { - "epoch": 34.94, - "learning_rate": 0.0003257415098949426, - "loss": 0.3746, - "step": 143200 - }, - { - "epoch": 34.95, - "learning_rate": 0.00032571096994869287, - "loss": 0.3566, - "step": 143225 - }, - { - "epoch": 34.96, - "learning_rate": 0.00032568043000244317, - "loss": 0.3725, - "step": 143250 - }, - { - "epoch": 34.96, - "learning_rate": 0.0003256498900561935, - "loss": 0.3446, - "step": 143275 - }, - { - "epoch": 34.97, - "learning_rate": 0.00032561935010994383, - "loss": 0.395, - "step": 143300 - }, - { - "epoch": 34.97, - "learning_rate": 0.00032558881016369413, - "loss": 0.3806, - "step": 143325 - }, - { - "epoch": 34.98, - "learning_rate": 0.00032555827021744444, - "loss": 0.4025, - "step": 143350 - }, - { - "epoch": 34.99, - "learning_rate": 0.00032552773027119474, - "loss": 0.3337, - "step": 143375 - }, - { - "epoch": 34.99, - "learning_rate": 0.000325497190324945, - "loss": 0.3959, - "step": 143400 - }, - { - "epoch": 35.0, - "learning_rate": 0.00032546665037869535, - "loss": 0.3356, - "step": 143425 - }, - { - "epoch": 35.0, - "learning_rate": 0.00032543611043244565, - "loss": 0.3593, - "step": 143450 - }, - { - "epoch": 35.01, - "learning_rate": 0.00032540557048619595, - "loss": 0.3414, - "step": 143475 - }, - { - "epoch": 35.02, - "learning_rate": 0.00032537503053994626, - "loss": 0.3893, - "step": 143500 - }, - { - "epoch": 35.02, - "learning_rate": 0.00032534449059369656, - "loss": 0.3779, - "step": 143525 - }, - { - "epoch": 35.03, - "learning_rate": 0.00032531395064744686, - "loss": 0.3826, - "step": 143550 - }, - { - "epoch": 35.04, - "learning_rate": 0.00032528341070119717, - "loss": 0.3229, - "step": 143575 - }, - { - "epoch": 35.04, - "learning_rate": 0.00032525287075494747, - "loss": 0.3747, - "step": 143600 - }, - { - "epoch": 35.05, - "learning_rate": 0.0003252223308086978, - "loss": 0.3863, - "step": 143625 - }, - { - "epoch": 35.05, - "learning_rate": 0.0003251917908624481, - "loss": 0.3804, - "step": 143650 - }, - { - "epoch": 35.06, - "learning_rate": 0.00032516125091619844, - "loss": 0.3068, - "step": 143675 - }, - { - "epoch": 35.07, - "learning_rate": 0.0003251307109699487, - "loss": 0.3687, - "step": 143700 - }, - { - "epoch": 35.07, - "learning_rate": 0.000325100171023699, - "loss": 0.3628, - "step": 143725 - }, - { - "epoch": 35.08, - "learning_rate": 0.0003250696310774493, - "loss": 0.3683, - "step": 143750 - }, - { - "epoch": 35.08, - "learning_rate": 0.0003250390911311996, - "loss": 0.3492, - "step": 143775 - }, - { - "epoch": 35.09, - "learning_rate": 0.00032500855118494995, - "loss": 0.3791, - "step": 143800 - }, - { - "epoch": 35.1, - "learning_rate": 0.00032497801123870026, - "loss": 0.3718, - "step": 143825 - }, - { - "epoch": 35.1, - "learning_rate": 0.00032494747129245056, - "loss": 0.4213, - "step": 143850 - }, - { - "epoch": 35.11, - "learning_rate": 0.0003249169313462008, - "loss": 0.3575, - "step": 143875 - }, - { - "epoch": 35.11, - "learning_rate": 0.0003248863913999511, - "loss": 0.3555, - "step": 143900 - }, - { - "epoch": 35.12, - "learning_rate": 0.00032485585145370147, - "loss": 0.3463, - "step": 143925 - }, - { - "epoch": 35.13, - "learning_rate": 0.00032482531150745177, - "loss": 0.3952, - "step": 143950 - }, - { - "epoch": 35.13, - "learning_rate": 0.0003247947715612021, - "loss": 0.3151, - "step": 143975 - }, - { - "epoch": 35.14, - "learning_rate": 0.0003247642316149524, - "loss": 0.4055, - "step": 144000 - }, - { - "epoch": 35.14, - "eval_cer": 0.09494574089093766, - "eval_loss": 0.39560216665267944, - "eval_runtime": 149.4692, - "eval_samples_per_second": 28.053, - "eval_steps_per_second": 7.018, - "eval_wer": 0.38818923327895594, - "step": 144000 - }, - { - "epoch": 35.15, - "learning_rate": 0.00032473369166870263, - "loss": 0.3437, - "step": 144025 - }, - { - "epoch": 35.15, - "learning_rate": 0.000324703151722453, - "loss": 0.3985, - "step": 144050 - }, - { - "epoch": 35.16, - "learning_rate": 0.0003246726117762033, - "loss": 0.338, - "step": 144075 - }, - { - "epoch": 35.16, - "learning_rate": 0.0003246420718299536, - "loss": 0.4219, - "step": 144100 - }, - { - "epoch": 35.17, - "learning_rate": 0.0003246115318837039, - "loss": 0.3662, - "step": 144125 - }, - { - "epoch": 35.18, - "learning_rate": 0.0003245809919374542, - "loss": 0.3914, - "step": 144150 - }, - { - "epoch": 35.18, - "learning_rate": 0.0003245504519912045, - "loss": 0.3389, - "step": 144175 - }, - { - "epoch": 35.19, - "learning_rate": 0.0003245199120449548, - "loss": 0.3745, - "step": 144200 - }, - { - "epoch": 35.19, - "learning_rate": 0.0003244893720987051, - "loss": 0.3361, - "step": 144225 - }, - { - "epoch": 35.2, - "learning_rate": 0.0003244588321524554, - "loss": 0.4224, - "step": 144250 - }, - { - "epoch": 35.21, - "learning_rate": 0.0003244295138040557, - "loss": 0.3588, - "step": 144275 - }, - { - "epoch": 35.21, - "learning_rate": 0.000324398973857806, - "loss": 0.3742, - "step": 144300 - }, - { - "epoch": 35.22, - "learning_rate": 0.0003243684339115563, - "loss": 0.3108, - "step": 144325 - }, - { - "epoch": 35.22, - "learning_rate": 0.00032433789396530663, - "loss": 0.3738, - "step": 144350 - }, - { - "epoch": 35.23, - "learning_rate": 0.00032430735401905693, - "loss": 0.3379, - "step": 144375 - }, - { - "epoch": 35.24, - "learning_rate": 0.00032427681407280724, - "loss": 0.3941, - "step": 144400 - }, - { - "epoch": 35.24, - "learning_rate": 0.00032424627412655754, - "loss": 0.3378, - "step": 144425 - }, - { - "epoch": 35.25, - "learning_rate": 0.00032421573418030784, - "loss": 0.4398, - "step": 144450 - }, - { - "epoch": 35.26, - "learning_rate": 0.0003241851942340582, - "loss": 0.3265, - "step": 144475 - }, - { - "epoch": 35.26, - "learning_rate": 0.00032415465428780845, - "loss": 0.402, - "step": 144500 - }, - { - "epoch": 35.27, - "learning_rate": 0.00032412411434155875, - "loss": 0.3512, - "step": 144525 - }, - { - "epoch": 35.27, - "learning_rate": 0.00032409357439530906, - "loss": 0.434, - "step": 144550 - }, - { - "epoch": 35.28, - "learning_rate": 0.00032406303444905936, - "loss": 0.3559, - "step": 144575 - }, - { - "epoch": 35.29, - "learning_rate": 0.0003240324945028097, - "loss": 0.3925, - "step": 144600 - }, - { - "epoch": 35.29, - "learning_rate": 0.00032400195455656, - "loss": 0.3415, - "step": 144625 - }, - { - "epoch": 35.3, - "learning_rate": 0.00032397141461031027, - "loss": 0.4035, - "step": 144650 - }, - { - "epoch": 35.3, - "learning_rate": 0.00032394087466406057, - "loss": 0.3086, - "step": 144675 - }, - { - "epoch": 35.31, - "learning_rate": 0.0003239103347178109, - "loss": 0.3642, - "step": 144700 - }, - { - "epoch": 35.32, - "learning_rate": 0.00032387979477156123, - "loss": 0.3991, - "step": 144725 - }, - { - "epoch": 35.32, - "learning_rate": 0.00032384925482531154, - "loss": 0.4157, - "step": 144750 - }, - { - "epoch": 35.33, - "learning_rate": 0.00032381871487906184, - "loss": 0.3541, - "step": 144775 - }, - { - "epoch": 35.33, - "learning_rate": 0.00032378817493281214, - "loss": 0.3786, - "step": 144800 - }, - { - "epoch": 35.34, - "learning_rate": 0.0003237576349865624, - "loss": 0.327, - "step": 144825 - }, - { - "epoch": 35.35, - "learning_rate": 0.00032372709504031275, - "loss": 0.3758, - "step": 144850 - }, - { - "epoch": 35.35, - "learning_rate": 0.00032369655509406305, - "loss": 0.3576, - "step": 144875 - }, - { - "epoch": 35.36, - "learning_rate": 0.00032366601514781336, - "loss": 0.3495, - "step": 144900 - }, - { - "epoch": 35.36, - "learning_rate": 0.00032363547520156366, - "loss": 0.3452, - "step": 144925 - }, - { - "epoch": 35.37, - "learning_rate": 0.00032360493525531396, - "loss": 0.3905, - "step": 144950 - }, - { - "epoch": 35.38, - "learning_rate": 0.00032357439530906427, - "loss": 0.3453, - "step": 144975 - }, - { - "epoch": 35.38, - "learning_rate": 0.00032354385536281457, - "loss": 0.3825, - "step": 145000 - }, - { - "epoch": 35.39, - "learning_rate": 0.0003235133154165649, - "loss": 0.3431, - "step": 145025 - }, - { - "epoch": 35.4, - "learning_rate": 0.0003234827754703152, - "loss": 0.3646, - "step": 145050 - }, - { - "epoch": 35.4, - "learning_rate": 0.0003234522355240655, - "loss": 0.3521, - "step": 145075 - }, - { - "epoch": 35.41, - "learning_rate": 0.00032342169557781584, - "loss": 0.3978, - "step": 145100 - }, - { - "epoch": 35.41, - "learning_rate": 0.0003233911556315661, - "loss": 0.3244, - "step": 145125 - }, - { - "epoch": 35.42, - "learning_rate": 0.0003233606156853164, - "loss": 0.3913, - "step": 145150 - }, - { - "epoch": 35.43, - "learning_rate": 0.0003233300757390667, - "loss": 0.3628, - "step": 145175 - }, - { - "epoch": 35.43, - "learning_rate": 0.000323299535792817, - "loss": 0.3918, - "step": 145200 - }, - { - "epoch": 35.44, - "learning_rate": 0.0003232689958465673, - "loss": 0.3509, - "step": 145225 - }, - { - "epoch": 35.44, - "learning_rate": 0.00032323845590031766, - "loss": 0.3958, - "step": 145250 - }, - { - "epoch": 35.45, - "learning_rate": 0.00032320791595406796, - "loss": 0.3478, - "step": 145275 - }, - { - "epoch": 35.46, - "learning_rate": 0.0003231773760078182, - "loss": 0.4068, - "step": 145300 - }, - { - "epoch": 35.46, - "learning_rate": 0.0003231468360615685, - "loss": 0.3665, - "step": 145325 - }, - { - "epoch": 35.47, - "learning_rate": 0.0003231162961153188, - "loss": 0.4198, - "step": 145350 - }, - { - "epoch": 35.47, - "learning_rate": 0.0003230857561690692, - "loss": 0.3439, - "step": 145375 - }, - { - "epoch": 35.48, - "learning_rate": 0.0003230552162228195, - "loss": 0.377, - "step": 145400 - }, - { - "epoch": 35.49, - "learning_rate": 0.0003230246762765698, - "loss": 0.362, - "step": 145425 - }, - { - "epoch": 35.49, - "learning_rate": 0.00032299413633032003, - "loss": 0.415, - "step": 145450 - }, - { - "epoch": 35.5, - "learning_rate": 0.00032296359638407033, - "loss": 0.3535, - "step": 145475 - }, - { - "epoch": 35.51, - "learning_rate": 0.0003229330564378207, - "loss": 0.4043, - "step": 145500 - }, - { - "epoch": 35.51, - "learning_rate": 0.000322902516491571, - "loss": 0.326, - "step": 145525 - }, - { - "epoch": 35.52, - "learning_rate": 0.0003228719765453213, - "loss": 0.385, - "step": 145550 - }, - { - "epoch": 35.52, - "learning_rate": 0.0003228414365990716, - "loss": 0.3811, - "step": 145575 - }, - { - "epoch": 35.53, - "learning_rate": 0.00032281089665282185, - "loss": 0.3609, - "step": 145600 - }, - { - "epoch": 35.54, - "learning_rate": 0.0003227803567065722, - "loss": 0.357, - "step": 145625 - }, - { - "epoch": 35.54, - "learning_rate": 0.0003227498167603225, - "loss": 0.3908, - "step": 145650 - }, - { - "epoch": 35.55, - "learning_rate": 0.0003227192768140728, - "loss": 0.3159, - "step": 145675 - }, - { - "epoch": 35.55, - "learning_rate": 0.0003226887368678231, - "loss": 0.3898, - "step": 145700 - }, - { - "epoch": 35.56, - "learning_rate": 0.0003226581969215734, - "loss": 0.3226, - "step": 145725 - }, - { - "epoch": 35.57, - "learning_rate": 0.0003226276569753238, - "loss": 0.3833, - "step": 145750 - }, - { - "epoch": 35.57, - "learning_rate": 0.00032259711702907403, - "loss": 0.3699, - "step": 145775 - }, - { - "epoch": 35.58, - "learning_rate": 0.00032256657708282433, - "loss": 0.3777, - "step": 145800 - }, - { - "epoch": 35.58, - "learning_rate": 0.00032253603713657463, - "loss": 0.3697, - "step": 145825 - }, - { - "epoch": 35.59, - "learning_rate": 0.00032250549719032494, - "loss": 0.3952, - "step": 145850 - }, - { - "epoch": 35.6, - "learning_rate": 0.0003224749572440753, - "loss": 0.323, - "step": 145875 - }, - { - "epoch": 35.6, - "learning_rate": 0.0003224444172978256, - "loss": 0.3817, - "step": 145900 - }, - { - "epoch": 35.61, - "learning_rate": 0.00032241387735157585, - "loss": 0.3693, - "step": 145925 - }, - { - "epoch": 35.61, - "learning_rate": 0.00032238333740532615, - "loss": 0.3745, - "step": 145950 - }, - { - "epoch": 35.62, - "learning_rate": 0.00032235279745907645, - "loss": 0.3209, - "step": 145975 - }, - { - "epoch": 35.63, - "learning_rate": 0.00032232347911067676, - "loss": 0.3896, - "step": 146000 - }, - { - "epoch": 35.63, - "learning_rate": 0.00032229293916442706, - "loss": 0.3541, - "step": 146025 - }, - { - "epoch": 35.64, - "learning_rate": 0.0003222623992181774, - "loss": 0.3982, - "step": 146050 - }, - { - "epoch": 35.65, - "learning_rate": 0.00032223185927192767, - "loss": 0.3498, - "step": 146075 - }, - { - "epoch": 35.65, - "learning_rate": 0.000322201319325678, - "loss": 0.405, - "step": 146100 - }, - { - "epoch": 35.66, - "learning_rate": 0.0003221707793794283, - "loss": 0.3542, - "step": 146125 - }, - { - "epoch": 35.66, - "learning_rate": 0.0003221402394331786, - "loss": 0.4302, - "step": 146150 - }, - { - "epoch": 35.67, - "learning_rate": 0.00032210969948692894, - "loss": 0.3272, - "step": 146175 - }, - { - "epoch": 35.68, - "learning_rate": 0.00032207915954067924, - "loss": 0.3888, - "step": 146200 - }, - { - "epoch": 35.68, - "learning_rate": 0.00032204861959442955, - "loss": 0.394, - "step": 146225 - }, - { - "epoch": 35.69, - "learning_rate": 0.0003220180796481798, - "loss": 0.3891, - "step": 146250 - }, - { - "epoch": 35.69, - "learning_rate": 0.0003219875397019301, - "loss": 0.3566, - "step": 146275 - }, - { - "epoch": 35.7, - "learning_rate": 0.00032195699975568046, - "loss": 0.3858, - "step": 146300 - }, - { - "epoch": 35.71, - "learning_rate": 0.00032192645980943076, - "loss": 0.3621, - "step": 146325 - }, - { - "epoch": 35.71, - "learning_rate": 0.00032189591986318106, - "loss": 0.4315, - "step": 146350 - }, - { - "epoch": 35.72, - "learning_rate": 0.00032186537991693137, - "loss": 0.3582, - "step": 146375 - }, - { - "epoch": 35.72, - "learning_rate": 0.0003218348399706816, - "loss": 0.4036, - "step": 146400 - }, - { - "epoch": 35.73, - "learning_rate": 0.00032180430002443197, - "loss": 0.3515, - "step": 146425 - }, - { - "epoch": 35.74, - "learning_rate": 0.0003217737600781823, - "loss": 0.4004, - "step": 146450 - }, - { - "epoch": 35.74, - "learning_rate": 0.0003217432201319326, - "loss": 0.3602, - "step": 146475 - }, - { - "epoch": 35.75, - "learning_rate": 0.0003217126801856829, - "loss": 0.3917, - "step": 146500 - }, - { - "epoch": 35.76, - "learning_rate": 0.0003216821402394332, - "loss": 0.3357, - "step": 146525 - }, - { - "epoch": 35.76, - "learning_rate": 0.0003216516002931835, - "loss": 0.4125, - "step": 146550 - }, - { - "epoch": 35.77, - "learning_rate": 0.0003216210603469338, - "loss": 0.3342, - "step": 146575 - }, - { - "epoch": 35.77, - "learning_rate": 0.0003215905204006841, - "loss": 0.367, - "step": 146600 - }, - { - "epoch": 35.78, - "learning_rate": 0.0003215599804544344, - "loss": 0.3721, - "step": 146625 - }, - { - "epoch": 35.79, - "learning_rate": 0.0003215294405081847, - "loss": 0.387, - "step": 146650 - }, - { - "epoch": 35.79, - "learning_rate": 0.00032149890056193506, - "loss": 0.3573, - "step": 146675 - }, - { - "epoch": 35.8, - "learning_rate": 0.0003214683606156853, - "loss": 0.373, - "step": 146700 - }, - { - "epoch": 35.8, - "learning_rate": 0.0003214378206694356, - "loss": 0.3215, - "step": 146725 - }, - { - "epoch": 35.81, - "learning_rate": 0.0003214072807231859, - "loss": 0.3953, - "step": 146750 - }, - { - "epoch": 35.82, - "learning_rate": 0.0003213767407769362, - "loss": 0.3182, - "step": 146775 - }, - { - "epoch": 35.82, - "learning_rate": 0.0003213462008306866, - "loss": 0.4039, - "step": 146800 - }, - { - "epoch": 35.83, - "learning_rate": 0.0003213156608844369, - "loss": 0.3126, - "step": 146825 - }, - { - "epoch": 35.83, - "learning_rate": 0.0003212851209381872, - "loss": 0.3938, - "step": 146850 - }, - { - "epoch": 35.84, - "learning_rate": 0.00032125458099193743, - "loss": 0.3636, - "step": 146875 - }, - { - "epoch": 35.85, - "learning_rate": 0.00032122404104568774, - "loss": 0.3621, - "step": 146900 - }, - { - "epoch": 35.85, - "learning_rate": 0.0003211935010994381, - "loss": 0.3415, - "step": 146925 - }, - { - "epoch": 35.86, - "learning_rate": 0.0003211629611531884, - "loss": 0.4049, - "step": 146950 - }, - { - "epoch": 35.87, - "learning_rate": 0.0003211324212069387, - "loss": 0.2868, - "step": 146975 - }, - { - "epoch": 35.87, - "learning_rate": 0.000321101881260689, - "loss": 0.3831, - "step": 147000 - }, - { - "epoch": 35.87, - "eval_cer": 0.09333901419874131, - "eval_loss": 0.3962480425834656, - "eval_runtime": 148.6843, - "eval_samples_per_second": 28.201, - "eval_steps_per_second": 7.055, - "eval_wer": 0.3842414355628059, - "step": 147000 - }, - { - "epoch": 35.88, - "learning_rate": 0.00032107134131443925, - "loss": 0.3714, - "step": 147025 - }, - { - "epoch": 35.88, - "learning_rate": 0.0003210408013681896, - "loss": 0.4221, - "step": 147050 - }, - { - "epoch": 35.89, - "learning_rate": 0.0003210102614219399, - "loss": 0.3564, - "step": 147075 - }, - { - "epoch": 35.9, - "learning_rate": 0.0003209797214756902, - "loss": 0.398, - "step": 147100 - }, - { - "epoch": 35.9, - "learning_rate": 0.0003209491815294405, - "loss": 0.3744, - "step": 147125 - }, - { - "epoch": 35.91, - "learning_rate": 0.0003209186415831908, - "loss": 0.3761, - "step": 147150 - }, - { - "epoch": 35.91, - "learning_rate": 0.00032088810163694107, - "loss": 0.3845, - "step": 147175 - }, - { - "epoch": 35.92, - "learning_rate": 0.00032085756169069143, - "loss": 0.4164, - "step": 147200 - }, - { - "epoch": 35.93, - "learning_rate": 0.00032082702174444173, - "loss": 0.3672, - "step": 147225 - }, - { - "epoch": 35.93, - "learning_rate": 0.00032079648179819204, - "loss": 0.3552, - "step": 147250 - }, - { - "epoch": 35.94, - "learning_rate": 0.00032076594185194234, - "loss": 0.3435, - "step": 147275 - }, - { - "epoch": 35.94, - "learning_rate": 0.00032073540190569264, - "loss": 0.3759, - "step": 147300 - }, - { - "epoch": 35.95, - "learning_rate": 0.000320704861959443, - "loss": 0.3765, - "step": 147325 - }, - { - "epoch": 35.96, - "learning_rate": 0.00032067432201319325, - "loss": 0.3909, - "step": 147350 - }, - { - "epoch": 35.96, - "learning_rate": 0.00032064378206694355, - "loss": 0.3515, - "step": 147375 - }, - { - "epoch": 35.97, - "learning_rate": 0.00032061324212069386, - "loss": 0.3989, - "step": 147400 - }, - { - "epoch": 35.97, - "learning_rate": 0.00032058270217444416, - "loss": 0.3365, - "step": 147425 - }, - { - "epoch": 35.98, - "learning_rate": 0.0003205521622281945, - "loss": 0.3786, - "step": 147450 - }, - { - "epoch": 35.99, - "learning_rate": 0.0003205216222819448, - "loss": 0.3397, - "step": 147475 - }, - { - "epoch": 35.99, - "learning_rate": 0.00032049108233569507, - "loss": 0.3643, - "step": 147500 - }, - { - "epoch": 36.0, - "learning_rate": 0.0003204605423894454, - "loss": 0.4007, - "step": 147525 - }, - { - "epoch": 36.01, - "learning_rate": 0.0003204300024431957, - "loss": 0.3823, - "step": 147550 - }, - { - "epoch": 36.01, - "learning_rate": 0.00032039946249694603, - "loss": 0.329, - "step": 147575 - }, - { - "epoch": 36.02, - "learning_rate": 0.00032036892255069634, - "loss": 0.383, - "step": 147600 - }, - { - "epoch": 36.02, - "learning_rate": 0.00032033838260444664, - "loss": 0.3285, - "step": 147625 - }, - { - "epoch": 36.03, - "learning_rate": 0.0003203078426581969, - "loss": 0.3687, - "step": 147650 - }, - { - "epoch": 36.04, - "learning_rate": 0.0003202773027119472, - "loss": 0.3371, - "step": 147675 - }, - { - "epoch": 36.04, - "learning_rate": 0.00032024676276569755, - "loss": 0.3651, - "step": 147700 - }, - { - "epoch": 36.05, - "learning_rate": 0.00032021622281944785, - "loss": 0.3373, - "step": 147725 - }, - { - "epoch": 36.05, - "learning_rate": 0.00032018568287319816, - "loss": 0.3969, - "step": 147750 - }, - { - "epoch": 36.06, - "learning_rate": 0.00032015514292694846, - "loss": 0.3296, - "step": 147775 - }, - { - "epoch": 36.07, - "learning_rate": 0.00032012460298069876, - "loss": 0.378, - "step": 147800 - }, - { - "epoch": 36.07, - "learning_rate": 0.00032009406303444907, - "loss": 0.3491, - "step": 147825 - }, - { - "epoch": 36.08, - "learning_rate": 0.00032006352308819937, - "loss": 0.3889, - "step": 147850 - }, - { - "epoch": 36.08, - "learning_rate": 0.0003200329831419497, - "loss": 0.3165, - "step": 147875 - }, - { - "epoch": 36.09, - "learning_rate": 0.0003200024431957, - "loss": 0.3961, - "step": 147900 - }, - { - "epoch": 36.1, - "learning_rate": 0.0003199719032494503, - "loss": 0.3166, - "step": 147925 - }, - { - "epoch": 36.1, - "learning_rate": 0.00031994136330320064, - "loss": 0.3755, - "step": 147950 - }, - { - "epoch": 36.11, - "learning_rate": 0.0003199108233569509, - "loss": 0.3135, - "step": 147975 - }, - { - "epoch": 36.12, - "learning_rate": 0.0003198802834107012, - "loss": 0.3744, - "step": 148000 - }, - { - "epoch": 36.12, - "learning_rate": 0.0003198497434644515, - "loss": 0.3229, - "step": 148025 - }, - { - "epoch": 36.13, - "learning_rate": 0.0003198192035182018, - "loss": 0.3819, - "step": 148050 - }, - { - "epoch": 36.13, - "learning_rate": 0.00031978866357195216, - "loss": 0.3388, - "step": 148075 - }, - { - "epoch": 36.14, - "learning_rate": 0.00031975812362570246, - "loss": 0.3758, - "step": 148100 - }, - { - "epoch": 36.15, - "learning_rate": 0.0003197275836794527, - "loss": 0.3504, - "step": 148125 - }, - { - "epoch": 36.15, - "learning_rate": 0.000319697043733203, - "loss": 0.3758, - "step": 148150 - }, - { - "epoch": 36.16, - "learning_rate": 0.0003196665037869533, - "loss": 0.3839, - "step": 148175 - }, - { - "epoch": 36.16, - "learning_rate": 0.00031963596384070367, - "loss": 0.3664, - "step": 148200 - }, - { - "epoch": 36.17, - "learning_rate": 0.000319605423894454, - "loss": 0.3364, - "step": 148225 - }, - { - "epoch": 36.18, - "learning_rate": 0.0003195748839482043, - "loss": 0.3849, - "step": 148250 - }, - { - "epoch": 36.18, - "learning_rate": 0.0003195443440019546, - "loss": 0.3492, - "step": 148275 - }, - { - "epoch": 36.19, - "learning_rate": 0.00031951380405570483, - "loss": 0.3773, - "step": 148300 - }, - { - "epoch": 36.19, - "learning_rate": 0.0003194832641094552, - "loss": 0.3099, - "step": 148325 - }, - { - "epoch": 36.2, - "learning_rate": 0.0003194527241632055, - "loss": 0.3811, - "step": 148350 - }, - { - "epoch": 36.21, - "learning_rate": 0.0003194221842169558, - "loss": 0.3234, - "step": 148375 - }, - { - "epoch": 36.21, - "learning_rate": 0.0003193916442707061, - "loss": 0.4036, - "step": 148400 - }, - { - "epoch": 36.22, - "learning_rate": 0.0003193611043244564, - "loss": 0.2925, - "step": 148425 - }, - { - "epoch": 36.22, - "learning_rate": 0.00031933056437820665, - "loss": 0.3937, - "step": 148450 - }, - { - "epoch": 36.23, - "learning_rate": 0.000319300024431957, - "loss": 0.3269, - "step": 148475 - }, - { - "epoch": 36.24, - "learning_rate": 0.0003192694844857073, - "loss": 0.3872, - "step": 148500 - }, - { - "epoch": 36.24, - "learning_rate": 0.0003192389445394576, - "loss": 0.3289, - "step": 148525 - }, - { - "epoch": 36.25, - "learning_rate": 0.0003192084045932079, - "loss": 0.3613, - "step": 148550 - }, - { - "epoch": 36.26, - "learning_rate": 0.0003191778646469582, - "loss": 0.3232, - "step": 148575 - }, - { - "epoch": 36.26, - "learning_rate": 0.0003191473247007085, - "loss": 0.3684, - "step": 148600 - }, - { - "epoch": 36.27, - "learning_rate": 0.00031911678475445883, - "loss": 0.3468, - "step": 148625 - }, - { - "epoch": 36.27, - "learning_rate": 0.00031908624480820913, - "loss": 0.385, - "step": 148650 - }, - { - "epoch": 36.28, - "learning_rate": 0.00031905570486195944, - "loss": 0.3279, - "step": 148675 - }, - { - "epoch": 36.29, - "learning_rate": 0.00031902516491570974, - "loss": 0.3795, - "step": 148700 - }, - { - "epoch": 36.29, - "learning_rate": 0.0003189946249694601, - "loss": 0.3429, - "step": 148725 - }, - { - "epoch": 36.3, - "learning_rate": 0.0003189640850232104, - "loss": 0.3697, - "step": 148750 - }, - { - "epoch": 36.3, - "learning_rate": 0.00031893354507696065, - "loss": 0.3696, - "step": 148775 - }, - { - "epoch": 36.31, - "learning_rate": 0.00031890300513071095, - "loss": 0.3479, - "step": 148800 - }, - { - "epoch": 36.32, - "learning_rate": 0.00031887246518446126, - "loss": 0.3308, - "step": 148825 - }, - { - "epoch": 36.32, - "learning_rate": 0.0003188419252382116, - "loss": 0.3699, - "step": 148850 - }, - { - "epoch": 36.33, - "learning_rate": 0.0003188113852919619, - "loss": 0.3258, - "step": 148875 - }, - { - "epoch": 36.33, - "learning_rate": 0.0003187808453457122, - "loss": 0.3816, - "step": 148900 - }, - { - "epoch": 36.34, - "learning_rate": 0.00031875030539946247, - "loss": 0.3045, - "step": 148925 - }, - { - "epoch": 36.35, - "learning_rate": 0.00031871976545321277, - "loss": 0.3856, - "step": 148950 - }, - { - "epoch": 36.35, - "learning_rate": 0.00031868922550696313, - "loss": 0.3719, - "step": 148975 - }, - { - "epoch": 36.36, - "learning_rate": 0.00031865868556071343, - "loss": 0.3844, - "step": 149000 - }, - { - "epoch": 36.37, - "learning_rate": 0.00031862814561446374, - "loss": 0.3496, - "step": 149025 - }, - { - "epoch": 36.37, - "learning_rate": 0.00031859760566821404, - "loss": 0.379, - "step": 149050 - }, - { - "epoch": 36.38, - "learning_rate": 0.0003185670657219643, - "loss": 0.3435, - "step": 149075 - }, - { - "epoch": 36.38, - "learning_rate": 0.00031853652577571465, - "loss": 0.3707, - "step": 149100 - }, - { - "epoch": 36.39, - "learning_rate": 0.00031850598582946495, - "loss": 0.3272, - "step": 149125 - }, - { - "epoch": 36.4, - "learning_rate": 0.00031847544588321525, - "loss": 0.3826, - "step": 149150 - }, - { - "epoch": 36.4, - "learning_rate": 0.00031844490593696556, - "loss": 0.3228, - "step": 149175 - }, - { - "epoch": 36.41, - "learning_rate": 0.00031841436599071586, - "loss": 0.3787, - "step": 149200 - }, - { - "epoch": 36.41, - "learning_rate": 0.0003183838260444662, - "loss": 0.3101, - "step": 149225 - }, - { - "epoch": 36.42, - "learning_rate": 0.00031835328609821647, - "loss": 0.3894, - "step": 149250 - }, - { - "epoch": 36.43, - "learning_rate": 0.00031832274615196677, - "loss": 0.3226, - "step": 149275 - }, - { - "epoch": 36.43, - "learning_rate": 0.0003182922062057171, - "loss": 0.3965, - "step": 149300 - }, - { - "epoch": 36.44, - "learning_rate": 0.0003182616662594674, - "loss": 0.3584, - "step": 149325 - }, - { - "epoch": 36.44, - "learning_rate": 0.00031823112631321773, - "loss": 0.402, - "step": 149350 - }, - { - "epoch": 36.45, - "learning_rate": 0.00031820058636696804, - "loss": 0.3279, - "step": 149375 - }, - { - "epoch": 36.46, - "learning_rate": 0.0003181700464207183, - "loss": 0.3963, - "step": 149400 - }, - { - "epoch": 36.46, - "learning_rate": 0.0003181395064744686, - "loss": 0.3839, - "step": 149425 - }, - { - "epoch": 36.47, - "learning_rate": 0.0003181089665282189, - "loss": 0.3805, - "step": 149450 - }, - { - "epoch": 36.48, - "learning_rate": 0.00031807842658196925, - "loss": 0.3281, - "step": 149475 - }, - { - "epoch": 36.48, - "learning_rate": 0.00031804788663571955, - "loss": 0.4039, - "step": 149500 - }, - { - "epoch": 36.49, - "learning_rate": 0.00031801734668946986, - "loss": 0.3571, - "step": 149525 - }, - { - "epoch": 36.49, - "learning_rate": 0.0003179868067432201, - "loss": 0.3404, - "step": 149550 - }, - { - "epoch": 36.5, - "learning_rate": 0.0003179562667969704, - "loss": 0.3561, - "step": 149575 - }, - { - "epoch": 36.51, - "learning_rate": 0.00031792572685072077, - "loss": 0.3672, - "step": 149600 - }, - { - "epoch": 36.51, - "learning_rate": 0.00031789518690447107, - "loss": 0.3173, - "step": 149625 - }, - { - "epoch": 36.52, - "learning_rate": 0.0003178646469582214, - "loss": 0.4015, - "step": 149650 - }, - { - "epoch": 36.52, - "learning_rate": 0.0003178341070119717, - "loss": 0.3559, - "step": 149675 - }, - { - "epoch": 36.53, - "learning_rate": 0.00031780356706572193, - "loss": 0.3795, - "step": 149700 - }, - { - "epoch": 36.54, - "learning_rate": 0.00031777302711947223, - "loss": 0.3588, - "step": 149725 - }, - { - "epoch": 36.54, - "learning_rate": 0.0003177424871732226, - "loss": 0.4294, - "step": 149750 - }, - { - "epoch": 36.55, - "learning_rate": 0.0003177119472269729, - "loss": 0.3245, - "step": 149775 - }, - { - "epoch": 36.55, - "learning_rate": 0.0003176814072807232, - "loss": 0.3661, - "step": 149800 - }, - { - "epoch": 36.56, - "learning_rate": 0.0003176508673344735, - "loss": 0.3169, - "step": 149825 - }, - { - "epoch": 36.57, - "learning_rate": 0.0003176203273882238, - "loss": 0.3811, - "step": 149850 - }, - { - "epoch": 36.57, - "learning_rate": 0.0003175897874419741, - "loss": 0.377, - "step": 149875 - }, - { - "epoch": 36.58, - "learning_rate": 0.0003175592474957244, - "loss": 0.3724, - "step": 149900 - }, - { - "epoch": 36.58, - "learning_rate": 0.0003175287075494747, - "loss": 0.3341, - "step": 149925 - }, - { - "epoch": 36.59, - "learning_rate": 0.000317498167603225, - "loss": 0.3699, - "step": 149950 - }, - { - "epoch": 36.6, - "learning_rate": 0.0003174676276569753, - "loss": 0.3583, - "step": 149975 - }, - { - "epoch": 36.6, - "learning_rate": 0.0003174370877107257, - "loss": 0.408, - "step": 150000 - }, - { - "epoch": 36.6, - "eval_cer": 0.09135242240998737, - "eval_loss": 0.4018867313861847, - "eval_runtime": 149.0214, - "eval_samples_per_second": 28.137, - "eval_steps_per_second": 7.039, - "eval_wer": 0.3780750407830343, - "step": 150000 - }, - { - "epoch": 36.61, - "learning_rate": 0.0003174065477644759, - "loss": 0.3359, - "step": 150025 - }, - { - "epoch": 36.62, - "learning_rate": 0.00031737600781822623, - "loss": 0.3467, - "step": 150050 - }, - { - "epoch": 36.62, - "learning_rate": 0.00031734546787197653, - "loss": 0.3999, - "step": 150075 - }, - { - "epoch": 36.63, - "learning_rate": 0.00031731492792572684, - "loss": 0.3519, - "step": 150100 - }, - { - "epoch": 36.63, - "learning_rate": 0.0003172843879794772, - "loss": 0.3624, - "step": 150125 - }, - { - "epoch": 36.64, - "learning_rate": 0.0003172538480332275, - "loss": 0.4109, - "step": 150150 - }, - { - "epoch": 36.65, - "learning_rate": 0.00031722330808697775, - "loss": 0.3374, - "step": 150175 - }, - { - "epoch": 36.65, - "learning_rate": 0.00031719398973857805, - "loss": 0.4039, - "step": 150200 - }, - { - "epoch": 36.66, - "learning_rate": 0.00031716344979232835, - "loss": 0.3698, - "step": 150225 - }, - { - "epoch": 36.66, - "learning_rate": 0.00031713290984607866, - "loss": 0.3895, - "step": 150250 - }, - { - "epoch": 36.67, - "learning_rate": 0.000317102369899829, - "loss": 0.3492, - "step": 150275 - }, - { - "epoch": 36.68, - "learning_rate": 0.0003170718299535793, - "loss": 0.3893, - "step": 150300 - }, - { - "epoch": 36.68, - "learning_rate": 0.0003170412900073296, - "loss": 0.3069, - "step": 150325 - }, - { - "epoch": 36.69, - "learning_rate": 0.00031701075006107987, - "loss": 0.3858, - "step": 150350 - }, - { - "epoch": 36.69, - "learning_rate": 0.0003169802101148302, - "loss": 0.3083, - "step": 150375 - }, - { - "epoch": 36.7, - "learning_rate": 0.00031694967016858053, - "loss": 0.3714, - "step": 150400 - }, - { - "epoch": 36.71, - "learning_rate": 0.00031691913022233084, - "loss": 0.3288, - "step": 150425 - }, - { - "epoch": 36.71, - "learning_rate": 0.00031688859027608114, - "loss": 0.4096, - "step": 150450 - }, - { - "epoch": 36.72, - "learning_rate": 0.00031685805032983144, - "loss": 0.3209, - "step": 150475 - }, - { - "epoch": 36.73, - "learning_rate": 0.0003168275103835817, - "loss": 0.3546, - "step": 150500 - }, - { - "epoch": 36.73, - "learning_rate": 0.000316796970437332, - "loss": 0.3455, - "step": 150525 - }, - { - "epoch": 36.74, - "learning_rate": 0.00031676643049108235, - "loss": 0.3994, - "step": 150550 - }, - { - "epoch": 36.74, - "learning_rate": 0.00031673589054483266, - "loss": 0.3656, - "step": 150575 - }, - { - "epoch": 36.75, - "learning_rate": 0.00031670535059858296, - "loss": 0.3779, - "step": 150600 - }, - { - "epoch": 36.76, - "learning_rate": 0.00031667481065233326, - "loss": 0.3492, - "step": 150625 - }, - { - "epoch": 36.76, - "learning_rate": 0.0003166442707060835, - "loss": 0.3824, - "step": 150650 - }, - { - "epoch": 36.77, - "learning_rate": 0.00031661373075983387, - "loss": 0.3349, - "step": 150675 - }, - { - "epoch": 36.77, - "learning_rate": 0.00031658319081358417, - "loss": 0.3545, - "step": 150700 - }, - { - "epoch": 36.78, - "learning_rate": 0.0003165526508673345, - "loss": 0.3335, - "step": 150725 - }, - { - "epoch": 36.79, - "learning_rate": 0.0003165221109210848, - "loss": 0.3794, - "step": 150750 - }, - { - "epoch": 36.79, - "learning_rate": 0.0003164915709748351, - "loss": 0.3286, - "step": 150775 - }, - { - "epoch": 36.8, - "learning_rate": 0.00031646103102858544, - "loss": 0.4115, - "step": 150800 - }, - { - "epoch": 36.8, - "learning_rate": 0.0003164304910823357, - "loss": 0.3495, - "step": 150825 - }, - { - "epoch": 36.81, - "learning_rate": 0.000316399951136086, - "loss": 0.3778, - "step": 150850 - }, - { - "epoch": 36.82, - "learning_rate": 0.0003163694111898363, - "loss": 0.3178, - "step": 150875 - }, - { - "epoch": 36.82, - "learning_rate": 0.0003163388712435866, - "loss": 0.3725, - "step": 150900 - }, - { - "epoch": 36.83, - "learning_rate": 0.00031630833129733696, - "loss": 0.324, - "step": 150925 - }, - { - "epoch": 36.84, - "learning_rate": 0.00031627779135108726, - "loss": 0.3948, - "step": 150950 - }, - { - "epoch": 36.84, - "learning_rate": 0.0003162472514048375, - "loss": 0.3707, - "step": 150975 - }, - { - "epoch": 36.85, - "learning_rate": 0.0003162167114585878, - "loss": 0.3868, - "step": 151000 - }, - { - "epoch": 36.85, - "learning_rate": 0.0003161861715123381, - "loss": 0.3439, - "step": 151025 - }, - { - "epoch": 36.86, - "learning_rate": 0.0003161556315660885, - "loss": 0.3855, - "step": 151050 - }, - { - "epoch": 36.87, - "learning_rate": 0.0003161250916198388, - "loss": 0.3445, - "step": 151075 - }, - { - "epoch": 36.87, - "learning_rate": 0.0003160945516735891, - "loss": 0.3752, - "step": 151100 - }, - { - "epoch": 36.88, - "learning_rate": 0.00031606401172733933, - "loss": 0.3755, - "step": 151125 - }, - { - "epoch": 36.88, - "learning_rate": 0.00031603347178108963, - "loss": 0.4136, - "step": 151150 - }, - { - "epoch": 36.89, - "learning_rate": 0.00031600293183484, - "loss": 0.3776, - "step": 151175 - }, - { - "epoch": 36.9, - "learning_rate": 0.0003159723918885903, - "loss": 0.3947, - "step": 151200 - }, - { - "epoch": 36.9, - "learning_rate": 0.0003159418519423406, - "loss": 0.3663, - "step": 151225 - }, - { - "epoch": 36.91, - "learning_rate": 0.0003159113119960909, - "loss": 0.3671, - "step": 151250 - }, - { - "epoch": 36.91, - "learning_rate": 0.0003158807720498412, - "loss": 0.3609, - "step": 151275 - }, - { - "epoch": 36.92, - "learning_rate": 0.0003158502321035915, - "loss": 0.3713, - "step": 151300 - }, - { - "epoch": 36.93, - "learning_rate": 0.0003158196921573418, - "loss": 0.3369, - "step": 151325 - }, - { - "epoch": 36.93, - "learning_rate": 0.0003157891522110921, - "loss": 0.3894, - "step": 151350 - }, - { - "epoch": 36.94, - "learning_rate": 0.0003157586122648424, - "loss": 0.3614, - "step": 151375 - }, - { - "epoch": 36.94, - "learning_rate": 0.0003157280723185927, - "loss": 0.3813, - "step": 151400 - }, - { - "epoch": 36.95, - "learning_rate": 0.0003156975323723431, - "loss": 0.3522, - "step": 151425 - }, - { - "epoch": 36.96, - "learning_rate": 0.00031566699242609333, - "loss": 0.3855, - "step": 151450 - }, - { - "epoch": 36.96, - "learning_rate": 0.00031563645247984363, - "loss": 0.3148, - "step": 151475 - }, - { - "epoch": 36.97, - "learning_rate": 0.00031560591253359393, - "loss": 0.4214, - "step": 151500 - }, - { - "epoch": 36.98, - "learning_rate": 0.00031557537258734424, - "loss": 0.3241, - "step": 151525 - }, - { - "epoch": 36.98, - "learning_rate": 0.0003155448326410946, - "loss": 0.412, - "step": 151550 - }, - { - "epoch": 36.99, - "learning_rate": 0.0003155142926948449, - "loss": 0.397, - "step": 151575 - }, - { - "epoch": 36.99, - "learning_rate": 0.00031548375274859515, - "loss": 0.3947, - "step": 151600 - }, - { - "epoch": 37.0, - "learning_rate": 0.00031545321280234545, - "loss": 0.295, - "step": 151625 - }, - { - "epoch": 37.01, - "learning_rate": 0.00031542267285609575, - "loss": 0.4214, - "step": 151650 - }, - { - "epoch": 37.01, - "learning_rate": 0.0003153921329098461, - "loss": 0.3445, - "step": 151675 - }, - { - "epoch": 37.02, - "learning_rate": 0.0003153615929635964, - "loss": 0.371, - "step": 151700 - }, - { - "epoch": 37.02, - "learning_rate": 0.0003153310530173467, - "loss": 0.3183, - "step": 151725 - }, - { - "epoch": 37.03, - "learning_rate": 0.000315300513071097, - "loss": 0.3857, - "step": 151750 - }, - { - "epoch": 37.04, - "learning_rate": 0.00031526997312484727, - "loss": 0.3127, - "step": 151775 - }, - { - "epoch": 37.04, - "learning_rate": 0.0003152394331785976, - "loss": 0.3762, - "step": 151800 - }, - { - "epoch": 37.05, - "learning_rate": 0.00031520889323234793, - "loss": 0.3028, - "step": 151825 - }, - { - "epoch": 37.05, - "learning_rate": 0.00031517835328609824, - "loss": 0.3879, - "step": 151850 - }, - { - "epoch": 37.06, - "learning_rate": 0.00031514781333984854, - "loss": 0.3842, - "step": 151875 - }, - { - "epoch": 37.07, - "learning_rate": 0.00031511727339359884, - "loss": 0.3761, - "step": 151900 - }, - { - "epoch": 37.07, - "learning_rate": 0.0003150867334473491, - "loss": 0.346, - "step": 151925 - }, - { - "epoch": 37.08, - "learning_rate": 0.00031505619350109945, - "loss": 0.3817, - "step": 151950 - }, - { - "epoch": 37.09, - "learning_rate": 0.00031502565355484975, - "loss": 0.3488, - "step": 151975 - }, - { - "epoch": 37.09, - "learning_rate": 0.00031499511360860006, - "loss": 0.3675, - "step": 152000 - }, - { - "epoch": 37.1, - "learning_rate": 0.00031496457366235036, - "loss": 0.3434, - "step": 152025 - }, - { - "epoch": 37.1, - "learning_rate": 0.00031493403371610066, - "loss": 0.3962, - "step": 152050 - }, - { - "epoch": 37.11, - "learning_rate": 0.00031490349376985097, - "loss": 0.3325, - "step": 152075 - }, - { - "epoch": 37.12, - "learning_rate": 0.00031487295382360127, - "loss": 0.3673, - "step": 152100 - }, - { - "epoch": 37.12, - "learning_rate": 0.00031484241387735157, - "loss": 0.3133, - "step": 152125 - }, - { - "epoch": 37.13, - "learning_rate": 0.0003148118739311019, - "loss": 0.3723, - "step": 152150 - }, - { - "epoch": 37.13, - "learning_rate": 0.0003147813339848522, - "loss": 0.366, - "step": 152175 - }, - { - "epoch": 37.14, - "learning_rate": 0.00031475079403860254, - "loss": 0.3774, - "step": 152200 - }, - { - "epoch": 37.15, - "learning_rate": 0.00031472025409235284, - "loss": 0.3535, - "step": 152225 - }, - { - "epoch": 37.15, - "learning_rate": 0.0003146897141461031, - "loss": 0.3537, - "step": 152250 - }, - { - "epoch": 37.16, - "learning_rate": 0.0003146603957977034, - "loss": 0.309, - "step": 152275 - }, - { - "epoch": 37.16, - "learning_rate": 0.0003146298558514537, - "loss": 0.3716, - "step": 152300 - }, - { - "epoch": 37.17, - "learning_rate": 0.000314599315905204, - "loss": 0.3139, - "step": 152325 - }, - { - "epoch": 37.18, - "learning_rate": 0.00031456877595895436, - "loss": 0.3545, - "step": 152350 - }, - { - "epoch": 37.18, - "learning_rate": 0.00031453823601270466, - "loss": 0.3189, - "step": 152375 - }, - { - "epoch": 37.19, - "learning_rate": 0.0003145076960664549, - "loss": 0.375, - "step": 152400 - }, - { - "epoch": 37.19, - "learning_rate": 0.0003144771561202052, - "loss": 0.366, - "step": 152425 - }, - { - "epoch": 37.2, - "learning_rate": 0.0003144466161739555, - "loss": 0.3618, - "step": 152450 - }, - { - "epoch": 37.21, - "learning_rate": 0.0003144160762277059, - "loss": 0.3243, - "step": 152475 - }, - { - "epoch": 37.21, - "learning_rate": 0.0003143855362814562, - "loss": 0.3805, - "step": 152500 - }, - { - "epoch": 37.22, - "learning_rate": 0.0003143549963352065, - "loss": 0.3194, - "step": 152525 - }, - { - "epoch": 37.23, - "learning_rate": 0.00031432445638895673, - "loss": 0.3671, - "step": 152550 - }, - { - "epoch": 37.23, - "learning_rate": 0.00031429391644270704, - "loss": 0.3048, - "step": 152575 - }, - { - "epoch": 37.24, - "learning_rate": 0.00031426337649645734, - "loss": 0.3994, - "step": 152600 - }, - { - "epoch": 37.24, - "learning_rate": 0.0003142328365502077, - "loss": 0.3395, - "step": 152625 - }, - { - "epoch": 37.25, - "learning_rate": 0.000314202296603958, - "loss": 0.3874, - "step": 152650 - }, - { - "epoch": 37.26, - "learning_rate": 0.0003141717566577083, - "loss": 0.3063, - "step": 152675 - }, - { - "epoch": 37.26, - "learning_rate": 0.0003141412167114586, - "loss": 0.3598, - "step": 152700 - }, - { - "epoch": 37.27, - "learning_rate": 0.00031411067676520886, - "loss": 0.3066, - "step": 152725 - }, - { - "epoch": 37.27, - "learning_rate": 0.0003140801368189592, - "loss": 0.3716, - "step": 152750 - }, - { - "epoch": 37.28, - "learning_rate": 0.0003140495968727095, - "loss": 0.3447, - "step": 152775 - }, - { - "epoch": 37.29, - "learning_rate": 0.0003140190569264598, - "loss": 0.394, - "step": 152800 - }, - { - "epoch": 37.29, - "learning_rate": 0.0003139885169802101, - "loss": 0.3836, - "step": 152825 - }, - { - "epoch": 37.3, - "learning_rate": 0.0003139579770339604, - "loss": 0.3557, - "step": 152850 - }, - { - "epoch": 37.3, - "learning_rate": 0.00031392743708771073, - "loss": 0.3331, - "step": 152875 - }, - { - "epoch": 37.31, - "learning_rate": 0.00031389689714146103, - "loss": 0.379, - "step": 152900 - }, - { - "epoch": 37.32, - "learning_rate": 0.00031386635719521134, - "loss": 0.3065, - "step": 152925 - }, - { - "epoch": 37.32, - "learning_rate": 0.00031383581724896164, - "loss": 0.3761, - "step": 152950 - }, - { - "epoch": 37.33, - "learning_rate": 0.00031380527730271194, - "loss": 0.3338, - "step": 152975 - }, - { - "epoch": 37.34, - "learning_rate": 0.0003137747373564623, - "loss": 0.3632, - "step": 153000 - }, - { - "epoch": 37.34, - "eval_cer": 0.09168095438538854, - "eval_loss": 0.40829116106033325, - "eval_runtime": 148.4618, - "eval_samples_per_second": 28.243, - "eval_steps_per_second": 7.066, - "eval_wer": 0.38140293637846656, - "step": 153000 - }, - { - "epoch": 37.34, - "learning_rate": 0.00031374419741021255, - "loss": 0.3374, - "step": 153025 - }, - { - "epoch": 37.35, - "learning_rate": 0.00031371365746396285, - "loss": 0.383, - "step": 153050 - }, - { - "epoch": 37.35, - "learning_rate": 0.00031368311751771316, - "loss": 0.3429, - "step": 153075 - }, - { - "epoch": 37.36, - "learning_rate": 0.00031365257757146346, - "loss": 0.3699, - "step": 153100 - }, - { - "epoch": 37.37, - "learning_rate": 0.0003136220376252138, - "loss": 0.3116, - "step": 153125 - }, - { - "epoch": 37.37, - "learning_rate": 0.0003135914976789641, - "loss": 0.3865, - "step": 153150 - }, - { - "epoch": 37.38, - "learning_rate": 0.0003135609577327144, - "loss": 0.3409, - "step": 153175 - }, - { - "epoch": 37.38, - "learning_rate": 0.0003135304177864647, - "loss": 0.372, - "step": 153200 - }, - { - "epoch": 37.39, - "learning_rate": 0.000313499877840215, - "loss": 0.3812, - "step": 153225 - }, - { - "epoch": 37.4, - "learning_rate": 0.00031346933789396533, - "loss": 0.373, - "step": 153250 - }, - { - "epoch": 37.4, - "learning_rate": 0.00031343879794771564, - "loss": 0.3142, - "step": 153275 - }, - { - "epoch": 37.41, - "learning_rate": 0.00031340825800146594, - "loss": 0.3495, - "step": 153300 - }, - { - "epoch": 37.41, - "learning_rate": 0.00031337771805521624, - "loss": 0.3527, - "step": 153325 - }, - { - "epoch": 37.42, - "learning_rate": 0.0003133471781089665, - "loss": 0.3969, - "step": 153350 - }, - { - "epoch": 37.43, - "learning_rate": 0.00031331663816271685, - "loss": 0.3238, - "step": 153375 - }, - { - "epoch": 37.43, - "learning_rate": 0.00031328609821646715, - "loss": 0.3597, - "step": 153400 - }, - { - "epoch": 37.44, - "learning_rate": 0.00031325555827021746, - "loss": 0.3015, - "step": 153425 - }, - { - "epoch": 37.45, - "learning_rate": 0.00031322501832396776, - "loss": 0.3801, - "step": 153450 - }, - { - "epoch": 37.45, - "learning_rate": 0.00031319447837771806, - "loss": 0.3414, - "step": 153475 - }, - { - "epoch": 37.46, - "learning_rate": 0.00031316393843146837, - "loss": 0.3881, - "step": 153500 - }, - { - "epoch": 37.46, - "learning_rate": 0.00031313339848521867, - "loss": 0.3183, - "step": 153525 - }, - { - "epoch": 37.47, - "learning_rate": 0.000313102858538969, - "loss": 0.3875, - "step": 153550 - }, - { - "epoch": 37.48, - "learning_rate": 0.0003130723185927193, - "loss": 0.3188, - "step": 153575 - }, - { - "epoch": 37.48, - "learning_rate": 0.0003130417786464696, - "loss": 0.3813, - "step": 153600 - }, - { - "epoch": 37.49, - "learning_rate": 0.00031301123870021994, - "loss": 0.3453, - "step": 153625 - }, - { - "epoch": 37.49, - "learning_rate": 0.0003129806987539702, - "loss": 0.3438, - "step": 153650 - }, - { - "epoch": 37.5, - "learning_rate": 0.0003129501588077205, - "loss": 0.3138, - "step": 153675 - }, - { - "epoch": 37.51, - "learning_rate": 0.0003129196188614708, - "loss": 0.3745, - "step": 153700 - }, - { - "epoch": 37.51, - "learning_rate": 0.0003128890789152211, - "loss": 0.3121, - "step": 153725 - }, - { - "epoch": 37.52, - "learning_rate": 0.00031285853896897145, - "loss": 0.3774, - "step": 153750 - }, - { - "epoch": 37.52, - "learning_rate": 0.00031282799902272176, - "loss": 0.3335, - "step": 153775 - }, - { - "epoch": 37.53, - "learning_rate": 0.00031279745907647206, - "loss": 0.3647, - "step": 153800 - }, - { - "epoch": 37.54, - "learning_rate": 0.0003127669191302223, - "loss": 0.3647, - "step": 153825 - }, - { - "epoch": 37.54, - "learning_rate": 0.0003127363791839726, - "loss": 0.3418, - "step": 153850 - }, - { - "epoch": 37.55, - "learning_rate": 0.0003127058392377229, - "loss": 0.3247, - "step": 153875 - }, - { - "epoch": 37.55, - "learning_rate": 0.0003126752992914733, - "loss": 0.3909, - "step": 153900 - }, - { - "epoch": 37.56, - "learning_rate": 0.0003126447593452236, - "loss": 0.334, - "step": 153925 - }, - { - "epoch": 37.57, - "learning_rate": 0.0003126142193989739, - "loss": 0.3984, - "step": 153950 - }, - { - "epoch": 37.57, - "learning_rate": 0.00031258367945272413, - "loss": 0.3609, - "step": 153975 - }, - { - "epoch": 37.58, - "learning_rate": 0.00031255313950647443, - "loss": 0.3759, - "step": 154000 - }, - { - "epoch": 37.59, - "learning_rate": 0.0003125225995602248, - "loss": 0.3416, - "step": 154025 - }, - { - "epoch": 37.59, - "learning_rate": 0.0003124920596139751, - "loss": 0.4028, - "step": 154050 - }, - { - "epoch": 37.6, - "learning_rate": 0.0003124615196677254, - "loss": 0.341, - "step": 154075 - }, - { - "epoch": 37.6, - "learning_rate": 0.0003124309797214757, - "loss": 0.3857, - "step": 154100 - }, - { - "epoch": 37.61, - "learning_rate": 0.00031240043977522595, - "loss": 0.3042, - "step": 154125 - }, - { - "epoch": 37.62, - "learning_rate": 0.0003123698998289763, - "loss": 0.3616, - "step": 154150 - }, - { - "epoch": 37.62, - "learning_rate": 0.0003123393598827266, - "loss": 0.3524, - "step": 154175 - }, - { - "epoch": 37.63, - "learning_rate": 0.0003123088199364769, - "loss": 0.3803, - "step": 154200 - }, - { - "epoch": 37.63, - "learning_rate": 0.0003122782799902272, - "loss": 0.2806, - "step": 154225 - }, - { - "epoch": 37.64, - "learning_rate": 0.0003122477400439775, - "loss": 0.3637, - "step": 154250 - }, - { - "epoch": 37.65, - "learning_rate": 0.0003122172000977279, - "loss": 0.337, - "step": 154275 - }, - { - "epoch": 37.65, - "learning_rate": 0.00031218666015147813, - "loss": 0.3736, - "step": 154300 - }, - { - "epoch": 37.66, - "learning_rate": 0.00031215612020522843, - "loss": 0.3206, - "step": 154325 - }, - { - "epoch": 37.66, - "learning_rate": 0.00031212558025897874, - "loss": 0.346, - "step": 154350 - }, - { - "epoch": 37.67, - "learning_rate": 0.00031209504031272904, - "loss": 0.3539, - "step": 154375 - }, - { - "epoch": 37.68, - "learning_rate": 0.0003120645003664794, - "loss": 0.376, - "step": 154400 - }, - { - "epoch": 37.68, - "learning_rate": 0.0003120339604202297, - "loss": 0.3605, - "step": 154425 - }, - { - "epoch": 37.69, - "learning_rate": 0.00031200342047397995, - "loss": 0.3651, - "step": 154450 - }, - { - "epoch": 37.7, - "learning_rate": 0.00031197288052773025, - "loss": 0.3858, - "step": 154475 - }, - { - "epoch": 37.7, - "learning_rate": 0.00031194234058148056, - "loss": 0.3746, - "step": 154500 - }, - { - "epoch": 37.71, - "learning_rate": 0.0003119118006352309, - "loss": 0.3329, - "step": 154525 - }, - { - "epoch": 37.71, - "learning_rate": 0.0003118812606889812, - "loss": 0.3976, - "step": 154550 - }, - { - "epoch": 37.72, - "learning_rate": 0.0003118507207427315, - "loss": 0.3131, - "step": 154575 - }, - { - "epoch": 37.73, - "learning_rate": 0.00031182018079648177, - "loss": 0.3685, - "step": 154600 - }, - { - "epoch": 37.73, - "learning_rate": 0.00031178964085023207, - "loss": 0.3311, - "step": 154625 - }, - { - "epoch": 37.74, - "learning_rate": 0.00031175910090398243, - "loss": 0.3813, - "step": 154650 - }, - { - "epoch": 37.74, - "learning_rate": 0.00031172856095773273, - "loss": 0.3179, - "step": 154675 - }, - { - "epoch": 37.75, - "learning_rate": 0.00031169802101148304, - "loss": 0.38, - "step": 154700 - }, - { - "epoch": 37.76, - "learning_rate": 0.00031166748106523334, - "loss": 0.2989, - "step": 154725 - }, - { - "epoch": 37.76, - "learning_rate": 0.00031163694111898364, - "loss": 0.3676, - "step": 154750 - }, - { - "epoch": 37.77, - "learning_rate": 0.00031160640117273395, - "loss": 0.3427, - "step": 154775 - }, - { - "epoch": 37.77, - "learning_rate": 0.00031157586122648425, - "loss": 0.3874, - "step": 154800 - }, - { - "epoch": 37.78, - "learning_rate": 0.00031154532128023455, - "loss": 0.3477, - "step": 154825 - }, - { - "epoch": 37.79, - "learning_rate": 0.00031151478133398486, - "loss": 0.344, - "step": 154850 - }, - { - "epoch": 37.79, - "learning_rate": 0.00031148424138773516, - "loss": 0.3357, - "step": 154875 - }, - { - "epoch": 37.8, - "learning_rate": 0.0003114537014414855, - "loss": 0.3821, - "step": 154900 - }, - { - "epoch": 37.81, - "learning_rate": 0.00031142316149523577, - "loss": 0.3115, - "step": 154925 - }, - { - "epoch": 37.81, - "learning_rate": 0.00031139262154898607, - "loss": 0.3384, - "step": 154950 - }, - { - "epoch": 37.82, - "learning_rate": 0.0003113620816027364, - "loss": 0.3625, - "step": 154975 - }, - { - "epoch": 37.82, - "learning_rate": 0.0003113315416564867, - "loss": 0.383, - "step": 155000 - }, - { - "epoch": 37.83, - "learning_rate": 0.00031130100171023703, - "loss": 0.3745, - "step": 155025 - }, - { - "epoch": 37.84, - "learning_rate": 0.00031127046176398734, - "loss": 0.3998, - "step": 155050 - }, - { - "epoch": 37.84, - "learning_rate": 0.0003112399218177376, - "loss": 0.3262, - "step": 155075 - }, - { - "epoch": 37.85, - "learning_rate": 0.0003112093818714879, - "loss": 0.3842, - "step": 155100 - }, - { - "epoch": 37.85, - "learning_rate": 0.0003111800635230882, - "loss": 0.3746, - "step": 155125 - }, - { - "epoch": 37.86, - "learning_rate": 0.0003111495235768385, - "loss": 0.37, - "step": 155150 - }, - { - "epoch": 37.87, - "learning_rate": 0.0003111189836305888, - "loss": 0.3215, - "step": 155175 - }, - { - "epoch": 37.87, - "learning_rate": 0.00031108844368433916, - "loss": 0.3761, - "step": 155200 - }, - { - "epoch": 37.88, - "learning_rate": 0.00031105790373808946, - "loss": 0.3683, - "step": 155225 - }, - { - "epoch": 37.88, - "learning_rate": 0.0003110273637918397, - "loss": 0.3582, - "step": 155250 - }, - { - "epoch": 37.89, - "learning_rate": 0.00031099682384559, - "loss": 0.3242, - "step": 155275 - }, - { - "epoch": 37.9, - "learning_rate": 0.0003109662838993403, - "loss": 0.3859, - "step": 155300 - }, - { - "epoch": 37.9, - "learning_rate": 0.0003109357439530907, - "loss": 0.3175, - "step": 155325 - }, - { - "epoch": 37.91, - "learning_rate": 0.000310905204006841, - "loss": 0.3666, - "step": 155350 - }, - { - "epoch": 37.91, - "learning_rate": 0.0003108746640605913, - "loss": 0.3116, - "step": 155375 - }, - { - "epoch": 37.92, - "learning_rate": 0.00031084412411434153, - "loss": 0.3966, - "step": 155400 - }, - { - "epoch": 37.93, - "learning_rate": 0.00031081358416809184, - "loss": 0.3215, - "step": 155425 - }, - { - "epoch": 37.93, - "learning_rate": 0.0003107830442218422, - "loss": 0.3751, - "step": 155450 - }, - { - "epoch": 37.94, - "learning_rate": 0.0003107525042755925, - "loss": 0.3868, - "step": 155475 - }, - { - "epoch": 37.95, - "learning_rate": 0.0003107219643293428, - "loss": 0.3995, - "step": 155500 - }, - { - "epoch": 37.95, - "learning_rate": 0.0003106914243830931, - "loss": 0.3341, - "step": 155525 - }, - { - "epoch": 37.96, - "learning_rate": 0.00031066088443684335, - "loss": 0.3976, - "step": 155550 - }, - { - "epoch": 37.96, - "learning_rate": 0.0003106303444905937, - "loss": 0.3575, - "step": 155575 - }, - { - "epoch": 37.97, - "learning_rate": 0.000310599804544344, - "loss": 0.3953, - "step": 155600 - }, - { - "epoch": 37.98, - "learning_rate": 0.0003105692645980943, - "loss": 0.3328, - "step": 155625 - }, - { - "epoch": 37.98, - "learning_rate": 0.0003105387246518446, - "loss": 0.383, - "step": 155650 - }, - { - "epoch": 37.99, - "learning_rate": 0.0003105081847055949, - "loss": 0.3547, - "step": 155675 - }, - { - "epoch": 37.99, - "learning_rate": 0.0003104776447593453, - "loss": 0.3654, - "step": 155700 - }, - { - "epoch": 38.0, - "learning_rate": 0.00031044710481309553, - "loss": 0.3441, - "step": 155725 - }, - { - "epoch": 38.01, - "learning_rate": 0.00031041656486684583, - "loss": 0.3477, - "step": 155750 - }, - { - "epoch": 38.01, - "learning_rate": 0.00031038602492059614, - "loss": 0.339, - "step": 155775 - }, - { - "epoch": 38.02, - "learning_rate": 0.00031035548497434644, - "loss": 0.4182, - "step": 155800 - }, - { - "epoch": 38.02, - "learning_rate": 0.0003103249450280968, - "loss": 0.3457, - "step": 155825 - }, - { - "epoch": 38.03, - "learning_rate": 0.0003102944050818471, - "loss": 0.3448, - "step": 155850 - }, - { - "epoch": 38.04, - "learning_rate": 0.00031026386513559735, - "loss": 0.3479, - "step": 155875 - }, - { - "epoch": 38.04, - "learning_rate": 0.00031023332518934765, - "loss": 0.3582, - "step": 155900 - }, - { - "epoch": 38.05, - "learning_rate": 0.00031020278524309796, - "loss": 0.338, - "step": 155925 - }, - { - "epoch": 38.06, - "learning_rate": 0.00031017224529684826, - "loss": 0.3746, - "step": 155950 - }, - { - "epoch": 38.06, - "learning_rate": 0.0003101417053505986, - "loss": 0.2483, - "step": 155975 - }, - { - "epoch": 38.07, - "learning_rate": 0.0003101111654043489, - "loss": 0.381, - "step": 156000 - }, - { - "epoch": 38.07, - "eval_cer": 0.09138835559479687, - "eval_loss": 0.4063064157962799, - "eval_runtime": 149.0731, - "eval_samples_per_second": 28.127, - "eval_steps_per_second": 7.037, - "eval_wer": 0.373768352365416, - "step": 156000 - }, - { - "epoch": 38.07, - "learning_rate": 0.00031008062545809917, - "loss": 0.3356, - "step": 156025 - }, - { - "epoch": 38.08, - "learning_rate": 0.0003100500855118495, - "loss": 0.3456, - "step": 156050 - }, - { - "epoch": 38.09, - "learning_rate": 0.0003100195455655998, - "loss": 0.3717, - "step": 156075 - }, - { - "epoch": 38.09, - "learning_rate": 0.00030998900561935014, - "loss": 0.3781, - "step": 156100 - }, - { - "epoch": 38.1, - "learning_rate": 0.00030995846567310044, - "loss": 0.2897, - "step": 156125 - }, - { - "epoch": 38.1, - "learning_rate": 0.00030992792572685074, - "loss": 0.3618, - "step": 156150 - }, - { - "epoch": 38.11, - "learning_rate": 0.00030989738578060105, - "loss": 0.3098, - "step": 156175 - }, - { - "epoch": 38.12, - "learning_rate": 0.0003098668458343513, - "loss": 0.3536, - "step": 156200 - }, - { - "epoch": 38.12, - "learning_rate": 0.00030983630588810165, - "loss": 0.3248, - "step": 156225 - }, - { - "epoch": 38.13, - "learning_rate": 0.00030980576594185196, - "loss": 0.3859, - "step": 156250 - }, - { - "epoch": 38.13, - "learning_rate": 0.00030977522599560226, - "loss": 0.3119, - "step": 156275 - }, - { - "epoch": 38.14, - "learning_rate": 0.00030974468604935256, - "loss": 0.3489, - "step": 156300 - }, - { - "epoch": 38.15, - "learning_rate": 0.00030971414610310287, - "loss": 0.3205, - "step": 156325 - }, - { - "epoch": 38.15, - "learning_rate": 0.00030968360615685317, - "loss": 0.3643, - "step": 156350 - }, - { - "epoch": 38.16, - "learning_rate": 0.00030965306621060347, - "loss": 0.3497, - "step": 156375 - }, - { - "epoch": 38.16, - "learning_rate": 0.0003096225262643538, - "loss": 0.3789, - "step": 156400 - }, - { - "epoch": 38.17, - "learning_rate": 0.0003095919863181041, - "loss": 0.3531, - "step": 156425 - }, - { - "epoch": 38.18, - "learning_rate": 0.0003095614463718544, - "loss": 0.3614, - "step": 156450 - }, - { - "epoch": 38.18, - "learning_rate": 0.00030953090642560474, - "loss": 0.3456, - "step": 156475 - }, - { - "epoch": 38.19, - "learning_rate": 0.000309500366479355, - "loss": 0.3613, - "step": 156500 - }, - { - "epoch": 38.2, - "learning_rate": 0.0003094698265331053, - "loss": 0.2974, - "step": 156525 - }, - { - "epoch": 38.2, - "learning_rate": 0.0003094392865868556, - "loss": 0.3759, - "step": 156550 - }, - { - "epoch": 38.21, - "learning_rate": 0.0003094087466406059, - "loss": 0.3586, - "step": 156575 - }, - { - "epoch": 38.21, - "learning_rate": 0.00030937820669435626, - "loss": 0.3498, - "step": 156600 - }, - { - "epoch": 38.22, - "learning_rate": 0.00030934766674810656, - "loss": 0.3484, - "step": 156625 - }, - { - "epoch": 38.23, - "learning_rate": 0.0003093171268018568, - "loss": 0.3656, - "step": 156650 - }, - { - "epoch": 38.23, - "learning_rate": 0.0003092865868556071, - "loss": 0.3113, - "step": 156675 - }, - { - "epoch": 38.24, - "learning_rate": 0.0003092560469093574, - "loss": 0.3757, - "step": 156700 - }, - { - "epoch": 38.24, - "learning_rate": 0.0003092255069631078, - "loss": 0.3385, - "step": 156725 - }, - { - "epoch": 38.25, - "learning_rate": 0.0003091949670168581, - "loss": 0.3611, - "step": 156750 - }, - { - "epoch": 38.26, - "learning_rate": 0.0003091644270706084, - "loss": 0.3193, - "step": 156775 - }, - { - "epoch": 38.26, - "learning_rate": 0.0003091338871243587, - "loss": 0.3628, - "step": 156800 - }, - { - "epoch": 38.27, - "learning_rate": 0.00030910334717810893, - "loss": 0.3189, - "step": 156825 - }, - { - "epoch": 38.27, - "learning_rate": 0.0003090728072318593, - "loss": 0.3541, - "step": 156850 - }, - { - "epoch": 38.28, - "learning_rate": 0.0003090422672856096, - "loss": 0.2861, - "step": 156875 - }, - { - "epoch": 38.29, - "learning_rate": 0.0003090117273393599, - "loss": 0.366, - "step": 156900 - }, - { - "epoch": 38.29, - "learning_rate": 0.0003089811873931102, - "loss": 0.3202, - "step": 156925 - }, - { - "epoch": 38.3, - "learning_rate": 0.0003089506474468605, - "loss": 0.3439, - "step": 156950 - }, - { - "epoch": 38.31, - "learning_rate": 0.0003089201075006108, - "loss": 0.3096, - "step": 156975 - }, - { - "epoch": 38.31, - "learning_rate": 0.0003088895675543611, - "loss": 0.3748, - "step": 157000 - }, - { - "epoch": 38.32, - "learning_rate": 0.0003088590276081114, - "loss": 0.3443, - "step": 157025 - }, - { - "epoch": 38.32, - "learning_rate": 0.0003088284876618617, - "loss": 0.3491, - "step": 157050 - }, - { - "epoch": 38.33, - "learning_rate": 0.000308797947715612, - "loss": 0.3376, - "step": 157075 - }, - { - "epoch": 38.34, - "learning_rate": 0.0003087674077693624, - "loss": 0.3932, - "step": 157100 - }, - { - "epoch": 38.34, - "learning_rate": 0.0003087368678231126, - "loss": 0.3509, - "step": 157125 - }, - { - "epoch": 38.35, - "learning_rate": 0.00030870754947471293, - "loss": 0.37, - "step": 157150 - }, - { - "epoch": 38.35, - "learning_rate": 0.00030867700952846324, - "loss": 0.3191, - "step": 157175 - }, - { - "epoch": 38.36, - "learning_rate": 0.00030864646958221354, - "loss": 0.3615, - "step": 157200 - }, - { - "epoch": 38.37, - "learning_rate": 0.00030861592963596384, - "loss": 0.3703, - "step": 157225 - }, - { - "epoch": 38.37, - "learning_rate": 0.00030858538968971415, - "loss": 0.3829, - "step": 157250 - }, - { - "epoch": 38.38, - "learning_rate": 0.0003085548497434645, - "loss": 0.3682, - "step": 157275 - }, - { - "epoch": 38.38, - "learning_rate": 0.00030852430979721475, - "loss": 0.3631, - "step": 157300 - }, - { - "epoch": 38.39, - "learning_rate": 0.00030849376985096506, - "loss": 0.3219, - "step": 157325 - }, - { - "epoch": 38.4, - "learning_rate": 0.00030846322990471536, - "loss": 0.3675, - "step": 157350 - }, - { - "epoch": 38.4, - "learning_rate": 0.00030843268995846566, - "loss": 0.3204, - "step": 157375 - }, - { - "epoch": 38.41, - "learning_rate": 0.000308402150012216, - "loss": 0.3539, - "step": 157400 - }, - { - "epoch": 38.42, - "learning_rate": 0.0003083716100659663, - "loss": 0.3556, - "step": 157425 - }, - { - "epoch": 38.42, - "learning_rate": 0.0003083410701197166, - "loss": 0.3787, - "step": 157450 - }, - { - "epoch": 38.43, - "learning_rate": 0.0003083105301734669, - "loss": 0.3152, - "step": 157475 - }, - { - "epoch": 38.43, - "learning_rate": 0.0003082799902272172, - "loss": 0.3738, - "step": 157500 - }, - { - "epoch": 38.44, - "learning_rate": 0.00030824945028096754, - "loss": 0.3171, - "step": 157525 - }, - { - "epoch": 38.45, - "learning_rate": 0.00030821891033471784, - "loss": 0.3718, - "step": 157550 - }, - { - "epoch": 38.45, - "learning_rate": 0.00030818837038846814, - "loss": 0.3166, - "step": 157575 - }, - { - "epoch": 38.46, - "learning_rate": 0.0003081578304422184, - "loss": 0.385, - "step": 157600 - }, - { - "epoch": 38.46, - "learning_rate": 0.0003081272904959687, - "loss": 0.3285, - "step": 157625 - }, - { - "epoch": 38.47, - "learning_rate": 0.00030809675054971905, - "loss": 0.3749, - "step": 157650 - }, - { - "epoch": 38.48, - "learning_rate": 0.00030806621060346936, - "loss": 0.3479, - "step": 157675 - }, - { - "epoch": 38.48, - "learning_rate": 0.00030803567065721966, - "loss": 0.3662, - "step": 157700 - }, - { - "epoch": 38.49, - "learning_rate": 0.00030800513071096996, - "loss": 0.2701, - "step": 157725 - }, - { - "epoch": 38.49, - "learning_rate": 0.00030797459076472027, - "loss": 0.3413, - "step": 157750 - }, - { - "epoch": 38.5, - "learning_rate": 0.00030794405081847057, - "loss": 0.3228, - "step": 157775 - }, - { - "epoch": 38.51, - "learning_rate": 0.0003079135108722209, - "loss": 0.3578, - "step": 157800 - }, - { - "epoch": 38.51, - "learning_rate": 0.0003078829709259712, - "loss": 0.3163, - "step": 157825 - }, - { - "epoch": 38.52, - "learning_rate": 0.0003078524309797215, - "loss": 0.4182, - "step": 157850 - }, - { - "epoch": 38.52, - "learning_rate": 0.0003078218910334718, - "loss": 0.3249, - "step": 157875 - }, - { - "epoch": 38.53, - "learning_rate": 0.00030779135108722214, - "loss": 0.3338, - "step": 157900 - }, - { - "epoch": 38.54, - "learning_rate": 0.0003077608111409724, - "loss": 0.3573, - "step": 157925 - }, - { - "epoch": 38.54, - "learning_rate": 0.0003077302711947227, - "loss": 0.3489, - "step": 157950 - }, - { - "epoch": 38.55, - "learning_rate": 0.000307699731248473, - "loss": 0.3266, - "step": 157975 - }, - { - "epoch": 38.56, - "learning_rate": 0.0003076691913022233, - "loss": 0.3913, - "step": 158000 - }, - { - "epoch": 38.56, - "learning_rate": 0.0003076386513559736, - "loss": 0.3552, - "step": 158025 - }, - { - "epoch": 38.57, - "learning_rate": 0.00030760811140972396, - "loss": 0.3592, - "step": 158050 - }, - { - "epoch": 38.57, - "learning_rate": 0.0003075775714634742, - "loss": 0.3313, - "step": 158075 - }, - { - "epoch": 38.58, - "learning_rate": 0.0003075470315172245, - "loss": 0.3816, - "step": 158100 - }, - { - "epoch": 38.59, - "learning_rate": 0.0003075164915709748, - "loss": 0.2628, - "step": 158125 - }, - { - "epoch": 38.59, - "learning_rate": 0.0003074859516247251, - "loss": 0.3693, - "step": 158150 - }, - { - "epoch": 38.6, - "learning_rate": 0.0003074554116784755, - "loss": 0.3403, - "step": 158175 - }, - { - "epoch": 38.6, - "learning_rate": 0.0003074248717322258, - "loss": 0.3769, - "step": 158200 - }, - { - "epoch": 38.61, - "learning_rate": 0.0003073943317859761, - "loss": 0.3627, - "step": 158225 - }, - { - "epoch": 38.62, - "learning_rate": 0.00030736379183972633, - "loss": 0.3698, - "step": 158250 - }, - { - "epoch": 38.62, - "learning_rate": 0.00030733325189347664, - "loss": 0.3424, - "step": 158275 - }, - { - "epoch": 38.63, - "learning_rate": 0.000307302711947227, - "loss": 0.3883, - "step": 158300 - }, - { - "epoch": 38.63, - "learning_rate": 0.0003072721720009773, - "loss": 0.3199, - "step": 158325 - }, - { - "epoch": 38.64, - "learning_rate": 0.0003072416320547276, - "loss": 0.3781, - "step": 158350 - }, - { - "epoch": 38.65, - "learning_rate": 0.0003072110921084779, - "loss": 0.3001, - "step": 158375 - }, - { - "epoch": 38.65, - "learning_rate": 0.00030718055216222815, - "loss": 0.3562, - "step": 158400 - }, - { - "epoch": 38.66, - "learning_rate": 0.0003071500122159785, - "loss": 0.317, - "step": 158425 - }, - { - "epoch": 38.67, - "learning_rate": 0.0003071194722697288, - "loss": 0.3913, - "step": 158450 - }, - { - "epoch": 38.67, - "learning_rate": 0.0003070889323234791, - "loss": 0.3584, - "step": 158475 - }, - { - "epoch": 38.68, - "learning_rate": 0.0003070583923772294, - "loss": 0.3619, - "step": 158500 - }, - { - "epoch": 38.68, - "learning_rate": 0.0003070278524309797, - "loss": 0.347, - "step": 158525 - }, - { - "epoch": 38.69, - "learning_rate": 0.00030699731248473003, - "loss": 0.3808, - "step": 158550 - }, - { - "epoch": 38.7, - "learning_rate": 0.00030696677253848033, - "loss": 0.3607, - "step": 158575 - }, - { - "epoch": 38.7, - "learning_rate": 0.00030693623259223064, - "loss": 0.3674, - "step": 158600 - }, - { - "epoch": 38.71, - "learning_rate": 0.00030690569264598094, - "loss": 0.3131, - "step": 158625 - }, - { - "epoch": 38.71, - "learning_rate": 0.00030687515269973124, - "loss": 0.3722, - "step": 158650 - }, - { - "epoch": 38.72, - "learning_rate": 0.0003068446127534816, - "loss": 0.346, - "step": 158675 - }, - { - "epoch": 38.73, - "learning_rate": 0.0003068140728072319, - "loss": 0.3828, - "step": 158700 - }, - { - "epoch": 38.73, - "learning_rate": 0.00030678353286098215, - "loss": 0.3791, - "step": 158725 - }, - { - "epoch": 38.74, - "learning_rate": 0.00030675299291473246, - "loss": 0.3738, - "step": 158750 - }, - { - "epoch": 38.74, - "learning_rate": 0.00030672245296848276, - "loss": 0.3576, - "step": 158775 - }, - { - "epoch": 38.75, - "learning_rate": 0.0003066919130222331, - "loss": 0.3791, - "step": 158800 - }, - { - "epoch": 38.76, - "learning_rate": 0.0003066613730759834, - "loss": 0.2818, - "step": 158825 - }, - { - "epoch": 38.76, - "learning_rate": 0.0003066308331297337, - "loss": 0.3524, - "step": 158850 - }, - { - "epoch": 38.77, - "learning_rate": 0.00030660029318348397, - "loss": 0.3395, - "step": 158875 - }, - { - "epoch": 38.78, - "learning_rate": 0.0003065697532372343, - "loss": 0.3586, - "step": 158900 - }, - { - "epoch": 38.78, - "learning_rate": 0.00030653921329098463, - "loss": 0.3633, - "step": 158925 - }, - { - "epoch": 38.79, - "learning_rate": 0.00030650867334473494, - "loss": 0.3851, - "step": 158950 - }, - { - "epoch": 38.79, - "learning_rate": 0.00030647813339848524, - "loss": 0.3311, - "step": 158975 - }, - { - "epoch": 38.8, - "learning_rate": 0.00030644759345223554, - "loss": 0.3891, - "step": 159000 - }, - { - "epoch": 38.8, - "eval_cer": 0.09004342782049835, - "eval_loss": 0.4059583842754364, - "eval_runtime": 152.7166, - "eval_samples_per_second": 27.456, - "eval_steps_per_second": 6.869, - "eval_wer": 0.3733768352365416, - "step": 159000 - }, - { - "epoch": 38.81, - "learning_rate": 0.0003064170535059858, - "loss": 0.3558, - "step": 159025 - }, - { - "epoch": 38.81, - "learning_rate": 0.00030638651355973615, - "loss": 0.3752, - "step": 159050 - }, - { - "epoch": 38.82, - "learning_rate": 0.00030635597361348645, - "loss": 0.2948, - "step": 159075 - }, - { - "epoch": 38.82, - "learning_rate": 0.00030632543366723676, - "loss": 0.3565, - "step": 159100 - }, - { - "epoch": 38.83, - "learning_rate": 0.00030629489372098706, - "loss": 0.3322, - "step": 159125 - }, - { - "epoch": 38.84, - "learning_rate": 0.00030626435377473736, - "loss": 0.3378, - "step": 159150 - }, - { - "epoch": 38.84, - "learning_rate": 0.0003062338138284877, - "loss": 0.3024, - "step": 159175 - }, - { - "epoch": 38.85, - "learning_rate": 0.00030620327388223797, - "loss": 0.3415, - "step": 159200 - }, - { - "epoch": 38.85, - "learning_rate": 0.0003061727339359883, - "loss": 0.303, - "step": 159225 - }, - { - "epoch": 38.86, - "learning_rate": 0.0003061421939897386, - "loss": 0.3643, - "step": 159250 - }, - { - "epoch": 38.87, - "learning_rate": 0.0003061128756413389, - "loss": 0.3538, - "step": 159275 - }, - { - "epoch": 38.87, - "learning_rate": 0.0003060823356950892, - "loss": 0.3531, - "step": 159300 - }, - { - "epoch": 38.88, - "learning_rate": 0.0003060517957488395, - "loss": 0.2936, - "step": 159325 - }, - { - "epoch": 38.88, - "learning_rate": 0.0003060212558025898, - "loss": 0.3812, - "step": 159350 - }, - { - "epoch": 38.89, - "learning_rate": 0.0003059907158563401, - "loss": 0.2826, - "step": 159375 - }, - { - "epoch": 38.9, - "learning_rate": 0.0003059601759100904, - "loss": 0.3285, - "step": 159400 - }, - { - "epoch": 38.9, - "learning_rate": 0.0003059296359638407, - "loss": 0.3135, - "step": 159425 - }, - { - "epoch": 38.91, - "learning_rate": 0.000305899096017591, - "loss": 0.3443, - "step": 159450 - }, - { - "epoch": 38.92, - "learning_rate": 0.00030586855607134136, - "loss": 0.3174, - "step": 159475 - }, - { - "epoch": 38.92, - "learning_rate": 0.0003058380161250916, - "loss": 0.3853, - "step": 159500 - }, - { - "epoch": 38.93, - "learning_rate": 0.0003058074761788419, - "loss": 0.3711, - "step": 159525 - }, - { - "epoch": 38.93, - "learning_rate": 0.0003057769362325922, - "loss": 0.3791, - "step": 159550 - }, - { - "epoch": 38.94, - "learning_rate": 0.0003057463962863425, - "loss": 0.3156, - "step": 159575 - }, - { - "epoch": 38.95, - "learning_rate": 0.0003057158563400929, - "loss": 0.355, - "step": 159600 - }, - { - "epoch": 38.95, - "learning_rate": 0.0003056853163938432, - "loss": 0.3496, - "step": 159625 - }, - { - "epoch": 38.96, - "learning_rate": 0.0003056547764475935, - "loss": 0.3647, - "step": 159650 - }, - { - "epoch": 38.96, - "learning_rate": 0.00030562423650134374, - "loss": 0.3236, - "step": 159675 - }, - { - "epoch": 38.97, - "learning_rate": 0.00030559369655509404, - "loss": 0.3881, - "step": 159700 - }, - { - "epoch": 38.98, - "learning_rate": 0.0003055631566088444, - "loss": 0.3831, - "step": 159725 - }, - { - "epoch": 38.98, - "learning_rate": 0.0003055326166625947, - "loss": 0.3445, - "step": 159750 - }, - { - "epoch": 38.99, - "learning_rate": 0.000305502076716345, - "loss": 0.346, - "step": 159775 - }, - { - "epoch": 38.99, - "learning_rate": 0.0003054715367700953, - "loss": 0.358, - "step": 159800 - }, - { - "epoch": 39.0, - "learning_rate": 0.00030544099682384556, - "loss": 0.3103, - "step": 159825 - }, - { - "epoch": 39.01, - "learning_rate": 0.0003054104568775959, - "loss": 0.3739, - "step": 159850 - }, - { - "epoch": 39.01, - "learning_rate": 0.0003053799169313462, - "loss": 0.2863, - "step": 159875 - }, - { - "epoch": 39.02, - "learning_rate": 0.0003053493769850965, - "loss": 0.3753, - "step": 159900 - }, - { - "epoch": 39.03, - "learning_rate": 0.0003053188370388468, - "loss": 0.3675, - "step": 159925 - }, - { - "epoch": 39.03, - "learning_rate": 0.00030528829709259713, - "loss": 0.3794, - "step": 159950 - }, - { - "epoch": 39.04, - "learning_rate": 0.0003052577571463474, - "loss": 0.358, - "step": 159975 - }, - { - "epoch": 39.04, - "learning_rate": 0.00030522721720009773, - "loss": 0.3563, - "step": 160000 - }, - { - "epoch": 39.05, - "learning_rate": 0.00030519667725384804, - "loss": 0.3202, - "step": 160025 - }, - { - "epoch": 39.06, - "learning_rate": 0.00030516613730759834, - "loss": 0.3827, - "step": 160050 - }, - { - "epoch": 39.06, - "learning_rate": 0.00030513559736134864, - "loss": 0.2992, - "step": 160075 - }, - { - "epoch": 39.07, - "learning_rate": 0.00030510505741509895, - "loss": 0.3799, - "step": 160100 - }, - { - "epoch": 39.07, - "learning_rate": 0.0003050745174688493, - "loss": 0.3517, - "step": 160125 - }, - { - "epoch": 39.08, - "learning_rate": 0.00030504397752259955, - "loss": 0.3921, - "step": 160150 - }, - { - "epoch": 39.09, - "learning_rate": 0.00030501343757634986, - "loss": 0.3031, - "step": 160175 - }, - { - "epoch": 39.09, - "learning_rate": 0.00030498289763010016, - "loss": 0.3653, - "step": 160200 - }, - { - "epoch": 39.1, - "learning_rate": 0.00030495235768385046, - "loss": 0.379, - "step": 160225 - }, - { - "epoch": 39.1, - "learning_rate": 0.0003049218177376008, - "loss": 0.3623, - "step": 160250 - }, - { - "epoch": 39.11, - "learning_rate": 0.0003048912777913511, - "loss": 0.337, - "step": 160275 - }, - { - "epoch": 39.12, - "learning_rate": 0.0003048607378451014, - "loss": 0.345, - "step": 160300 - }, - { - "epoch": 39.12, - "learning_rate": 0.0003048301978988517, - "loss": 0.3205, - "step": 160325 - }, - { - "epoch": 39.13, - "learning_rate": 0.000304799657952602, - "loss": 0.3479, - "step": 160350 - }, - { - "epoch": 39.13, - "learning_rate": 0.00030476911800635234, - "loss": 0.3246, - "step": 160375 - }, - { - "epoch": 39.14, - "learning_rate": 0.00030473857806010264, - "loss": 0.3478, - "step": 160400 - }, - { - "epoch": 39.15, - "learning_rate": 0.00030470803811385295, - "loss": 0.295, - "step": 160425 - }, - { - "epoch": 39.15, - "learning_rate": 0.0003046774981676032, - "loss": 0.3245, - "step": 160450 - }, - { - "epoch": 39.16, - "learning_rate": 0.0003046469582213535, - "loss": 0.3547, - "step": 160475 - }, - { - "epoch": 39.17, - "learning_rate": 0.00030461641827510386, - "loss": 0.3722, - "step": 160500 - }, - { - "epoch": 39.17, - "learning_rate": 0.00030458587832885416, - "loss": 0.3288, - "step": 160525 - }, - { - "epoch": 39.18, - "learning_rate": 0.00030455533838260446, - "loss": 0.4058, - "step": 160550 - }, - { - "epoch": 39.18, - "learning_rate": 0.00030452479843635477, - "loss": 0.2893, - "step": 160575 - }, - { - "epoch": 39.19, - "learning_rate": 0.000304494258490105, - "loss": 0.3485, - "step": 160600 - }, - { - "epoch": 39.2, - "learning_rate": 0.00030446371854385537, - "loss": 0.3285, - "step": 160625 - }, - { - "epoch": 39.2, - "learning_rate": 0.0003044331785976057, - "loss": 0.3315, - "step": 160650 - }, - { - "epoch": 39.21, - "learning_rate": 0.000304402638651356, - "loss": 0.32, - "step": 160675 - }, - { - "epoch": 39.21, - "learning_rate": 0.0003043720987051063, - "loss": 0.3428, - "step": 160700 - }, - { - "epoch": 39.22, - "learning_rate": 0.0003043415587588566, - "loss": 0.297, - "step": 160725 - }, - { - "epoch": 39.23, - "learning_rate": 0.00030431101881260694, - "loss": 0.3625, - "step": 160750 - }, - { - "epoch": 39.23, - "learning_rate": 0.0003042804788663572, - "loss": 0.3106, - "step": 160775 - }, - { - "epoch": 39.24, - "learning_rate": 0.0003042499389201075, - "loss": 0.3413, - "step": 160800 - }, - { - "epoch": 39.24, - "learning_rate": 0.0003042193989738578, - "loss": 0.2959, - "step": 160825 - }, - { - "epoch": 39.25, - "learning_rate": 0.0003041888590276081, - "loss": 0.3455, - "step": 160850 - }, - { - "epoch": 39.26, - "learning_rate": 0.00030415831908135846, - "loss": 0.3409, - "step": 160875 - }, - { - "epoch": 39.26, - "learning_rate": 0.00030412777913510876, - "loss": 0.3663, - "step": 160900 - }, - { - "epoch": 39.27, - "learning_rate": 0.000304097239188859, - "loss": 0.3359, - "step": 160925 - }, - { - "epoch": 39.28, - "learning_rate": 0.0003040666992426093, - "loss": 0.375, - "step": 160950 - }, - { - "epoch": 39.28, - "learning_rate": 0.0003040361592963596, - "loss": 0.3297, - "step": 160975 - }, - { - "epoch": 39.29, - "learning_rate": 0.00030400561935011, - "loss": 0.3621, - "step": 161000 - }, - { - "epoch": 39.29, - "learning_rate": 0.0003039750794038603, - "loss": 0.3113, - "step": 161025 - }, - { - "epoch": 39.3, - "learning_rate": 0.0003039445394576106, - "loss": 0.3815, - "step": 161050 - }, - { - "epoch": 39.31, - "learning_rate": 0.00030391399951136083, - "loss": 0.2934, - "step": 161075 - }, - { - "epoch": 39.31, - "learning_rate": 0.00030388345956511114, - "loss": 0.3274, - "step": 161100 - }, - { - "epoch": 39.32, - "learning_rate": 0.0003038529196188615, - "loss": 0.3138, - "step": 161125 - }, - { - "epoch": 39.32, - "learning_rate": 0.0003038223796726118, - "loss": 0.3716, - "step": 161150 - }, - { - "epoch": 39.33, - "learning_rate": 0.0003037918397263621, - "loss": 0.3124, - "step": 161175 - }, - { - "epoch": 39.34, - "learning_rate": 0.0003037612997801124, - "loss": 0.3633, - "step": 161200 - }, - { - "epoch": 39.34, - "learning_rate": 0.0003037307598338627, - "loss": 0.327, - "step": 161225 - }, - { - "epoch": 39.35, - "learning_rate": 0.000303700219887613, - "loss": 0.3636, - "step": 161250 - }, - { - "epoch": 39.35, - "learning_rate": 0.0003036696799413633, - "loss": 0.3756, - "step": 161275 - }, - { - "epoch": 39.36, - "learning_rate": 0.0003036391399951136, - "loss": 0.3734, - "step": 161300 - }, - { - "epoch": 39.37, - "learning_rate": 0.0003036086000488639, - "loss": 0.3191, - "step": 161325 - }, - { - "epoch": 39.37, - "learning_rate": 0.0003035780601026142, - "loss": 0.3649, - "step": 161350 - }, - { - "epoch": 39.38, - "learning_rate": 0.0003035475201563646, - "loss": 0.3288, - "step": 161375 - }, - { - "epoch": 39.39, - "learning_rate": 0.00030351698021011483, - "loss": 0.3663, - "step": 161400 - }, - { - "epoch": 39.39, - "learning_rate": 0.00030348644026386513, - "loss": 0.3615, - "step": 161425 - }, - { - "epoch": 39.4, - "learning_rate": 0.00030345590031761544, - "loss": 0.3597, - "step": 161450 - }, - { - "epoch": 39.4, - "learning_rate": 0.00030342536037136574, - "loss": 0.3365, - "step": 161475 - }, - { - "epoch": 39.41, - "learning_rate": 0.00030339482042511604, - "loss": 0.3327, - "step": 161500 - }, - { - "epoch": 39.42, - "learning_rate": 0.0003033642804788664, - "loss": 0.3703, - "step": 161525 - }, - { - "epoch": 39.42, - "learning_rate": 0.00030333374053261665, - "loss": 0.3808, - "step": 161550 - }, - { - "epoch": 39.43, - "learning_rate": 0.00030330320058636695, - "loss": 0.3423, - "step": 161575 - }, - { - "epoch": 39.43, - "learning_rate": 0.00030327266064011726, - "loss": 0.3588, - "step": 161600 - }, - { - "epoch": 39.44, - "learning_rate": 0.00030324212069386756, - "loss": 0.3462, - "step": 161625 - }, - { - "epoch": 39.45, - "learning_rate": 0.0003032115807476179, - "loss": 0.3527, - "step": 161650 - }, - { - "epoch": 39.45, - "learning_rate": 0.0003031810408013682, - "loss": 0.341, - "step": 161675 - }, - { - "epoch": 39.46, - "learning_rate": 0.0003031505008551185, - "loss": 0.3785, - "step": 161700 - }, - { - "epoch": 39.46, - "learning_rate": 0.0003031199609088688, - "loss": 0.2958, - "step": 161725 - }, - { - "epoch": 39.47, - "learning_rate": 0.0003030894209626191, - "loss": 0.402, - "step": 161750 - }, - { - "epoch": 39.48, - "learning_rate": 0.00030305888101636943, - "loss": 0.3029, - "step": 161775 - }, - { - "epoch": 39.48, - "learning_rate": 0.00030302834107011974, - "loss": 0.373, - "step": 161800 - }, - { - "epoch": 39.49, - "learning_rate": 0.00030299780112387004, - "loss": 0.3279, - "step": 161825 - }, - { - "epoch": 39.49, - "learning_rate": 0.00030296726117762034, - "loss": 0.3434, - "step": 161850 - }, - { - "epoch": 39.5, - "learning_rate": 0.0003029367212313706, - "loss": 0.3362, - "step": 161875 - }, - { - "epoch": 39.51, - "learning_rate": 0.00030290618128512095, - "loss": 0.3598, - "step": 161900 - }, - { - "epoch": 39.51, - "learning_rate": 0.00030287686293672126, - "loss": 0.3523, - "step": 161925 - }, - { - "epoch": 39.52, - "learning_rate": 0.00030284632299047156, - "loss": 0.354, - "step": 161950 - }, - { - "epoch": 39.53, - "learning_rate": 0.00030281578304422186, - "loss": 0.3426, - "step": 161975 - }, - { - "epoch": 39.53, - "learning_rate": 0.00030278524309797217, - "loss": 0.3668, - "step": 162000 - }, - { - "epoch": 39.53, - "eval_cer": 0.08933503074853957, - "eval_loss": 0.4087386727333069, - "eval_runtime": 152.8656, - "eval_samples_per_second": 27.429, - "eval_steps_per_second": 6.862, - "eval_wer": 0.3700815660685155, - "step": 162000 - }, - { - "epoch": 39.54, - "learning_rate": 0.0003027547031517224, - "loss": 0.3361, - "step": 162025 - }, - { - "epoch": 39.54, - "learning_rate": 0.0003027241632054727, - "loss": 0.3544, - "step": 162050 - }, - { - "epoch": 39.55, - "learning_rate": 0.0003026936232592231, - "loss": 0.3459, - "step": 162075 - }, - { - "epoch": 39.56, - "learning_rate": 0.0003026630833129734, - "loss": 0.3486, - "step": 162100 - }, - { - "epoch": 39.56, - "learning_rate": 0.0003026325433667237, - "loss": 0.3441, - "step": 162125 - }, - { - "epoch": 39.57, - "learning_rate": 0.000302602003420474, - "loss": 0.3544, - "step": 162150 - }, - { - "epoch": 39.57, - "learning_rate": 0.0003025714634742243, - "loss": 0.3274, - "step": 162175 - }, - { - "epoch": 39.58, - "learning_rate": 0.0003025409235279746, - "loss": 0.3809, - "step": 162200 - }, - { - "epoch": 39.59, - "learning_rate": 0.0003025103835817249, - "loss": 0.293, - "step": 162225 - }, - { - "epoch": 39.59, - "learning_rate": 0.0003024798436354752, - "loss": 0.3687, - "step": 162250 - }, - { - "epoch": 39.6, - "learning_rate": 0.0003024493036892255, - "loss": 0.2723, - "step": 162275 - }, - { - "epoch": 39.6, - "learning_rate": 0.0003024187637429758, - "loss": 0.3782, - "step": 162300 - }, - { - "epoch": 39.61, - "learning_rate": 0.00030238822379672617, - "loss": 0.3465, - "step": 162325 - }, - { - "epoch": 39.62, - "learning_rate": 0.0003023576838504764, - "loss": 0.3483, - "step": 162350 - }, - { - "epoch": 39.62, - "learning_rate": 0.0003023271439042267, - "loss": 0.314, - "step": 162375 - }, - { - "epoch": 39.63, - "learning_rate": 0.000302296603957977, - "loss": 0.376, - "step": 162400 - }, - { - "epoch": 39.64, - "learning_rate": 0.0003022660640117273, - "loss": 0.3641, - "step": 162425 - }, - { - "epoch": 39.64, - "learning_rate": 0.0003022355240654777, - "loss": 0.3611, - "step": 162450 - }, - { - "epoch": 39.65, - "learning_rate": 0.000302204984119228, - "loss": 0.2945, - "step": 162475 - }, - { - "epoch": 39.65, - "learning_rate": 0.00030217444417297823, - "loss": 0.3313, - "step": 162500 - }, - { - "epoch": 39.66, - "learning_rate": 0.00030214390422672854, - "loss": 0.3319, - "step": 162525 - }, - { - "epoch": 39.67, - "learning_rate": 0.00030211336428047884, - "loss": 0.3411, - "step": 162550 - }, - { - "epoch": 39.67, - "learning_rate": 0.0003020828243342292, - "loss": 0.2996, - "step": 162575 - }, - { - "epoch": 39.68, - "learning_rate": 0.0003020522843879795, - "loss": 0.3635, - "step": 162600 - }, - { - "epoch": 39.68, - "learning_rate": 0.0003020217444417298, - "loss": 0.3447, - "step": 162625 - }, - { - "epoch": 39.69, - "learning_rate": 0.0003019912044954801, - "loss": 0.3559, - "step": 162650 - }, - { - "epoch": 39.7, - "learning_rate": 0.00030196066454923036, - "loss": 0.3664, - "step": 162675 - }, - { - "epoch": 39.7, - "learning_rate": 0.0003019301246029807, - "loss": 0.3482, - "step": 162700 - }, - { - "epoch": 39.71, - "learning_rate": 0.000301899584656731, - "loss": 0.3171, - "step": 162725 - }, - { - "epoch": 39.71, - "learning_rate": 0.0003018690447104813, - "loss": 0.367, - "step": 162750 - }, - { - "epoch": 39.72, - "learning_rate": 0.0003018385047642316, - "loss": 0.3359, - "step": 162775 - }, - { - "epoch": 39.73, - "learning_rate": 0.00030180796481798193, - "loss": 0.3473, - "step": 162800 - }, - { - "epoch": 39.73, - "learning_rate": 0.00030177742487173223, - "loss": 0.3301, - "step": 162825 - }, - { - "epoch": 39.74, - "learning_rate": 0.00030174688492548254, - "loss": 0.3561, - "step": 162850 - }, - { - "epoch": 39.74, - "learning_rate": 0.00030171634497923284, - "loss": 0.3127, - "step": 162875 - }, - { - "epoch": 39.75, - "learning_rate": 0.00030168580503298314, - "loss": 0.3439, - "step": 162900 - }, - { - "epoch": 39.76, - "learning_rate": 0.00030165526508673345, - "loss": 0.2874, - "step": 162925 - }, - { - "epoch": 39.76, - "learning_rate": 0.0003016247251404838, - "loss": 0.3598, - "step": 162950 - }, - { - "epoch": 39.77, - "learning_rate": 0.00030159418519423405, - "loss": 0.2957, - "step": 162975 - }, - { - "epoch": 39.78, - "learning_rate": 0.00030156364524798436, - "loss": 0.3637, - "step": 163000 - }, - { - "epoch": 39.78, - "learning_rate": 0.00030153310530173466, - "loss": 0.3313, - "step": 163025 - }, - { - "epoch": 39.79, - "learning_rate": 0.00030150256535548496, - "loss": 0.3765, - "step": 163050 - }, - { - "epoch": 39.79, - "learning_rate": 0.0003014720254092353, - "loss": 0.3241, - "step": 163075 - }, - { - "epoch": 39.8, - "learning_rate": 0.0003014414854629856, - "loss": 0.351, - "step": 163100 - }, - { - "epoch": 39.81, - "learning_rate": 0.0003014109455167359, - "loss": 0.3051, - "step": 163125 - }, - { - "epoch": 39.81, - "learning_rate": 0.0003013804055704862, - "loss": 0.3359, - "step": 163150 - }, - { - "epoch": 39.82, - "learning_rate": 0.0003013498656242365, - "loss": 0.3172, - "step": 163175 - }, - { - "epoch": 39.82, - "learning_rate": 0.00030131932567798684, - "loss": 0.3753, - "step": 163200 - }, - { - "epoch": 39.83, - "learning_rate": 0.00030128878573173714, - "loss": 0.3561, - "step": 163225 - }, - { - "epoch": 39.84, - "learning_rate": 0.00030125824578548744, - "loss": 0.3807, - "step": 163250 - }, - { - "epoch": 39.84, - "learning_rate": 0.00030122770583923775, - "loss": 0.2925, - "step": 163275 - }, - { - "epoch": 39.85, - "learning_rate": 0.000301197165892988, - "loss": 0.3456, - "step": 163300 - }, - { - "epoch": 39.85, - "learning_rate": 0.0003011666259467383, - "loss": 0.3528, - "step": 163325 - }, - { - "epoch": 39.86, - "learning_rate": 0.00030113608600048866, - "loss": 0.3625, - "step": 163350 - }, - { - "epoch": 39.87, - "learning_rate": 0.00030110554605423896, - "loss": 0.3056, - "step": 163375 - }, - { - "epoch": 39.87, - "learning_rate": 0.00030107500610798926, - "loss": 0.3511, - "step": 163400 - }, - { - "epoch": 39.88, - "learning_rate": 0.00030104446616173957, - "loss": 0.3334, - "step": 163425 - }, - { - "epoch": 39.89, - "learning_rate": 0.0003010139262154898, - "loss": 0.348, - "step": 163450 - }, - { - "epoch": 39.89, - "learning_rate": 0.0003009833862692402, - "loss": 0.3457, - "step": 163475 - }, - { - "epoch": 39.9, - "learning_rate": 0.0003009528463229905, - "loss": 0.3472, - "step": 163500 - }, - { - "epoch": 39.9, - "learning_rate": 0.0003009223063767408, - "loss": 0.3753, - "step": 163525 - }, - { - "epoch": 39.91, - "learning_rate": 0.0003008917664304911, - "loss": 0.3817, - "step": 163550 - }, - { - "epoch": 39.92, - "learning_rate": 0.0003008612264842414, - "loss": 0.3385, - "step": 163575 - }, - { - "epoch": 39.92, - "learning_rate": 0.00030083068653799174, - "loss": 0.3407, - "step": 163600 - }, - { - "epoch": 39.93, - "learning_rate": 0.000300800146591742, - "loss": 0.274, - "step": 163625 - }, - { - "epoch": 39.93, - "learning_rate": 0.0003007696066454923, - "loss": 0.3358, - "step": 163650 - }, - { - "epoch": 39.94, - "learning_rate": 0.0003007390666992426, - "loss": 0.2925, - "step": 163675 - }, - { - "epoch": 39.95, - "learning_rate": 0.0003007085267529929, - "loss": 0.3619, - "step": 163700 - }, - { - "epoch": 39.95, - "learning_rate": 0.00030067798680674326, - "loss": 0.3223, - "step": 163725 - }, - { - "epoch": 39.96, - "learning_rate": 0.00030064744686049356, - "loss": 0.3764, - "step": 163750 - }, - { - "epoch": 39.96, - "learning_rate": 0.0003006169069142438, - "loss": 0.2987, - "step": 163775 - }, - { - "epoch": 39.97, - "learning_rate": 0.0003005863669679941, - "loss": 0.3724, - "step": 163800 - }, - { - "epoch": 39.98, - "learning_rate": 0.0003005558270217444, - "loss": 0.3446, - "step": 163825 - }, - { - "epoch": 39.98, - "learning_rate": 0.0003005252870754948, - "loss": 0.3664, - "step": 163850 - }, - { - "epoch": 39.99, - "learning_rate": 0.0003004947471292451, - "loss": 0.3606, - "step": 163875 - }, - { - "epoch": 40.0, - "learning_rate": 0.0003004642071829954, - "loss": 0.3275, - "step": 163900 - }, - { - "epoch": 40.0, - "learning_rate": 0.00030043366723674563, - "loss": 0.3197, - "step": 163925 - }, - { - "epoch": 40.01, - "learning_rate": 0.00030040312729049594, - "loss": 0.3236, - "step": 163950 - }, - { - "epoch": 40.01, - "learning_rate": 0.0003003725873442463, - "loss": 0.3119, - "step": 163975 - }, - { - "epoch": 40.02, - "learning_rate": 0.0003003420473979966, - "loss": 0.3327, - "step": 164000 - }, - { - "epoch": 132.6, - "learning_rate": 0.00013210073820669788, - "loss": 0.3925, - "step": 164025 - }, - { - "epoch": 132.62, - "learning_rate": 0.00013204447245228666, - "loss": 0.3782, - "step": 164050 - }, - { - "epoch": 132.64, - "learning_rate": 0.0001319882066978754, - "loss": 0.3837, - "step": 164075 - }, - { - "epoch": 132.66, - "learning_rate": 0.00013193194094346416, - "loss": 0.4232, - "step": 164100 - }, - { - "epoch": 132.68, - "learning_rate": 0.00013187567518905294, - "loss": 0.3438, - "step": 164125 - }, - { - "epoch": 132.7, - "learning_rate": 0.00013181940943464171, - "loss": 0.3733, - "step": 164150 - }, - { - "epoch": 132.72, - "learning_rate": 0.00013176314368023047, - "loss": 0.3464, - "step": 164175 - }, - { - "epoch": 132.74, - "learning_rate": 0.00013170687792581922, - "loss": 0.3868, - "step": 164200 - }, - { - "epoch": 132.76, - "learning_rate": 0.000131650612171408, - "loss": 0.3679, - "step": 164225 - }, - { - "epoch": 132.78, - "learning_rate": 0.00013159434641699677, - "loss": 0.3511, - "step": 164250 - }, - { - "epoch": 132.8, - "learning_rate": 0.00013153808066258552, - "loss": 0.3603, - "step": 164275 - }, - { - "epoch": 132.82, - "learning_rate": 0.0001314818149081743, - "loss": 0.3171, - "step": 164300 - }, - { - "epoch": 132.84, - "learning_rate": 0.00013142554915376305, - "loss": 0.3233, - "step": 164325 - }, - { - "epoch": 132.86, - "learning_rate": 0.0001313692833993518, - "loss": 0.3759, - "step": 164350 - }, - { - "epoch": 132.88, - "learning_rate": 0.00013131301764494058, - "loss": 0.3586, - "step": 164375 - }, - { - "epoch": 132.9, - "learning_rate": 0.00013125675189052936, - "loss": 0.3792, - "step": 164400 - }, - { - "epoch": 132.92, - "learning_rate": 0.00013120048613611811, - "loss": 0.3269, - "step": 164425 - }, - { - "epoch": 132.94, - "learning_rate": 0.00013114422038170686, - "loss": 0.383, - "step": 164450 - }, - { - "epoch": 132.96, - "learning_rate": 0.00013108795462729564, - "loss": 0.3353, - "step": 164475 - }, - { - "epoch": 132.98, - "learning_rate": 0.00013103168887288442, - "loss": 0.3276, - "step": 164500 - }, - { - "epoch": 133.0, - "learning_rate": 0.00013097542311847317, - "loss": 0.3406, - "step": 164525 - }, - { - "epoch": 133.02, - "learning_rate": 0.00013091915736406192, - "loss": 0.3269, - "step": 164550 - }, - { - "epoch": 133.04, - "learning_rate": 0.0001308628916096507, - "loss": 0.3718, - "step": 164575 - }, - { - "epoch": 133.06, - "learning_rate": 0.00013080662585523948, - "loss": 0.3165, - "step": 164600 - }, - { - "epoch": 133.08, - "learning_rate": 0.00013075036010082826, - "loss": 0.341, - "step": 164625 - }, - { - "epoch": 133.1, - "learning_rate": 0.00013069409434641698, - "loss": 0.3919, - "step": 164650 - }, - { - "epoch": 133.12, - "learning_rate": 0.00013063782859200576, - "loss": 0.3463, - "step": 164675 - }, - { - "epoch": 133.14, - "learning_rate": 0.00013058156283759454, - "loss": 0.3437, - "step": 164700 - }, - { - "epoch": 133.16, - "learning_rate": 0.0001305252970831833, - "loss": 0.3789, - "step": 164725 - }, - { - "epoch": 133.19, - "learning_rate": 0.00013046903132877204, - "loss": 0.3604, - "step": 164750 - }, - { - "epoch": 133.21, - "learning_rate": 0.00013041276557436082, - "loss": 0.3047, - "step": 164775 - }, - { - "epoch": 133.23, - "learning_rate": 0.0001303564998199496, - "loss": 0.3157, - "step": 164800 - }, - { - "epoch": 133.25, - "learning_rate": 0.00013030023406553835, - "loss": 0.3391, - "step": 164825 - }, - { - "epoch": 133.27, - "learning_rate": 0.0001302439683111271, - "loss": 0.3064, - "step": 164850 - }, - { - "epoch": 133.29, - "learning_rate": 0.00013018770255671588, - "loss": 0.316, - "step": 164875 - }, - { - "epoch": 133.31, - "learning_rate": 0.00013013143680230466, - "loss": 0.3451, - "step": 164900 - }, - { - "epoch": 133.33, - "learning_rate": 0.0001300751710478934, - "loss": 0.3783, - "step": 164925 - }, - { - "epoch": 133.35, - "learning_rate": 0.0001300189052934822, - "loss": 0.3264, - "step": 164950 - }, - { - "epoch": 133.37, - "learning_rate": 0.00012996263953907094, - "loss": 0.3266, - "step": 164975 - }, - { - "epoch": 133.39, - "learning_rate": 0.00012990637378465972, - "loss": 0.3243, - "step": 165000 - }, - { - "epoch": 133.39, - "eval_cer": 0.082004661047401, - "eval_loss": 0.38078561425209045, - "eval_runtime": 149.725, - "eval_samples_per_second": 28.005, - "eval_steps_per_second": 7.006, - "eval_wer": 0.3460032626427406, - "step": 165000 - }, - { - "epoch": 133.41, - "learning_rate": 0.00012985235866042492, - "loss": 0.3781, - "step": 165025 - }, - { - "epoch": 133.43, - "learning_rate": 0.0001297960929060137, - "loss": 0.3568, - "step": 165050 - }, - { - "epoch": 133.45, - "learning_rate": 0.00012973982715160245, - "loss": 0.3452, - "step": 165075 - }, - { - "epoch": 133.47, - "learning_rate": 0.00012968356139719122, - "loss": 0.3334, - "step": 165100 - }, - { - "epoch": 133.49, - "learning_rate": 0.00012962729564277998, - "loss": 0.3706, - "step": 165125 - }, - { - "epoch": 133.51, - "learning_rate": 0.00012957102988836875, - "loss": 0.3022, - "step": 165150 - }, - { - "epoch": 133.53, - "learning_rate": 0.0001295147641339575, - "loss": 0.3669, - "step": 165175 - }, - { - "epoch": 133.55, - "learning_rate": 0.00012945849837954626, - "loss": 0.3328, - "step": 165200 - }, - { - "epoch": 133.57, - "learning_rate": 0.00012940223262513503, - "loss": 0.3602, - "step": 165225 - }, - { - "epoch": 133.59, - "learning_rate": 0.0001293459668707238, - "loss": 0.3087, - "step": 165250 - }, - { - "epoch": 133.61, - "learning_rate": 0.0001292897011163126, - "loss": 0.3497, - "step": 165275 - }, - { - "epoch": 133.63, - "learning_rate": 0.00012923343536190132, - "loss": 0.3157, - "step": 165300 - }, - { - "epoch": 133.65, - "learning_rate": 0.0001291771696074901, - "loss": 0.3685, - "step": 165325 - }, - { - "epoch": 133.67, - "learning_rate": 0.00012912090385307887, - "loss": 0.3191, - "step": 165350 - }, - { - "epoch": 133.69, - "learning_rate": 0.00012906463809866765, - "loss": 0.3419, - "step": 165375 - }, - { - "epoch": 133.71, - "learning_rate": 0.00012900837234425637, - "loss": 0.3458, - "step": 165400 - }, - { - "epoch": 133.73, - "learning_rate": 0.00012895210658984515, - "loss": 0.3708, - "step": 165425 - }, - { - "epoch": 133.75, - "learning_rate": 0.00012889584083543393, - "loss": 0.3363, - "step": 165450 - }, - { - "epoch": 133.77, - "learning_rate": 0.00012883957508102268, - "loss": 0.3356, - "step": 165475 - }, - { - "epoch": 133.79, - "learning_rate": 0.00012878330932661143, - "loss": 0.3318, - "step": 165500 - }, - { - "epoch": 133.81, - "learning_rate": 0.0001287270435722002, - "loss": 0.3353, - "step": 165525 - }, - { - "epoch": 133.83, - "learning_rate": 0.000128670777817789, - "loss": 0.3232, - "step": 165550 - }, - { - "epoch": 133.85, - "learning_rate": 0.00012861451206337774, - "loss": 0.3464, - "step": 165575 - }, - { - "epoch": 133.87, - "learning_rate": 0.00012855824630896652, - "loss": 0.318, - "step": 165600 - }, - { - "epoch": 133.89, - "learning_rate": 0.00012850198055455527, - "loss": 0.3313, - "step": 165625 - }, - { - "epoch": 133.91, - "learning_rate": 0.00012844571480014405, - "loss": 0.3521, - "step": 165650 - }, - { - "epoch": 133.93, - "learning_rate": 0.0001283894490457328, - "loss": 0.3293, - "step": 165675 - }, - { - "epoch": 133.95, - "learning_rate": 0.00012833318329132158, - "loss": 0.3308, - "step": 165700 - }, - { - "epoch": 133.97, - "learning_rate": 0.00012827691753691033, - "loss": 0.3869, - "step": 165725 - }, - { - "epoch": 133.99, - "learning_rate": 0.0001282206517824991, - "loss": 0.3079, - "step": 165750 - }, - { - "epoch": 134.01, - "learning_rate": 0.00012816438602808786, - "loss": 0.3746, - "step": 165775 - }, - { - "epoch": 134.03, - "learning_rate": 0.00012810812027367664, - "loss": 0.3151, - "step": 165800 - }, - { - "epoch": 134.05, - "learning_rate": 0.00012805185451926542, - "loss": 0.3134, - "step": 165825 - }, - { - "epoch": 134.07, - "learning_rate": 0.00012799558876485414, - "loss": 0.3314, - "step": 165850 - }, - { - "epoch": 134.09, - "learning_rate": 0.00012793932301044292, - "loss": 0.3433, - "step": 165875 - }, - { - "epoch": 134.11, - "learning_rate": 0.0001278830572560317, - "loss": 0.3068, - "step": 165900 - }, - { - "epoch": 134.14, - "learning_rate": 0.00012782679150162048, - "loss": 0.3531, - "step": 165925 - }, - { - "epoch": 134.16, - "learning_rate": 0.0001277705257472092, - "loss": 0.2854, - "step": 165950 - }, - { - "epoch": 134.18, - "learning_rate": 0.00012771425999279798, - "loss": 0.3131, - "step": 165975 - }, - { - "epoch": 134.2, - "learning_rate": 0.00012765799423838676, - "loss": 0.3166, - "step": 166000 - }, - { - "epoch": 134.22, - "learning_rate": 0.00012760172848397554, - "loss": 0.3593, - "step": 166025 - }, - { - "epoch": 134.24, - "learning_rate": 0.00012754546272956426, - "loss": 0.2937, - "step": 166050 - }, - { - "epoch": 134.26, - "learning_rate": 0.00012748919697515304, - "loss": 0.3275, - "step": 166075 - }, - { - "epoch": 134.28, - "learning_rate": 0.00012743293122074182, - "loss": 0.31, - "step": 166100 - }, - { - "epoch": 134.3, - "learning_rate": 0.0001273766654663306, - "loss": 0.3444, - "step": 166125 - }, - { - "epoch": 134.32, - "learning_rate": 0.00012732039971191932, - "loss": 0.3116, - "step": 166150 - }, - { - "epoch": 134.34, - "learning_rate": 0.0001272641339575081, - "loss": 0.3177, - "step": 166175 - }, - { - "epoch": 134.36, - "learning_rate": 0.00012720786820309688, - "loss": 0.3111, - "step": 166200 - }, - { - "epoch": 134.38, - "learning_rate": 0.00012715160244868563, - "loss": 0.3299, - "step": 166225 - }, - { - "epoch": 134.4, - "learning_rate": 0.0001270953366942744, - "loss": 0.3308, - "step": 166250 - }, - { - "epoch": 134.42, - "learning_rate": 0.00012703907093986316, - "loss": 0.3252, - "step": 166275 - }, - { - "epoch": 134.44, - "learning_rate": 0.00012698280518545193, - "loss": 0.3124, - "step": 166300 - }, - { - "epoch": 134.46, - "learning_rate": 0.00012692653943104069, - "loss": 0.332, - "step": 166325 - }, - { - "epoch": 134.48, - "learning_rate": 0.00012687027367662946, - "loss": 0.3465, - "step": 166350 - }, - { - "epoch": 134.5, - "learning_rate": 0.00012681400792221822, - "loss": 0.3512, - "step": 166375 - }, - { - "epoch": 134.52, - "learning_rate": 0.000126757742167807, - "loss": 0.2847, - "step": 166400 - }, - { - "epoch": 134.54, - "learning_rate": 0.00012670147641339575, - "loss": 0.3292, - "step": 166425 - }, - { - "epoch": 134.56, - "learning_rate": 0.00012664521065898452, - "loss": 0.3211, - "step": 166450 - }, - { - "epoch": 134.58, - "learning_rate": 0.0001265889449045733, - "loss": 0.3182, - "step": 166475 - }, - { - "epoch": 134.6, - "learning_rate": 0.00012653267915016205, - "loss": 0.3041, - "step": 166500 - }, - { - "epoch": 134.62, - "learning_rate": 0.0001264764133957508, - "loss": 0.3265, - "step": 166525 - }, - { - "epoch": 134.64, - "learning_rate": 0.00012642014764133958, - "loss": 0.3068, - "step": 166550 - }, - { - "epoch": 134.66, - "learning_rate": 0.00012636388188692836, - "loss": 0.3571, - "step": 166575 - }, - { - "epoch": 134.68, - "learning_rate": 0.00012630761613251709, - "loss": 0.2864, - "step": 166600 - }, - { - "epoch": 134.7, - "learning_rate": 0.00012625135037810586, - "loss": 0.3247, - "step": 166625 - }, - { - "epoch": 134.72, - "learning_rate": 0.00012619508462369464, - "loss": 0.3179, - "step": 166650 - }, - { - "epoch": 134.74, - "learning_rate": 0.00012613881886928342, - "loss": 0.383, - "step": 166675 - }, - { - "epoch": 134.76, - "learning_rate": 0.00012608255311487214, - "loss": 0.3227, - "step": 166700 - }, - { - "epoch": 134.78, - "learning_rate": 0.00012602628736046092, - "loss": 0.3244, - "step": 166725 - }, - { - "epoch": 134.8, - "learning_rate": 0.0001259700216060497, - "loss": 0.3133, - "step": 166750 - }, - { - "epoch": 134.82, - "learning_rate": 0.00012591375585163848, - "loss": 0.3224, - "step": 166775 - }, - { - "epoch": 134.84, - "learning_rate": 0.00012585749009722723, - "loss": 0.3206, - "step": 166800 - }, - { - "epoch": 134.86, - "learning_rate": 0.00012580122434281598, - "loss": 0.368, - "step": 166825 - }, - { - "epoch": 134.88, - "learning_rate": 0.00012574495858840476, - "loss": 0.3022, - "step": 166850 - }, - { - "epoch": 134.9, - "learning_rate": 0.00012568869283399354, - "loss": 0.3127, - "step": 166875 - }, - { - "epoch": 134.92, - "learning_rate": 0.0001256324270795823, - "loss": 0.332, - "step": 166900 - }, - { - "epoch": 134.94, - "learning_rate": 0.00012557616132517104, - "loss": 0.3249, - "step": 166925 - }, - { - "epoch": 134.96, - "learning_rate": 0.00012551989557075982, - "loss": 0.3103, - "step": 166950 - }, - { - "epoch": 134.98, - "learning_rate": 0.00012546362981634857, - "loss": 0.3777, - "step": 166975 - }, - { - "epoch": 135.0, - "learning_rate": 0.00012540736406193735, - "loss": 0.3212, - "step": 167000 - }, - { - "epoch": 135.02, - "learning_rate": 0.0001253510983075261, - "loss": 0.3258, - "step": 167025 - }, - { - "epoch": 135.04, - "learning_rate": 0.00012529483255311488, - "loss": 0.3189, - "step": 167050 - }, - { - "epoch": 135.06, - "learning_rate": 0.00012523856679870363, - "loss": 0.2856, - "step": 167075 - }, - { - "epoch": 135.08, - "learning_rate": 0.0001251823010442924, - "loss": 0.3336, - "step": 167100 - }, - { - "epoch": 135.11, - "learning_rate": 0.0001251260352898812, - "loss": 0.3283, - "step": 167125 - }, - { - "epoch": 135.13, - "learning_rate": 0.00012506976953546994, - "loss": 0.2868, - "step": 167150 - }, - { - "epoch": 135.15, - "learning_rate": 0.0001250135037810587, - "loss": 0.2945, - "step": 167175 - }, - { - "epoch": 135.17, - "learning_rate": 0.00012495723802664747, - "loss": 0.3234, - "step": 167200 - }, - { - "epoch": 135.19, - "learning_rate": 0.00012490097227223625, - "loss": 0.3029, - "step": 167225 - }, - { - "epoch": 135.21, - "learning_rate": 0.000124844706517825, - "loss": 0.3149, - "step": 167250 - }, - { - "epoch": 135.23, - "learning_rate": 0.00012478844076341375, - "loss": 0.3135, - "step": 167275 - }, - { - "epoch": 135.25, - "learning_rate": 0.00012473217500900253, - "loss": 0.3306, - "step": 167300 - }, - { - "epoch": 135.27, - "learning_rate": 0.00012467815988476773, - "loss": 0.3093, - "step": 167325 - }, - { - "epoch": 135.29, - "learning_rate": 0.0001246218941303565, - "loss": 0.3139, - "step": 167350 - }, - { - "epoch": 135.31, - "learning_rate": 0.00012456562837594526, - "loss": 0.3219, - "step": 167375 - }, - { - "epoch": 135.33, - "learning_rate": 0.00012450936262153403, - "loss": 0.3237, - "step": 167400 - }, - { - "epoch": 135.35, - "learning_rate": 0.00012445309686712279, - "loss": 0.3151, - "step": 167425 - }, - { - "epoch": 135.37, - "learning_rate": 0.00012439683111271156, - "loss": 0.3459, - "step": 167450 - }, - { - "epoch": 135.39, - "learning_rate": 0.00012434056535830031, - "loss": 0.3431, - "step": 167475 - }, - { - "epoch": 135.41, - "learning_rate": 0.0001242842996038891, - "loss": 0.3127, - "step": 167500 - }, - { - "epoch": 135.43, - "learning_rate": 0.00012422803384947784, - "loss": 0.313, - "step": 167525 - }, - { - "epoch": 135.45, - "learning_rate": 0.00012417176809506662, - "loss": 0.303, - "step": 167550 - }, - { - "epoch": 135.47, - "learning_rate": 0.00012411550234065537, - "loss": 0.3268, - "step": 167575 - }, - { - "epoch": 135.49, - "learning_rate": 0.00012405923658624415, - "loss": 0.3701, - "step": 167600 - }, - { - "epoch": 135.51, - "learning_rate": 0.0001240029708318329, - "loss": 0.3157, - "step": 167625 - }, - { - "epoch": 135.53, - "learning_rate": 0.00012394670507742168, - "loss": 0.2676, - "step": 167650 - }, - { - "epoch": 135.55, - "learning_rate": 0.00012389043932301043, - "loss": 0.3035, - "step": 167675 - }, - { - "epoch": 135.57, - "learning_rate": 0.0001238341735685992, - "loss": 0.3092, - "step": 167700 - }, - { - "epoch": 135.59, - "learning_rate": 0.00012377790781418796, - "loss": 0.3087, - "step": 167725 - }, - { - "epoch": 135.61, - "learning_rate": 0.00012372164205977674, - "loss": 0.3078, - "step": 167750 - }, - { - "epoch": 135.63, - "learning_rate": 0.00012366537630536552, - "loss": 0.3105, - "step": 167775 - }, - { - "epoch": 135.65, - "learning_rate": 0.00012360911055095427, - "loss": 0.3049, - "step": 167800 - }, - { - "epoch": 135.67, - "learning_rate": 0.00012355284479654305, - "loss": 0.3142, - "step": 167825 - }, - { - "epoch": 135.69, - "learning_rate": 0.0001234965790421318, - "loss": 0.3163, - "step": 167850 - }, - { - "epoch": 135.71, - "learning_rate": 0.00012344031328772058, - "loss": 0.3115, - "step": 167875 - }, - { - "epoch": 135.73, - "learning_rate": 0.00012338404753330933, - "loss": 0.313, - "step": 167900 - }, - { - "epoch": 135.75, - "learning_rate": 0.0001233277817788981, - "loss": 0.3197, - "step": 167925 - }, - { - "epoch": 135.77, - "learning_rate": 0.00012327151602448686, - "loss": 0.3004, - "step": 167950 - }, - { - "epoch": 135.79, - "learning_rate": 0.00012321525027007564, - "loss": 0.3218, - "step": 167975 - }, - { - "epoch": 135.81, - "learning_rate": 0.0001231589845156644, - "loss": 0.2861, - "step": 168000 - }, - { - "epoch": 135.81, - "eval_cer": 0.07884254078416476, - "eval_loss": 0.39860469102859497, - "eval_runtime": 150.7158, - "eval_samples_per_second": 27.821, - "eval_steps_per_second": 6.96, - "eval_wer": 0.33210440456769985, - "step": 168000 - }, - { - "epoch": 135.83, - "learning_rate": 0.00012310271876125317, - "loss": 0.2921, - "step": 168025 - }, - { - "epoch": 135.85, - "learning_rate": 0.00012304645300684192, - "loss": 0.3139, - "step": 168050 - }, - { - "epoch": 135.87, - "learning_rate": 0.00012299018725243067, - "loss": 0.3147, - "step": 168075 - }, - { - "epoch": 135.89, - "learning_rate": 0.00012293392149801945, - "loss": 0.3194, - "step": 168100 - }, - { - "epoch": 135.91, - "learning_rate": 0.0001228776557436082, - "loss": 0.3239, - "step": 168125 - }, - { - "epoch": 135.93, - "learning_rate": 0.00012282138998919698, - "loss": 0.2988, - "step": 168150 - }, - { - "epoch": 135.95, - "learning_rate": 0.00012276512423478573, - "loss": 0.3145, - "step": 168175 - }, - { - "epoch": 135.97, - "learning_rate": 0.0001227088584803745, - "loss": 0.3016, - "step": 168200 - }, - { - "epoch": 135.99, - "learning_rate": 0.00012265259272596326, - "loss": 0.2996, - "step": 168225 - }, - { - "epoch": 136.01, - "learning_rate": 0.00012259632697155204, - "loss": 0.3197, - "step": 168250 - }, - { - "epoch": 136.03, - "learning_rate": 0.0001225400612171408, - "loss": 0.3165, - "step": 168275 - }, - { - "epoch": 136.05, - "learning_rate": 0.00012248379546272957, - "loss": 0.3363, - "step": 168300 - }, - { - "epoch": 136.08, - "learning_rate": 0.00012242752970831832, - "loss": 0.3163, - "step": 168325 - }, - { - "epoch": 136.1, - "learning_rate": 0.0001223712639539071, - "loss": 0.3296, - "step": 168350 - }, - { - "epoch": 136.12, - "learning_rate": 0.00012231499819949587, - "loss": 0.2873, - "step": 168375 - }, - { - "epoch": 136.14, - "learning_rate": 0.00012225873244508463, - "loss": 0.322, - "step": 168400 - }, - { - "epoch": 136.16, - "learning_rate": 0.0001222024666906734, - "loss": 0.2893, - "step": 168425 - }, - { - "epoch": 136.18, - "learning_rate": 0.00012214620093626216, - "loss": 0.3518, - "step": 168450 - }, - { - "epoch": 136.2, - "learning_rate": 0.00012208993518185093, - "loss": 0.301, - "step": 168475 - }, - { - "epoch": 136.22, - "learning_rate": 0.00012203366942743968, - "loss": 0.335, - "step": 168500 - }, - { - "epoch": 136.24, - "learning_rate": 0.00012197740367302845, - "loss": 0.2887, - "step": 168525 - }, - { - "epoch": 136.26, - "learning_rate": 0.00012192113791861721, - "loss": 0.3269, - "step": 168550 - }, - { - "epoch": 136.28, - "learning_rate": 0.00012186487216420598, - "loss": 0.277, - "step": 168575 - }, - { - "epoch": 136.3, - "learning_rate": 0.00012180860640979474, - "loss": 0.3189, - "step": 168600 - }, - { - "epoch": 136.32, - "learning_rate": 0.00012175234065538351, - "loss": 0.2905, - "step": 168625 - }, - { - "epoch": 136.34, - "learning_rate": 0.00012169607490097227, - "loss": 0.3169, - "step": 168650 - }, - { - "epoch": 136.36, - "learning_rate": 0.00012163980914656104, - "loss": 0.3394, - "step": 168675 - }, - { - "epoch": 136.38, - "learning_rate": 0.0001215835433921498, - "loss": 0.3289, - "step": 168700 - }, - { - "epoch": 136.4, - "learning_rate": 0.00012152727763773858, - "loss": 0.3032, - "step": 168725 - }, - { - "epoch": 136.42, - "learning_rate": 0.00012147101188332733, - "loss": 0.3371, - "step": 168750 - }, - { - "epoch": 136.44, - "learning_rate": 0.0001214147461289161, - "loss": 0.3093, - "step": 168775 - }, - { - "epoch": 136.46, - "learning_rate": 0.00012135848037450486, - "loss": 0.3675, - "step": 168800 - }, - { - "epoch": 136.48, - "learning_rate": 0.00012130221462009363, - "loss": 0.2731, - "step": 168825 - }, - { - "epoch": 136.5, - "learning_rate": 0.00012124594886568239, - "loss": 0.3193, - "step": 168850 - }, - { - "epoch": 136.52, - "learning_rate": 0.00012118968311127116, - "loss": 0.2995, - "step": 168875 - }, - { - "epoch": 136.54, - "learning_rate": 0.00012113341735685992, - "loss": 0.3197, - "step": 168900 - }, - { - "epoch": 136.56, - "learning_rate": 0.00012107715160244869, - "loss": 0.286, - "step": 168925 - }, - { - "epoch": 136.58, - "learning_rate": 0.00012102088584803745, - "loss": 0.3061, - "step": 168950 - }, - { - "epoch": 136.6, - "learning_rate": 0.00012096462009362622, - "loss": 0.3494, - "step": 168975 - }, - { - "epoch": 136.62, - "learning_rate": 0.00012090835433921498, - "loss": 0.298, - "step": 169000 - }, - { - "epoch": 136.64, - "learning_rate": 0.00012085208858480375, - "loss": 0.2882, - "step": 169025 - }, - { - "epoch": 136.66, - "learning_rate": 0.00012079582283039252, - "loss": 0.3382, - "step": 169050 - }, - { - "epoch": 136.68, - "learning_rate": 0.00012073955707598128, - "loss": 0.2833, - "step": 169075 - }, - { - "epoch": 136.7, - "learning_rate": 0.00012068329132157005, - "loss": 0.2912, - "step": 169100 - }, - { - "epoch": 136.72, - "learning_rate": 0.0001206270255671588, - "loss": 0.3223, - "step": 169125 - }, - { - "epoch": 136.74, - "learning_rate": 0.00012057075981274757, - "loss": 0.3128, - "step": 169150 - }, - { - "epoch": 136.76, - "learning_rate": 0.00012051449405833633, - "loss": 0.294, - "step": 169175 - }, - { - "epoch": 136.78, - "learning_rate": 0.0001204582283039251, - "loss": 0.2779, - "step": 169200 - }, - { - "epoch": 136.8, - "learning_rate": 0.00012040196254951386, - "loss": 0.3011, - "step": 169225 - }, - { - "epoch": 136.82, - "learning_rate": 0.00012034569679510263, - "loss": 0.3261, - "step": 169250 - }, - { - "epoch": 136.84, - "learning_rate": 0.0001202894310406914, - "loss": 0.2565, - "step": 169275 - }, - { - "epoch": 136.86, - "learning_rate": 0.00012023316528628016, - "loss": 0.3077, - "step": 169300 - }, - { - "epoch": 136.88, - "learning_rate": 0.00012017689953186892, - "loss": 0.3274, - "step": 169325 - }, - { - "epoch": 136.9, - "learning_rate": 0.00012012063377745769, - "loss": 0.3226, - "step": 169350 - }, - { - "epoch": 136.92, - "learning_rate": 0.00012006436802304647, - "loss": 0.3182, - "step": 169375 - }, - { - "epoch": 136.94, - "learning_rate": 0.00012000810226863522, - "loss": 0.3158, - "step": 169400 - }, - { - "epoch": 136.96, - "learning_rate": 0.000119951836514224, - "loss": 0.3394, - "step": 169425 - }, - { - "epoch": 136.98, - "learning_rate": 0.00011989557075981275, - "loss": 0.2783, - "step": 169450 - }, - { - "epoch": 137.0, - "learning_rate": 0.00011983930500540151, - "loss": 0.3017, - "step": 169475 - }, - { - "epoch": 137.03, - "learning_rate": 0.00011978303925099028, - "loss": 0.3023, - "step": 169500 - }, - { - "epoch": 137.05, - "learning_rate": 0.00011972677349657904, - "loss": 0.2827, - "step": 169525 - }, - { - "epoch": 137.07, - "learning_rate": 0.0001196705077421678, - "loss": 0.2734, - "step": 169550 - }, - { - "epoch": 137.09, - "learning_rate": 0.00011961424198775657, - "loss": 0.3511, - "step": 169575 - }, - { - "epoch": 137.11, - "learning_rate": 0.00011955797623334534, - "loss": 0.3267, - "step": 169600 - }, - { - "epoch": 137.13, - "learning_rate": 0.0001195017104789341, - "loss": 0.2964, - "step": 169625 - }, - { - "epoch": 137.15, - "learning_rate": 0.00011944544472452288, - "loss": 0.2819, - "step": 169650 - }, - { - "epoch": 137.17, - "learning_rate": 0.00011938917897011163, - "loss": 0.3149, - "step": 169675 - }, - { - "epoch": 137.19, - "learning_rate": 0.00011933291321570041, - "loss": 0.313, - "step": 169700 - }, - { - "epoch": 137.21, - "learning_rate": 0.00011927664746128916, - "loss": 0.2858, - "step": 169725 - }, - { - "epoch": 137.23, - "learning_rate": 0.00011922038170687794, - "loss": 0.2711, - "step": 169750 - }, - { - "epoch": 137.25, - "learning_rate": 0.00011916411595246669, - "loss": 0.3047, - "step": 169775 - }, - { - "epoch": 137.27, - "learning_rate": 0.00011910785019805547, - "loss": 0.2944, - "step": 169800 - }, - { - "epoch": 137.29, - "learning_rate": 0.00011905158444364422, - "loss": 0.2697, - "step": 169825 - }, - { - "epoch": 137.31, - "learning_rate": 0.00011899531868923298, - "loss": 0.2926, - "step": 169850 - }, - { - "epoch": 137.33, - "learning_rate": 0.00011893905293482175, - "loss": 0.29, - "step": 169875 - }, - { - "epoch": 137.35, - "learning_rate": 0.00011888503781058696, - "loss": 0.2891, - "step": 169900 - }, - { - "epoch": 137.37, - "learning_rate": 0.00011882877205617573, - "loss": 0.3194, - "step": 169925 - }, - { - "epoch": 137.39, - "learning_rate": 0.00011877250630176449, - "loss": 0.3081, - "step": 169950 - }, - { - "epoch": 137.41, - "learning_rate": 0.00011871624054735327, - "loss": 0.2835, - "step": 169975 - }, - { - "epoch": 137.43, - "learning_rate": 0.00011865997479294202, - "loss": 0.2794, - "step": 170000 - }, - { - "epoch": 137.45, - "learning_rate": 0.0001186037090385308, - "loss": 0.2922, - "step": 170025 - }, - { - "epoch": 137.47, - "learning_rate": 0.00011854744328411955, - "loss": 0.3218, - "step": 170050 - }, - { - "epoch": 137.49, - "learning_rate": 0.00011849117752970833, - "loss": 0.2572, - "step": 170075 - }, - { - "epoch": 137.51, - "learning_rate": 0.00011843491177529708, - "loss": 0.306, - "step": 170100 - }, - { - "epoch": 137.53, - "learning_rate": 0.00011837864602088586, - "loss": 0.287, - "step": 170125 - }, - { - "epoch": 137.55, - "learning_rate": 0.00011832238026647461, - "loss": 0.2955, - "step": 170150 - }, - { - "epoch": 137.57, - "learning_rate": 0.00011826611451206339, - "loss": 0.278, - "step": 170175 - }, - { - "epoch": 137.59, - "learning_rate": 0.00011820984875765214, - "loss": 0.2853, - "step": 170200 - }, - { - "epoch": 137.61, - "learning_rate": 0.00011815358300324092, - "loss": 0.3193, - "step": 170225 - }, - { - "epoch": 137.63, - "learning_rate": 0.00011809731724882967, - "loss": 0.2939, - "step": 170250 - }, - { - "epoch": 137.65, - "learning_rate": 0.00011804105149441843, - "loss": 0.2987, - "step": 170275 - }, - { - "epoch": 137.67, - "learning_rate": 0.00011798478574000721, - "loss": 0.3462, - "step": 170300 - }, - { - "epoch": 137.69, - "learning_rate": 0.00011792851998559596, - "loss": 0.3188, - "step": 170325 - }, - { - "epoch": 137.71, - "learning_rate": 0.00011787225423118474, - "loss": 0.2941, - "step": 170350 - }, - { - "epoch": 137.73, - "learning_rate": 0.00011781598847677349, - "loss": 0.3043, - "step": 170375 - }, - { - "epoch": 137.75, - "learning_rate": 0.00011775972272236227, - "loss": 0.3037, - "step": 170400 - }, - { - "epoch": 137.77, - "learning_rate": 0.00011770345696795102, - "loss": 0.3143, - "step": 170425 - }, - { - "epoch": 137.79, - "learning_rate": 0.0001176471912135398, - "loss": 0.3184, - "step": 170450 - }, - { - "epoch": 137.81, - "learning_rate": 0.00011759092545912855, - "loss": 0.3059, - "step": 170475 - }, - { - "epoch": 137.83, - "learning_rate": 0.00011753465970471733, - "loss": 0.2957, - "step": 170500 - }, - { - "epoch": 137.85, - "learning_rate": 0.00011747839395030608, - "loss": 0.2845, - "step": 170525 - }, - { - "epoch": 137.87, - "learning_rate": 0.00011742212819589486, - "loss": 0.2972, - "step": 170550 - }, - { - "epoch": 137.89, - "learning_rate": 0.00011736586244148361, - "loss": 0.28, - "step": 170575 - }, - { - "epoch": 137.91, - "learning_rate": 0.00011731184731724884, - "loss": 0.3189, - "step": 170600 - }, - { - "epoch": 137.93, - "learning_rate": 0.0001172555815628376, - "loss": 0.2701, - "step": 170625 - }, - { - "epoch": 137.95, - "learning_rate": 0.00011719931580842637, - "loss": 0.3023, - "step": 170650 - }, - { - "epoch": 137.97, - "learning_rate": 0.00011714305005401513, - "loss": 0.2986, - "step": 170675 - }, - { - "epoch": 138.0, - "learning_rate": 0.00011708678429960388, - "loss": 0.2969, - "step": 170700 - }, - { - "epoch": 138.02, - "learning_rate": 0.00011703051854519266, - "loss": 0.2963, - "step": 170725 - }, - { - "epoch": 138.04, - "learning_rate": 0.00011697425279078141, - "loss": 0.2854, - "step": 170750 - }, - { - "epoch": 138.06, - "learning_rate": 0.00011691798703637019, - "loss": 0.302, - "step": 170775 - }, - { - "epoch": 138.08, - "learning_rate": 0.00011686172128195894, - "loss": 0.2673, - "step": 170800 - }, - { - "epoch": 138.1, - "learning_rate": 0.00011680545552754772, - "loss": 0.3032, - "step": 170825 - }, - { - "epoch": 138.12, - "learning_rate": 0.00011674918977313647, - "loss": 0.2525, - "step": 170850 - }, - { - "epoch": 138.14, - "learning_rate": 0.00011669292401872525, - "loss": 0.3259, - "step": 170875 - }, - { - "epoch": 138.16, - "learning_rate": 0.000116636658264314, - "loss": 0.278, - "step": 170900 - }, - { - "epoch": 138.18, - "learning_rate": 0.00011658039250990278, - "loss": 0.2929, - "step": 170925 - }, - { - "epoch": 138.2, - "learning_rate": 0.00011652412675549154, - "loss": 0.2807, - "step": 170950 - }, - { - "epoch": 138.22, - "learning_rate": 0.00011646786100108031, - "loss": 0.3071, - "step": 170975 - }, - { - "epoch": 138.24, - "learning_rate": 0.00011641159524666907, - "loss": 0.2684, - "step": 171000 - }, - { - "epoch": 138.24, - "eval_cer": 0.07738468014332207, - "eval_loss": 0.4014652967453003, - "eval_runtime": 148.1695, - "eval_samples_per_second": 28.299, - "eval_steps_per_second": 7.08, - "eval_wer": 0.3298531810766721, - "step": 171000 - }, - { - "epoch": 138.26, - "learning_rate": 0.00011635532949225784, - "loss": 0.3076, - "step": 171025 - }, - { - "epoch": 138.28, - "learning_rate": 0.0001162990637378466, - "loss": 0.2608, - "step": 171050 - }, - { - "epoch": 138.3, - "learning_rate": 0.00011624279798343535, - "loss": 0.263, - "step": 171075 - }, - { - "epoch": 138.32, - "learning_rate": 0.00011618653222902413, - "loss": 0.2851, - "step": 171100 - }, - { - "epoch": 138.34, - "learning_rate": 0.00011613026647461288, - "loss": 0.3014, - "step": 171125 - }, - { - "epoch": 138.36, - "learning_rate": 0.00011607400072020166, - "loss": 0.2999, - "step": 171150 - }, - { - "epoch": 138.38, - "learning_rate": 0.00011601773496579041, - "loss": 0.282, - "step": 171175 - }, - { - "epoch": 138.4, - "learning_rate": 0.00011596146921137919, - "loss": 0.294, - "step": 171200 - }, - { - "epoch": 138.42, - "learning_rate": 0.00011590520345696794, - "loss": 0.2917, - "step": 171225 - }, - { - "epoch": 138.44, - "learning_rate": 0.00011584893770255672, - "loss": 0.2989, - "step": 171250 - }, - { - "epoch": 138.46, - "learning_rate": 0.00011579267194814549, - "loss": 0.2784, - "step": 171275 - }, - { - "epoch": 138.48, - "learning_rate": 0.00011573640619373425, - "loss": 0.2769, - "step": 171300 - }, - { - "epoch": 138.5, - "learning_rate": 0.00011568014043932302, - "loss": 0.3011, - "step": 171325 - }, - { - "epoch": 138.52, - "learning_rate": 0.00011562387468491178, - "loss": 0.2945, - "step": 171350 - }, - { - "epoch": 138.54, - "learning_rate": 0.00011556760893050055, - "loss": 0.2648, - "step": 171375 - }, - { - "epoch": 138.56, - "learning_rate": 0.0001155113431760893, - "loss": 0.2837, - "step": 171400 - }, - { - "epoch": 138.58, - "learning_rate": 0.00011545507742167808, - "loss": 0.29, - "step": 171425 - }, - { - "epoch": 138.6, - "learning_rate": 0.00011539881166726683, - "loss": 0.2791, - "step": 171450 - }, - { - "epoch": 138.62, - "learning_rate": 0.0001153425459128556, - "loss": 0.3383, - "step": 171475 - }, - { - "epoch": 138.64, - "learning_rate": 0.00011528628015844436, - "loss": 0.2563, - "step": 171500 - }, - { - "epoch": 138.66, - "learning_rate": 0.00011523001440403313, - "loss": 0.3518, - "step": 171525 - }, - { - "epoch": 138.68, - "learning_rate": 0.00011517374864962189, - "loss": 0.2703, - "step": 171550 - }, - { - "epoch": 138.7, - "learning_rate": 0.00011511748289521066, - "loss": 0.2963, - "step": 171575 - }, - { - "epoch": 138.72, - "learning_rate": 0.00011506121714079943, - "loss": 0.2854, - "step": 171600 - }, - { - "epoch": 138.74, - "learning_rate": 0.0001150049513863882, - "loss": 0.3061, - "step": 171625 - }, - { - "epoch": 138.76, - "learning_rate": 0.00011494868563197696, - "loss": 0.2825, - "step": 171650 - }, - { - "epoch": 138.78, - "learning_rate": 0.00011489241987756572, - "loss": 0.307, - "step": 171675 - }, - { - "epoch": 138.8, - "learning_rate": 0.00011483615412315449, - "loss": 0.2979, - "step": 171700 - }, - { - "epoch": 138.82, - "learning_rate": 0.00011477988836874325, - "loss": 0.2978, - "step": 171725 - }, - { - "epoch": 138.84, - "learning_rate": 0.00011472362261433202, - "loss": 0.2819, - "step": 171750 - }, - { - "epoch": 138.86, - "learning_rate": 0.00011466735685992077, - "loss": 0.299, - "step": 171775 - }, - { - "epoch": 138.88, - "learning_rate": 0.00011461109110550955, - "loss": 0.2925, - "step": 171800 - }, - { - "epoch": 138.9, - "learning_rate": 0.0001145548253510983, - "loss": 0.2929, - "step": 171825 - }, - { - "epoch": 138.92, - "learning_rate": 0.00011449855959668708, - "loss": 0.2999, - "step": 171850 - }, - { - "epoch": 138.95, - "learning_rate": 0.00011444229384227584, - "loss": 0.2954, - "step": 171875 - }, - { - "epoch": 138.97, - "learning_rate": 0.00011438602808786461, - "loss": 0.3031, - "step": 171900 - }, - { - "epoch": 138.99, - "learning_rate": 0.00011432976233345337, - "loss": 0.2931, - "step": 171925 - }, - { - "epoch": 139.01, - "learning_rate": 0.00011427349657904214, - "loss": 0.2981, - "step": 171950 - }, - { - "epoch": 139.03, - "learning_rate": 0.0001142172308246309, - "loss": 0.2876, - "step": 171975 - }, - { - "epoch": 139.05, - "learning_rate": 0.00011416096507021967, - "loss": 0.2828, - "step": 172000 - }, - { - "epoch": 139.07, - "learning_rate": 0.00011410469931580843, - "loss": 0.2878, - "step": 172025 - }, - { - "epoch": 139.09, - "learning_rate": 0.0001140484335613972, - "loss": 0.312, - "step": 172050 - }, - { - "epoch": 139.11, - "learning_rate": 0.00011399216780698596, - "loss": 0.2955, - "step": 172075 - }, - { - "epoch": 139.13, - "learning_rate": 0.00011393590205257471, - "loss": 0.2678, - "step": 172100 - }, - { - "epoch": 139.15, - "learning_rate": 0.00011387963629816349, - "loss": 0.2801, - "step": 172125 - }, - { - "epoch": 139.17, - "learning_rate": 0.00011382337054375224, - "loss": 0.2742, - "step": 172150 - }, - { - "epoch": 139.19, - "learning_rate": 0.00011376710478934102, - "loss": 0.2767, - "step": 172175 - }, - { - "epoch": 139.21, - "learning_rate": 0.00011371083903492978, - "loss": 0.2836, - "step": 172200 - }, - { - "epoch": 139.23, - "learning_rate": 0.00011365457328051855, - "loss": 0.2982, - "step": 172225 - }, - { - "epoch": 139.25, - "learning_rate": 0.00011359830752610731, - "loss": 0.2699, - "step": 172250 - }, - { - "epoch": 139.27, - "learning_rate": 0.00011354204177169608, - "loss": 0.3034, - "step": 172275 - }, - { - "epoch": 139.29, - "learning_rate": 0.00011348577601728484, - "loss": 0.3068, - "step": 172300 - }, - { - "epoch": 139.31, - "learning_rate": 0.00011342951026287361, - "loss": 0.2779, - "step": 172325 - }, - { - "epoch": 139.33, - "learning_rate": 0.00011337324450846237, - "loss": 0.2628, - "step": 172350 - }, - { - "epoch": 139.35, - "learning_rate": 0.00011331697875405114, - "loss": 0.2489, - "step": 172375 - }, - { - "epoch": 139.37, - "learning_rate": 0.0001132607129996399, - "loss": 0.3067, - "step": 172400 - }, - { - "epoch": 139.39, - "learning_rate": 0.00011320444724522867, - "loss": 0.2742, - "step": 172425 - }, - { - "epoch": 139.41, - "learning_rate": 0.00011314818149081743, - "loss": 0.2872, - "step": 172450 - }, - { - "epoch": 139.43, - "learning_rate": 0.00011309191573640618, - "loss": 0.2746, - "step": 172475 - }, - { - "epoch": 139.45, - "learning_rate": 0.00011303564998199496, - "loss": 0.3101, - "step": 172500 - }, - { - "epoch": 139.47, - "learning_rate": 0.00011297938422758373, - "loss": 0.2742, - "step": 172525 - }, - { - "epoch": 139.49, - "learning_rate": 0.00011292311847317249, - "loss": 0.2837, - "step": 172550 - }, - { - "epoch": 139.51, - "learning_rate": 0.00011286685271876126, - "loss": 0.2966, - "step": 172575 - }, - { - "epoch": 139.53, - "learning_rate": 0.00011281058696435002, - "loss": 0.2651, - "step": 172600 - }, - { - "epoch": 139.55, - "learning_rate": 0.00011275432120993879, - "loss": 0.2917, - "step": 172625 - }, - { - "epoch": 139.57, - "learning_rate": 0.00011269805545552755, - "loss": 0.325, - "step": 172650 - }, - { - "epoch": 139.59, - "learning_rate": 0.00011264178970111632, - "loss": 0.2883, - "step": 172675 - }, - { - "epoch": 139.61, - "learning_rate": 0.00011258552394670508, - "loss": 0.318, - "step": 172700 - }, - { - "epoch": 139.63, - "learning_rate": 0.00011252925819229385, - "loss": 0.2515, - "step": 172725 - }, - { - "epoch": 139.65, - "learning_rate": 0.00011247299243788261, - "loss": 0.302, - "step": 172750 - }, - { - "epoch": 139.67, - "learning_rate": 0.00011241672668347137, - "loss": 0.3091, - "step": 172775 - }, - { - "epoch": 139.69, - "learning_rate": 0.00011236046092906014, - "loss": 0.2583, - "step": 172800 - }, - { - "epoch": 139.71, - "learning_rate": 0.0001123041951746489, - "loss": 0.287, - "step": 172825 - }, - { - "epoch": 139.73, - "learning_rate": 0.00011224792942023767, - "loss": 0.2717, - "step": 172850 - }, - { - "epoch": 139.75, - "learning_rate": 0.00011219166366582643, - "loss": 0.2837, - "step": 172875 - }, - { - "epoch": 139.77, - "learning_rate": 0.0001121353979114152, - "loss": 0.3425, - "step": 172900 - }, - { - "epoch": 139.79, - "learning_rate": 0.00011207913215700396, - "loss": 0.2964, - "step": 172925 - }, - { - "epoch": 139.81, - "learning_rate": 0.00011202286640259273, - "loss": 0.2905, - "step": 172950 - }, - { - "epoch": 139.83, - "learning_rate": 0.00011196660064818149, - "loss": 0.2925, - "step": 172975 - }, - { - "epoch": 139.85, - "learning_rate": 0.00011191033489377026, - "loss": 0.2624, - "step": 173000 - }, - { - "epoch": 139.87, - "learning_rate": 0.00011185406913935902, - "loss": 0.2889, - "step": 173025 - }, - { - "epoch": 139.89, - "learning_rate": 0.00011179780338494779, - "loss": 0.2856, - "step": 173050 - }, - { - "epoch": 139.92, - "learning_rate": 0.00011174153763053655, - "loss": 0.3082, - "step": 173075 - }, - { - "epoch": 139.94, - "learning_rate": 0.00011168527187612532, - "loss": 0.2864, - "step": 173100 - }, - { - "epoch": 139.96, - "learning_rate": 0.00011162900612171408, - "loss": 0.305, - "step": 173125 - }, - { - "epoch": 139.98, - "learning_rate": 0.00011157274036730285, - "loss": 0.2429, - "step": 173150 - }, - { - "epoch": 140.0, - "learning_rate": 0.00011151647461289161, - "loss": 0.2649, - "step": 173175 - }, - { - "epoch": 140.02, - "learning_rate": 0.00011146020885848038, - "loss": 0.2885, - "step": 173200 - }, - { - "epoch": 140.04, - "learning_rate": 0.00011140394310406914, - "loss": 0.268, - "step": 173225 - }, - { - "epoch": 140.06, - "learning_rate": 0.0001113476773496579, - "loss": 0.261, - "step": 173250 - }, - { - "epoch": 140.08, - "learning_rate": 0.00011129141159524667, - "loss": 0.2635, - "step": 173275 - }, - { - "epoch": 140.1, - "learning_rate": 0.00011123514584083544, - "loss": 0.2925, - "step": 173300 - }, - { - "epoch": 140.12, - "learning_rate": 0.0001111788800864242, - "loss": 0.258, - "step": 173325 - }, - { - "epoch": 140.14, - "learning_rate": 0.00011112261433201297, - "loss": 0.2917, - "step": 173350 - }, - { - "epoch": 140.16, - "learning_rate": 0.00011106634857760173, - "loss": 0.2612, - "step": 173375 - }, - { - "epoch": 140.18, - "learning_rate": 0.0001110100828231905, - "loss": 0.2843, - "step": 173400 - }, - { - "epoch": 140.2, - "learning_rate": 0.00011095381706877926, - "loss": 0.2835, - "step": 173425 - }, - { - "epoch": 140.22, - "learning_rate": 0.00011089755131436802, - "loss": 0.2705, - "step": 173450 - }, - { - "epoch": 140.24, - "learning_rate": 0.00011084128555995679, - "loss": 0.2501, - "step": 173475 - }, - { - "epoch": 140.26, - "learning_rate": 0.00011078501980554557, - "loss": 0.2746, - "step": 173500 - }, - { - "epoch": 140.28, - "learning_rate": 0.00011072875405113432, - "loss": 0.3089, - "step": 173525 - }, - { - "epoch": 140.3, - "learning_rate": 0.00011067248829672308, - "loss": 0.2911, - "step": 173550 - }, - { - "epoch": 140.32, - "learning_rate": 0.00011061622254231185, - "loss": 0.2676, - "step": 173575 - }, - { - "epoch": 140.34, - "learning_rate": 0.00011055995678790061, - "loss": 0.3069, - "step": 173600 - }, - { - "epoch": 140.36, - "learning_rate": 0.00011050369103348938, - "loss": 0.2712, - "step": 173625 - }, - { - "epoch": 140.38, - "learning_rate": 0.00011044742527907814, - "loss": 0.3218, - "step": 173650 - }, - { - "epoch": 140.4, - "learning_rate": 0.00011039115952466691, - "loss": 0.2947, - "step": 173675 - }, - { - "epoch": 140.42, - "learning_rate": 0.00011033489377025567, - "loss": 0.2914, - "step": 173700 - }, - { - "epoch": 140.44, - "learning_rate": 0.00011027862801584444, - "loss": 0.2393, - "step": 173725 - }, - { - "epoch": 140.46, - "learning_rate": 0.0001102223622614332, - "loss": 0.2852, - "step": 173750 - }, - { - "epoch": 140.48, - "learning_rate": 0.00011016609650702197, - "loss": 0.2695, - "step": 173775 - }, - { - "epoch": 140.5, - "learning_rate": 0.00011010983075261073, - "loss": 0.2816, - "step": 173800 - }, - { - "epoch": 140.52, - "learning_rate": 0.00011005356499819951, - "loss": 0.3011, - "step": 173825 - }, - { - "epoch": 140.54, - "learning_rate": 0.00010999729924378826, - "loss": 0.273, - "step": 173850 - }, - { - "epoch": 140.56, - "learning_rate": 0.00010994103348937704, - "loss": 0.2642, - "step": 173875 - }, - { - "epoch": 140.58, - "learning_rate": 0.00010988476773496579, - "loss": 0.3017, - "step": 173900 - }, - { - "epoch": 140.6, - "learning_rate": 0.00010982850198055456, - "loss": 0.2992, - "step": 173925 - }, - { - "epoch": 140.62, - "learning_rate": 0.00010977223622614332, - "loss": 0.2861, - "step": 173950 - }, - { - "epoch": 140.64, - "learning_rate": 0.00010971597047173209, - "loss": 0.2856, - "step": 173975 - }, - { - "epoch": 140.66, - "learning_rate": 0.00010965970471732085, - "loss": 0.3027, - "step": 174000 - }, - { - "epoch": 140.66, - "eval_cer": 0.07708181472849912, - "eval_loss": 0.4022682011127472, - "eval_runtime": 148.8918, - "eval_samples_per_second": 28.161, - "eval_steps_per_second": 7.045, - "eval_wer": 0.3271778140293638, - "step": 174000 - }, - { - "epoch": 140.68, - "learning_rate": 0.00010960343896290961, - "loss": 0.2699, - "step": 174025 - }, - { - "epoch": 140.7, - "learning_rate": 0.00010954717320849838, - "loss": 0.3009, - "step": 174050 - }, - { - "epoch": 140.72, - "learning_rate": 0.00010949090745408714, - "loss": 0.2494, - "step": 174075 - }, - { - "epoch": 140.74, - "learning_rate": 0.00010943464169967591, - "loss": 0.2995, - "step": 174100 - }, - { - "epoch": 140.76, - "learning_rate": 0.00010937837594526467, - "loss": 0.2852, - "step": 174125 - }, - { - "epoch": 140.78, - "learning_rate": 0.00010932211019085345, - "loss": 0.2718, - "step": 174150 - }, - { - "epoch": 140.8, - "learning_rate": 0.0001092658444364422, - "loss": 0.2706, - "step": 174175 - }, - { - "epoch": 140.82, - "learning_rate": 0.00010920957868203098, - "loss": 0.2943, - "step": 174200 - }, - { - "epoch": 140.84, - "learning_rate": 0.00010915331292761973, - "loss": 0.2803, - "step": 174225 - }, - { - "epoch": 140.86, - "learning_rate": 0.0001090970471732085, - "loss": 0.3043, - "step": 174250 - }, - { - "epoch": 140.89, - "learning_rate": 0.00010904078141879726, - "loss": 0.2994, - "step": 174275 - }, - { - "epoch": 140.91, - "learning_rate": 0.00010898451566438603, - "loss": 0.2499, - "step": 174300 - }, - { - "epoch": 140.93, - "learning_rate": 0.00010892824990997479, - "loss": 0.255, - "step": 174325 - }, - { - "epoch": 140.95, - "learning_rate": 0.00010887198415556356, - "loss": 0.3099, - "step": 174350 - }, - { - "epoch": 140.97, - "learning_rate": 0.00010881571840115232, - "loss": 0.2674, - "step": 174375 - }, - { - "epoch": 140.99, - "learning_rate": 0.00010875945264674109, - "loss": 0.286, - "step": 174400 - }, - { - "epoch": 141.01, - "learning_rate": 0.00010870318689232987, - "loss": 0.2941, - "step": 174425 - }, - { - "epoch": 141.03, - "learning_rate": 0.00010864692113791862, - "loss": 0.2946, - "step": 174450 - }, - { - "epoch": 141.05, - "learning_rate": 0.0001085906553835074, - "loss": 0.2516, - "step": 174475 - }, - { - "epoch": 141.07, - "learning_rate": 0.00010853438962909615, - "loss": 0.2951, - "step": 174500 - }, - { - "epoch": 141.09, - "learning_rate": 0.00010847812387468492, - "loss": 0.2711, - "step": 174525 - }, - { - "epoch": 141.11, - "learning_rate": 0.00010842185812027368, - "loss": 0.2711, - "step": 174550 - }, - { - "epoch": 141.13, - "learning_rate": 0.00010836559236586245, - "loss": 0.2735, - "step": 174575 - }, - { - "epoch": 141.15, - "learning_rate": 0.0001083093266114512, - "loss": 0.2538, - "step": 174600 - }, - { - "epoch": 141.17, - "learning_rate": 0.00010825306085703997, - "loss": 0.292, - "step": 174625 - }, - { - "epoch": 141.19, - "learning_rate": 0.00010819679510262873, - "loss": 0.2676, - "step": 174650 - }, - { - "epoch": 141.21, - "learning_rate": 0.0001081405293482175, - "loss": 0.3015, - "step": 174675 - }, - { - "epoch": 141.23, - "learning_rate": 0.00010808426359380626, - "loss": 0.2743, - "step": 174700 - }, - { - "epoch": 141.25, - "learning_rate": 0.00010802799783939503, - "loss": 0.3051, - "step": 174725 - }, - { - "epoch": 141.27, - "learning_rate": 0.00010797173208498381, - "loss": 0.2722, - "step": 174750 - }, - { - "epoch": 141.29, - "learning_rate": 0.000107917716960749, - "loss": 0.2842, - "step": 174775 - }, - { - "epoch": 141.31, - "learning_rate": 0.00010786145120633778, - "loss": 0.2956, - "step": 174800 - }, - { - "epoch": 141.33, - "learning_rate": 0.00010780518545192654, - "loss": 0.2599, - "step": 174825 - }, - { - "epoch": 141.35, - "learning_rate": 0.00010774891969751531, - "loss": 0.2926, - "step": 174850 - }, - { - "epoch": 141.37, - "learning_rate": 0.00010769265394310407, - "loss": 0.273, - "step": 174875 - }, - { - "epoch": 141.39, - "learning_rate": 0.00010763638818869284, - "loss": 0.2931, - "step": 174900 - }, - { - "epoch": 141.41, - "learning_rate": 0.0001075801224342816, - "loss": 0.2713, - "step": 174925 - }, - { - "epoch": 141.43, - "learning_rate": 0.00010752385667987037, - "loss": 0.2927, - "step": 174950 - }, - { - "epoch": 141.45, - "learning_rate": 0.00010746759092545912, - "loss": 0.2819, - "step": 174975 - }, - { - "epoch": 141.47, - "learning_rate": 0.0001074113251710479, - "loss": 0.2662, - "step": 175000 - }, - { - "epoch": 141.49, - "learning_rate": 0.00010735505941663665, - "loss": 0.2878, - "step": 175025 - }, - { - "epoch": 141.51, - "learning_rate": 0.00010729879366222542, - "loss": 0.2845, - "step": 175050 - }, - { - "epoch": 141.53, - "learning_rate": 0.0001072425279078142, - "loss": 0.2991, - "step": 175075 - }, - { - "epoch": 141.55, - "learning_rate": 0.00010718626215340295, - "loss": 0.2895, - "step": 175100 - }, - { - "epoch": 141.57, - "learning_rate": 0.00010712999639899173, - "loss": 0.2725, - "step": 175125 - }, - { - "epoch": 141.59, - "learning_rate": 0.00010707373064458048, - "loss": 0.278, - "step": 175150 - }, - { - "epoch": 141.61, - "learning_rate": 0.00010701746489016926, - "loss": 0.3198, - "step": 175175 - }, - { - "epoch": 141.63, - "learning_rate": 0.00010696119913575801, - "loss": 0.2396, - "step": 175200 - }, - { - "epoch": 141.65, - "learning_rate": 0.00010690493338134679, - "loss": 0.2867, - "step": 175225 - }, - { - "epoch": 141.67, - "learning_rate": 0.00010684866762693554, - "loss": 0.261, - "step": 175250 - }, - { - "epoch": 141.69, - "learning_rate": 0.00010679240187252432, - "loss": 0.2841, - "step": 175275 - }, - { - "epoch": 141.71, - "learning_rate": 0.00010673613611811307, - "loss": 0.2834, - "step": 175300 - }, - { - "epoch": 141.73, - "learning_rate": 0.00010667987036370185, - "loss": 0.3053, - "step": 175325 - }, - { - "epoch": 141.75, - "learning_rate": 0.0001066236046092906, - "loss": 0.266, - "step": 175350 - }, - { - "epoch": 141.77, - "learning_rate": 0.00010656733885487936, - "loss": 0.243, - "step": 175375 - }, - { - "epoch": 141.79, - "learning_rate": 0.00010651107310046814, - "loss": 0.2668, - "step": 175400 - }, - { - "epoch": 141.81, - "learning_rate": 0.00010645480734605689, - "loss": 0.2564, - "step": 175425 - }, - { - "epoch": 141.84, - "learning_rate": 0.00010639854159164567, - "loss": 0.28, - "step": 175450 - }, - { - "epoch": 141.86, - "learning_rate": 0.00010634227583723442, - "loss": 0.2736, - "step": 175475 - }, - { - "epoch": 141.88, - "learning_rate": 0.0001062860100828232, - "loss": 0.2765, - "step": 175500 - }, - { - "epoch": 141.9, - "learning_rate": 0.00010622974432841195, - "loss": 0.2498, - "step": 175525 - }, - { - "epoch": 141.92, - "learning_rate": 0.00010617347857400073, - "loss": 0.2621, - "step": 175550 - }, - { - "epoch": 141.94, - "learning_rate": 0.00010611721281958948, - "loss": 0.2964, - "step": 175575 - }, - { - "epoch": 141.96, - "learning_rate": 0.00010606094706517826, - "loss": 0.2681, - "step": 175600 - }, - { - "epoch": 141.98, - "learning_rate": 0.00010600468131076701, - "loss": 0.2661, - "step": 175625 - }, - { - "epoch": 142.0, - "learning_rate": 0.00010594841555635579, - "loss": 0.3061, - "step": 175650 - }, - { - "epoch": 142.02, - "learning_rate": 0.00010589214980194454, - "loss": 0.2647, - "step": 175675 - }, - { - "epoch": 142.04, - "learning_rate": 0.00010583588404753332, - "loss": 0.2527, - "step": 175700 - }, - { - "epoch": 142.06, - "learning_rate": 0.00010577961829312208, - "loss": 0.2711, - "step": 175725 - }, - { - "epoch": 142.08, - "learning_rate": 0.00010572335253871083, - "loss": 0.2901, - "step": 175750 - }, - { - "epoch": 142.1, - "learning_rate": 0.00010566708678429961, - "loss": 0.2703, - "step": 175775 - }, - { - "epoch": 142.12, - "learning_rate": 0.00010561082102988836, - "loss": 0.2531, - "step": 175800 - }, - { - "epoch": 142.14, - "learning_rate": 0.00010555455527547714, - "loss": 0.2782, - "step": 175825 - }, - { - "epoch": 142.16, - "learning_rate": 0.00010549828952106589, - "loss": 0.2693, - "step": 175850 - }, - { - "epoch": 142.18, - "learning_rate": 0.00010544202376665467, - "loss": 0.2651, - "step": 175875 - }, - { - "epoch": 142.2, - "learning_rate": 0.00010538575801224342, - "loss": 0.2791, - "step": 175900 - }, - { - "epoch": 142.22, - "learning_rate": 0.0001053294922578322, - "loss": 0.2897, - "step": 175925 - }, - { - "epoch": 142.24, - "learning_rate": 0.00010527322650342095, - "loss": 0.2439, - "step": 175950 - }, - { - "epoch": 142.26, - "learning_rate": 0.00010521696074900973, - "loss": 0.2884, - "step": 175975 - }, - { - "epoch": 142.28, - "learning_rate": 0.00010516069499459848, - "loss": 0.255, - "step": 176000 - }, - { - "epoch": 142.3, - "learning_rate": 0.00010510442924018726, - "loss": 0.2626, - "step": 176025 - }, - { - "epoch": 142.32, - "learning_rate": 0.00010504816348577602, - "loss": 0.2629, - "step": 176050 - }, - { - "epoch": 142.34, - "learning_rate": 0.00010499189773136479, - "loss": 0.2627, - "step": 176075 - }, - { - "epoch": 142.36, - "learning_rate": 0.00010493563197695355, - "loss": 0.2666, - "step": 176100 - }, - { - "epoch": 142.38, - "learning_rate": 0.0001048793662225423, - "loss": 0.256, - "step": 176125 - }, - { - "epoch": 142.4, - "learning_rate": 0.00010482310046813108, - "loss": 0.2422, - "step": 176150 - }, - { - "epoch": 142.42, - "learning_rate": 0.00010476683471371984, - "loss": 0.2624, - "step": 176175 - }, - { - "epoch": 142.44, - "learning_rate": 0.00010471056895930861, - "loss": 0.2484, - "step": 176200 - }, - { - "epoch": 142.46, - "learning_rate": 0.00010465430320489736, - "loss": 0.2808, - "step": 176225 - }, - { - "epoch": 142.48, - "learning_rate": 0.00010459803745048614, - "loss": 0.2721, - "step": 176250 - }, - { - "epoch": 142.5, - "learning_rate": 0.0001045417716960749, - "loss": 0.2502, - "step": 176275 - }, - { - "epoch": 142.52, - "learning_rate": 0.00010448550594166367, - "loss": 0.2818, - "step": 176300 - }, - { - "epoch": 142.54, - "learning_rate": 0.00010442924018725242, - "loss": 0.2806, - "step": 176325 - }, - { - "epoch": 142.56, - "learning_rate": 0.0001043729744328412, - "loss": 0.2663, - "step": 176350 - }, - { - "epoch": 142.58, - "learning_rate": 0.00010431670867842997, - "loss": 0.2644, - "step": 176375 - }, - { - "epoch": 142.6, - "learning_rate": 0.00010426044292401873, - "loss": 0.2705, - "step": 176400 - }, - { - "epoch": 142.62, - "learning_rate": 0.0001042041771696075, - "loss": 0.2603, - "step": 176425 - }, - { - "epoch": 142.64, - "learning_rate": 0.00010414791141519625, - "loss": 0.2746, - "step": 176450 - }, - { - "epoch": 142.66, - "learning_rate": 0.00010409164566078503, - "loss": 0.3054, - "step": 176475 - }, - { - "epoch": 142.68, - "learning_rate": 0.00010403537990637378, - "loss": 0.2514, - "step": 176500 - }, - { - "epoch": 142.7, - "learning_rate": 0.00010397911415196256, - "loss": 0.2954, - "step": 176525 - }, - { - "epoch": 142.72, - "learning_rate": 0.00010392284839755131, - "loss": 0.2764, - "step": 176550 - }, - { - "epoch": 142.74, - "learning_rate": 0.00010386658264314009, - "loss": 0.3033, - "step": 176575 - }, - { - "epoch": 142.76, - "learning_rate": 0.00010381031688872884, - "loss": 0.2734, - "step": 176600 - }, - { - "epoch": 142.78, - "learning_rate": 0.00010375405113431762, - "loss": 0.2748, - "step": 176625 - }, - { - "epoch": 142.81, - "learning_rate": 0.00010369778537990637, - "loss": 0.291, - "step": 176650 - }, - { - "epoch": 142.83, - "learning_rate": 0.00010364151962549514, - "loss": 0.2815, - "step": 176675 - }, - { - "epoch": 142.85, - "learning_rate": 0.00010358525387108391, - "loss": 0.2591, - "step": 176700 - }, - { - "epoch": 142.87, - "learning_rate": 0.00010352898811667267, - "loss": 0.2985, - "step": 176725 - }, - { - "epoch": 142.89, - "learning_rate": 0.00010347272236226144, - "loss": 0.2495, - "step": 176750 - }, - { - "epoch": 142.91, - "learning_rate": 0.0001034164566078502, - "loss": 0.2591, - "step": 176775 - }, - { - "epoch": 142.93, - "learning_rate": 0.00010336019085343897, - "loss": 0.2359, - "step": 176800 - }, - { - "epoch": 142.95, - "learning_rate": 0.00010330392509902772, - "loss": 0.3169, - "step": 176825 - }, - { - "epoch": 142.97, - "learning_rate": 0.0001032476593446165, - "loss": 0.2446, - "step": 176850 - }, - { - "epoch": 142.99, - "learning_rate": 0.00010319139359020525, - "loss": 0.251, - "step": 176875 - }, - { - "epoch": 143.01, - "learning_rate": 0.00010313512783579403, - "loss": 0.2533, - "step": 176900 - }, - { - "epoch": 143.03, - "learning_rate": 0.00010307886208138278, - "loss": 0.2458, - "step": 176925 - }, - { - "epoch": 143.05, - "learning_rate": 0.00010302259632697156, - "loss": 0.2945, - "step": 176950 - }, - { - "epoch": 143.07, - "learning_rate": 0.00010296633057256031, - "loss": 0.2787, - "step": 176975 - }, - { - "epoch": 143.09, - "learning_rate": 0.00010291006481814909, - "loss": 0.2742, - "step": 177000 - }, - { - "epoch": 143.09, - "eval_cer": 0.07704074823157397, - "eval_loss": 0.4133159816265106, - "eval_runtime": 148.921, - "eval_samples_per_second": 28.156, - "eval_steps_per_second": 7.044, - "eval_wer": 0.3272756933115824, - "step": 177000 - }, - { - "epoch": 143.11, - "learning_rate": 0.00010285379906373785, - "loss": 0.3223, - "step": 177025 - }, - { - "epoch": 143.13, - "learning_rate": 0.00010279753330932662, - "loss": 0.2516, - "step": 177050 - }, - { - "epoch": 143.15, - "learning_rate": 0.00010274126755491538, - "loss": 0.2412, - "step": 177075 - }, - { - "epoch": 143.17, - "learning_rate": 0.00010268500180050415, - "loss": 0.3262, - "step": 177100 - }, - { - "epoch": 143.19, - "learning_rate": 0.00010262873604609291, - "loss": 0.2569, - "step": 177125 - }, - { - "epoch": 143.21, - "learning_rate": 0.00010257247029168168, - "loss": 0.2536, - "step": 177150 - }, - { - "epoch": 143.23, - "learning_rate": 0.00010251620453727044, - "loss": 0.2279, - "step": 177175 - }, - { - "epoch": 143.25, - "learning_rate": 0.00010245993878285919, - "loss": 0.2628, - "step": 177200 - }, - { - "epoch": 143.27, - "learning_rate": 0.00010240367302844797, - "loss": 0.2487, - "step": 177225 - }, - { - "epoch": 143.29, - "learning_rate": 0.00010234740727403672, - "loss": 0.2353, - "step": 177250 - }, - { - "epoch": 143.31, - "learning_rate": 0.0001022911415196255, - "loss": 0.27, - "step": 177275 - }, - { - "epoch": 143.33, - "learning_rate": 0.00010223487576521426, - "loss": 0.2688, - "step": 177300 - }, - { - "epoch": 143.35, - "learning_rate": 0.00010217861001080303, - "loss": 0.2563, - "step": 177325 - }, - { - "epoch": 143.37, - "learning_rate": 0.0001021223442563918, - "loss": 0.2587, - "step": 177350 - }, - { - "epoch": 143.39, - "learning_rate": 0.00010206607850198056, - "loss": 0.2638, - "step": 177375 - }, - { - "epoch": 143.41, - "learning_rate": 0.00010201206337774577, - "loss": 0.2754, - "step": 177400 - }, - { - "epoch": 143.43, - "learning_rate": 0.00010195579762333454, - "loss": 0.296, - "step": 177425 - }, - { - "epoch": 143.45, - "learning_rate": 0.0001018995318689233, - "loss": 0.2548, - "step": 177450 - }, - { - "epoch": 143.47, - "learning_rate": 0.00010184326611451207, - "loss": 0.2865, - "step": 177475 - }, - { - "epoch": 143.49, - "learning_rate": 0.00010178700036010083, - "loss": 0.2461, - "step": 177500 - }, - { - "epoch": 143.51, - "learning_rate": 0.0001017307346056896, - "loss": 0.2623, - "step": 177525 - }, - { - "epoch": 143.53, - "learning_rate": 0.00010167446885127836, - "loss": 0.2453, - "step": 177550 - }, - { - "epoch": 143.55, - "learning_rate": 0.00010161820309686713, - "loss": 0.2594, - "step": 177575 - }, - { - "epoch": 143.57, - "learning_rate": 0.00010156193734245589, - "loss": 0.2596, - "step": 177600 - }, - { - "epoch": 143.59, - "learning_rate": 0.00010150567158804465, - "loss": 0.2489, - "step": 177625 - }, - { - "epoch": 143.61, - "learning_rate": 0.00010144940583363342, - "loss": 0.3084, - "step": 177650 - }, - { - "epoch": 143.63, - "learning_rate": 0.00010139314007922218, - "loss": 0.2514, - "step": 177675 - }, - { - "epoch": 143.65, - "learning_rate": 0.00010133687432481095, - "loss": 0.2738, - "step": 177700 - }, - { - "epoch": 143.67, - "learning_rate": 0.00010128060857039971, - "loss": 0.2646, - "step": 177725 - }, - { - "epoch": 143.69, - "learning_rate": 0.00010122659344616493, - "loss": 0.2791, - "step": 177750 - }, - { - "epoch": 143.71, - "learning_rate": 0.00010117032769175369, - "loss": 0.2591, - "step": 177775 - }, - { - "epoch": 143.73, - "learning_rate": 0.00010111406193734246, - "loss": 0.285, - "step": 177800 - }, - { - "epoch": 143.76, - "learning_rate": 0.00010105779618293122, - "loss": 0.2542, - "step": 177825 - }, - { - "epoch": 143.78, - "learning_rate": 0.00010100153042851999, - "loss": 0.2748, - "step": 177850 - }, - { - "epoch": 143.8, - "learning_rate": 0.00010094526467410875, - "loss": 0.2367, - "step": 177875 - }, - { - "epoch": 143.82, - "learning_rate": 0.00010088899891969752, - "loss": 0.2801, - "step": 177900 - }, - { - "epoch": 143.84, - "learning_rate": 0.00010083273316528628, - "loss": 0.26, - "step": 177925 - }, - { - "epoch": 143.86, - "learning_rate": 0.00010077646741087506, - "loss": 0.2576, - "step": 177950 - }, - { - "epoch": 143.88, - "learning_rate": 0.00010072020165646381, - "loss": 0.2953, - "step": 177975 - }, - { - "epoch": 143.9, - "learning_rate": 0.00010066393590205259, - "loss": 0.2709, - "step": 178000 - }, - { - "epoch": 143.92, - "learning_rate": 0.00010060767014764134, - "loss": 0.2523, - "step": 178025 - }, - { - "epoch": 143.94, - "learning_rate": 0.0001005514043932301, - "loss": 0.2694, - "step": 178050 - }, - { - "epoch": 143.96, - "learning_rate": 0.00010049513863881887, - "loss": 0.2635, - "step": 178075 - }, - { - "epoch": 143.98, - "learning_rate": 0.00010043887288440763, - "loss": 0.2893, - "step": 178100 - }, - { - "epoch": 144.0, - "learning_rate": 0.0001003826071299964, - "loss": 0.2153, - "step": 178125 - }, - { - "epoch": 144.02, - "learning_rate": 0.00010032634137558516, - "loss": 0.2666, - "step": 178150 - }, - { - "epoch": 144.04, - "learning_rate": 0.00010027007562117393, - "loss": 0.2425, - "step": 178175 - }, - { - "epoch": 144.06, - "learning_rate": 0.00010021380986676269, - "loss": 0.3232, - "step": 178200 - }, - { - "epoch": 144.08, - "learning_rate": 0.00010015754411235146, - "loss": 0.2406, - "step": 178225 - }, - { - "epoch": 144.1, - "learning_rate": 0.00010010127835794022, - "loss": 0.2781, - "step": 178250 - }, - { - "epoch": 144.12, - "learning_rate": 0.000100045012603529, - "loss": 0.2836, - "step": 178275 - }, - { - "epoch": 144.14, - "learning_rate": 9.998874684911775e-05, - "loss": 0.2649, - "step": 178300 - }, - { - "epoch": 144.16, - "learning_rate": 9.993248109470653e-05, - "loss": 0.2533, - "step": 178325 - }, - { - "epoch": 144.18, - "learning_rate": 9.987621534029528e-05, - "loss": 0.2742, - "step": 178350 - }, - { - "epoch": 144.2, - "learning_rate": 9.981994958588405e-05, - "loss": 0.2831, - "step": 178375 - }, - { - "epoch": 144.22, - "learning_rate": 9.976368383147281e-05, - "loss": 0.2591, - "step": 178400 - }, - { - "epoch": 144.24, - "learning_rate": 9.970741807706158e-05, - "loss": 0.3329, - "step": 178425 - }, - { - "epoch": 144.26, - "learning_rate": 9.965115232265034e-05, - "loss": 0.2753, - "step": 178450 - }, - { - "epoch": 144.28, - "learning_rate": 9.95948865682391e-05, - "loss": 0.2812, - "step": 178475 - }, - { - "epoch": 144.3, - "learning_rate": 9.953862081382787e-05, - "loss": 0.2858, - "step": 178500 - }, - { - "epoch": 144.32, - "learning_rate": 9.948235505941664e-05, - "loss": 0.2483, - "step": 178525 - }, - { - "epoch": 144.34, - "learning_rate": 9.942608930500541e-05, - "loss": 0.2794, - "step": 178550 - }, - { - "epoch": 144.36, - "learning_rate": 9.936982355059417e-05, - "loss": 0.2633, - "step": 178575 - }, - { - "epoch": 144.38, - "learning_rate": 9.931355779618294e-05, - "loss": 0.2647, - "step": 178600 - }, - { - "epoch": 144.4, - "learning_rate": 9.92572920417717e-05, - "loss": 0.2696, - "step": 178625 - }, - { - "epoch": 144.42, - "learning_rate": 9.920102628736047e-05, - "loss": 0.2561, - "step": 178650 - }, - { - "epoch": 144.44, - "learning_rate": 9.914476053294922e-05, - "loss": 0.2813, - "step": 178675 - }, - { - "epoch": 144.46, - "learning_rate": 9.9088494778538e-05, - "loss": 0.263, - "step": 178700 - }, - { - "epoch": 144.48, - "learning_rate": 9.903222902412675e-05, - "loss": 0.2509, - "step": 178725 - }, - { - "epoch": 144.5, - "learning_rate": 9.897596326971552e-05, - "loss": 0.2884, - "step": 178750 - }, - { - "epoch": 144.52, - "learning_rate": 9.891969751530428e-05, - "loss": 0.234, - "step": 178775 - }, - { - "epoch": 144.54, - "learning_rate": 9.886343176089305e-05, - "loss": 0.269, - "step": 178800 - }, - { - "epoch": 144.56, - "learning_rate": 9.880716600648181e-05, - "loss": 0.2357, - "step": 178825 - }, - { - "epoch": 144.58, - "learning_rate": 9.875090025207058e-05, - "loss": 0.2629, - "step": 178850 - }, - { - "epoch": 144.6, - "learning_rate": 9.869463449765936e-05, - "loss": 0.2591, - "step": 178875 - }, - { - "epoch": 144.62, - "learning_rate": 9.863836874324811e-05, - "loss": 0.2542, - "step": 178900 - }, - { - "epoch": 144.64, - "learning_rate": 9.858210298883689e-05, - "loss": 0.2394, - "step": 178925 - }, - { - "epoch": 144.66, - "learning_rate": 9.852583723442564e-05, - "loss": 0.2625, - "step": 178950 - }, - { - "epoch": 144.68, - "learning_rate": 9.846957148001442e-05, - "loss": 0.2806, - "step": 178975 - }, - { - "epoch": 144.7, - "learning_rate": 9.841330572560317e-05, - "loss": 0.2456, - "step": 179000 - }, - { - "epoch": 144.73, - "learning_rate": 9.835703997119195e-05, - "loss": 0.2521, - "step": 179025 - }, - { - "epoch": 144.75, - "learning_rate": 9.83007742167807e-05, - "loss": 0.2492, - "step": 179050 - }, - { - "epoch": 144.77, - "learning_rate": 9.824450846236947e-05, - "loss": 0.2117, - "step": 179075 - }, - { - "epoch": 144.79, - "learning_rate": 9.818824270795823e-05, - "loss": 0.2542, - "step": 179100 - }, - { - "epoch": 144.81, - "learning_rate": 9.813197695354699e-05, - "loss": 0.2675, - "step": 179125 - }, - { - "epoch": 144.83, - "learning_rate": 9.807571119913576e-05, - "loss": 0.283, - "step": 179150 - }, - { - "epoch": 144.85, - "learning_rate": 9.801944544472452e-05, - "loss": 0.2702, - "step": 179175 - }, - { - "epoch": 144.87, - "learning_rate": 9.79631796903133e-05, - "loss": 0.2926, - "step": 179200 - }, - { - "epoch": 144.89, - "learning_rate": 9.790691393590205e-05, - "loss": 0.2802, - "step": 179225 - }, - { - "epoch": 144.91, - "learning_rate": 9.785064818149083e-05, - "loss": 0.2731, - "step": 179250 - }, - { - "epoch": 144.93, - "learning_rate": 9.779438242707958e-05, - "loss": 0.2636, - "step": 179275 - }, - { - "epoch": 144.95, - "learning_rate": 9.773811667266836e-05, - "loss": 0.2672, - "step": 179300 - }, - { - "epoch": 144.97, - "learning_rate": 9.768185091825711e-05, - "loss": 0.2679, - "step": 179325 - }, - { - "epoch": 144.99, - "learning_rate": 9.762558516384589e-05, - "loss": 0.277, - "step": 179350 - }, - { - "epoch": 145.01, - "learning_rate": 9.756931940943464e-05, - "loss": 0.2467, - "step": 179375 - }, - { - "epoch": 145.03, - "learning_rate": 9.751305365502342e-05, - "loss": 0.2388, - "step": 179400 - }, - { - "epoch": 145.05, - "learning_rate": 9.745678790061217e-05, - "loss": 0.2745, - "step": 179425 - }, - { - "epoch": 145.07, - "learning_rate": 9.740052214620093e-05, - "loss": 0.2472, - "step": 179450 - }, - { - "epoch": 145.09, - "learning_rate": 9.73442563917897e-05, - "loss": 0.2608, - "step": 179475 - }, - { - "epoch": 145.11, - "learning_rate": 9.728799063737846e-05, - "loss": 0.2417, - "step": 179500 - }, - { - "epoch": 145.13, - "learning_rate": 9.723172488296724e-05, - "loss": 0.2602, - "step": 179525 - }, - { - "epoch": 145.15, - "learning_rate": 9.717545912855599e-05, - "loss": 0.265, - "step": 179550 - }, - { - "epoch": 145.17, - "learning_rate": 9.711919337414477e-05, - "loss": 0.2563, - "step": 179575 - }, - { - "epoch": 145.19, - "learning_rate": 9.706292761973352e-05, - "loss": 0.2417, - "step": 179600 - }, - { - "epoch": 145.21, - "learning_rate": 9.70066618653223e-05, - "loss": 0.2727, - "step": 179625 - }, - { - "epoch": 145.23, - "learning_rate": 9.695039611091105e-05, - "loss": 0.2765, - "step": 179650 - }, - { - "epoch": 145.25, - "learning_rate": 9.689413035649983e-05, - "loss": 0.2681, - "step": 179675 - }, - { - "epoch": 145.27, - "learning_rate": 9.683786460208858e-05, - "loss": 0.2429, - "step": 179700 - }, - { - "epoch": 145.29, - "learning_rate": 9.678159884767736e-05, - "loss": 0.2514, - "step": 179725 - }, - { - "epoch": 145.31, - "learning_rate": 9.672533309326611e-05, - "loss": 0.2567, - "step": 179750 - }, - { - "epoch": 145.33, - "learning_rate": 9.666906733885489e-05, - "loss": 0.2719, - "step": 179775 - }, - { - "epoch": 145.35, - "learning_rate": 9.661280158444364e-05, - "loss": 0.2475, - "step": 179800 - }, - { - "epoch": 145.37, - "learning_rate": 9.65565358300324e-05, - "loss": 0.2627, - "step": 179825 - }, - { - "epoch": 145.39, - "learning_rate": 9.650027007562118e-05, - "loss": 0.2742, - "step": 179850 - }, - { - "epoch": 145.41, - "learning_rate": 9.644400432120993e-05, - "loss": 0.2662, - "step": 179875 - }, - { - "epoch": 145.43, - "learning_rate": 9.638773856679871e-05, - "loss": 0.2762, - "step": 179900 - }, - { - "epoch": 145.45, - "learning_rate": 9.633147281238746e-05, - "loss": 0.2654, - "step": 179925 - }, - { - "epoch": 145.47, - "learning_rate": 9.627520705797624e-05, - "loss": 0.267, - "step": 179950 - }, - { - "epoch": 145.49, - "learning_rate": 9.6218941303565e-05, - "loss": 0.272, - "step": 179975 - }, - { - "epoch": 145.51, - "learning_rate": 9.616267554915377e-05, - "loss": 0.2339, - "step": 180000 - }, - { - "epoch": 145.51, - "eval_cer": 0.07711774791330862, - "eval_loss": 0.428690105676651, - "eval_runtime": 149.384, - "eval_samples_per_second": 28.069, - "eval_steps_per_second": 7.022, - "eval_wer": 0.3267536704730832, - "step": 180000 - }, - { - "epoch": 145.53, - "learning_rate": 9.610640979474252e-05, - "loss": 0.2665, - "step": 180025 - }, - { - "epoch": 145.55, - "learning_rate": 9.60501440403313e-05, - "loss": 0.2467, - "step": 180050 - }, - { - "epoch": 145.57, - "learning_rate": 9.599387828592005e-05, - "loss": 0.2536, - "step": 180075 - }, - { - "epoch": 145.59, - "learning_rate": 9.593761253150883e-05, - "loss": 0.2215, - "step": 180100 - }, - { - "epoch": 145.61, - "learning_rate": 9.588134677709758e-05, - "loss": 0.2676, - "step": 180125 - }, - { - "epoch": 145.63, - "learning_rate": 9.582508102268635e-05, - "loss": 0.2845, - "step": 180150 - }, - { - "epoch": 145.65, - "learning_rate": 9.576881526827513e-05, - "loss": 0.2815, - "step": 180175 - }, - { - "epoch": 145.68, - "learning_rate": 9.571254951386388e-05, - "loss": 0.2321, - "step": 180200 - }, - { - "epoch": 145.7, - "learning_rate": 9.565628375945266e-05, - "loss": 0.2314, - "step": 180225 - }, - { - "epoch": 145.72, - "learning_rate": 9.56000180050414e-05, - "loss": 0.2685, - "step": 180250 - }, - { - "epoch": 145.74, - "learning_rate": 9.554375225063019e-05, - "loss": 0.282, - "step": 180275 - }, - { - "epoch": 145.76, - "learning_rate": 9.548748649621894e-05, - "loss": 0.2542, - "step": 180300 - }, - { - "epoch": 145.78, - "learning_rate": 9.543122074180771e-05, - "loss": 0.2701, - "step": 180325 - }, - { - "epoch": 145.8, - "learning_rate": 9.537495498739647e-05, - "loss": 0.2636, - "step": 180350 - }, - { - "epoch": 145.82, - "learning_rate": 9.531868923298524e-05, - "loss": 0.3032, - "step": 180375 - }, - { - "epoch": 145.84, - "learning_rate": 9.5262423478574e-05, - "loss": 0.2669, - "step": 180400 - }, - { - "epoch": 145.86, - "learning_rate": 9.520615772416277e-05, - "loss": 0.287, - "step": 180425 - }, - { - "epoch": 145.88, - "learning_rate": 9.514989196975153e-05, - "loss": 0.2689, - "step": 180450 - }, - { - "epoch": 145.9, - "learning_rate": 9.50936262153403e-05, - "loss": 0.2868, - "step": 180475 - }, - { - "epoch": 145.92, - "learning_rate": 9.503736046092907e-05, - "loss": 0.2729, - "step": 180500 - }, - { - "epoch": 145.94, - "learning_rate": 9.498109470651782e-05, - "loss": 0.266, - "step": 180525 - }, - { - "epoch": 145.96, - "learning_rate": 9.49248289521066e-05, - "loss": 0.2661, - "step": 180550 - }, - { - "epoch": 145.98, - "learning_rate": 9.486856319769535e-05, - "loss": 0.2618, - "step": 180575 - }, - { - "epoch": 146.0, - "learning_rate": 9.481229744328413e-05, - "loss": 0.2463, - "step": 180600 - }, - { - "epoch": 146.02, - "learning_rate": 9.475603168887288e-05, - "loss": 0.2412, - "step": 180625 - }, - { - "epoch": 146.04, - "learning_rate": 9.469976593446166e-05, - "loss": 0.2517, - "step": 180650 - }, - { - "epoch": 146.06, - "learning_rate": 9.464350018005041e-05, - "loss": 0.2745, - "step": 180675 - }, - { - "epoch": 146.08, - "learning_rate": 9.458723442563919e-05, - "loss": 0.2349, - "step": 180700 - }, - { - "epoch": 146.1, - "learning_rate": 9.453096867122794e-05, - "loss": 0.2567, - "step": 180725 - }, - { - "epoch": 146.12, - "learning_rate": 9.447470291681672e-05, - "loss": 0.2081, - "step": 180750 - }, - { - "epoch": 146.14, - "learning_rate": 9.441843716240547e-05, - "loss": 0.2739, - "step": 180775 - }, - { - "epoch": 146.16, - "learning_rate": 9.436217140799425e-05, - "loss": 0.2464, - "step": 180800 - }, - { - "epoch": 146.18, - "learning_rate": 9.430590565358301e-05, - "loss": 0.2567, - "step": 180825 - }, - { - "epoch": 146.2, - "learning_rate": 9.424963989917178e-05, - "loss": 0.2657, - "step": 180850 - }, - { - "epoch": 146.22, - "learning_rate": 9.419337414476054e-05, - "loss": 0.2507, - "step": 180875 - }, - { - "epoch": 146.24, - "learning_rate": 9.413710839034929e-05, - "loss": 0.2496, - "step": 180900 - }, - { - "epoch": 146.26, - "learning_rate": 9.408084263593807e-05, - "loss": 0.2255, - "step": 180925 - }, - { - "epoch": 146.28, - "learning_rate": 9.402457688152682e-05, - "loss": 0.236, - "step": 180950 - }, - { - "epoch": 146.3, - "learning_rate": 9.39683111271156e-05, - "loss": 0.2439, - "step": 180975 - }, - { - "epoch": 146.32, - "learning_rate": 9.391204537270435e-05, - "loss": 0.2623, - "step": 181000 - }, - { - "epoch": 146.34, - "learning_rate": 9.385577961829313e-05, - "loss": 0.278, - "step": 181025 - }, - { - "epoch": 146.36, - "learning_rate": 9.379951386388188e-05, - "loss": 0.2782, - "step": 181050 - }, - { - "epoch": 146.38, - "learning_rate": 9.374324810947066e-05, - "loss": 0.2576, - "step": 181075 - }, - { - "epoch": 146.4, - "learning_rate": 9.368698235505941e-05, - "loss": 0.2764, - "step": 181100 - }, - { - "epoch": 146.42, - "learning_rate": 9.363071660064819e-05, - "loss": 0.276, - "step": 181125 - }, - { - "epoch": 146.44, - "learning_rate": 9.357445084623695e-05, - "loss": 0.2534, - "step": 181150 - }, - { - "epoch": 146.46, - "learning_rate": 9.351818509182572e-05, - "loss": 0.2563, - "step": 181175 - }, - { - "epoch": 146.48, - "learning_rate": 9.346191933741448e-05, - "loss": 0.2341, - "step": 181200 - }, - { - "epoch": 146.5, - "learning_rate": 9.340565358300323e-05, - "loss": 0.2514, - "step": 181225 - }, - { - "epoch": 146.52, - "learning_rate": 9.334938782859201e-05, - "loss": 0.2452, - "step": 181250 - }, - { - "epoch": 146.54, - "learning_rate": 9.329312207418076e-05, - "loss": 0.2607, - "step": 181275 - }, - { - "epoch": 146.56, - "learning_rate": 9.323685631976954e-05, - "loss": 0.2634, - "step": 181300 - }, - { - "epoch": 146.58, - "learning_rate": 9.318059056535829e-05, - "loss": 0.2678, - "step": 181325 - }, - { - "epoch": 146.6, - "learning_rate": 9.312432481094707e-05, - "loss": 0.228, - "step": 181350 - }, - { - "epoch": 146.62, - "learning_rate": 9.306805905653582e-05, - "loss": 0.2766, - "step": 181375 - }, - { - "epoch": 146.65, - "learning_rate": 9.30117933021246e-05, - "loss": 0.2583, - "step": 181400 - }, - { - "epoch": 146.67, - "learning_rate": 9.295552754771335e-05, - "loss": 0.2615, - "step": 181425 - }, - { - "epoch": 146.69, - "learning_rate": 9.289926179330213e-05, - "loss": 0.2496, - "step": 181450 - }, - { - "epoch": 146.71, - "learning_rate": 9.28429960388909e-05, - "loss": 0.2688, - "step": 181475 - }, - { - "epoch": 146.73, - "learning_rate": 9.278673028447966e-05, - "loss": 0.2621, - "step": 181500 - }, - { - "epoch": 146.75, - "learning_rate": 9.273046453006842e-05, - "loss": 0.2605, - "step": 181525 - }, - { - "epoch": 146.77, - "learning_rate": 9.267419877565719e-05, - "loss": 0.2803, - "step": 181550 - }, - { - "epoch": 146.79, - "learning_rate": 9.261793302124595e-05, - "loss": 0.2872, - "step": 181575 - }, - { - "epoch": 146.81, - "learning_rate": 9.25616672668347e-05, - "loss": 0.2439, - "step": 181600 - }, - { - "epoch": 146.83, - "learning_rate": 9.250540151242348e-05, - "loss": 0.2783, - "step": 181625 - }, - { - "epoch": 146.85, - "learning_rate": 9.244913575801224e-05, - "loss": 0.2359, - "step": 181650 - }, - { - "epoch": 146.87, - "learning_rate": 9.239287000360101e-05, - "loss": 0.2689, - "step": 181675 - }, - { - "epoch": 146.89, - "learning_rate": 9.233660424918977e-05, - "loss": 0.2645, - "step": 181700 - }, - { - "epoch": 146.91, - "learning_rate": 9.228033849477854e-05, - "loss": 0.2623, - "step": 181725 - }, - { - "epoch": 146.93, - "learning_rate": 9.22240727403673e-05, - "loss": 0.2612, - "step": 181750 - }, - { - "epoch": 146.95, - "learning_rate": 9.216780698595607e-05, - "loss": 0.2524, - "step": 181775 - }, - { - "epoch": 146.97, - "learning_rate": 9.211154123154484e-05, - "loss": 0.2505, - "step": 181800 - }, - { - "epoch": 146.99, - "learning_rate": 9.20552754771336e-05, - "loss": 0.2467, - "step": 181825 - }, - { - "epoch": 147.01, - "learning_rate": 9.199900972272237e-05, - "loss": 0.2356, - "step": 181850 - }, - { - "epoch": 147.03, - "learning_rate": 9.194274396831113e-05, - "loss": 0.2552, - "step": 181875 - }, - { - "epoch": 147.05, - "learning_rate": 9.18864782138999e-05, - "loss": 0.2573, - "step": 181900 - }, - { - "epoch": 147.07, - "learning_rate": 9.183021245948866e-05, - "loss": 0.2314, - "step": 181925 - }, - { - "epoch": 147.09, - "learning_rate": 9.177394670507743e-05, - "loss": 0.2382, - "step": 181950 - }, - { - "epoch": 147.11, - "learning_rate": 9.171768095066618e-05, - "loss": 0.2383, - "step": 181975 - }, - { - "epoch": 147.13, - "learning_rate": 9.166141519625496e-05, - "loss": 0.2562, - "step": 182000 - }, - { - "epoch": 147.15, - "learning_rate": 9.160514944184371e-05, - "loss": 0.2514, - "step": 182025 - }, - { - "epoch": 147.17, - "learning_rate": 9.154888368743249e-05, - "loss": 0.2235, - "step": 182050 - }, - { - "epoch": 147.19, - "learning_rate": 9.149261793302125e-05, - "loss": 0.2309, - "step": 182075 - }, - { - "epoch": 147.21, - "learning_rate": 9.143635217861002e-05, - "loss": 0.2431, - "step": 182100 - }, - { - "epoch": 147.23, - "learning_rate": 9.138008642419878e-05, - "loss": 0.2409, - "step": 182125 - }, - { - "epoch": 147.25, - "learning_rate": 9.132382066978754e-05, - "loss": 0.2604, - "step": 182150 - }, - { - "epoch": 147.27, - "learning_rate": 9.126755491537631e-05, - "loss": 0.2481, - "step": 182175 - }, - { - "epoch": 147.29, - "learning_rate": 9.121128916096507e-05, - "loss": 0.2883, - "step": 182200 - }, - { - "epoch": 147.31, - "learning_rate": 9.115502340655384e-05, - "loss": 0.2286, - "step": 182225 - }, - { - "epoch": 147.33, - "learning_rate": 9.10987576521426e-05, - "loss": 0.2696, - "step": 182250 - }, - { - "epoch": 147.35, - "learning_rate": 9.104249189773137e-05, - "loss": 0.2482, - "step": 182275 - }, - { - "epoch": 147.37, - "learning_rate": 9.098622614332012e-05, - "loss": 0.2588, - "step": 182300 - }, - { - "epoch": 147.39, - "learning_rate": 9.09299603889089e-05, - "loss": 0.2588, - "step": 182325 - }, - { - "epoch": 147.41, - "learning_rate": 9.087369463449765e-05, - "loss": 0.2528, - "step": 182350 - }, - { - "epoch": 147.43, - "learning_rate": 9.081742888008643e-05, - "loss": 0.2473, - "step": 182375 - }, - { - "epoch": 147.45, - "learning_rate": 9.076116312567519e-05, - "loss": 0.29, - "step": 182400 - }, - { - "epoch": 147.47, - "learning_rate": 9.070489737126396e-05, - "loss": 0.2481, - "step": 182425 - }, - { - "epoch": 147.49, - "learning_rate": 9.064863161685272e-05, - "loss": 0.2873, - "step": 182450 - }, - { - "epoch": 147.51, - "learning_rate": 9.059236586244149e-05, - "loss": 0.2778, - "step": 182475 - }, - { - "epoch": 147.53, - "learning_rate": 9.053610010803025e-05, - "loss": 0.2449, - "step": 182500 - }, - { - "epoch": 147.55, - "learning_rate": 9.047983435361902e-05, - "loss": 0.2394, - "step": 182525 - }, - { - "epoch": 147.57, - "learning_rate": 9.042356859920778e-05, - "loss": 0.2331, - "step": 182550 - }, - { - "epoch": 147.59, - "learning_rate": 9.0369553474973e-05, - "loss": 0.2373, - "step": 182575 - }, - { - "epoch": 147.62, - "learning_rate": 9.031328772056176e-05, - "loss": 0.2741, - "step": 182600 - }, - { - "epoch": 147.64, - "learning_rate": 9.025702196615052e-05, - "loss": 0.2569, - "step": 182625 - }, - { - "epoch": 147.66, - "learning_rate": 9.020075621173929e-05, - "loss": 0.2636, - "step": 182650 - }, - { - "epoch": 147.68, - "learning_rate": 9.014449045732805e-05, - "loss": 0.2395, - "step": 182675 - }, - { - "epoch": 147.7, - "learning_rate": 9.008822470291682e-05, - "loss": 0.2618, - "step": 182700 - }, - { - "epoch": 147.72, - "learning_rate": 9.003195894850558e-05, - "loss": 0.2482, - "step": 182725 - }, - { - "epoch": 147.74, - "learning_rate": 8.997569319409435e-05, - "loss": 0.2572, - "step": 182750 - }, - { - "epoch": 147.76, - "learning_rate": 8.991942743968311e-05, - "loss": 0.2241, - "step": 182775 - }, - { - "epoch": 147.78, - "learning_rate": 8.986316168527188e-05, - "loss": 0.2586, - "step": 182800 - }, - { - "epoch": 147.8, - "learning_rate": 8.980689593086064e-05, - "loss": 0.2482, - "step": 182825 - }, - { - "epoch": 147.82, - "learning_rate": 8.975063017644941e-05, - "loss": 0.2951, - "step": 182850 - }, - { - "epoch": 147.84, - "learning_rate": 8.969436442203817e-05, - "loss": 0.2154, - "step": 182875 - }, - { - "epoch": 147.86, - "learning_rate": 8.963809866762694e-05, - "loss": 0.2295, - "step": 182900 - }, - { - "epoch": 147.88, - "learning_rate": 8.95818329132157e-05, - "loss": 0.2438, - "step": 182925 - }, - { - "epoch": 147.9, - "learning_rate": 8.952556715880447e-05, - "loss": 0.1849, - "step": 182950 - }, - { - "epoch": 147.92, - "learning_rate": 8.946930140439323e-05, - "loss": 0.2155, - "step": 182975 - }, - { - "epoch": 147.94, - "learning_rate": 8.9413035649982e-05, - "loss": 0.2547, - "step": 183000 - }, - { - "epoch": 147.94, - "eval_cer": 0.07676868268944488, - "eval_loss": 0.4395972192287445, - "eval_runtime": 150.3968, - "eval_samples_per_second": 27.88, - "eval_steps_per_second": 6.975, - "eval_wer": 0.3253507340946166, - "step": 183000 - }, - { - "epoch": 147.96, - "learning_rate": 8.935676989557076e-05, - "loss": 0.2438, - "step": 183025 - }, - { - "epoch": 147.98, - "learning_rate": 8.930050414115954e-05, - "loss": 0.2418, - "step": 183050 - }, - { - "epoch": 148.0, - "learning_rate": 8.924423838674829e-05, - "loss": 0.2301, - "step": 183075 - }, - { - "epoch": 148.02, - "learning_rate": 8.919022326251352e-05, - "loss": 0.2259, - "step": 183100 - }, - { - "epoch": 148.04, - "learning_rate": 8.913395750810227e-05, - "loss": 0.2529, - "step": 183125 - }, - { - "epoch": 148.06, - "learning_rate": 8.907769175369103e-05, - "loss": 0.223, - "step": 183150 - }, - { - "epoch": 148.08, - "learning_rate": 8.90214259992798e-05, - "loss": 0.2741, - "step": 183175 - }, - { - "epoch": 148.1, - "learning_rate": 8.896516024486856e-05, - "loss": 0.2585, - "step": 183200 - }, - { - "epoch": 148.12, - "learning_rate": 8.890889449045733e-05, - "loss": 0.241, - "step": 183225 - }, - { - "epoch": 148.14, - "learning_rate": 8.885262873604609e-05, - "loss": 0.2538, - "step": 183250 - }, - { - "epoch": 148.16, - "learning_rate": 8.879636298163486e-05, - "loss": 0.2224, - "step": 183275 - }, - { - "epoch": 148.18, - "learning_rate": 8.874009722722362e-05, - "loss": 0.2388, - "step": 183300 - }, - { - "epoch": 148.2, - "learning_rate": 8.86838314728124e-05, - "loss": 0.2234, - "step": 183325 - }, - { - "epoch": 148.22, - "learning_rate": 8.862756571840115e-05, - "loss": 0.2426, - "step": 183350 - }, - { - "epoch": 148.24, - "learning_rate": 8.857129996398993e-05, - "loss": 0.2038, - "step": 183375 - }, - { - "epoch": 148.26, - "learning_rate": 8.851503420957868e-05, - "loss": 0.2496, - "step": 183400 - }, - { - "epoch": 148.28, - "learning_rate": 8.845876845516746e-05, - "loss": 0.2406, - "step": 183425 - }, - { - "epoch": 148.3, - "learning_rate": 8.840250270075621e-05, - "loss": 0.2573, - "step": 183450 - }, - { - "epoch": 148.32, - "learning_rate": 8.834623694634499e-05, - "loss": 0.23, - "step": 183475 - }, - { - "epoch": 148.34, - "learning_rate": 8.828997119193374e-05, - "loss": 0.2747, - "step": 183500 - }, - { - "epoch": 148.36, - "learning_rate": 8.82337054375225e-05, - "loss": 0.2621, - "step": 183525 - }, - { - "epoch": 148.38, - "learning_rate": 8.817743968311127e-05, - "loss": 0.2474, - "step": 183550 - }, - { - "epoch": 148.4, - "learning_rate": 8.812117392870003e-05, - "loss": 0.2303, - "step": 183575 - }, - { - "epoch": 148.42, - "learning_rate": 8.80649081742888e-05, - "loss": 0.2598, - "step": 183600 - }, - { - "epoch": 148.44, - "learning_rate": 8.800864241987756e-05, - "loss": 0.2554, - "step": 183625 - }, - { - "epoch": 148.46, - "learning_rate": 8.795237666546634e-05, - "loss": 0.2547, - "step": 183650 - }, - { - "epoch": 148.48, - "learning_rate": 8.78961109110551e-05, - "loss": 0.2592, - "step": 183675 - }, - { - "epoch": 148.5, - "learning_rate": 8.783984515664387e-05, - "loss": 0.2723, - "step": 183700 - }, - { - "epoch": 148.52, - "learning_rate": 8.778357940223262e-05, - "loss": 0.2315, - "step": 183725 - }, - { - "epoch": 148.54, - "learning_rate": 8.77273136478214e-05, - "loss": 0.2444, - "step": 183750 - }, - { - "epoch": 148.57, - "learning_rate": 8.767104789341015e-05, - "loss": 0.2418, - "step": 183775 - }, - { - "epoch": 148.59, - "learning_rate": 8.761478213899893e-05, - "loss": 0.2439, - "step": 183800 - }, - { - "epoch": 148.61, - "learning_rate": 8.755851638458768e-05, - "loss": 0.2374, - "step": 183825 - }, - { - "epoch": 148.63, - "learning_rate": 8.750225063017646e-05, - "loss": 0.2548, - "step": 183850 - }, - { - "epoch": 148.65, - "learning_rate": 8.744598487576521e-05, - "loss": 0.2225, - "step": 183875 - }, - { - "epoch": 148.67, - "learning_rate": 8.738971912135398e-05, - "loss": 0.2514, - "step": 183900 - }, - { - "epoch": 148.69, - "learning_rate": 8.733345336694274e-05, - "loss": 0.2674, - "step": 183925 - }, - { - "epoch": 148.71, - "learning_rate": 8.72771876125315e-05, - "loss": 0.2733, - "step": 183950 - }, - { - "epoch": 148.73, - "learning_rate": 8.722092185812028e-05, - "loss": 0.2434, - "step": 183975 - }, - { - "epoch": 148.75, - "learning_rate": 8.716465610370904e-05, - "loss": 0.2764, - "step": 184000 - }, - { - "epoch": 148.77, - "learning_rate": 8.710839034929781e-05, - "loss": 0.2095, - "step": 184025 - }, - { - "epoch": 148.79, - "learning_rate": 8.705212459488657e-05, - "loss": 0.2386, - "step": 184050 - }, - { - "epoch": 148.81, - "learning_rate": 8.699585884047534e-05, - "loss": 0.1872, - "step": 184075 - }, - { - "epoch": 148.83, - "learning_rate": 8.69395930860641e-05, - "loss": 0.253, - "step": 184100 - }, - { - "epoch": 148.85, - "learning_rate": 8.688332733165287e-05, - "loss": 0.2379, - "step": 184125 - }, - { - "epoch": 148.87, - "learning_rate": 8.682706157724162e-05, - "loss": 0.2736, - "step": 184150 - }, - { - "epoch": 148.89, - "learning_rate": 8.67707958228304e-05, - "loss": 0.2587, - "step": 184175 - }, - { - "epoch": 148.91, - "learning_rate": 8.671453006841915e-05, - "loss": 0.2599, - "step": 184200 - }, - { - "epoch": 148.93, - "learning_rate": 8.665826431400792e-05, - "loss": 0.2492, - "step": 184225 - }, - { - "epoch": 148.95, - "learning_rate": 8.660199855959668e-05, - "loss": 0.2701, - "step": 184250 - }, - { - "epoch": 148.97, - "learning_rate": 8.654573280518545e-05, - "loss": 0.2593, - "step": 184275 - }, - { - "epoch": 148.99, - "learning_rate": 8.648946705077423e-05, - "loss": 0.2218, - "step": 184300 - }, - { - "epoch": 149.01, - "learning_rate": 8.643320129636298e-05, - "loss": 0.2569, - "step": 184325 - }, - { - "epoch": 149.03, - "learning_rate": 8.637693554195176e-05, - "loss": 0.213, - "step": 184350 - }, - { - "epoch": 149.05, - "learning_rate": 8.632066978754051e-05, - "loss": 0.2683, - "step": 184375 - }, - { - "epoch": 149.07, - "learning_rate": 8.626440403312929e-05, - "loss": 0.2441, - "step": 184400 - }, - { - "epoch": 149.09, - "learning_rate": 8.620813827871804e-05, - "loss": 0.2504, - "step": 184425 - }, - { - "epoch": 149.11, - "learning_rate": 8.615187252430682e-05, - "loss": 0.2652, - "step": 184450 - }, - { - "epoch": 149.13, - "learning_rate": 8.609560676989557e-05, - "loss": 0.2908, - "step": 184475 - }, - { - "epoch": 149.15, - "learning_rate": 8.603934101548435e-05, - "loss": 0.243, - "step": 184500 - }, - { - "epoch": 149.17, - "learning_rate": 8.59830752610731e-05, - "loss": 0.2683, - "step": 184525 - }, - { - "epoch": 149.19, - "learning_rate": 8.592680950666187e-05, - "loss": 0.2351, - "step": 184550 - }, - { - "epoch": 149.21, - "learning_rate": 8.587054375225063e-05, - "loss": 0.2483, - "step": 184575 - }, - { - "epoch": 149.23, - "learning_rate": 8.581427799783939e-05, - "loss": 0.2449, - "step": 184600 - }, - { - "epoch": 149.25, - "learning_rate": 8.575801224342817e-05, - "loss": 0.2198, - "step": 184625 - }, - { - "epoch": 149.27, - "learning_rate": 8.570174648901692e-05, - "loss": 0.2365, - "step": 184650 - }, - { - "epoch": 149.29, - "learning_rate": 8.56454807346057e-05, - "loss": 0.2766, - "step": 184675 - }, - { - "epoch": 149.31, - "learning_rate": 8.558921498019445e-05, - "loss": 0.2583, - "step": 184700 - }, - { - "epoch": 149.33, - "learning_rate": 8.553294922578323e-05, - "loss": 0.2544, - "step": 184725 - }, - { - "epoch": 149.35, - "learning_rate": 8.547668347137198e-05, - "loss": 0.2424, - "step": 184750 - }, - { - "epoch": 149.37, - "learning_rate": 8.542041771696076e-05, - "loss": 0.2458, - "step": 184775 - }, - { - "epoch": 149.39, - "learning_rate": 8.536415196254951e-05, - "loss": 0.2223, - "step": 184800 - }, - { - "epoch": 149.41, - "learning_rate": 8.530788620813829e-05, - "loss": 0.2389, - "step": 184825 - }, - { - "epoch": 149.43, - "learning_rate": 8.525162045372704e-05, - "loss": 0.2231, - "step": 184850 - }, - { - "epoch": 149.45, - "learning_rate": 8.519535469931582e-05, - "loss": 0.236, - "step": 184875 - }, - { - "epoch": 149.47, - "learning_rate": 8.513908894490457e-05, - "loss": 0.2126, - "step": 184900 - }, - { - "epoch": 149.49, - "learning_rate": 8.508282319049333e-05, - "loss": 0.2418, - "step": 184925 - }, - { - "epoch": 149.51, - "learning_rate": 8.502655743608211e-05, - "loss": 0.2328, - "step": 184950 - }, - { - "epoch": 149.54, - "learning_rate": 8.497029168167086e-05, - "loss": 0.2368, - "step": 184975 - }, - { - "epoch": 149.56, - "learning_rate": 8.491402592725964e-05, - "loss": 0.227, - "step": 185000 - }, - { - "epoch": 149.58, - "learning_rate": 8.485776017284839e-05, - "loss": 0.2445, - "step": 185025 - }, - { - "epoch": 149.6, - "learning_rate": 8.480149441843717e-05, - "loss": 0.2377, - "step": 185050 - }, - { - "epoch": 149.62, - "learning_rate": 8.474522866402592e-05, - "loss": 0.2296, - "step": 185075 - }, - { - "epoch": 149.64, - "learning_rate": 8.46889629096147e-05, - "loss": 0.2326, - "step": 185100 - }, - { - "epoch": 149.66, - "learning_rate": 8.463269715520345e-05, - "loss": 0.241, - "step": 185125 - }, - { - "epoch": 149.68, - "learning_rate": 8.457643140079223e-05, - "loss": 0.2221, - "step": 185150 - }, - { - "epoch": 149.7, - "learning_rate": 8.452016564638098e-05, - "loss": 0.2295, - "step": 185175 - }, - { - "epoch": 149.72, - "learning_rate": 8.446615052214621e-05, - "loss": 0.2696, - "step": 185200 - }, - { - "epoch": 149.74, - "learning_rate": 8.440988476773496e-05, - "loss": 0.2305, - "step": 185225 - }, - { - "epoch": 149.76, - "learning_rate": 8.435361901332374e-05, - "loss": 0.2355, - "step": 185250 - }, - { - "epoch": 149.78, - "learning_rate": 8.42973532589125e-05, - "loss": 0.3044, - "step": 185275 - }, - { - "epoch": 149.8, - "learning_rate": 8.424108750450127e-05, - "loss": 0.2521, - "step": 185300 - }, - { - "epoch": 149.82, - "learning_rate": 8.418482175009003e-05, - "loss": 0.224, - "step": 185325 - }, - { - "epoch": 149.84, - "learning_rate": 8.412855599567878e-05, - "loss": 0.2408, - "step": 185350 - }, - { - "epoch": 149.86, - "learning_rate": 8.407229024126756e-05, - "loss": 0.2726, - "step": 185375 - }, - { - "epoch": 149.88, - "learning_rate": 8.401602448685631e-05, - "loss": 0.2534, - "step": 185400 - }, - { - "epoch": 149.9, - "learning_rate": 8.395975873244509e-05, - "loss": 0.2088, - "step": 185425 - }, - { - "epoch": 149.92, - "learning_rate": 8.390349297803384e-05, - "loss": 0.2246, - "step": 185450 - }, - { - "epoch": 149.94, - "learning_rate": 8.384722722362262e-05, - "loss": 0.2466, - "step": 185475 - }, - { - "epoch": 149.96, - "learning_rate": 8.379096146921137e-05, - "loss": 0.2467, - "step": 185500 - }, - { - "epoch": 149.98, - "learning_rate": 8.373469571480015e-05, - "loss": 0.2591, - "step": 185525 - }, - { - "epoch": 150.0, - "learning_rate": 8.36784299603889e-05, - "loss": 0.2049, - "step": 185550 - }, - { - "epoch": 150.02, - "learning_rate": 8.362216420597768e-05, - "loss": 0.2339, - "step": 185575 - }, - { - "epoch": 150.04, - "learning_rate": 8.356589845156644e-05, - "loss": 0.2122, - "step": 185600 - }, - { - "epoch": 150.06, - "learning_rate": 8.350963269715521e-05, - "loss": 0.2562, - "step": 185625 - }, - { - "epoch": 150.08, - "learning_rate": 8.345336694274397e-05, - "loss": 0.2575, - "step": 185650 - }, - { - "epoch": 150.1, - "learning_rate": 8.339710118833274e-05, - "loss": 0.2611, - "step": 185675 - }, - { - "epoch": 150.12, - "learning_rate": 8.33408354339215e-05, - "loss": 0.2384, - "step": 185700 - }, - { - "epoch": 150.14, - "learning_rate": 8.328456967951025e-05, - "loss": 0.2435, - "step": 185725 - }, - { - "epoch": 150.16, - "learning_rate": 8.322830392509903e-05, - "loss": 0.2407, - "step": 185750 - }, - { - "epoch": 150.18, - "learning_rate": 8.317203817068778e-05, - "loss": 0.2448, - "step": 185775 - }, - { - "epoch": 150.2, - "learning_rate": 8.311577241627656e-05, - "loss": 0.2177, - "step": 185800 - }, - { - "epoch": 150.22, - "learning_rate": 8.305950666186531e-05, - "loss": 0.2452, - "step": 185825 - }, - { - "epoch": 150.24, - "learning_rate": 8.300324090745409e-05, - "loss": 0.2237, - "step": 185850 - }, - { - "epoch": 150.26, - "learning_rate": 8.294697515304284e-05, - "loss": 0.2466, - "step": 185875 - }, - { - "epoch": 150.28, - "learning_rate": 8.289070939863162e-05, - "loss": 0.2356, - "step": 185900 - }, - { - "epoch": 150.3, - "learning_rate": 8.283444364422039e-05, - "loss": 0.2661, - "step": 185925 - }, - { - "epoch": 150.32, - "learning_rate": 8.277817788980915e-05, - "loss": 0.2332, - "step": 185950 - }, - { - "epoch": 150.34, - "learning_rate": 8.272191213539792e-05, - "loss": 0.243, - "step": 185975 - }, - { - "epoch": 150.36, - "learning_rate": 8.266564638098668e-05, - "loss": 0.2072, - "step": 186000 - }, - { - "epoch": 150.36, - "eval_cer": 0.07735388027062821, - "eval_loss": 0.4585643708705902, - "eval_runtime": 148.6768, - "eval_samples_per_second": 28.202, - "eval_steps_per_second": 7.056, - "eval_wer": 0.3288743882544861, - "step": 186000 - }, - { - "epoch": 150.38, - "learning_rate": 8.260938062657545e-05, - "loss": 0.2533, - "step": 186025 - }, - { - "epoch": 150.4, - "learning_rate": 8.255311487216421e-05, - "loss": 0.2254, - "step": 186050 - }, - { - "epoch": 150.42, - "learning_rate": 8.249684911775298e-05, - "loss": 0.2465, - "step": 186075 - }, - { - "epoch": 150.44, - "learning_rate": 8.244058336334173e-05, - "loss": 0.2551, - "step": 186100 - }, - { - "epoch": 150.46, - "learning_rate": 8.23843176089305e-05, - "loss": 0.2728, - "step": 186125 - }, - { - "epoch": 150.49, - "learning_rate": 8.232805185451926e-05, - "loss": 0.2044, - "step": 186150 - }, - { - "epoch": 150.51, - "learning_rate": 8.227178610010803e-05, - "loss": 0.2728, - "step": 186175 - }, - { - "epoch": 150.53, - "learning_rate": 8.22155203456968e-05, - "loss": 0.2426, - "step": 186200 - }, - { - "epoch": 150.55, - "learning_rate": 8.215925459128556e-05, - "loss": 0.2366, - "step": 186225 - }, - { - "epoch": 150.57, - "learning_rate": 8.210298883687433e-05, - "loss": 0.2211, - "step": 186250 - }, - { - "epoch": 150.59, - "learning_rate": 8.20467230824631e-05, - "loss": 0.2591, - "step": 186275 - }, - { - "epoch": 150.61, - "learning_rate": 8.199045732805186e-05, - "loss": 0.2458, - "step": 186300 - }, - { - "epoch": 150.63, - "learning_rate": 8.193419157364062e-05, - "loss": 0.247, - "step": 186325 - }, - { - "epoch": 150.65, - "learning_rate": 8.187792581922939e-05, - "loss": 0.2158, - "step": 186350 - }, - { - "epoch": 150.67, - "learning_rate": 8.182166006481815e-05, - "loss": 0.2425, - "step": 186375 - }, - { - "epoch": 150.69, - "learning_rate": 8.176539431040692e-05, - "loss": 0.2253, - "step": 186400 - }, - { - "epoch": 150.71, - "learning_rate": 8.170912855599567e-05, - "loss": 0.2422, - "step": 186425 - }, - { - "epoch": 150.73, - "learning_rate": 8.165286280158445e-05, - "loss": 0.2539, - "step": 186450 - }, - { - "epoch": 150.75, - "learning_rate": 8.15965970471732e-05, - "loss": 0.2591, - "step": 186475 - }, - { - "epoch": 150.77, - "learning_rate": 8.154033129276198e-05, - "loss": 0.2537, - "step": 186500 - }, - { - "epoch": 150.79, - "learning_rate": 8.148406553835074e-05, - "loss": 0.2706, - "step": 186525 - }, - { - "epoch": 150.81, - "learning_rate": 8.14277997839395e-05, - "loss": 0.2407, - "step": 186550 - }, - { - "epoch": 150.83, - "learning_rate": 8.137153402952827e-05, - "loss": 0.27, - "step": 186575 - }, - { - "epoch": 150.85, - "learning_rate": 8.131526827511704e-05, - "loss": 0.2428, - "step": 186600 - }, - { - "epoch": 150.87, - "learning_rate": 8.12590025207058e-05, - "loss": 0.2493, - "step": 186625 - }, - { - "epoch": 150.89, - "learning_rate": 8.120273676629457e-05, - "loss": 0.2124, - "step": 186650 - }, - { - "epoch": 150.91, - "learning_rate": 8.114647101188333e-05, - "loss": 0.2553, - "step": 186675 - }, - { - "epoch": 150.93, - "learning_rate": 8.10902052574721e-05, - "loss": 0.2606, - "step": 186700 - }, - { - "epoch": 150.95, - "learning_rate": 8.103393950306086e-05, - "loss": 0.2538, - "step": 186725 - }, - { - "epoch": 150.97, - "learning_rate": 8.097767374864962e-05, - "loss": 0.2262, - "step": 186750 - }, - { - "epoch": 150.99, - "learning_rate": 8.092140799423839e-05, - "loss": 0.275, - "step": 186775 - }, - { - "epoch": 151.01, - "learning_rate": 8.086514223982714e-05, - "loss": 0.2215, - "step": 186800 - }, - { - "epoch": 151.03, - "learning_rate": 8.080887648541592e-05, - "loss": 0.2329, - "step": 186825 - }, - { - "epoch": 151.05, - "learning_rate": 8.075261073100468e-05, - "loss": 0.2574, - "step": 186850 - }, - { - "epoch": 151.07, - "learning_rate": 8.069634497659345e-05, - "loss": 0.243, - "step": 186875 - }, - { - "epoch": 151.09, - "learning_rate": 8.064007922218221e-05, - "loss": 0.232, - "step": 186900 - }, - { - "epoch": 151.11, - "learning_rate": 8.058381346777098e-05, - "loss": 0.2434, - "step": 186925 - }, - { - "epoch": 151.13, - "learning_rate": 8.052754771335974e-05, - "loss": 0.242, - "step": 186950 - }, - { - "epoch": 151.15, - "learning_rate": 8.047128195894851e-05, - "loss": 0.1852, - "step": 186975 - }, - { - "epoch": 151.17, - "learning_rate": 8.041501620453727e-05, - "loss": 0.2491, - "step": 187000 - }, - { - "epoch": 151.19, - "learning_rate": 8.035875045012604e-05, - "loss": 0.2206, - "step": 187025 - }, - { - "epoch": 151.21, - "learning_rate": 8.03024846957148e-05, - "loss": 0.2376, - "step": 187050 - }, - { - "epoch": 151.23, - "learning_rate": 8.024621894130357e-05, - "loss": 0.2447, - "step": 187075 - }, - { - "epoch": 151.25, - "learning_rate": 8.018995318689233e-05, - "loss": 0.2547, - "step": 187100 - }, - { - "epoch": 151.27, - "learning_rate": 8.01336874324811e-05, - "loss": 0.2324, - "step": 187125 - }, - { - "epoch": 151.29, - "learning_rate": 8.007742167806986e-05, - "loss": 0.2326, - "step": 187150 - }, - { - "epoch": 151.31, - "learning_rate": 8.002115592365863e-05, - "loss": 0.2488, - "step": 187175 - }, - { - "epoch": 151.33, - "learning_rate": 7.996489016924739e-05, - "loss": 0.2404, - "step": 187200 - }, - { - "epoch": 151.35, - "learning_rate": 7.990862441483616e-05, - "loss": 0.2286, - "step": 187225 - }, - { - "epoch": 151.37, - "learning_rate": 7.985235866042492e-05, - "loss": 0.2559, - "step": 187250 - }, - { - "epoch": 151.39, - "learning_rate": 7.979834353619013e-05, - "loss": 0.2392, - "step": 187275 - }, - { - "epoch": 151.41, - "learning_rate": 7.97420777817789e-05, - "loss": 0.2791, - "step": 187300 - }, - { - "epoch": 151.43, - "learning_rate": 7.968581202736766e-05, - "loss": 0.2096, - "step": 187325 - }, - { - "epoch": 151.46, - "learning_rate": 7.962954627295643e-05, - "loss": 0.2229, - "step": 187350 - }, - { - "epoch": 151.48, - "learning_rate": 7.957328051854519e-05, - "loss": 0.2372, - "step": 187375 - }, - { - "epoch": 151.5, - "learning_rate": 7.951701476413396e-05, - "loss": 0.2234, - "step": 187400 - }, - { - "epoch": 151.52, - "learning_rate": 7.946074900972272e-05, - "loss": 0.1954, - "step": 187425 - }, - { - "epoch": 151.54, - "learning_rate": 7.940448325531149e-05, - "loss": 0.253, - "step": 187450 - }, - { - "epoch": 151.56, - "learning_rate": 7.934821750090025e-05, - "loss": 0.2445, - "step": 187475 - }, - { - "epoch": 151.58, - "learning_rate": 7.929195174648903e-05, - "loss": 0.2517, - "step": 187500 - }, - { - "epoch": 151.6, - "learning_rate": 7.923568599207778e-05, - "loss": 0.232, - "step": 187525 - }, - { - "epoch": 151.62, - "learning_rate": 7.917942023766656e-05, - "loss": 0.2241, - "step": 187550 - }, - { - "epoch": 151.64, - "learning_rate": 7.912315448325531e-05, - "loss": 0.2243, - "step": 187575 - }, - { - "epoch": 151.66, - "learning_rate": 7.906688872884408e-05, - "loss": 0.232, - "step": 187600 - }, - { - "epoch": 151.68, - "learning_rate": 7.901062297443284e-05, - "loss": 0.2587, - "step": 187625 - }, - { - "epoch": 151.7, - "learning_rate": 7.89543572200216e-05, - "loss": 0.244, - "step": 187650 - }, - { - "epoch": 151.72, - "learning_rate": 7.889809146561037e-05, - "loss": 0.2174, - "step": 187675 - }, - { - "epoch": 151.74, - "learning_rate": 7.884182571119914e-05, - "loss": 0.2759, - "step": 187700 - }, - { - "epoch": 151.76, - "learning_rate": 7.87855599567879e-05, - "loss": 0.2542, - "step": 187725 - }, - { - "epoch": 151.78, - "learning_rate": 7.872929420237666e-05, - "loss": 0.2479, - "step": 187750 - }, - { - "epoch": 151.8, - "learning_rate": 7.867302844796543e-05, - "loss": 0.2559, - "step": 187775 - }, - { - "epoch": 151.82, - "learning_rate": 7.86167626935542e-05, - "loss": 0.2481, - "step": 187800 - }, - { - "epoch": 151.84, - "learning_rate": 7.856049693914297e-05, - "loss": 0.2493, - "step": 187825 - }, - { - "epoch": 151.86, - "learning_rate": 7.850423118473172e-05, - "loss": 0.2427, - "step": 187850 - }, - { - "epoch": 151.88, - "learning_rate": 7.84479654303205e-05, - "loss": 0.2342, - "step": 187875 - }, - { - "epoch": 151.9, - "learning_rate": 7.839169967590925e-05, - "loss": 0.2367, - "step": 187900 - }, - { - "epoch": 151.92, - "learning_rate": 7.833543392149802e-05, - "loss": 0.2207, - "step": 187925 - }, - { - "epoch": 151.94, - "learning_rate": 7.827916816708678e-05, - "loss": 0.2621, - "step": 187950 - }, - { - "epoch": 151.96, - "learning_rate": 7.822290241267555e-05, - "loss": 0.2345, - "step": 187975 - }, - { - "epoch": 151.98, - "learning_rate": 7.816663665826431e-05, - "loss": 0.2754, - "step": 188000 - }, - { - "epoch": 152.0, - "learning_rate": 7.811037090385308e-05, - "loss": 0.2283, - "step": 188025 - }, - { - "epoch": 152.02, - "learning_rate": 7.805410514944184e-05, - "loss": 0.2487, - "step": 188050 - }, - { - "epoch": 152.04, - "learning_rate": 7.799783939503061e-05, - "loss": 0.2386, - "step": 188075 - }, - { - "epoch": 152.06, - "learning_rate": 7.794157364061939e-05, - "loss": 0.2449, - "step": 188100 - }, - { - "epoch": 152.08, - "learning_rate": 7.788530788620814e-05, - "loss": 0.2767, - "step": 188125 - }, - { - "epoch": 152.1, - "learning_rate": 7.782904213179692e-05, - "loss": 0.2534, - "step": 188150 - }, - { - "epoch": 152.12, - "learning_rate": 7.777277637738567e-05, - "loss": 0.2175, - "step": 188175 - }, - { - "epoch": 152.14, - "learning_rate": 7.771651062297444e-05, - "loss": 0.2289, - "step": 188200 - }, - { - "epoch": 152.16, - "learning_rate": 7.76602448685632e-05, - "loss": 0.1924, - "step": 188225 - }, - { - "epoch": 152.18, - "learning_rate": 7.760397911415197e-05, - "loss": 0.2595, - "step": 188250 - }, - { - "epoch": 152.2, - "learning_rate": 7.754771335974073e-05, - "loss": 0.2235, - "step": 188275 - }, - { - "epoch": 152.22, - "learning_rate": 7.749144760532949e-05, - "loss": 0.2349, - "step": 188300 - }, - { - "epoch": 152.24, - "learning_rate": 7.743518185091826e-05, - "loss": 0.2049, - "step": 188325 - }, - { - "epoch": 152.26, - "learning_rate": 7.737891609650702e-05, - "loss": 0.2321, - "step": 188350 - }, - { - "epoch": 152.28, - "learning_rate": 7.732265034209578e-05, - "loss": 0.1949, - "step": 188375 - }, - { - "epoch": 152.3, - "learning_rate": 7.726638458768455e-05, - "loss": 0.232, - "step": 188400 - }, - { - "epoch": 152.32, - "learning_rate": 7.721011883327333e-05, - "loss": 0.2478, - "step": 188425 - }, - { - "epoch": 152.34, - "learning_rate": 7.715385307886208e-05, - "loss": 0.2493, - "step": 188450 - }, - { - "epoch": 152.36, - "learning_rate": 7.709758732445086e-05, - "loss": 0.2047, - "step": 188475 - }, - { - "epoch": 152.38, - "learning_rate": 7.704132157003961e-05, - "loss": 0.2377, - "step": 188500 - }, - { - "epoch": 152.41, - "learning_rate": 7.698505581562839e-05, - "loss": 0.2217, - "step": 188525 - }, - { - "epoch": 152.43, - "learning_rate": 7.692879006121714e-05, - "loss": 0.2379, - "step": 188550 - }, - { - "epoch": 152.45, - "learning_rate": 7.687252430680592e-05, - "loss": 0.2238, - "step": 188575 - }, - { - "epoch": 152.47, - "learning_rate": 7.681625855239467e-05, - "loss": 0.2216, - "step": 188600 - }, - { - "epoch": 152.49, - "learning_rate": 7.675999279798343e-05, - "loss": 0.2229, - "step": 188625 - }, - { - "epoch": 152.51, - "learning_rate": 7.67037270435722e-05, - "loss": 0.2629, - "step": 188650 - }, - { - "epoch": 152.53, - "learning_rate": 7.664746128916096e-05, - "loss": 0.2448, - "step": 188675 - }, - { - "epoch": 152.55, - "learning_rate": 7.659119553474973e-05, - "loss": 0.2494, - "step": 188700 - }, - { - "epoch": 152.57, - "learning_rate": 7.653492978033849e-05, - "loss": 0.2113, - "step": 188725 - }, - { - "epoch": 152.59, - "learning_rate": 7.647866402592727e-05, - "loss": 0.2247, - "step": 188750 - }, - { - "epoch": 152.61, - "learning_rate": 7.642239827151602e-05, - "loss": 0.2647, - "step": 188775 - }, - { - "epoch": 152.63, - "learning_rate": 7.63661325171048e-05, - "loss": 0.2634, - "step": 188800 - }, - { - "epoch": 152.65, - "learning_rate": 7.630986676269355e-05, - "loss": 0.2549, - "step": 188825 - }, - { - "epoch": 152.67, - "learning_rate": 7.625360100828233e-05, - "loss": 0.2276, - "step": 188850 - }, - { - "epoch": 152.69, - "learning_rate": 7.619733525387108e-05, - "loss": 0.2175, - "step": 188875 - }, - { - "epoch": 152.71, - "learning_rate": 7.614106949945986e-05, - "loss": 0.2392, - "step": 188900 - }, - { - "epoch": 152.73, - "learning_rate": 7.608480374504861e-05, - "loss": 0.2177, - "step": 188925 - }, - { - "epoch": 152.75, - "learning_rate": 7.602853799063739e-05, - "loss": 0.2344, - "step": 188950 - }, - { - "epoch": 152.77, - "learning_rate": 7.597227223622614e-05, - "loss": 0.2275, - "step": 188975 - }, - { - "epoch": 152.79, - "learning_rate": 7.59160064818149e-05, - "loss": 0.2444, - "step": 189000 - }, - { - "epoch": 152.79, - "eval_cer": 0.07623481822941798, - "eval_loss": 0.45240142941474915, - "eval_runtime": 150.3487, - "eval_samples_per_second": 27.889, - "eval_steps_per_second": 6.977, - "eval_wer": 0.32388254486133766, - "step": 189000 - }, - { - "epoch": 152.81, - "learning_rate": 7.585974072740367e-05, - "loss": 0.2367, - "step": 189025 - }, - { - "epoch": 152.83, - "learning_rate": 7.580347497299243e-05, - "loss": 0.2331, - "step": 189050 - }, - { - "epoch": 152.85, - "learning_rate": 7.574720921858121e-05, - "loss": 0.2564, - "step": 189075 - }, - { - "epoch": 152.87, - "learning_rate": 7.569094346416996e-05, - "loss": 0.2473, - "step": 189100 - }, - { - "epoch": 152.89, - "learning_rate": 7.563467770975874e-05, - "loss": 0.2096, - "step": 189125 - }, - { - "epoch": 152.91, - "learning_rate": 7.55784119553475e-05, - "loss": 0.2707, - "step": 189150 - }, - { - "epoch": 152.93, - "learning_rate": 7.552214620093627e-05, - "loss": 0.2173, - "step": 189175 - }, - { - "epoch": 152.95, - "learning_rate": 7.546588044652502e-05, - "loss": 0.2174, - "step": 189200 - }, - { - "epoch": 152.97, - "learning_rate": 7.54096146921138e-05, - "loss": 0.2082, - "step": 189225 - }, - { - "epoch": 152.99, - "learning_rate": 7.535334893770255e-05, - "loss": 0.2535, - "step": 189250 - }, - { - "epoch": 153.01, - "learning_rate": 7.529708318329133e-05, - "loss": 0.2413, - "step": 189275 - }, - { - "epoch": 153.03, - "learning_rate": 7.524081742888008e-05, - "loss": 0.2138, - "step": 189300 - }, - { - "epoch": 153.05, - "learning_rate": 7.518455167446886e-05, - "loss": 0.2521, - "step": 189325 - }, - { - "epoch": 153.07, - "learning_rate": 7.512828592005761e-05, - "loss": 0.2148, - "step": 189350 - }, - { - "epoch": 153.09, - "learning_rate": 7.507202016564638e-05, - "loss": 0.22, - "step": 189375 - }, - { - "epoch": 153.11, - "learning_rate": 7.501575441123516e-05, - "loss": 0.2497, - "step": 189400 - }, - { - "epoch": 153.13, - "learning_rate": 7.49594886568239e-05, - "loss": 0.2299, - "step": 189425 - }, - { - "epoch": 153.15, - "learning_rate": 7.490322290241268e-05, - "loss": 0.2348, - "step": 189450 - }, - { - "epoch": 153.17, - "learning_rate": 7.484695714800144e-05, - "loss": 0.2554, - "step": 189475 - }, - { - "epoch": 153.19, - "learning_rate": 7.479069139359021e-05, - "loss": 0.1973, - "step": 189500 - }, - { - "epoch": 153.21, - "learning_rate": 7.473442563917897e-05, - "loss": 0.2412, - "step": 189525 - }, - { - "epoch": 153.23, - "learning_rate": 7.467815988476774e-05, - "loss": 0.2277, - "step": 189550 - }, - { - "epoch": 153.25, - "learning_rate": 7.46218941303565e-05, - "loss": 0.2222, - "step": 189575 - }, - { - "epoch": 153.27, - "learning_rate": 7.456562837594527e-05, - "loss": 0.2381, - "step": 189600 - }, - { - "epoch": 153.29, - "learning_rate": 7.450936262153402e-05, - "loss": 0.2318, - "step": 189625 - }, - { - "epoch": 153.31, - "learning_rate": 7.44530968671228e-05, - "loss": 0.2303, - "step": 189650 - }, - { - "epoch": 153.33, - "learning_rate": 7.439683111271155e-05, - "loss": 0.2455, - "step": 189675 - }, - { - "epoch": 153.35, - "learning_rate": 7.434056535830032e-05, - "loss": 0.2171, - "step": 189700 - }, - { - "epoch": 153.38, - "learning_rate": 7.42842996038891e-05, - "loss": 0.2435, - "step": 189725 - }, - { - "epoch": 153.4, - "learning_rate": 7.422803384947785e-05, - "loss": 0.2469, - "step": 189750 - }, - { - "epoch": 153.42, - "learning_rate": 7.417176809506663e-05, - "loss": 0.2263, - "step": 189775 - }, - { - "epoch": 153.44, - "learning_rate": 7.411550234065538e-05, - "loss": 0.2311, - "step": 189800 - }, - { - "epoch": 153.46, - "learning_rate": 7.405923658624416e-05, - "loss": 0.2528, - "step": 189825 - }, - { - "epoch": 153.48, - "learning_rate": 7.400297083183291e-05, - "loss": 0.2196, - "step": 189850 - }, - { - "epoch": 153.5, - "learning_rate": 7.394670507742169e-05, - "loss": 0.2193, - "step": 189875 - }, - { - "epoch": 153.52, - "learning_rate": 7.389043932301044e-05, - "loss": 0.238, - "step": 189900 - }, - { - "epoch": 153.54, - "learning_rate": 7.383417356859922e-05, - "loss": 0.2361, - "step": 189925 - }, - { - "epoch": 153.56, - "learning_rate": 7.377790781418797e-05, - "loss": 0.2492, - "step": 189950 - }, - { - "epoch": 153.58, - "learning_rate": 7.372164205977675e-05, - "loss": 0.2293, - "step": 189975 - }, - { - "epoch": 153.6, - "learning_rate": 7.36653763053655e-05, - "loss": 0.2377, - "step": 190000 - }, - { - "epoch": 153.62, - "learning_rate": 7.360911055095427e-05, - "loss": 0.2156, - "step": 190025 - }, - { - "epoch": 153.64, - "learning_rate": 7.355284479654304e-05, - "loss": 0.2152, - "step": 190050 - }, - { - "epoch": 153.66, - "learning_rate": 7.349657904213179e-05, - "loss": 0.234, - "step": 190075 - }, - { - "epoch": 153.68, - "learning_rate": 7.344031328772057e-05, - "loss": 0.2216, - "step": 190100 - }, - { - "epoch": 153.7, - "learning_rate": 7.338404753330932e-05, - "loss": 0.2155, - "step": 190125 - }, - { - "epoch": 153.72, - "learning_rate": 7.33277817788981e-05, - "loss": 0.2125, - "step": 190150 - }, - { - "epoch": 153.74, - "learning_rate": 7.327151602448685e-05, - "loss": 0.2174, - "step": 190175 - }, - { - "epoch": 153.76, - "learning_rate": 7.321525027007563e-05, - "loss": 0.1994, - "step": 190200 - }, - { - "epoch": 153.78, - "learning_rate": 7.315898451566438e-05, - "loss": 0.2014, - "step": 190225 - }, - { - "epoch": 153.8, - "learning_rate": 7.310271876125316e-05, - "loss": 0.2064, - "step": 190250 - }, - { - "epoch": 153.82, - "learning_rate": 7.304645300684191e-05, - "loss": 0.247, - "step": 190275 - }, - { - "epoch": 153.84, - "learning_rate": 7.299018725243069e-05, - "loss": 0.2307, - "step": 190300 - }, - { - "epoch": 153.86, - "learning_rate": 7.293392149801944e-05, - "loss": 0.2136, - "step": 190325 - }, - { - "epoch": 153.88, - "learning_rate": 7.287765574360822e-05, - "loss": 0.2163, - "step": 190350 - }, - { - "epoch": 153.9, - "learning_rate": 7.282138998919698e-05, - "loss": 0.2388, - "step": 190375 - }, - { - "epoch": 153.92, - "learning_rate": 7.276512423478575e-05, - "loss": 0.2372, - "step": 190400 - }, - { - "epoch": 153.94, - "learning_rate": 7.270885848037451e-05, - "loss": 0.2427, - "step": 190425 - }, - { - "epoch": 153.96, - "learning_rate": 7.265259272596326e-05, - "loss": 0.2014, - "step": 190450 - }, - { - "epoch": 153.98, - "learning_rate": 7.259632697155204e-05, - "loss": 0.2028, - "step": 190475 - }, - { - "epoch": 154.0, - "learning_rate": 7.254006121714079e-05, - "loss": 0.3995, - "step": 190500 - }, - { - "epoch": 154.02, - "learning_rate": 7.248379546272957e-05, - "loss": 0.2444, - "step": 190525 - }, - { - "epoch": 154.04, - "learning_rate": 7.242752970831832e-05, - "loss": 0.2182, - "step": 190550 - }, - { - "epoch": 154.06, - "learning_rate": 7.23712639539071e-05, - "loss": 0.2397, - "step": 190575 - }, - { - "epoch": 154.08, - "learning_rate": 7.231499819949585e-05, - "loss": 0.2091, - "step": 190600 - }, - { - "epoch": 154.1, - "learning_rate": 7.225873244508463e-05, - "loss": 0.2603, - "step": 190625 - }, - { - "epoch": 154.12, - "learning_rate": 7.220246669067338e-05, - "loss": 0.1942, - "step": 190650 - }, - { - "epoch": 154.14, - "learning_rate": 7.214620093626216e-05, - "loss": 0.2209, - "step": 190675 - }, - { - "epoch": 154.16, - "learning_rate": 7.208993518185092e-05, - "loss": 0.2305, - "step": 190700 - }, - { - "epoch": 154.18, - "learning_rate": 7.203366942743969e-05, - "loss": 0.2347, - "step": 190725 - }, - { - "epoch": 154.2, - "learning_rate": 7.197740367302845e-05, - "loss": 0.2093, - "step": 190750 - }, - { - "epoch": 154.22, - "learning_rate": 7.19211379186172e-05, - "loss": 0.2282, - "step": 190775 - }, - { - "epoch": 154.24, - "learning_rate": 7.186487216420598e-05, - "loss": 0.2018, - "step": 190800 - }, - { - "epoch": 154.26, - "learning_rate": 7.180860640979474e-05, - "loss": 0.2247, - "step": 190825 - }, - { - "epoch": 154.28, - "learning_rate": 7.175234065538351e-05, - "loss": 0.2136, - "step": 190850 - }, - { - "epoch": 154.3, - "learning_rate": 7.169607490097226e-05, - "loss": 0.2416, - "step": 190875 - }, - { - "epoch": 154.32, - "learning_rate": 7.163980914656104e-05, - "loss": 0.2178, - "step": 190900 - }, - { - "epoch": 154.35, - "learning_rate": 7.15835433921498e-05, - "loss": 0.2408, - "step": 190925 - }, - { - "epoch": 154.37, - "learning_rate": 7.152727763773857e-05, - "loss": 0.216, - "step": 190950 - }, - { - "epoch": 154.39, - "learning_rate": 7.147101188332732e-05, - "loss": 0.2245, - "step": 190975 - }, - { - "epoch": 154.41, - "learning_rate": 7.14147461289161e-05, - "loss": 0.234, - "step": 191000 - }, - { - "epoch": 154.43, - "learning_rate": 7.135848037450487e-05, - "loss": 0.2355, - "step": 191025 - }, - { - "epoch": 154.45, - "learning_rate": 7.130221462009363e-05, - "loss": 0.2217, - "step": 191050 - }, - { - "epoch": 154.47, - "learning_rate": 7.12459488656824e-05, - "loss": 0.245, - "step": 191075 - }, - { - "epoch": 154.49, - "learning_rate": 7.118968311127116e-05, - "loss": 0.2192, - "step": 191100 - }, - { - "epoch": 154.51, - "learning_rate": 7.113341735685993e-05, - "loss": 0.2443, - "step": 191125 - }, - { - "epoch": 154.53, - "learning_rate": 7.107715160244868e-05, - "loss": 0.2346, - "step": 191150 - }, - { - "epoch": 154.55, - "learning_rate": 7.102088584803746e-05, - "loss": 0.2395, - "step": 191175 - }, - { - "epoch": 154.57, - "learning_rate": 7.096462009362621e-05, - "loss": 0.2436, - "step": 191200 - }, - { - "epoch": 154.59, - "learning_rate": 7.090835433921499e-05, - "loss": 0.2365, - "step": 191225 - }, - { - "epoch": 154.61, - "learning_rate": 7.085208858480374e-05, - "loss": 0.24, - "step": 191250 - }, - { - "epoch": 154.63, - "learning_rate": 7.079582283039251e-05, - "loss": 0.2425, - "step": 191275 - }, - { - "epoch": 154.65, - "learning_rate": 7.073955707598127e-05, - "loss": 0.2055, - "step": 191300 - }, - { - "epoch": 154.67, - "learning_rate": 7.068329132157004e-05, - "loss": 0.2431, - "step": 191325 - }, - { - "epoch": 154.69, - "learning_rate": 7.062702556715881e-05, - "loss": 0.2072, - "step": 191350 - }, - { - "epoch": 154.71, - "learning_rate": 7.057075981274757e-05, - "loss": 0.2459, - "step": 191375 - }, - { - "epoch": 154.73, - "learning_rate": 7.051449405833634e-05, - "loss": 0.2247, - "step": 191400 - }, - { - "epoch": 154.75, - "learning_rate": 7.04582283039251e-05, - "loss": 0.2301, - "step": 191425 - }, - { - "epoch": 154.77, - "learning_rate": 7.040196254951387e-05, - "loss": 0.2022, - "step": 191450 - }, - { - "epoch": 154.79, - "learning_rate": 7.034569679510262e-05, - "loss": 0.2515, - "step": 191475 - }, - { - "epoch": 154.81, - "learning_rate": 7.02894310406914e-05, - "loss": 0.1996, - "step": 191500 - }, - { - "epoch": 154.83, - "learning_rate": 7.023316528628015e-05, - "loss": 0.2401, - "step": 191525 - }, - { - "epoch": 154.85, - "learning_rate": 7.017689953186893e-05, - "loss": 0.2216, - "step": 191550 - }, - { - "epoch": 154.87, - "learning_rate": 7.012063377745768e-05, - "loss": 0.2277, - "step": 191575 - }, - { - "epoch": 154.89, - "learning_rate": 7.006436802304646e-05, - "loss": 0.2025, - "step": 191600 - }, - { - "epoch": 154.91, - "learning_rate": 7.000810226863521e-05, - "loss": 0.2423, - "step": 191625 - }, - { - "epoch": 154.93, - "learning_rate": 6.995408714440043e-05, - "loss": 0.2019, - "step": 191650 - }, - { - "epoch": 154.95, - "learning_rate": 6.990007202016565e-05, - "loss": 0.2271, - "step": 191675 - }, - { - "epoch": 154.97, - "learning_rate": 6.984380626575441e-05, - "loss": 0.2214, - "step": 191700 - }, - { - "epoch": 154.99, - "learning_rate": 6.978754051134318e-05, - "loss": 0.2428, - "step": 191725 - }, - { - "epoch": 155.01, - "learning_rate": 6.973127475693194e-05, - "loss": 0.2019, - "step": 191750 - }, - { - "epoch": 155.03, - "learning_rate": 6.96750090025207e-05, - "loss": 0.23, - "step": 191775 - }, - { - "epoch": 155.05, - "learning_rate": 6.961874324810947e-05, - "loss": 0.2473, - "step": 191800 - }, - { - "epoch": 155.07, - "learning_rate": 6.956247749369824e-05, - "loss": 0.2076, - "step": 191825 - }, - { - "epoch": 155.09, - "learning_rate": 6.9506211739287e-05, - "loss": 0.2534, - "step": 191850 - }, - { - "epoch": 155.11, - "learning_rate": 6.944994598487577e-05, - "loss": 0.2278, - "step": 191875 - }, - { - "epoch": 155.13, - "learning_rate": 6.939368023046453e-05, - "loss": 0.2109, - "step": 191900 - }, - { - "epoch": 155.15, - "learning_rate": 6.93374144760533e-05, - "loss": 0.224, - "step": 191925 - }, - { - "epoch": 155.17, - "learning_rate": 6.928114872164207e-05, - "loss": 0.2067, - "step": 191950 - }, - { - "epoch": 155.19, - "learning_rate": 6.922488296723082e-05, - "loss": 0.1854, - "step": 191975 - }, - { - "epoch": 155.21, - "learning_rate": 6.916861721281959e-05, - "loss": 0.2272, - "step": 192000 - }, - { - "epoch": 155.21, - "eval_cer": 0.0758806196934386, - "eval_loss": 0.46198299527168274, - "eval_runtime": 150.7236, - "eval_samples_per_second": 27.819, - "eval_steps_per_second": 6.96, - "eval_wer": 0.32218597063621535, - "step": 192000 - }, - { - "epoch": 155.23, - "learning_rate": 6.911235145840835e-05, - "loss": 0.1919, - "step": 192025 - }, - { - "epoch": 155.25, - "learning_rate": 6.905608570399712e-05, - "loss": 0.228, - "step": 192050 - }, - { - "epoch": 155.27, - "learning_rate": 6.899981994958588e-05, - "loss": 0.1864, - "step": 192075 - }, - { - "epoch": 155.3, - "learning_rate": 6.894355419517465e-05, - "loss": 0.2503, - "step": 192100 - }, - { - "epoch": 155.32, - "learning_rate": 6.888728844076341e-05, - "loss": 0.2288, - "step": 192125 - }, - { - "epoch": 155.34, - "learning_rate": 6.883102268635218e-05, - "loss": 0.2405, - "step": 192150 - }, - { - "epoch": 155.36, - "learning_rate": 6.877475693194094e-05, - "loss": 0.226, - "step": 192175 - }, - { - "epoch": 155.38, - "learning_rate": 6.871849117752971e-05, - "loss": 0.2376, - "step": 192200 - }, - { - "epoch": 155.4, - "learning_rate": 6.866222542311847e-05, - "loss": 0.2325, - "step": 192225 - }, - { - "epoch": 155.42, - "learning_rate": 6.860595966870724e-05, - "loss": 0.2236, - "step": 192250 - }, - { - "epoch": 155.44, - "learning_rate": 6.854969391429602e-05, - "loss": 0.2091, - "step": 192275 - }, - { - "epoch": 155.46, - "learning_rate": 6.849342815988477e-05, - "loss": 0.2424, - "step": 192300 - }, - { - "epoch": 155.48, - "learning_rate": 6.843716240547355e-05, - "loss": 0.2122, - "step": 192325 - }, - { - "epoch": 155.5, - "learning_rate": 6.83808966510623e-05, - "loss": 0.2159, - "step": 192350 - }, - { - "epoch": 155.52, - "learning_rate": 6.832463089665106e-05, - "loss": 0.2481, - "step": 192375 - }, - { - "epoch": 155.54, - "learning_rate": 6.826836514223983e-05, - "loss": 0.2146, - "step": 192400 - }, - { - "epoch": 155.56, - "learning_rate": 6.821209938782859e-05, - "loss": 0.1996, - "step": 192425 - }, - { - "epoch": 155.58, - "learning_rate": 6.815583363341736e-05, - "loss": 0.2338, - "step": 192450 - }, - { - "epoch": 155.6, - "learning_rate": 6.809956787900612e-05, - "loss": 0.2209, - "step": 192475 - }, - { - "epoch": 155.62, - "learning_rate": 6.804330212459489e-05, - "loss": 0.242, - "step": 192500 - }, - { - "epoch": 155.64, - "learning_rate": 6.798703637018365e-05, - "loss": 0.2416, - "step": 192525 - }, - { - "epoch": 155.66, - "learning_rate": 6.793077061577242e-05, - "loss": 0.2224, - "step": 192550 - }, - { - "epoch": 155.68, - "learning_rate": 6.787450486136118e-05, - "loss": 0.2458, - "step": 192575 - }, - { - "epoch": 155.7, - "learning_rate": 6.781823910694996e-05, - "loss": 0.2218, - "step": 192600 - }, - { - "epoch": 155.72, - "learning_rate": 6.776197335253871e-05, - "loss": 0.2382, - "step": 192625 - }, - { - "epoch": 155.74, - "learning_rate": 6.770570759812749e-05, - "loss": 0.2254, - "step": 192650 - }, - { - "epoch": 155.76, - "learning_rate": 6.764944184371624e-05, - "loss": 0.2037, - "step": 192675 - }, - { - "epoch": 155.78, - "learning_rate": 6.7593176089305e-05, - "loss": 0.221, - "step": 192700 - }, - { - "epoch": 155.8, - "learning_rate": 6.753691033489377e-05, - "loss": 0.229, - "step": 192725 - }, - { - "epoch": 155.82, - "learning_rate": 6.748064458048253e-05, - "loss": 0.2352, - "step": 192750 - }, - { - "epoch": 155.84, - "learning_rate": 6.74243788260713e-05, - "loss": 0.2127, - "step": 192775 - }, - { - "epoch": 155.86, - "learning_rate": 6.736811307166006e-05, - "loss": 0.234, - "step": 192800 - }, - { - "epoch": 155.88, - "learning_rate": 6.731184731724883e-05, - "loss": 0.2289, - "step": 192825 - }, - { - "epoch": 155.9, - "learning_rate": 6.725558156283759e-05, - "loss": 0.2334, - "step": 192850 - }, - { - "epoch": 155.92, - "learning_rate": 6.719931580842637e-05, - "loss": 0.2458, - "step": 192875 - }, - { - "epoch": 155.94, - "learning_rate": 6.714305005401512e-05, - "loss": 0.2094, - "step": 192900 - }, - { - "epoch": 155.96, - "learning_rate": 6.70867842996039e-05, - "loss": 0.2045, - "step": 192925 - }, - { - "epoch": 155.98, - "learning_rate": 6.703051854519265e-05, - "loss": 0.2256, - "step": 192950 - }, - { - "epoch": 156.0, - "learning_rate": 6.697425279078143e-05, - "loss": 0.1937, - "step": 192975 - }, - { - "epoch": 156.02, - "learning_rate": 6.691798703637018e-05, - "loss": 0.2296, - "step": 193000 - }, - { - "epoch": 156.04, - "learning_rate": 6.686172128195896e-05, - "loss": 0.2489, - "step": 193025 - }, - { - "epoch": 156.06, - "learning_rate": 6.680545552754771e-05, - "loss": 0.2634, - "step": 193050 - }, - { - "epoch": 156.08, - "learning_rate": 6.674918977313648e-05, - "loss": 0.2301, - "step": 193075 - }, - { - "epoch": 156.1, - "learning_rate": 6.669292401872524e-05, - "loss": 0.194, - "step": 193100 - }, - { - "epoch": 156.12, - "learning_rate": 6.6636658264314e-05, - "loss": 0.2145, - "step": 193125 - }, - { - "epoch": 156.14, - "learning_rate": 6.658039250990277e-05, - "loss": 0.2503, - "step": 193150 - }, - { - "epoch": 156.16, - "learning_rate": 6.652412675549154e-05, - "loss": 0.2152, - "step": 193175 - }, - { - "epoch": 156.18, - "learning_rate": 6.646786100108031e-05, - "loss": 0.2306, - "step": 193200 - }, - { - "epoch": 156.2, - "learning_rate": 6.641159524666906e-05, - "loss": 0.22, - "step": 193225 - }, - { - "epoch": 156.22, - "learning_rate": 6.635532949225784e-05, - "loss": 0.2105, - "step": 193250 - }, - { - "epoch": 156.24, - "learning_rate": 6.62990637378466e-05, - "loss": 0.2004, - "step": 193275 - }, - { - "epoch": 156.27, - "learning_rate": 6.624279798343537e-05, - "loss": 0.2387, - "step": 193300 - }, - { - "epoch": 156.29, - "learning_rate": 6.618653222902412e-05, - "loss": 0.2132, - "step": 193325 - }, - { - "epoch": 156.31, - "learning_rate": 6.61302664746129e-05, - "loss": 0.2178, - "step": 193350 - }, - { - "epoch": 156.33, - "learning_rate": 6.607400072020165e-05, - "loss": 0.2301, - "step": 193375 - }, - { - "epoch": 156.35, - "learning_rate": 6.601773496579042e-05, - "loss": 0.2328, - "step": 193400 - }, - { - "epoch": 156.37, - "learning_rate": 6.596146921137918e-05, - "loss": 0.182, - "step": 193425 - }, - { - "epoch": 156.39, - "learning_rate": 6.590520345696795e-05, - "loss": 0.2293, - "step": 193450 - }, - { - "epoch": 156.41, - "learning_rate": 6.584893770255671e-05, - "loss": 0.2109, - "step": 193475 - }, - { - "epoch": 156.43, - "learning_rate": 6.579267194814548e-05, - "loss": 0.2151, - "step": 193500 - }, - { - "epoch": 156.45, - "learning_rate": 6.573640619373426e-05, - "loss": 0.2366, - "step": 193525 - }, - { - "epoch": 156.47, - "learning_rate": 6.568014043932301e-05, - "loss": 0.2333, - "step": 193550 - }, - { - "epoch": 156.49, - "learning_rate": 6.562387468491179e-05, - "loss": 0.2129, - "step": 193575 - }, - { - "epoch": 156.51, - "learning_rate": 6.556760893050054e-05, - "loss": 0.2277, - "step": 193600 - }, - { - "epoch": 156.53, - "learning_rate": 6.551134317608932e-05, - "loss": 0.1766, - "step": 193625 - }, - { - "epoch": 156.55, - "learning_rate": 6.545507742167807e-05, - "loss": 0.2129, - "step": 193650 - }, - { - "epoch": 156.57, - "learning_rate": 6.539881166726684e-05, - "loss": 0.2477, - "step": 193675 - }, - { - "epoch": 156.59, - "learning_rate": 6.53425459128556e-05, - "loss": 0.2421, - "step": 193700 - }, - { - "epoch": 156.61, - "learning_rate": 6.528628015844437e-05, - "loss": 0.1967, - "step": 193725 - }, - { - "epoch": 156.63, - "learning_rate": 6.523001440403313e-05, - "loss": 0.2341, - "step": 193750 - }, - { - "epoch": 156.65, - "learning_rate": 6.517374864962189e-05, - "loss": 0.1614, - "step": 193775 - }, - { - "epoch": 156.67, - "learning_rate": 6.511748289521066e-05, - "loss": 0.2197, - "step": 193800 - }, - { - "epoch": 156.69, - "learning_rate": 6.506121714079942e-05, - "loss": 0.2228, - "step": 193825 - }, - { - "epoch": 156.71, - "learning_rate": 6.50049513863882e-05, - "loss": 0.24, - "step": 193850 - }, - { - "epoch": 156.73, - "learning_rate": 6.494868563197695e-05, - "loss": 0.2053, - "step": 193875 - }, - { - "epoch": 156.75, - "learning_rate": 6.489241987756573e-05, - "loss": 0.235, - "step": 193900 - }, - { - "epoch": 156.77, - "learning_rate": 6.483615412315448e-05, - "loss": 0.1891, - "step": 193925 - }, - { - "epoch": 156.79, - "learning_rate": 6.477988836874326e-05, - "loss": 0.2285, - "step": 193950 - }, - { - "epoch": 156.81, - "learning_rate": 6.472362261433201e-05, - "loss": 0.2047, - "step": 193975 - }, - { - "epoch": 156.83, - "learning_rate": 6.466735685992079e-05, - "loss": 0.2422, - "step": 194000 - }, - { - "epoch": 156.85, - "learning_rate": 6.461109110550954e-05, - "loss": 0.2219, - "step": 194025 - }, - { - "epoch": 156.87, - "learning_rate": 6.455482535109832e-05, - "loss": 0.2377, - "step": 194050 - }, - { - "epoch": 156.89, - "learning_rate": 6.449855959668707e-05, - "loss": 0.2314, - "step": 194075 - }, - { - "epoch": 156.91, - "learning_rate": 6.444229384227585e-05, - "loss": 0.2444, - "step": 194100 - }, - { - "epoch": 156.93, - "learning_rate": 6.43860280878646e-05, - "loss": 0.1989, - "step": 194125 - }, - { - "epoch": 156.95, - "learning_rate": 6.432976233345336e-05, - "loss": 0.2266, - "step": 194150 - }, - { - "epoch": 156.97, - "learning_rate": 6.427349657904214e-05, - "loss": 0.2442, - "step": 194175 - }, - { - "epoch": 156.99, - "learning_rate": 6.421723082463089e-05, - "loss": 0.2409, - "step": 194200 - }, - { - "epoch": 157.01, - "learning_rate": 6.416096507021967e-05, - "loss": 0.2476, - "step": 194225 - }, - { - "epoch": 157.03, - "learning_rate": 6.410469931580842e-05, - "loss": 0.1957, - "step": 194250 - }, - { - "epoch": 157.05, - "learning_rate": 6.40484335613972e-05, - "loss": 0.221, - "step": 194275 - }, - { - "epoch": 157.07, - "learning_rate": 6.399216780698595e-05, - "loss": 0.2055, - "step": 194300 - }, - { - "epoch": 157.09, - "learning_rate": 6.393590205257473e-05, - "loss": 0.2165, - "step": 194325 - }, - { - "epoch": 157.11, - "learning_rate": 6.387963629816348e-05, - "loss": 0.1957, - "step": 194350 - }, - { - "epoch": 157.13, - "learning_rate": 6.382337054375226e-05, - "loss": 0.2212, - "step": 194375 - }, - { - "epoch": 157.15, - "learning_rate": 6.376710478934101e-05, - "loss": 0.2048, - "step": 194400 - }, - { - "epoch": 157.17, - "learning_rate": 6.371083903492979e-05, - "loss": 0.249, - "step": 194425 - }, - { - "epoch": 157.19, - "learning_rate": 6.365457328051854e-05, - "loss": 0.2055, - "step": 194450 - }, - { - "epoch": 157.22, - "learning_rate": 6.35983075261073e-05, - "loss": 0.231, - "step": 194475 - }, - { - "epoch": 157.24, - "learning_rate": 6.354204177169608e-05, - "loss": 0.211, - "step": 194500 - }, - { - "epoch": 157.26, - "learning_rate": 6.348577601728483e-05, - "loss": 0.2182, - "step": 194525 - }, - { - "epoch": 157.28, - "learning_rate": 6.342951026287361e-05, - "loss": 0.2143, - "step": 194550 - }, - { - "epoch": 157.3, - "learning_rate": 6.337324450846236e-05, - "loss": 0.212, - "step": 194575 - }, - { - "epoch": 157.32, - "learning_rate": 6.331697875405114e-05, - "loss": 0.2317, - "step": 194600 - }, - { - "epoch": 157.34, - "learning_rate": 6.32607129996399e-05, - "loss": 0.2148, - "step": 194625 - }, - { - "epoch": 157.36, - "learning_rate": 6.320444724522867e-05, - "loss": 0.2185, - "step": 194650 - }, - { - "epoch": 157.38, - "learning_rate": 6.314818149081742e-05, - "loss": 0.2312, - "step": 194675 - }, - { - "epoch": 157.4, - "learning_rate": 6.30919157364062e-05, - "loss": 0.2312, - "step": 194700 - }, - { - "epoch": 157.42, - "learning_rate": 6.303564998199495e-05, - "loss": 0.2471, - "step": 194725 - }, - { - "epoch": 157.44, - "learning_rate": 6.297938422758373e-05, - "loss": 0.2164, - "step": 194750 - }, - { - "epoch": 157.46, - "learning_rate": 6.292311847317248e-05, - "loss": 0.2311, - "step": 194775 - }, - { - "epoch": 157.48, - "learning_rate": 6.286685271876126e-05, - "loss": 0.2, - "step": 194800 - }, - { - "epoch": 157.5, - "learning_rate": 6.281058696435003e-05, - "loss": 0.2278, - "step": 194825 - }, - { - "epoch": 157.52, - "learning_rate": 6.275432120993878e-05, - "loss": 0.2307, - "step": 194850 - }, - { - "epoch": 157.54, - "learning_rate": 6.269805545552756e-05, - "loss": 0.2185, - "step": 194875 - }, - { - "epoch": 157.56, - "learning_rate": 6.26417897011163e-05, - "loss": 0.2261, - "step": 194900 - }, - { - "epoch": 157.58, - "learning_rate": 6.258552394670508e-05, - "loss": 0.2419, - "step": 194925 - }, - { - "epoch": 157.6, - "learning_rate": 6.252925819229384e-05, - "loss": 0.1713, - "step": 194950 - }, - { - "epoch": 157.62, - "learning_rate": 6.247299243788261e-05, - "loss": 0.2293, - "step": 194975 - }, - { - "epoch": 157.64, - "learning_rate": 6.241672668347137e-05, - "loss": 0.2102, - "step": 195000 - }, - { - "epoch": 157.64, - "eval_cer": 0.07536215516975864, - "eval_loss": 0.45333951711654663, - "eval_runtime": 150.7124, - "eval_samples_per_second": 27.821, - "eval_steps_per_second": 6.96, - "eval_wer": 0.32120717781402935, - "step": 195000 - }, - { - "epoch": 157.66, - "learning_rate": 6.236046092906013e-05, - "loss": 0.2039, - "step": 195025 - }, - { - "epoch": 157.68, - "learning_rate": 6.23041951746489e-05, - "loss": 0.1991, - "step": 195050 - }, - { - "epoch": 157.7, - "learning_rate": 6.224792942023766e-05, - "loss": 0.2326, - "step": 195075 - }, - { - "epoch": 157.72, - "learning_rate": 6.219166366582642e-05, - "loss": 0.2278, - "step": 195100 - }, - { - "epoch": 157.74, - "learning_rate": 6.21353979114152e-05, - "loss": 0.2313, - "step": 195125 - }, - { - "epoch": 157.76, - "learning_rate": 6.207913215700397e-05, - "loss": 0.2003, - "step": 195150 - }, - { - "epoch": 157.78, - "learning_rate": 6.202286640259273e-05, - "loss": 0.2438, - "step": 195175 - }, - { - "epoch": 157.8, - "learning_rate": 6.19666006481815e-05, - "loss": 0.203, - "step": 195200 - }, - { - "epoch": 157.82, - "learning_rate": 6.191033489377026e-05, - "loss": 0.2163, - "step": 195225 - }, - { - "epoch": 157.84, - "learning_rate": 6.185406913935903e-05, - "loss": 0.2048, - "step": 195250 - }, - { - "epoch": 157.86, - "learning_rate": 6.179780338494779e-05, - "loss": 0.2448, - "step": 195275 - }, - { - "epoch": 157.88, - "learning_rate": 6.174153763053656e-05, - "loss": 0.2062, - "step": 195300 - }, - { - "epoch": 157.9, - "learning_rate": 6.168527187612532e-05, - "loss": 0.2055, - "step": 195325 - }, - { - "epoch": 157.92, - "learning_rate": 6.162900612171409e-05, - "loss": 0.2309, - "step": 195350 - }, - { - "epoch": 157.94, - "learning_rate": 6.157274036730284e-05, - "loss": 0.2249, - "step": 195375 - }, - { - "epoch": 157.96, - "learning_rate": 6.15164746128916e-05, - "loss": 0.2243, - "step": 195400 - }, - { - "epoch": 157.98, - "learning_rate": 6.146020885848037e-05, - "loss": 0.2109, - "step": 195425 - }, - { - "epoch": 158.0, - "learning_rate": 6.140394310406915e-05, - "loss": 0.1838, - "step": 195450 - }, - { - "epoch": 158.02, - "learning_rate": 6.134767734965791e-05, - "loss": 0.2381, - "step": 195475 - }, - { - "epoch": 158.04, - "learning_rate": 6.129141159524668e-05, - "loss": 0.1997, - "step": 195500 - }, - { - "epoch": 158.06, - "learning_rate": 6.123514584083544e-05, - "loss": 0.2122, - "step": 195525 - }, - { - "epoch": 158.08, - "learning_rate": 6.11788800864242e-05, - "loss": 0.1902, - "step": 195550 - }, - { - "epoch": 158.1, - "learning_rate": 6.112261433201297e-05, - "loss": 0.2381, - "step": 195575 - }, - { - "epoch": 158.12, - "learning_rate": 6.106634857760173e-05, - "loss": 0.2255, - "step": 195600 - }, - { - "epoch": 158.14, - "learning_rate": 6.10100828231905e-05, - "loss": 0.1934, - "step": 195625 - }, - { - "epoch": 158.16, - "learning_rate": 6.0953817068779264e-05, - "loss": 0.212, - "step": 195650 - }, - { - "epoch": 158.19, - "learning_rate": 6.089755131436803e-05, - "loss": 0.2282, - "step": 195675 - }, - { - "epoch": 158.21, - "learning_rate": 6.0841285559956794e-05, - "loss": 0.2013, - "step": 195700 - }, - { - "epoch": 158.23, - "learning_rate": 6.078501980554555e-05, - "loss": 0.2444, - "step": 195725 - }, - { - "epoch": 158.25, - "learning_rate": 6.0728754051134316e-05, - "loss": 0.2717, - "step": 195750 - }, - { - "epoch": 158.27, - "learning_rate": 6.067248829672308e-05, - "loss": 0.2383, - "step": 195775 - }, - { - "epoch": 158.29, - "learning_rate": 6.0616222542311846e-05, - "loss": 0.174, - "step": 195800 - }, - { - "epoch": 158.31, - "learning_rate": 6.055995678790061e-05, - "loss": 0.2235, - "step": 195825 - }, - { - "epoch": 158.33, - "learning_rate": 6.0503691033489376e-05, - "loss": 0.1992, - "step": 195850 - }, - { - "epoch": 158.35, - "learning_rate": 6.044742527907814e-05, - "loss": 0.2396, - "step": 195875 - }, - { - "epoch": 158.37, - "learning_rate": 6.0391159524666905e-05, - "loss": 0.2072, - "step": 195900 - }, - { - "epoch": 158.39, - "learning_rate": 6.033489377025568e-05, - "loss": 0.2484, - "step": 195925 - }, - { - "epoch": 158.41, - "learning_rate": 6.027862801584444e-05, - "loss": 0.2344, - "step": 195950 - }, - { - "epoch": 158.43, - "learning_rate": 6.0222362261433206e-05, - "loss": 0.2205, - "step": 195975 - }, - { - "epoch": 158.45, - "learning_rate": 6.016609650702197e-05, - "loss": 0.2186, - "step": 196000 - }, - { - "epoch": 158.47, - "learning_rate": 6.0109830752610736e-05, - "loss": 0.1948, - "step": 196025 - }, - { - "epoch": 158.49, - "learning_rate": 6.00535649981995e-05, - "loss": 0.24, - "step": 196050 - }, - { - "epoch": 158.51, - "learning_rate": 5.999729924378826e-05, - "loss": 0.2104, - "step": 196075 - }, - { - "epoch": 158.53, - "learning_rate": 5.9941033489377024e-05, - "loss": 0.206, - "step": 196100 - }, - { - "epoch": 158.55, - "learning_rate": 5.988476773496579e-05, - "loss": 0.2317, - "step": 196125 - }, - { - "epoch": 158.57, - "learning_rate": 5.982850198055455e-05, - "loss": 0.2192, - "step": 196150 - }, - { - "epoch": 158.59, - "learning_rate": 5.9774486856319766e-05, - "loss": 0.1975, - "step": 196175 - }, - { - "epoch": 158.61, - "learning_rate": 5.971822110190853e-05, - "loss": 0.2098, - "step": 196200 - }, - { - "epoch": 158.63, - "learning_rate": 5.9661955347497295e-05, - "loss": 0.2464, - "step": 196225 - }, - { - "epoch": 158.65, - "learning_rate": 5.960568959308607e-05, - "loss": 0.2105, - "step": 196250 - }, - { - "epoch": 158.67, - "learning_rate": 5.954942383867483e-05, - "loss": 0.2118, - "step": 196275 - }, - { - "epoch": 158.69, - "learning_rate": 5.9493158084263597e-05, - "loss": 0.2251, - "step": 196300 - }, - { - "epoch": 158.71, - "learning_rate": 5.943689232985236e-05, - "loss": 0.2299, - "step": 196325 - }, - { - "epoch": 158.73, - "learning_rate": 5.9380626575441126e-05, - "loss": 0.2053, - "step": 196350 - }, - { - "epoch": 158.75, - "learning_rate": 5.932436082102989e-05, - "loss": 0.259, - "step": 196375 - }, - { - "epoch": 158.77, - "learning_rate": 5.9268095066618656e-05, - "loss": 0.2073, - "step": 196400 - }, - { - "epoch": 158.79, - "learning_rate": 5.921182931220742e-05, - "loss": 0.1926, - "step": 196425 - }, - { - "epoch": 158.81, - "learning_rate": 5.9155563557796185e-05, - "loss": 0.1656, - "step": 196450 - }, - { - "epoch": 158.83, - "learning_rate": 5.909929780338495e-05, - "loss": 0.2462, - "step": 196475 - }, - { - "epoch": 158.85, - "learning_rate": 5.904303204897371e-05, - "loss": 0.2064, - "step": 196500 - }, - { - "epoch": 158.87, - "learning_rate": 5.898676629456247e-05, - "loss": 0.2116, - "step": 196525 - }, - { - "epoch": 158.89, - "learning_rate": 5.8930500540151245e-05, - "loss": 0.1963, - "step": 196550 - }, - { - "epoch": 158.91, - "learning_rate": 5.887423478574001e-05, - "loss": 0.2498, - "step": 196575 - }, - { - "epoch": 158.93, - "learning_rate": 5.8817969031328774e-05, - "loss": 0.2001, - "step": 196600 - }, - { - "epoch": 158.95, - "learning_rate": 5.876170327691754e-05, - "loss": 0.2215, - "step": 196625 - }, - { - "epoch": 158.97, - "learning_rate": 5.8705437522506304e-05, - "loss": 0.2016, - "step": 196650 - }, - { - "epoch": 158.99, - "learning_rate": 5.864917176809507e-05, - "loss": 0.2508, - "step": 196675 - }, - { - "epoch": 159.01, - "learning_rate": 5.859290601368383e-05, - "loss": 0.2308, - "step": 196700 - }, - { - "epoch": 159.03, - "learning_rate": 5.85366402592726e-05, - "loss": 0.1911, - "step": 196725 - }, - { - "epoch": 159.05, - "learning_rate": 5.848037450486136e-05, - "loss": 0.2246, - "step": 196750 - }, - { - "epoch": 159.07, - "learning_rate": 5.8426359380626575e-05, - "loss": 0.2202, - "step": 196775 - }, - { - "epoch": 159.09, - "learning_rate": 5.837009362621534e-05, - "loss": 0.2251, - "step": 196800 - }, - { - "epoch": 159.11, - "learning_rate": 5.8313827871804105e-05, - "loss": 0.1669, - "step": 196825 - }, - { - "epoch": 159.14, - "learning_rate": 5.825756211739287e-05, - "loss": 0.2453, - "step": 196850 - }, - { - "epoch": 159.16, - "learning_rate": 5.820129636298164e-05, - "loss": 0.195, - "step": 196875 - }, - { - "epoch": 159.18, - "learning_rate": 5.8145030608570406e-05, - "loss": 0.2235, - "step": 196900 - }, - { - "epoch": 159.2, - "learning_rate": 5.8088764854159164e-05, - "loss": 0.2228, - "step": 196925 - }, - { - "epoch": 159.22, - "learning_rate": 5.803249909974793e-05, - "loss": 0.2062, - "step": 196950 - }, - { - "epoch": 159.24, - "learning_rate": 5.7976233345336694e-05, - "loss": 0.2005, - "step": 196975 - }, - { - "epoch": 159.26, - "learning_rate": 5.791996759092546e-05, - "loss": 0.2018, - "step": 197000 - }, - { - "epoch": 159.28, - "learning_rate": 5.7863701836514223e-05, - "loss": 0.2171, - "step": 197025 - }, - { - "epoch": 159.3, - "learning_rate": 5.780743608210299e-05, - "loss": 0.2398, - "step": 197050 - }, - { - "epoch": 159.32, - "learning_rate": 5.775117032769175e-05, - "loss": 0.1838, - "step": 197075 - }, - { - "epoch": 159.34, - "learning_rate": 5.769490457328052e-05, - "loss": 0.2108, - "step": 197100 - }, - { - "epoch": 159.36, - "learning_rate": 5.763863881886928e-05, - "loss": 0.2035, - "step": 197125 - }, - { - "epoch": 159.38, - "learning_rate": 5.758237306445805e-05, - "loss": 0.2166, - "step": 197150 - }, - { - "epoch": 159.4, - "learning_rate": 5.752610731004682e-05, - "loss": 0.2265, - "step": 197175 - }, - { - "epoch": 159.42, - "learning_rate": 5.7469841555635584e-05, - "loss": 0.2085, - "step": 197200 - }, - { - "epoch": 159.44, - "learning_rate": 5.741357580122435e-05, - "loss": 0.2277, - "step": 197225 - }, - { - "epoch": 159.46, - "learning_rate": 5.7357310046813113e-05, - "loss": 0.2095, - "step": 197250 - }, - { - "epoch": 159.48, - "learning_rate": 5.730104429240188e-05, - "loss": 0.2066, - "step": 197275 - }, - { - "epoch": 159.5, - "learning_rate": 5.7244778537990636e-05, - "loss": 0.2441, - "step": 197300 - }, - { - "epoch": 159.52, - "learning_rate": 5.71885127835794e-05, - "loss": 0.1938, - "step": 197325 - }, - { - "epoch": 159.54, - "learning_rate": 5.7132247029168166e-05, - "loss": 0.2241, - "step": 197350 - }, - { - "epoch": 159.56, - "learning_rate": 5.707598127475693e-05, - "loss": 0.2147, - "step": 197375 - }, - { - "epoch": 159.58, - "learning_rate": 5.7019715520345695e-05, - "loss": 0.2061, - "step": 197400 - }, - { - "epoch": 159.6, - "learning_rate": 5.696344976593446e-05, - "loss": 0.2328, - "step": 197425 - }, - { - "epoch": 159.62, - "learning_rate": 5.6907184011523225e-05, - "loss": 0.2262, - "step": 197450 - }, - { - "epoch": 159.64, - "learning_rate": 5.685091825711199e-05, - "loss": 0.2212, - "step": 197475 - }, - { - "epoch": 159.66, - "learning_rate": 5.679465250270076e-05, - "loss": 0.2308, - "step": 197500 - }, - { - "epoch": 159.68, - "learning_rate": 5.6738386748289526e-05, - "loss": 0.2058, - "step": 197525 - }, - { - "epoch": 159.7, - "learning_rate": 5.668212099387829e-05, - "loss": 0.2286, - "step": 197550 - }, - { - "epoch": 159.72, - "learning_rate": 5.6625855239467056e-05, - "loss": 0.2089, - "step": 197575 - }, - { - "epoch": 159.74, - "learning_rate": 5.656958948505582e-05, - "loss": 0.2438, - "step": 197600 - }, - { - "epoch": 159.76, - "learning_rate": 5.6513323730644585e-05, - "loss": 0.2046, - "step": 197625 - }, - { - "epoch": 159.78, - "learning_rate": 5.6457057976233343e-05, - "loss": 0.2079, - "step": 197650 - }, - { - "epoch": 159.8, - "learning_rate": 5.640079222182211e-05, - "loss": 0.1749, - "step": 197675 - }, - { - "epoch": 159.82, - "learning_rate": 5.634452646741087e-05, - "loss": 0.2364, - "step": 197700 - }, - { - "epoch": 159.84, - "learning_rate": 5.628826071299964e-05, - "loss": 0.1952, - "step": 197725 - }, - { - "epoch": 159.86, - "learning_rate": 5.62319949585884e-05, - "loss": 0.2134, - "step": 197750 - }, - { - "epoch": 159.88, - "learning_rate": 5.617572920417717e-05, - "loss": 0.1913, - "step": 197775 - }, - { - "epoch": 159.9, - "learning_rate": 5.611946344976593e-05, - "loss": 0.2211, - "step": 197800 - }, - { - "epoch": 159.92, - "learning_rate": 5.6063197695354704e-05, - "loss": 0.1965, - "step": 197825 - }, - { - "epoch": 159.94, - "learning_rate": 5.600693194094347e-05, - "loss": 0.2465, - "step": 197850 - }, - { - "epoch": 159.96, - "learning_rate": 5.5950666186532233e-05, - "loss": 0.243, - "step": 197875 - }, - { - "epoch": 159.98, - "learning_rate": 5.5894400432121e-05, - "loss": 0.2337, - "step": 197900 - }, - { - "epoch": 160.0, - "learning_rate": 5.583813467770976e-05, - "loss": 0.1881, - "step": 197925 - }, - { - "epoch": 160.02, - "learning_rate": 5.578186892329853e-05, - "loss": 0.2028, - "step": 197950 - }, - { - "epoch": 160.04, - "learning_rate": 5.572560316888729e-05, - "loss": 0.2267, - "step": 197975 - }, - { - "epoch": 160.06, - "learning_rate": 5.566933741447605e-05, - "loss": 0.2231, - "step": 198000 - }, - { - "epoch": 160.06, - "eval_cer": 0.07449462542221492, - "eval_loss": 0.45625007152557373, - "eval_runtime": 150.0374, - "eval_samples_per_second": 27.946, - "eval_steps_per_second": 6.992, - "eval_wer": 0.31830342577487764, - "step": 198000 - }, - { - "epoch": 160.08, - "learning_rate": 5.5613071660064815e-05, - "loss": 0.2143, - "step": 198025 - }, - { - "epoch": 160.11, - "learning_rate": 5.555680590565358e-05, - "loss": 0.2117, - "step": 198050 - }, - { - "epoch": 160.13, - "learning_rate": 5.5500540151242345e-05, - "loss": 0.2071, - "step": 198075 - }, - { - "epoch": 160.15, - "learning_rate": 5.544427439683111e-05, - "loss": 0.219, - "step": 198100 - }, - { - "epoch": 160.17, - "learning_rate": 5.5388008642419875e-05, - "loss": 0.1927, - "step": 198125 - }, - { - "epoch": 160.19, - "learning_rate": 5.5331742888008646e-05, - "loss": 0.2291, - "step": 198150 - }, - { - "epoch": 160.21, - "learning_rate": 5.527547713359741e-05, - "loss": 0.2125, - "step": 198175 - }, - { - "epoch": 160.23, - "learning_rate": 5.5219211379186176e-05, - "loss": 0.2172, - "step": 198200 - }, - { - "epoch": 160.25, - "learning_rate": 5.516294562477494e-05, - "loss": 0.2213, - "step": 198225 - }, - { - "epoch": 160.27, - "learning_rate": 5.5106679870363705e-05, - "loss": 0.2123, - "step": 198250 - }, - { - "epoch": 160.29, - "learning_rate": 5.505041411595247e-05, - "loss": 0.1807, - "step": 198275 - }, - { - "epoch": 160.31, - "learning_rate": 5.4994148361541235e-05, - "loss": 0.2112, - "step": 198300 - }, - { - "epoch": 160.33, - "learning_rate": 5.493788260713e-05, - "loss": 0.2075, - "step": 198325 - }, - { - "epoch": 160.35, - "learning_rate": 5.488161685271876e-05, - "loss": 0.2219, - "step": 198350 - }, - { - "epoch": 160.37, - "learning_rate": 5.482535109830752e-05, - "loss": 0.2084, - "step": 198375 - }, - { - "epoch": 160.39, - "learning_rate": 5.476908534389629e-05, - "loss": 0.2309, - "step": 198400 - }, - { - "epoch": 160.41, - "learning_rate": 5.471281958948505e-05, - "loss": 0.203, - "step": 198425 - }, - { - "epoch": 160.43, - "learning_rate": 5.465655383507382e-05, - "loss": 0.2272, - "step": 198450 - }, - { - "epoch": 160.45, - "learning_rate": 5.460028808066259e-05, - "loss": 0.1892, - "step": 198475 - }, - { - "epoch": 160.47, - "learning_rate": 5.4544022326251353e-05, - "loss": 0.2235, - "step": 198500 - }, - { - "epoch": 160.49, - "learning_rate": 5.448775657184012e-05, - "loss": 0.202, - "step": 198525 - }, - { - "epoch": 160.51, - "learning_rate": 5.443149081742888e-05, - "loss": 0.2377, - "step": 198550 - }, - { - "epoch": 160.53, - "learning_rate": 5.437522506301765e-05, - "loss": 0.1722, - "step": 198575 - }, - { - "epoch": 160.55, - "learning_rate": 5.431895930860641e-05, - "loss": 0.2065, - "step": 198600 - }, - { - "epoch": 160.57, - "learning_rate": 5.426269355419518e-05, - "loss": 0.1852, - "step": 198625 - }, - { - "epoch": 160.59, - "learning_rate": 5.420642779978394e-05, - "loss": 0.2182, - "step": 198650 - }, - { - "epoch": 160.61, - "learning_rate": 5.415016204537271e-05, - "loss": 0.2017, - "step": 198675 - }, - { - "epoch": 160.63, - "learning_rate": 5.409389629096147e-05, - "loss": 0.2293, - "step": 198700 - }, - { - "epoch": 160.65, - "learning_rate": 5.403763053655023e-05, - "loss": 0.2215, - "step": 198725 - }, - { - "epoch": 160.67, - "learning_rate": 5.3981364782138995e-05, - "loss": 0.2229, - "step": 198750 - }, - { - "epoch": 160.69, - "learning_rate": 5.3925099027727766e-05, - "loss": 0.2306, - "step": 198775 - }, - { - "epoch": 160.71, - "learning_rate": 5.386883327331653e-05, - "loss": 0.2306, - "step": 198800 - }, - { - "epoch": 160.73, - "learning_rate": 5.3812567518905296e-05, - "loss": 0.2359, - "step": 198825 - }, - { - "epoch": 160.75, - "learning_rate": 5.375630176449406e-05, - "loss": 0.2417, - "step": 198850 - }, - { - "epoch": 160.77, - "learning_rate": 5.3700036010082825e-05, - "loss": 0.2112, - "step": 198875 - }, - { - "epoch": 160.79, - "learning_rate": 5.364377025567159e-05, - "loss": 0.2106, - "step": 198900 - }, - { - "epoch": 160.81, - "learning_rate": 5.3587504501260355e-05, - "loss": 0.1836, - "step": 198925 - }, - { - "epoch": 160.83, - "learning_rate": 5.353123874684912e-05, - "loss": 0.2248, - "step": 198950 - }, - { - "epoch": 160.85, - "learning_rate": 5.3474972992437885e-05, - "loss": 0.2018, - "step": 198975 - }, - { - "epoch": 160.87, - "learning_rate": 5.341870723802665e-05, - "loss": 0.239, - "step": 199000 - }, - { - "epoch": 160.89, - "learning_rate": 5.3362441483615414e-05, - "loss": 0.2044, - "step": 199025 - }, - { - "epoch": 160.91, - "learning_rate": 5.330617572920418e-05, - "loss": 0.2236, - "step": 199050 - }, - { - "epoch": 160.93, - "learning_rate": 5.324990997479294e-05, - "loss": 0.2218, - "step": 199075 - }, - { - "epoch": 160.95, - "learning_rate": 5.319364422038171e-05, - "loss": 0.2156, - "step": 199100 - }, - { - "epoch": 160.97, - "learning_rate": 5.3137378465970473e-05, - "loss": 0.2013, - "step": 199125 - }, - { - "epoch": 160.99, - "learning_rate": 5.308111271155924e-05, - "loss": 0.2044, - "step": 199150 - }, - { - "epoch": 161.01, - "learning_rate": 5.3024846957148e-05, - "loss": 0.218, - "step": 199175 - }, - { - "epoch": 161.03, - "learning_rate": 5.296858120273677e-05, - "loss": 0.1846, - "step": 199200 - }, - { - "epoch": 161.05, - "learning_rate": 5.291231544832553e-05, - "loss": 0.2346, - "step": 199225 - }, - { - "epoch": 161.08, - "learning_rate": 5.28560496939143e-05, - "loss": 0.2067, - "step": 199250 - }, - { - "epoch": 161.1, - "learning_rate": 5.279978393950306e-05, - "loss": 0.2165, - "step": 199275 - }, - { - "epoch": 161.12, - "learning_rate": 5.274351818509183e-05, - "loss": 0.2015, - "step": 199300 - }, - { - "epoch": 161.14, - "learning_rate": 5.268725243068059e-05, - "loss": 0.2392, - "step": 199325 - }, - { - "epoch": 161.16, - "learning_rate": 5.2630986676269357e-05, - "loss": 0.2152, - "step": 199350 - }, - { - "epoch": 161.18, - "learning_rate": 5.257472092185812e-05, - "loss": 0.2017, - "step": 199375 - }, - { - "epoch": 161.2, - "learning_rate": 5.2518455167446886e-05, - "loss": 0.2026, - "step": 199400 - }, - { - "epoch": 161.22, - "learning_rate": 5.246218941303565e-05, - "loss": 0.2313, - "step": 199425 - }, - { - "epoch": 161.24, - "learning_rate": 5.2405923658624416e-05, - "loss": 0.2153, - "step": 199450 - }, - { - "epoch": 161.26, - "learning_rate": 5.234965790421318e-05, - "loss": 0.1926, - "step": 199475 - }, - { - "epoch": 161.28, - "learning_rate": 5.2293392149801945e-05, - "loss": 0.1938, - "step": 199500 - }, - { - "epoch": 161.3, - "learning_rate": 5.223712639539071e-05, - "loss": 0.1948, - "step": 199525 - }, - { - "epoch": 161.32, - "learning_rate": 5.2180860640979475e-05, - "loss": 0.2009, - "step": 199550 - }, - { - "epoch": 161.34, - "learning_rate": 5.212459488656824e-05, - "loss": 0.2141, - "step": 199575 - }, - { - "epoch": 161.36, - "learning_rate": 5.2068329132157005e-05, - "loss": 0.1755, - "step": 199600 - }, - { - "epoch": 161.38, - "learning_rate": 5.201206337774577e-05, - "loss": 0.2034, - "step": 199625 - }, - { - "epoch": 161.4, - "learning_rate": 5.1955797623334534e-05, - "loss": 0.2053, - "step": 199650 - }, - { - "epoch": 161.42, - "learning_rate": 5.18995318689233e-05, - "loss": 0.2017, - "step": 199675 - }, - { - "epoch": 161.44, - "learning_rate": 5.1843266114512064e-05, - "loss": 0.1859, - "step": 199700 - }, - { - "epoch": 161.46, - "learning_rate": 5.178700036010083e-05, - "loss": 0.195, - "step": 199725 - }, - { - "epoch": 161.48, - "learning_rate": 5.17307346056896e-05, - "loss": 0.1947, - "step": 199750 - }, - { - "epoch": 161.5, - "learning_rate": 5.167446885127836e-05, - "loss": 0.2052, - "step": 199775 - }, - { - "epoch": 161.52, - "learning_rate": 5.161820309686712e-05, - "loss": 0.1932, - "step": 199800 - }, - { - "epoch": 161.54, - "learning_rate": 5.156193734245589e-05, - "loss": 0.2126, - "step": 199825 - }, - { - "epoch": 161.56, - "learning_rate": 5.150567158804465e-05, - "loss": 0.2163, - "step": 199850 - }, - { - "epoch": 161.58, - "learning_rate": 5.144940583363342e-05, - "loss": 0.2018, - "step": 199875 - }, - { - "epoch": 161.6, - "learning_rate": 5.139314007922218e-05, - "loss": 0.2023, - "step": 199900 - }, - { - "epoch": 161.62, - "learning_rate": 5.133687432481095e-05, - "loss": 0.2208, - "step": 199925 - }, - { - "epoch": 161.64, - "learning_rate": 5.128060857039971e-05, - "loss": 0.2094, - "step": 199950 - }, - { - "epoch": 161.66, - "learning_rate": 5.1224342815988477e-05, - "loss": 0.2119, - "step": 199975 - }, - { - "epoch": 161.68, - "learning_rate": 5.116807706157724e-05, - "loss": 0.1994, - "step": 200000 - }, - { - "epoch": 161.7, - "learning_rate": 5.1111811307166006e-05, - "loss": 0.2172, - "step": 200025 - }, - { - "epoch": 161.72, - "learning_rate": 5.105554555275478e-05, - "loss": 0.1885, - "step": 200050 - }, - { - "epoch": 161.74, - "learning_rate": 5.099927979834354e-05, - "loss": 0.2093, - "step": 200075 - }, - { - "epoch": 161.76, - "learning_rate": 5.094301404393231e-05, - "loss": 0.197, - "step": 200100 - }, - { - "epoch": 161.78, - "learning_rate": 5.088674828952107e-05, - "loss": 0.2085, - "step": 200125 - }, - { - "epoch": 161.8, - "learning_rate": 5.083048253510983e-05, - "loss": 0.2121, - "step": 200150 - }, - { - "epoch": 161.82, - "learning_rate": 5.0774216780698595e-05, - "loss": 0.2206, - "step": 200175 - }, - { - "epoch": 161.84, - "learning_rate": 5.071795102628736e-05, - "loss": 0.1871, - "step": 200200 - }, - { - "epoch": 161.86, - "learning_rate": 5.0661685271876125e-05, - "loss": 0.2268, - "step": 200225 - }, - { - "epoch": 161.88, - "learning_rate": 5.060541951746489e-05, - "loss": 0.2047, - "step": 200250 - }, - { - "epoch": 161.9, - "learning_rate": 5.0549153763053654e-05, - "loss": 0.2072, - "step": 200275 - }, - { - "epoch": 161.92, - "learning_rate": 5.049288800864242e-05, - "loss": 0.2092, - "step": 200300 - }, - { - "epoch": 161.94, - "learning_rate": 5.0436622254231184e-05, - "loss": 0.2105, - "step": 200325 - }, - { - "epoch": 161.96, - "learning_rate": 5.038035649981995e-05, - "loss": 0.1982, - "step": 200350 - }, - { - "epoch": 161.98, - "learning_rate": 5.032409074540872e-05, - "loss": 0.2074, - "step": 200375 - }, - { - "epoch": 162.0, - "learning_rate": 5.0267824990997485e-05, - "loss": 0.2017, - "step": 200400 - }, - { - "epoch": 162.03, - "learning_rate": 5.021155923658625e-05, - "loss": 0.2278, - "step": 200425 - }, - { - "epoch": 162.05, - "learning_rate": 5.0155293482175015e-05, - "loss": 0.1947, - "step": 200450 - }, - { - "epoch": 162.07, - "learning_rate": 5.009902772776378e-05, - "loss": 0.2217, - "step": 200475 - }, - { - "epoch": 162.09, - "learning_rate": 5.004276197335254e-05, - "loss": 0.1645, - "step": 200500 - }, - { - "epoch": 162.11, - "learning_rate": 4.99864962189413e-05, - "loss": 0.2206, - "step": 200525 - }, - { - "epoch": 162.13, - "learning_rate": 4.993023046453007e-05, - "loss": 0.1874, - "step": 200550 - }, - { - "epoch": 162.15, - "learning_rate": 4.987396471011883e-05, - "loss": 0.1963, - "step": 200575 - }, - { - "epoch": 162.17, - "learning_rate": 4.9817698955707597e-05, - "loss": 0.1973, - "step": 200600 - }, - { - "epoch": 162.19, - "learning_rate": 4.976143320129636e-05, - "loss": 0.211, - "step": 200625 - }, - { - "epoch": 162.21, - "learning_rate": 4.9705167446885126e-05, - "loss": 0.1913, - "step": 200650 - }, - { - "epoch": 162.23, - "learning_rate": 4.964890169247389e-05, - "loss": 0.1771, - "step": 200675 - }, - { - "epoch": 162.25, - "learning_rate": 4.959263593806266e-05, - "loss": 0.1889, - "step": 200700 - }, - { - "epoch": 162.27, - "learning_rate": 4.953637018365143e-05, - "loss": 0.1948, - "step": 200725 - }, - { - "epoch": 162.29, - "learning_rate": 4.948010442924019e-05, - "loss": 0.1882, - "step": 200750 - }, - { - "epoch": 162.31, - "learning_rate": 4.942383867482896e-05, - "loss": 0.2305, - "step": 200775 - }, - { - "epoch": 162.33, - "learning_rate": 4.936757292041772e-05, - "loss": 0.2434, - "step": 200800 - }, - { - "epoch": 162.35, - "learning_rate": 4.9311307166006487e-05, - "loss": 0.2083, - "step": 200825 - }, - { - "epoch": 162.37, - "learning_rate": 4.9255041411595245e-05, - "loss": 0.2171, - "step": 200850 - }, - { - "epoch": 162.39, - "learning_rate": 4.919877565718401e-05, - "loss": 0.2204, - "step": 200875 - }, - { - "epoch": 162.41, - "learning_rate": 4.914476053294923e-05, - "loss": 0.2159, - "step": 200900 - }, - { - "epoch": 162.43, - "learning_rate": 4.908849477853799e-05, - "loss": 0.2106, - "step": 200925 - }, - { - "epoch": 162.45, - "learning_rate": 4.903222902412675e-05, - "loss": 0.2034, - "step": 200950 - }, - { - "epoch": 162.47, - "learning_rate": 4.8975963269715516e-05, - "loss": 0.2063, - "step": 200975 - }, - { - "epoch": 162.49, - "learning_rate": 4.891969751530428e-05, - "loss": 0.2096, - "step": 201000 - }, - { - "epoch": 162.49, - "eval_cer": 0.07474615771588144, - "eval_loss": 0.46688565611839294, - "eval_runtime": 150.852, - "eval_samples_per_second": 27.795, - "eval_steps_per_second": 6.954, - "eval_wer": 0.31830342577487764, - "step": 201000 - }, - { - "epoch": 162.51, - "learning_rate": 4.886343176089305e-05, - "loss": 0.2181, - "step": 201025 - }, - { - "epoch": 162.53, - "learning_rate": 4.880716600648182e-05, - "loss": 0.222, - "step": 201050 - }, - { - "epoch": 162.55, - "learning_rate": 4.875090025207058e-05, - "loss": 0.2604, - "step": 201075 - }, - { - "epoch": 162.57, - "learning_rate": 4.869463449765935e-05, - "loss": 0.1897, - "step": 201100 - }, - { - "epoch": 162.59, - "learning_rate": 4.863836874324811e-05, - "loss": 0.2158, - "step": 201125 - }, - { - "epoch": 162.61, - "learning_rate": 4.858210298883688e-05, - "loss": 0.1764, - "step": 201150 - }, - { - "epoch": 162.63, - "learning_rate": 4.852583723442564e-05, - "loss": 0.2127, - "step": 201175 - }, - { - "epoch": 162.65, - "learning_rate": 4.8469571480014406e-05, - "loss": 0.2119, - "step": 201200 - }, - { - "epoch": 162.67, - "learning_rate": 4.841330572560317e-05, - "loss": 0.2366, - "step": 201225 - }, - { - "epoch": 162.69, - "learning_rate": 4.8357039971191936e-05, - "loss": 0.1995, - "step": 201250 - }, - { - "epoch": 162.71, - "learning_rate": 4.8300774216780694e-05, - "loss": 0.2321, - "step": 201275 - }, - { - "epoch": 162.73, - "learning_rate": 4.824450846236946e-05, - "loss": 0.2315, - "step": 201300 - }, - { - "epoch": 162.75, - "learning_rate": 4.818824270795823e-05, - "loss": 0.2366, - "step": 201325 - }, - { - "epoch": 162.77, - "learning_rate": 4.8131976953546995e-05, - "loss": 0.1815, - "step": 201350 - }, - { - "epoch": 162.79, - "learning_rate": 4.807571119913576e-05, - "loss": 0.2202, - "step": 201375 - }, - { - "epoch": 162.81, - "learning_rate": 4.8019445444724525e-05, - "loss": 0.1994, - "step": 201400 - }, - { - "epoch": 162.83, - "learning_rate": 4.796317969031329e-05, - "loss": 0.2294, - "step": 201425 - }, - { - "epoch": 162.85, - "learning_rate": 4.7906913935902054e-05, - "loss": 0.2178, - "step": 201450 - }, - { - "epoch": 162.87, - "learning_rate": 4.785064818149082e-05, - "loss": 0.2219, - "step": 201475 - }, - { - "epoch": 162.89, - "learning_rate": 4.7794382427079584e-05, - "loss": 0.2385, - "step": 201500 - }, - { - "epoch": 162.91, - "learning_rate": 4.773811667266835e-05, - "loss": 0.2135, - "step": 201525 - }, - { - "epoch": 162.93, - "learning_rate": 4.7681850918257113e-05, - "loss": 0.1894, - "step": 201550 - }, - { - "epoch": 162.95, - "learning_rate": 4.762558516384588e-05, - "loss": 0.2315, - "step": 201575 - }, - { - "epoch": 162.97, - "learning_rate": 4.756931940943464e-05, - "loss": 0.2276, - "step": 201600 - }, - { - "epoch": 163.0, - "learning_rate": 4.75130536550234e-05, - "loss": 0.2329, - "step": 201625 - }, - { - "epoch": 163.02, - "learning_rate": 4.745678790061217e-05, - "loss": 0.2242, - "step": 201650 - }, - { - "epoch": 163.04, - "learning_rate": 4.740052214620094e-05, - "loss": 0.1868, - "step": 201675 - }, - { - "epoch": 163.06, - "learning_rate": 4.73442563917897e-05, - "loss": 0.2309, - "step": 201700 - }, - { - "epoch": 163.08, - "learning_rate": 4.728799063737847e-05, - "loss": 0.1948, - "step": 201725 - }, - { - "epoch": 163.1, - "learning_rate": 4.723172488296723e-05, - "loss": 0.2059, - "step": 201750 - }, - { - "epoch": 163.12, - "learning_rate": 4.7175459128556e-05, - "loss": 0.1922, - "step": 201775 - }, - { - "epoch": 163.14, - "learning_rate": 4.711919337414476e-05, - "loss": 0.216, - "step": 201800 - }, - { - "epoch": 163.16, - "learning_rate": 4.7062927619733526e-05, - "loss": 0.1945, - "step": 201825 - }, - { - "epoch": 163.18, - "learning_rate": 4.700666186532229e-05, - "loss": 0.2139, - "step": 201850 - }, - { - "epoch": 163.2, - "learning_rate": 4.6950396110911056e-05, - "loss": 0.2057, - "step": 201875 - }, - { - "epoch": 163.22, - "learning_rate": 4.689413035649982e-05, - "loss": 0.2023, - "step": 201900 - }, - { - "epoch": 163.24, - "learning_rate": 4.6837864602088585e-05, - "loss": 0.181, - "step": 201925 - }, - { - "epoch": 163.26, - "learning_rate": 4.678159884767735e-05, - "loss": 0.1965, - "step": 201950 - }, - { - "epoch": 163.28, - "learning_rate": 4.672533309326612e-05, - "loss": 0.1885, - "step": 201975 - }, - { - "epoch": 163.3, - "learning_rate": 4.666906733885488e-05, - "loss": 0.2403, - "step": 202000 - }, - { - "epoch": 163.32, - "learning_rate": 4.6612801584443645e-05, - "loss": 0.2078, - "step": 202025 - }, - { - "epoch": 163.34, - "learning_rate": 4.655653583003241e-05, - "loss": 0.2031, - "step": 202050 - }, - { - "epoch": 163.36, - "learning_rate": 4.6500270075621174e-05, - "loss": 0.21, - "step": 202075 - }, - { - "epoch": 163.38, - "learning_rate": 4.644400432120994e-05, - "loss": 0.2163, - "step": 202100 - }, - { - "epoch": 163.4, - "learning_rate": 4.6387738566798704e-05, - "loss": 0.1928, - "step": 202125 - }, - { - "epoch": 163.42, - "learning_rate": 4.633147281238747e-05, - "loss": 0.2349, - "step": 202150 - }, - { - "epoch": 163.44, - "learning_rate": 4.6275207057976233e-05, - "loss": 0.2285, - "step": 202175 - }, - { - "epoch": 163.46, - "learning_rate": 4.6218941303565e-05, - "loss": 0.2194, - "step": 202200 - }, - { - "epoch": 163.48, - "learning_rate": 4.616267554915376e-05, - "loss": 0.2165, - "step": 202225 - }, - { - "epoch": 163.5, - "learning_rate": 4.610640979474253e-05, - "loss": 0.2098, - "step": 202250 - }, - { - "epoch": 163.52, - "learning_rate": 4.605014404033129e-05, - "loss": 0.1859, - "step": 202275 - }, - { - "epoch": 163.54, - "learning_rate": 4.5993878285920064e-05, - "loss": 0.2116, - "step": 202300 - }, - { - "epoch": 163.56, - "learning_rate": 4.593761253150883e-05, - "loss": 0.2373, - "step": 202325 - }, - { - "epoch": 163.58, - "learning_rate": 4.588134677709759e-05, - "loss": 0.2213, - "step": 202350 - }, - { - "epoch": 163.6, - "learning_rate": 4.582508102268635e-05, - "loss": 0.2096, - "step": 202375 - }, - { - "epoch": 163.62, - "learning_rate": 4.576881526827512e-05, - "loss": 0.2153, - "step": 202400 - }, - { - "epoch": 163.64, - "learning_rate": 4.571254951386388e-05, - "loss": 0.2167, - "step": 202425 - }, - { - "epoch": 163.66, - "learning_rate": 4.5656283759452646e-05, - "loss": 0.2291, - "step": 202450 - }, - { - "epoch": 163.68, - "learning_rate": 4.560226863521786e-05, - "loss": 0.2253, - "step": 202475 - }, - { - "epoch": 163.7, - "learning_rate": 4.5546002880806624e-05, - "loss": 0.2502, - "step": 202500 - }, - { - "epoch": 163.72, - "learning_rate": 4.548973712639539e-05, - "loss": 0.1777, - "step": 202525 - }, - { - "epoch": 163.74, - "learning_rate": 4.543347137198415e-05, - "loss": 0.2006, - "step": 202550 - }, - { - "epoch": 163.76, - "learning_rate": 4.537720561757292e-05, - "loss": 0.2072, - "step": 202575 - }, - { - "epoch": 163.78, - "learning_rate": 4.532093986316169e-05, - "loss": 0.2245, - "step": 202600 - }, - { - "epoch": 163.8, - "learning_rate": 4.5264674108750454e-05, - "loss": 0.1904, - "step": 202625 - }, - { - "epoch": 163.82, - "learning_rate": 4.520840835433922e-05, - "loss": 0.1858, - "step": 202650 - }, - { - "epoch": 163.84, - "learning_rate": 4.5152142599927984e-05, - "loss": 0.2207, - "step": 202675 - }, - { - "epoch": 163.86, - "learning_rate": 4.509587684551675e-05, - "loss": 0.2185, - "step": 202700 - }, - { - "epoch": 163.88, - "learning_rate": 4.5039611091105514e-05, - "loss": 0.1909, - "step": 202725 - }, - { - "epoch": 163.9, - "learning_rate": 4.498334533669428e-05, - "loss": 0.1961, - "step": 202750 - }, - { - "epoch": 163.92, - "learning_rate": 4.4927079582283036e-05, - "loss": 0.2139, - "step": 202775 - }, - { - "epoch": 163.95, - "learning_rate": 4.48708138278718e-05, - "loss": 0.2081, - "step": 202800 - }, - { - "epoch": 163.97, - "learning_rate": 4.4814548073460566e-05, - "loss": 0.1896, - "step": 202825 - }, - { - "epoch": 163.99, - "learning_rate": 4.475828231904933e-05, - "loss": 0.1879, - "step": 202850 - }, - { - "epoch": 164.01, - "learning_rate": 4.4702016564638096e-05, - "loss": 0.1993, - "step": 202875 - }, - { - "epoch": 164.03, - "learning_rate": 4.464575081022686e-05, - "loss": 0.2381, - "step": 202900 - }, - { - "epoch": 164.05, - "learning_rate": 4.458948505581563e-05, - "loss": 0.1972, - "step": 202925 - }, - { - "epoch": 164.07, - "learning_rate": 4.45332193014044e-05, - "loss": 0.2297, - "step": 202950 - }, - { - "epoch": 164.09, - "learning_rate": 4.447695354699316e-05, - "loss": 0.1591, - "step": 202975 - }, - { - "epoch": 164.11, - "learning_rate": 4.4420687792581926e-05, - "loss": 0.1925, - "step": 203000 - }, - { - "epoch": 164.13, - "learning_rate": 4.436442203817069e-05, - "loss": 0.1655, - "step": 203025 - }, - { - "epoch": 164.15, - "learning_rate": 4.4308156283759456e-05, - "loss": 0.223, - "step": 203050 - }, - { - "epoch": 164.17, - "learning_rate": 4.425189052934822e-05, - "loss": 0.2068, - "step": 203075 - }, - { - "epoch": 164.19, - "learning_rate": 4.4195624774936986e-05, - "loss": 0.1982, - "step": 203100 - }, - { - "epoch": 164.21, - "learning_rate": 4.4139359020525744e-05, - "loss": 0.1926, - "step": 203125 - }, - { - "epoch": 164.23, - "learning_rate": 4.408309326611451e-05, - "loss": 0.1827, - "step": 203150 - }, - { - "epoch": 164.25, - "learning_rate": 4.402682751170327e-05, - "loss": 0.2055, - "step": 203175 - }, - { - "epoch": 164.27, - "learning_rate": 4.397056175729204e-05, - "loss": 0.1942, - "step": 203200 - }, - { - "epoch": 164.29, - "learning_rate": 4.39142960028808e-05, - "loss": 0.2065, - "step": 203225 - }, - { - "epoch": 164.31, - "learning_rate": 4.3858030248469574e-05, - "loss": 0.2095, - "step": 203250 - }, - { - "epoch": 164.33, - "learning_rate": 4.380176449405834e-05, - "loss": 0.2005, - "step": 203275 - }, - { - "epoch": 164.35, - "learning_rate": 4.3745498739647104e-05, - "loss": 0.2359, - "step": 203300 - }, - { - "epoch": 164.37, - "learning_rate": 4.368923298523587e-05, - "loss": 0.179, - "step": 203325 - }, - { - "epoch": 164.39, - "learning_rate": 4.3632967230824634e-05, - "loss": 0.2012, - "step": 203350 - }, - { - "epoch": 164.41, - "learning_rate": 4.35767014764134e-05, - "loss": 0.1984, - "step": 203375 - }, - { - "epoch": 164.43, - "learning_rate": 4.352043572200216e-05, - "loss": 0.1977, - "step": 203400 - }, - { - "epoch": 164.45, - "learning_rate": 4.346416996759093e-05, - "loss": 0.1622, - "step": 203425 - }, - { - "epoch": 164.47, - "learning_rate": 4.340790421317969e-05, - "loss": 0.205, - "step": 203450 - }, - { - "epoch": 164.49, - "learning_rate": 4.335163845876846e-05, - "loss": 0.1705, - "step": 203475 - }, - { - "epoch": 164.51, - "learning_rate": 4.3295372704357216e-05, - "loss": 0.1874, - "step": 203500 - }, - { - "epoch": 164.53, - "learning_rate": 4.323910694994598e-05, - "loss": 0.2105, - "step": 203525 - }, - { - "epoch": 164.55, - "learning_rate": 4.318284119553475e-05, - "loss": 0.2178, - "step": 203550 - }, - { - "epoch": 164.57, - "learning_rate": 4.312657544112352e-05, - "loss": 0.2348, - "step": 203575 - }, - { - "epoch": 164.59, - "learning_rate": 4.307030968671228e-05, - "loss": 0.2285, - "step": 203600 - }, - { - "epoch": 164.61, - "learning_rate": 4.3014043932301046e-05, - "loss": 0.2005, - "step": 203625 - }, - { - "epoch": 164.63, - "learning_rate": 4.295777817788981e-05, - "loss": 0.2259, - "step": 203650 - }, - { - "epoch": 164.65, - "learning_rate": 4.2901512423478576e-05, - "loss": 0.1709, - "step": 203675 - }, - { - "epoch": 164.67, - "learning_rate": 4.284524666906734e-05, - "loss": 0.1984, - "step": 203700 - }, - { - "epoch": 164.69, - "learning_rate": 4.2788980914656106e-05, - "loss": 0.1833, - "step": 203725 - }, - { - "epoch": 164.71, - "learning_rate": 4.273271516024487e-05, - "loss": 0.2113, - "step": 203750 - }, - { - "epoch": 164.73, - "learning_rate": 4.2676449405833635e-05, - "loss": 0.2044, - "step": 203775 - }, - { - "epoch": 164.75, - "learning_rate": 4.26201836514224e-05, - "loss": 0.2236, - "step": 203800 - }, - { - "epoch": 164.77, - "learning_rate": 4.2563917897011165e-05, - "loss": 0.2011, - "step": 203825 - }, - { - "epoch": 164.79, - "learning_rate": 4.250765214259992e-05, - "loss": 0.2171, - "step": 203850 - }, - { - "epoch": 164.81, - "learning_rate": 4.2451386388188694e-05, - "loss": 0.1913, - "step": 203875 - }, - { - "epoch": 164.83, - "learning_rate": 4.239512063377746e-05, - "loss": 0.2069, - "step": 203900 - }, - { - "epoch": 164.85, - "learning_rate": 4.2338854879366224e-05, - "loss": 0.1633, - "step": 203925 - }, - { - "epoch": 164.87, - "learning_rate": 4.228258912495499e-05, - "loss": 0.206, - "step": 203950 - }, - { - "epoch": 164.89, - "learning_rate": 4.2226323370543754e-05, - "loss": 0.1939, - "step": 203975 - }, - { - "epoch": 164.92, - "learning_rate": 4.217005761613252e-05, - "loss": 0.2173, - "step": 204000 - }, - { - "epoch": 164.92, - "eval_cer": 0.07462809153722165, - "eval_loss": 0.47042977809906006, - "eval_runtime": 151.4427, - "eval_samples_per_second": 27.687, - "eval_steps_per_second": 6.927, - "eval_wer": 0.3180097879282219, - "step": 204000 - }, - { - "epoch": 164.94, - "learning_rate": 4.211379186172128e-05, - "loss": 0.2402, - "step": 204025 - }, - { - "epoch": 164.96, - "learning_rate": 4.205752610731005e-05, - "loss": 0.2072, - "step": 204050 - }, - { - "epoch": 164.98, - "learning_rate": 4.200126035289881e-05, - "loss": 0.2063, - "step": 204075 - }, - { - "epoch": 165.0, - "learning_rate": 4.194499459848758e-05, - "loss": 0.196, - "step": 204100 - }, - { - "epoch": 165.02, - "learning_rate": 4.188872884407634e-05, - "loss": 0.1877, - "step": 204125 - }, - { - "epoch": 165.04, - "learning_rate": 4.183246308966511e-05, - "loss": 0.1892, - "step": 204150 - }, - { - "epoch": 165.06, - "learning_rate": 4.177619733525387e-05, - "loss": 0.2035, - "step": 204175 - }, - { - "epoch": 165.08, - "learning_rate": 4.171993158084264e-05, - "loss": 0.1885, - "step": 204200 - }, - { - "epoch": 165.1, - "learning_rate": 4.16636658264314e-05, - "loss": 0.2331, - "step": 204225 - }, - { - "epoch": 165.12, - "learning_rate": 4.1607400072020166e-05, - "loss": 0.1998, - "step": 204250 - }, - { - "epoch": 165.14, - "learning_rate": 4.155113431760893e-05, - "loss": 0.199, - "step": 204275 - }, - { - "epoch": 165.16, - "learning_rate": 4.1494868563197696e-05, - "loss": 0.227, - "step": 204300 - }, - { - "epoch": 165.18, - "learning_rate": 4.143860280878646e-05, - "loss": 0.2145, - "step": 204325 - }, - { - "epoch": 165.2, - "learning_rate": 4.1382337054375226e-05, - "loss": 0.1827, - "step": 204350 - }, - { - "epoch": 165.22, - "learning_rate": 4.132607129996399e-05, - "loss": 0.2053, - "step": 204375 - }, - { - "epoch": 165.24, - "learning_rate": 4.1269805545552755e-05, - "loss": 0.2036, - "step": 204400 - }, - { - "epoch": 165.26, - "learning_rate": 4.121353979114152e-05, - "loss": 0.2201, - "step": 204425 - }, - { - "epoch": 165.28, - "learning_rate": 4.1157274036730285e-05, - "loss": 0.1936, - "step": 204450 - }, - { - "epoch": 165.3, - "learning_rate": 4.110100828231905e-05, - "loss": 0.2106, - "step": 204475 - }, - { - "epoch": 165.32, - "learning_rate": 4.1044742527907814e-05, - "loss": 0.1847, - "step": 204500 - }, - { - "epoch": 165.34, - "learning_rate": 4.0988476773496586e-05, - "loss": 0.2236, - "step": 204525 - }, - { - "epoch": 165.36, - "learning_rate": 4.0932211019085344e-05, - "loss": 0.1982, - "step": 204550 - }, - { - "epoch": 165.38, - "learning_rate": 4.087594526467411e-05, - "loss": 0.2164, - "step": 204575 - }, - { - "epoch": 165.4, - "learning_rate": 4.0819679510262874e-05, - "loss": 0.1648, - "step": 204600 - }, - { - "epoch": 165.42, - "learning_rate": 4.076341375585164e-05, - "loss": 0.2193, - "step": 204625 - }, - { - "epoch": 165.44, - "learning_rate": 4.07071480014404e-05, - "loss": 0.2154, - "step": 204650 - }, - { - "epoch": 165.46, - "learning_rate": 4.065088224702917e-05, - "loss": 0.2004, - "step": 204675 - }, - { - "epoch": 165.48, - "learning_rate": 4.059461649261793e-05, - "loss": 0.2009, - "step": 204700 - }, - { - "epoch": 165.5, - "learning_rate": 4.05383507382067e-05, - "loss": 0.1868, - "step": 204725 - }, - { - "epoch": 165.52, - "learning_rate": 4.048208498379546e-05, - "loss": 0.2233, - "step": 204750 - }, - { - "epoch": 165.54, - "learning_rate": 4.042581922938423e-05, - "loss": 0.1929, - "step": 204775 - }, - { - "epoch": 165.56, - "learning_rate": 4.036955347497299e-05, - "loss": 0.2148, - "step": 204800 - }, - { - "epoch": 165.58, - "learning_rate": 4.031328772056176e-05, - "loss": 0.19, - "step": 204825 - }, - { - "epoch": 165.6, - "learning_rate": 4.025702196615053e-05, - "loss": 0.1779, - "step": 204850 - }, - { - "epoch": 165.62, - "learning_rate": 4.020075621173929e-05, - "loss": 0.1936, - "step": 204875 - }, - { - "epoch": 165.64, - "learning_rate": 4.014449045732806e-05, - "loss": 0.2117, - "step": 204900 - }, - { - "epoch": 165.66, - "learning_rate": 4.0088224702916816e-05, - "loss": 0.2124, - "step": 204925 - }, - { - "epoch": 165.68, - "learning_rate": 4.003195894850558e-05, - "loss": 0.2178, - "step": 204950 - }, - { - "epoch": 165.7, - "learning_rate": 3.9975693194094346e-05, - "loss": 0.2006, - "step": 204975 - }, - { - "epoch": 165.72, - "learning_rate": 3.991942743968311e-05, - "loss": 0.1948, - "step": 205000 - }, - { - "epoch": 165.74, - "learning_rate": 3.9863161685271875e-05, - "loss": 0.2193, - "step": 205025 - }, - { - "epoch": 165.76, - "learning_rate": 3.980689593086064e-05, - "loss": 0.1978, - "step": 205050 - }, - { - "epoch": 165.78, - "learning_rate": 3.9750630176449405e-05, - "loss": 0.2219, - "step": 205075 - }, - { - "epoch": 165.8, - "learning_rate": 3.969436442203817e-05, - "loss": 0.1989, - "step": 205100 - }, - { - "epoch": 165.82, - "learning_rate": 3.9638098667626934e-05, - "loss": 0.2189, - "step": 205125 - }, - { - "epoch": 165.84, - "learning_rate": 3.9581832913215706e-05, - "loss": 0.1913, - "step": 205150 - }, - { - "epoch": 165.86, - "learning_rate": 3.952556715880447e-05, - "loss": 0.2138, - "step": 205175 - }, - { - "epoch": 165.89, - "learning_rate": 3.9469301404393236e-05, - "loss": 0.1843, - "step": 205200 - }, - { - "epoch": 165.91, - "learning_rate": 3.9413035649982e-05, - "loss": 0.212, - "step": 205225 - }, - { - "epoch": 165.93, - "learning_rate": 3.9356769895570765e-05, - "loss": 0.1992, - "step": 205250 - }, - { - "epoch": 165.95, - "learning_rate": 3.930050414115952e-05, - "loss": 0.2029, - "step": 205275 - }, - { - "epoch": 165.97, - "learning_rate": 3.924423838674829e-05, - "loss": 0.2163, - "step": 205300 - }, - { - "epoch": 165.99, - "learning_rate": 3.918797263233705e-05, - "loss": 0.2093, - "step": 205325 - }, - { - "epoch": 166.01, - "learning_rate": 3.913170687792582e-05, - "loss": 0.191, - "step": 205350 - }, - { - "epoch": 166.03, - "learning_rate": 3.907544112351458e-05, - "loss": 0.2049, - "step": 205375 - }, - { - "epoch": 166.05, - "learning_rate": 3.901917536910335e-05, - "loss": 0.1871, - "step": 205400 - }, - { - "epoch": 166.07, - "learning_rate": 3.896290961469211e-05, - "loss": 0.1957, - "step": 205425 - }, - { - "epoch": 166.09, - "learning_rate": 3.8908894490457325e-05, - "loss": 0.19, - "step": 205450 - }, - { - "epoch": 166.11, - "learning_rate": 3.8852628736046096e-05, - "loss": 0.2078, - "step": 205475 - }, - { - "epoch": 166.13, - "learning_rate": 3.879636298163486e-05, - "loss": 0.1838, - "step": 205500 - }, - { - "epoch": 166.15, - "learning_rate": 3.8740097227223626e-05, - "loss": 0.2019, - "step": 205525 - }, - { - "epoch": 166.17, - "learning_rate": 3.868383147281239e-05, - "loss": 0.1774, - "step": 205550 - }, - { - "epoch": 166.19, - "learning_rate": 3.8627565718401155e-05, - "loss": 0.2137, - "step": 205575 - }, - { - "epoch": 166.21, - "learning_rate": 3.857129996398992e-05, - "loss": 0.2002, - "step": 205600 - }, - { - "epoch": 166.23, - "learning_rate": 3.8515034209578685e-05, - "loss": 0.1927, - "step": 205625 - }, - { - "epoch": 166.25, - "learning_rate": 3.845876845516745e-05, - "loss": 0.1999, - "step": 205650 - }, - { - "epoch": 166.27, - "learning_rate": 3.8402502700756214e-05, - "loss": 0.2, - "step": 205675 - }, - { - "epoch": 166.29, - "learning_rate": 3.834623694634497e-05, - "loss": 0.1938, - "step": 205700 - }, - { - "epoch": 166.31, - "learning_rate": 3.828997119193374e-05, - "loss": 0.2143, - "step": 205725 - }, - { - "epoch": 166.33, - "learning_rate": 3.82337054375225e-05, - "loss": 0.1971, - "step": 205750 - }, - { - "epoch": 166.35, - "learning_rate": 3.817743968311127e-05, - "loss": 0.2325, - "step": 205775 - }, - { - "epoch": 166.37, - "learning_rate": 3.812117392870004e-05, - "loss": 0.2128, - "step": 205800 - }, - { - "epoch": 166.39, - "learning_rate": 3.80649081742888e-05, - "loss": 0.1917, - "step": 205825 - }, - { - "epoch": 166.41, - "learning_rate": 3.800864241987757e-05, - "loss": 0.179, - "step": 205850 - }, - { - "epoch": 166.43, - "learning_rate": 3.795237666546633e-05, - "loss": 0.195, - "step": 205875 - }, - { - "epoch": 166.45, - "learning_rate": 3.78961109110551e-05, - "loss": 0.2235, - "step": 205900 - }, - { - "epoch": 166.47, - "learning_rate": 3.783984515664386e-05, - "loss": 0.2031, - "step": 205925 - }, - { - "epoch": 166.49, - "learning_rate": 3.778357940223263e-05, - "loss": 0.1853, - "step": 205950 - }, - { - "epoch": 166.51, - "learning_rate": 3.772731364782139e-05, - "loss": 0.2208, - "step": 205975 - }, - { - "epoch": 166.53, - "learning_rate": 3.767104789341016e-05, - "loss": 0.1579, - "step": 206000 - }, - { - "epoch": 166.55, - "learning_rate": 3.761478213899892e-05, - "loss": 0.21, - "step": 206025 - }, - { - "epoch": 166.57, - "learning_rate": 3.755851638458768e-05, - "loss": 0.202, - "step": 206050 - }, - { - "epoch": 166.59, - "learning_rate": 3.7502250630176444e-05, - "loss": 0.2098, - "step": 206075 - }, - { - "epoch": 166.61, - "learning_rate": 3.7445984875765216e-05, - "loss": 0.1852, - "step": 206100 - }, - { - "epoch": 166.63, - "learning_rate": 3.738971912135398e-05, - "loss": 0.2041, - "step": 206125 - }, - { - "epoch": 166.65, - "learning_rate": 3.7333453366942746e-05, - "loss": 0.1956, - "step": 206150 - }, - { - "epoch": 166.67, - "learning_rate": 3.727718761253151e-05, - "loss": 0.2027, - "step": 206175 - }, - { - "epoch": 166.69, - "learning_rate": 3.7220921858120275e-05, - "loss": 0.1736, - "step": 206200 - }, - { - "epoch": 166.71, - "learning_rate": 3.716465610370904e-05, - "loss": 0.217, - "step": 206225 - }, - { - "epoch": 166.73, - "learning_rate": 3.7108390349297805e-05, - "loss": 0.1787, - "step": 206250 - }, - { - "epoch": 166.75, - "learning_rate": 3.705212459488657e-05, - "loss": 0.1932, - "step": 206275 - }, - { - "epoch": 166.77, - "learning_rate": 3.6995858840475334e-05, - "loss": 0.1837, - "step": 206300 - }, - { - "epoch": 166.79, - "learning_rate": 3.69395930860641e-05, - "loss": 0.1666, - "step": 206325 - }, - { - "epoch": 166.81, - "learning_rate": 3.6883327331652864e-05, - "loss": 0.1649, - "step": 206350 - }, - { - "epoch": 166.84, - "learning_rate": 3.682706157724163e-05, - "loss": 0.1981, - "step": 206375 - }, - { - "epoch": 166.86, - "learning_rate": 3.677079582283039e-05, - "loss": 0.2142, - "step": 206400 - }, - { - "epoch": 166.88, - "learning_rate": 3.671453006841916e-05, - "loss": 0.2036, - "step": 206425 - }, - { - "epoch": 166.9, - "learning_rate": 3.665826431400792e-05, - "loss": 0.2075, - "step": 206450 - }, - { - "epoch": 166.92, - "learning_rate": 3.660199855959669e-05, - "loss": 0.2142, - "step": 206475 - }, - { - "epoch": 166.94, - "learning_rate": 3.654573280518545e-05, - "loss": 0.1761, - "step": 206500 - }, - { - "epoch": 166.96, - "learning_rate": 3.648946705077422e-05, - "loss": 0.1917, - "step": 206525 - }, - { - "epoch": 166.98, - "learning_rate": 3.643320129636298e-05, - "loss": 0.2077, - "step": 206550 - }, - { - "epoch": 167.0, - "learning_rate": 3.637693554195175e-05, - "loss": 0.1955, - "step": 206575 - }, - { - "epoch": 167.02, - "learning_rate": 3.632066978754051e-05, - "loss": 0.2168, - "step": 206600 - }, - { - "epoch": 167.04, - "learning_rate": 3.626440403312928e-05, - "loss": 0.2142, - "step": 206625 - }, - { - "epoch": 167.06, - "learning_rate": 3.620813827871804e-05, - "loss": 0.1914, - "step": 206650 - }, - { - "epoch": 167.08, - "learning_rate": 3.6151872524306806e-05, - "loss": 0.215, - "step": 206675 - }, - { - "epoch": 167.1, - "learning_rate": 3.609560676989557e-05, - "loss": 0.2052, - "step": 206700 - }, - { - "epoch": 167.12, - "learning_rate": 3.6039341015484336e-05, - "loss": 0.2032, - "step": 206725 - }, - { - "epoch": 167.14, - "learning_rate": 3.598307526107311e-05, - "loss": 0.1999, - "step": 206750 - }, - { - "epoch": 167.16, - "learning_rate": 3.5926809506661866e-05, - "loss": 0.1718, - "step": 206775 - }, - { - "epoch": 167.18, - "learning_rate": 3.587054375225063e-05, - "loss": 0.187, - "step": 206800 - }, - { - "epoch": 167.2, - "learning_rate": 3.5814277997839395e-05, - "loss": 0.2237, - "step": 206825 - }, - { - "epoch": 167.22, - "learning_rate": 3.575801224342816e-05, - "loss": 0.2192, - "step": 206850 - }, - { - "epoch": 167.24, - "learning_rate": 3.5701746489016925e-05, - "loss": 0.2003, - "step": 206875 - }, - { - "epoch": 167.26, - "learning_rate": 3.564548073460569e-05, - "loss": 0.1946, - "step": 206900 - }, - { - "epoch": 167.28, - "learning_rate": 3.5589214980194454e-05, - "loss": 0.1779, - "step": 206925 - }, - { - "epoch": 167.3, - "learning_rate": 3.553294922578322e-05, - "loss": 0.2129, - "step": 206950 - }, - { - "epoch": 167.32, - "learning_rate": 3.5476683471371984e-05, - "loss": 0.1759, - "step": 206975 - }, - { - "epoch": 167.34, - "learning_rate": 3.542041771696075e-05, - "loss": 0.1797, - "step": 207000 - }, - { - "epoch": 167.34, - "eval_cer": 0.07387349465622209, - "eval_loss": 0.46532440185546875, - "eval_runtime": 150.405, - "eval_samples_per_second": 27.878, - "eval_steps_per_second": 6.975, - "eval_wer": 0.3169004893964111, - "step": 207000 - }, - { - "epoch": 167.36, - "learning_rate": 3.5364151962549514e-05, - "loss": 0.1926, - "step": 207025 - }, - { - "epoch": 167.38, - "learning_rate": 3.530788620813828e-05, - "loss": 0.2108, - "step": 207050 - }, - { - "epoch": 167.4, - "learning_rate": 3.525162045372705e-05, - "loss": 0.2033, - "step": 207075 - }, - { - "epoch": 167.42, - "learning_rate": 3.5195354699315815e-05, - "loss": 0.215, - "step": 207100 - }, - { - "epoch": 167.44, - "learning_rate": 3.513908894490457e-05, - "loss": 0.2169, - "step": 207125 - }, - { - "epoch": 167.46, - "learning_rate": 3.508282319049334e-05, - "loss": 0.1875, - "step": 207150 - }, - { - "epoch": 167.48, - "learning_rate": 3.50265574360821e-05, - "loss": 0.2083, - "step": 207175 - }, - { - "epoch": 167.5, - "learning_rate": 3.497029168167087e-05, - "loss": 0.2057, - "step": 207200 - }, - { - "epoch": 167.52, - "learning_rate": 3.491402592725963e-05, - "loss": 0.2003, - "step": 207225 - }, - { - "epoch": 167.54, - "learning_rate": 3.48577601728484e-05, - "loss": 0.1973, - "step": 207250 - }, - { - "epoch": 167.56, - "learning_rate": 3.480149441843716e-05, - "loss": 0.183, - "step": 207275 - }, - { - "epoch": 167.58, - "learning_rate": 3.4745228664025926e-05, - "loss": 0.2074, - "step": 207300 - }, - { - "epoch": 167.6, - "learning_rate": 3.468896290961469e-05, - "loss": 0.195, - "step": 207325 - }, - { - "epoch": 167.62, - "learning_rate": 3.4632697155203456e-05, - "loss": 0.1961, - "step": 207350 - }, - { - "epoch": 167.64, - "learning_rate": 3.457643140079223e-05, - "loss": 0.2117, - "step": 207375 - }, - { - "epoch": 167.66, - "learning_rate": 3.452016564638099e-05, - "loss": 0.2127, - "step": 207400 - }, - { - "epoch": 167.68, - "learning_rate": 3.446389989196976e-05, - "loss": 0.164, - "step": 207425 - }, - { - "epoch": 167.7, - "learning_rate": 3.440763413755852e-05, - "loss": 0.2018, - "step": 207450 - }, - { - "epoch": 167.72, - "learning_rate": 3.435136838314728e-05, - "loss": 0.1931, - "step": 207475 - }, - { - "epoch": 167.74, - "learning_rate": 3.4295102628736045e-05, - "loss": 0.1934, - "step": 207500 - }, - { - "epoch": 167.76, - "learning_rate": 3.423883687432481e-05, - "loss": 0.1863, - "step": 207525 - }, - { - "epoch": 167.78, - "learning_rate": 3.4182571119913574e-05, - "loss": 0.1935, - "step": 207550 - }, - { - "epoch": 167.81, - "learning_rate": 3.412630536550234e-05, - "loss": 0.1803, - "step": 207575 - }, - { - "epoch": 167.83, - "learning_rate": 3.4070039611091104e-05, - "loss": 0.1956, - "step": 207600 - }, - { - "epoch": 167.85, - "learning_rate": 3.401377385667987e-05, - "loss": 0.1794, - "step": 207625 - }, - { - "epoch": 167.87, - "learning_rate": 3.3957508102268634e-05, - "loss": 0.2416, - "step": 207650 - }, - { - "epoch": 167.89, - "learning_rate": 3.39012423478574e-05, - "loss": 0.1805, - "step": 207675 - }, - { - "epoch": 167.91, - "learning_rate": 3.384497659344617e-05, - "loss": 0.1733, - "step": 207700 - }, - { - "epoch": 167.93, - "learning_rate": 3.3788710839034935e-05, - "loss": 0.1806, - "step": 207725 - }, - { - "epoch": 167.95, - "learning_rate": 3.37324450846237e-05, - "loss": 0.1991, - "step": 207750 - }, - { - "epoch": 167.97, - "learning_rate": 3.3676179330212464e-05, - "loss": 0.1957, - "step": 207775 - }, - { - "epoch": 167.99, - "learning_rate": 3.361991357580123e-05, - "loss": 0.1942, - "step": 207800 - }, - { - "epoch": 168.01, - "learning_rate": 3.356364782138999e-05, - "loss": 0.1886, - "step": 207825 - }, - { - "epoch": 168.03, - "learning_rate": 3.350738206697875e-05, - "loss": 0.1943, - "step": 207850 - }, - { - "epoch": 168.05, - "learning_rate": 3.345111631256752e-05, - "loss": 0.191, - "step": 207875 - }, - { - "epoch": 168.07, - "learning_rate": 3.339485055815628e-05, - "loss": 0.198, - "step": 207900 - }, - { - "epoch": 168.09, - "learning_rate": 3.3338584803745046e-05, - "loss": 0.182, - "step": 207925 - }, - { - "epoch": 168.11, - "learning_rate": 3.328231904933381e-05, - "loss": 0.2229, - "step": 207950 - }, - { - "epoch": 168.13, - "learning_rate": 3.3226053294922576e-05, - "loss": 0.1699, - "step": 207975 - }, - { - "epoch": 168.15, - "learning_rate": 3.316978754051134e-05, - "loss": 0.1911, - "step": 208000 - }, - { - "epoch": 168.17, - "learning_rate": 3.311352178610011e-05, - "loss": 0.2104, - "step": 208025 - }, - { - "epoch": 168.19, - "learning_rate": 3.305725603168888e-05, - "loss": 0.1995, - "step": 208050 - }, - { - "epoch": 168.21, - "learning_rate": 3.300099027727764e-05, - "loss": 0.1987, - "step": 208075 - }, - { - "epoch": 168.23, - "learning_rate": 3.294472452286641e-05, - "loss": 0.2129, - "step": 208100 - }, - { - "epoch": 168.25, - "learning_rate": 3.288845876845517e-05, - "loss": 0.2092, - "step": 208125 - }, - { - "epoch": 168.27, - "learning_rate": 3.2832193014043936e-05, - "loss": 0.2171, - "step": 208150 - }, - { - "epoch": 168.29, - "learning_rate": 3.27759272596327e-05, - "loss": 0.1689, - "step": 208175 - }, - { - "epoch": 168.31, - "learning_rate": 3.271966150522146e-05, - "loss": 0.2163, - "step": 208200 - }, - { - "epoch": 168.33, - "learning_rate": 3.2663395750810224e-05, - "loss": 0.1767, - "step": 208225 - }, - { - "epoch": 168.35, - "learning_rate": 3.260712999639899e-05, - "loss": 0.2149, - "step": 208250 - }, - { - "epoch": 168.37, - "learning_rate": 3.2550864241987754e-05, - "loss": 0.2043, - "step": 208275 - }, - { - "epoch": 168.39, - "learning_rate": 3.249459848757652e-05, - "loss": 0.2012, - "step": 208300 - }, - { - "epoch": 168.41, - "learning_rate": 3.243833273316528e-05, - "loss": 0.2468, - "step": 208325 - }, - { - "epoch": 168.43, - "learning_rate": 3.2382066978754055e-05, - "loss": 0.1984, - "step": 208350 - }, - { - "epoch": 168.45, - "learning_rate": 3.232580122434282e-05, - "loss": 0.2305, - "step": 208375 - }, - { - "epoch": 168.47, - "learning_rate": 3.2269535469931584e-05, - "loss": 0.2011, - "step": 208400 - }, - { - "epoch": 168.49, - "learning_rate": 3.221326971552035e-05, - "loss": 0.1946, - "step": 208425 - }, - { - "epoch": 168.51, - "learning_rate": 3.2157003961109114e-05, - "loss": 0.2048, - "step": 208450 - }, - { - "epoch": 168.53, - "learning_rate": 3.210073820669788e-05, - "loss": 0.187, - "step": 208475 - }, - { - "epoch": 168.55, - "learning_rate": 3.2044472452286644e-05, - "loss": 0.1927, - "step": 208500 - }, - { - "epoch": 168.57, - "learning_rate": 3.198820669787541e-05, - "loss": 0.1787, - "step": 208525 - }, - { - "epoch": 168.59, - "learning_rate": 3.1931940943464166e-05, - "loss": 0.1875, - "step": 208550 - }, - { - "epoch": 168.61, - "learning_rate": 3.187567518905293e-05, - "loss": 0.1975, - "step": 208575 - }, - { - "epoch": 168.63, - "learning_rate": 3.1819409434641696e-05, - "loss": 0.2049, - "step": 208600 - }, - { - "epoch": 168.65, - "learning_rate": 3.176314368023046e-05, - "loss": 0.1778, - "step": 208625 - }, - { - "epoch": 168.67, - "learning_rate": 3.1706877925819226e-05, - "loss": 0.2165, - "step": 208650 - }, - { - "epoch": 168.69, - "learning_rate": 3.1650612171408e-05, - "loss": 0.1997, - "step": 208675 - }, - { - "epoch": 168.71, - "learning_rate": 3.159434641699676e-05, - "loss": 0.1911, - "step": 208700 - }, - { - "epoch": 168.73, - "learning_rate": 3.153808066258553e-05, - "loss": 0.1659, - "step": 208725 - }, - { - "epoch": 168.76, - "learning_rate": 3.148181490817429e-05, - "loss": 0.213, - "step": 208750 - }, - { - "epoch": 168.78, - "learning_rate": 3.1425549153763056e-05, - "loss": 0.2257, - "step": 208775 - }, - { - "epoch": 168.8, - "learning_rate": 3.136928339935182e-05, - "loss": 0.2027, - "step": 208800 - }, - { - "epoch": 168.82, - "learning_rate": 3.1313017644940586e-05, - "loss": 0.2051, - "step": 208825 - }, - { - "epoch": 168.84, - "learning_rate": 3.125675189052935e-05, - "loss": 0.212, - "step": 208850 - }, - { - "epoch": 168.86, - "learning_rate": 3.1200486136118116e-05, - "loss": 0.2062, - "step": 208875 - }, - { - "epoch": 168.88, - "learning_rate": 3.114422038170688e-05, - "loss": 0.1752, - "step": 208900 - }, - { - "epoch": 168.9, - "learning_rate": 3.1087954627295645e-05, - "loss": 0.1771, - "step": 208925 - }, - { - "epoch": 168.92, - "learning_rate": 3.103168887288441e-05, - "loss": 0.1909, - "step": 208950 - }, - { - "epoch": 168.94, - "learning_rate": 3.0975423118473175e-05, - "loss": 0.1723, - "step": 208975 - }, - { - "epoch": 168.96, - "learning_rate": 3.091915736406194e-05, - "loss": 0.2065, - "step": 209000 - }, - { - "epoch": 168.98, - "learning_rate": 3.0862891609650704e-05, - "loss": 0.1911, - "step": 209025 - }, - { - "epoch": 169.0, - "learning_rate": 3.080662585523947e-05, - "loss": 0.1954, - "step": 209050 - }, - { - "epoch": 169.02, - "learning_rate": 3.0750360100828234e-05, - "loss": 0.2045, - "step": 209075 - }, - { - "epoch": 169.04, - "learning_rate": 3.0694094346417e-05, - "loss": 0.1925, - "step": 209100 - }, - { - "epoch": 169.06, - "learning_rate": 3.0637828592005764e-05, - "loss": 0.1893, - "step": 209125 - }, - { - "epoch": 169.08, - "learning_rate": 3.058156283759453e-05, - "loss": 0.1945, - "step": 209150 - }, - { - "epoch": 169.1, - "learning_rate": 3.052529708318329e-05, - "loss": 0.1925, - "step": 209175 - }, - { - "epoch": 169.12, - "learning_rate": 3.0469031328772055e-05, - "loss": 0.1575, - "step": 209200 - }, - { - "epoch": 169.14, - "learning_rate": 3.0412765574360823e-05, - "loss": 0.2029, - "step": 209225 - }, - { - "epoch": 169.16, - "learning_rate": 3.0356499819949588e-05, - "loss": 0.184, - "step": 209250 - }, - { - "epoch": 169.18, - "learning_rate": 3.0300234065538352e-05, - "loss": 0.1891, - "step": 209275 - }, - { - "epoch": 169.2, - "learning_rate": 3.0243968311127117e-05, - "loss": 0.1909, - "step": 209300 - }, - { - "epoch": 169.22, - "learning_rate": 3.0187702556715882e-05, - "loss": 0.2016, - "step": 209325 - }, - { - "epoch": 169.24, - "learning_rate": 3.0131436802304643e-05, - "loss": 0.1868, - "step": 209350 - }, - { - "epoch": 169.26, - "learning_rate": 3.0075171047893408e-05, - "loss": 0.2264, - "step": 209375 - }, - { - "epoch": 169.28, - "learning_rate": 3.0018905293482176e-05, - "loss": 0.1688, - "step": 209400 - }, - { - "epoch": 169.3, - "learning_rate": 2.996263953907094e-05, - "loss": 0.2192, - "step": 209425 - }, - { - "epoch": 169.32, - "learning_rate": 2.9908624414836154e-05, - "loss": 0.1976, - "step": 209450 - }, - { - "epoch": 169.34, - "learning_rate": 2.985235866042492e-05, - "loss": 0.1995, - "step": 209475 - }, - { - "epoch": 169.36, - "learning_rate": 2.9796092906013683e-05, - "loss": 0.2118, - "step": 209500 - }, - { - "epoch": 169.38, - "learning_rate": 2.973982715160245e-05, - "loss": 0.2228, - "step": 209525 - }, - { - "epoch": 169.4, - "learning_rate": 2.9683561397191216e-05, - "loss": 0.1806, - "step": 209550 - }, - { - "epoch": 169.42, - "learning_rate": 2.962729564277998e-05, - "loss": 0.1977, - "step": 209575 - }, - { - "epoch": 169.44, - "learning_rate": 2.9571029888368743e-05, - "loss": 0.1966, - "step": 209600 - }, - { - "epoch": 169.46, - "learning_rate": 2.9514764133957507e-05, - "loss": 0.1841, - "step": 209625 - }, - { - "epoch": 169.48, - "learning_rate": 2.9458498379546272e-05, - "loss": 0.1788, - "step": 209650 - }, - { - "epoch": 169.5, - "learning_rate": 2.9402232625135037e-05, - "loss": 0.189, - "step": 209675 - }, - { - "epoch": 169.52, - "learning_rate": 2.9345966870723805e-05, - "loss": 0.1697, - "step": 209700 - }, - { - "epoch": 169.54, - "learning_rate": 2.928970111631257e-05, - "loss": 0.2083, - "step": 209725 - }, - { - "epoch": 169.56, - "learning_rate": 2.9233435361901335e-05, - "loss": 0.2094, - "step": 209750 - }, - { - "epoch": 169.58, - "learning_rate": 2.9177169607490096e-05, - "loss": 0.2036, - "step": 209775 - }, - { - "epoch": 169.6, - "learning_rate": 2.912090385307886e-05, - "loss": 0.1829, - "step": 209800 - }, - { - "epoch": 169.62, - "learning_rate": 2.9064638098667626e-05, - "loss": 0.195, - "step": 209825 - }, - { - "epoch": 169.64, - "learning_rate": 2.9008372344256394e-05, - "loss": 0.1701, - "step": 209850 - }, - { - "epoch": 169.66, - "learning_rate": 2.895210658984516e-05, - "loss": 0.1991, - "step": 209875 - }, - { - "epoch": 169.68, - "learning_rate": 2.8895840835433924e-05, - "loss": 0.2002, - "step": 209900 - }, - { - "epoch": 169.7, - "learning_rate": 2.883957508102269e-05, - "loss": 0.199, - "step": 209925 - }, - { - "epoch": 169.73, - "learning_rate": 2.878330932661145e-05, - "loss": 0.1758, - "step": 209950 - }, - { - "epoch": 169.75, - "learning_rate": 2.8727043572200215e-05, - "loss": 0.1984, - "step": 209975 - }, - { - "epoch": 169.77, - "learning_rate": 2.867077781778898e-05, - "loss": 0.1841, - "step": 210000 - }, - { - "epoch": 169.77, - "eval_cer": 0.07372462860486843, - "eval_loss": 0.47256383299827576, - "eval_runtime": 150.2166, - "eval_samples_per_second": 27.913, - "eval_steps_per_second": 6.983, - "eval_wer": 0.3164110929853181, - "step": 210000 - }, - { - "epoch": 169.79, - "learning_rate": 2.8614512063377748e-05, - "loss": 0.2131, - "step": 210025 - }, - { - "epoch": 169.81, - "learning_rate": 2.8558246308966512e-05, - "loss": 0.2113, - "step": 210050 - }, - { - "epoch": 169.83, - "learning_rate": 2.8504231184731725e-05, - "loss": 0.2038, - "step": 210075 - }, - { - "epoch": 169.85, - "learning_rate": 2.844796543032049e-05, - "loss": 0.182, - "step": 210100 - }, - { - "epoch": 169.87, - "learning_rate": 2.8391699675909254e-05, - "loss": 0.2077, - "step": 210125 - }, - { - "epoch": 169.89, - "learning_rate": 2.8335433921498023e-05, - "loss": 0.2242, - "step": 210150 - }, - { - "epoch": 169.91, - "learning_rate": 2.8279168167086787e-05, - "loss": 0.2341, - "step": 210175 - }, - { - "epoch": 169.93, - "learning_rate": 2.822290241267555e-05, - "loss": 0.1838, - "step": 210200 - }, - { - "epoch": 169.95, - "learning_rate": 2.8166636658264314e-05, - "loss": 0.2204, - "step": 210225 - }, - { - "epoch": 169.97, - "learning_rate": 2.811037090385308e-05, - "loss": 0.1779, - "step": 210250 - }, - { - "epoch": 169.99, - "learning_rate": 2.8054105149441843e-05, - "loss": 0.224, - "step": 210275 - }, - { - "epoch": 170.01, - "learning_rate": 2.7997839395030608e-05, - "loss": 0.2022, - "step": 210300 - }, - { - "epoch": 170.03, - "learning_rate": 2.7941573640619376e-05, - "loss": 0.179, - "step": 210325 - }, - { - "epoch": 170.05, - "learning_rate": 2.788530788620814e-05, - "loss": 0.1978, - "step": 210350 - }, - { - "epoch": 170.07, - "learning_rate": 2.7829042131796902e-05, - "loss": 0.1825, - "step": 210375 - }, - { - "epoch": 170.09, - "learning_rate": 2.7772776377385667e-05, - "loss": 0.187, - "step": 210400 - }, - { - "epoch": 170.11, - "learning_rate": 2.7716510622974432e-05, - "loss": 0.1917, - "step": 210425 - }, - { - "epoch": 170.13, - "learning_rate": 2.7660244868563197e-05, - "loss": 0.2035, - "step": 210450 - }, - { - "epoch": 170.15, - "learning_rate": 2.7603979114151965e-05, - "loss": 0.1981, - "step": 210475 - }, - { - "epoch": 170.17, - "learning_rate": 2.754771335974073e-05, - "loss": 0.1971, - "step": 210500 - }, - { - "epoch": 170.19, - "learning_rate": 2.7491447605329495e-05, - "loss": 0.1822, - "step": 210525 - }, - { - "epoch": 170.21, - "learning_rate": 2.7435181850918256e-05, - "loss": 0.2026, - "step": 210550 - }, - { - "epoch": 170.23, - "learning_rate": 2.737891609650702e-05, - "loss": 0.2142, - "step": 210575 - }, - { - "epoch": 170.25, - "learning_rate": 2.7322650342095786e-05, - "loss": 0.2011, - "step": 210600 - }, - { - "epoch": 170.27, - "learning_rate": 2.726638458768455e-05, - "loss": 0.1691, - "step": 210625 - }, - { - "epoch": 170.29, - "learning_rate": 2.721011883327332e-05, - "loss": 0.1798, - "step": 210650 - }, - { - "epoch": 170.31, - "learning_rate": 2.7153853078862083e-05, - "loss": 0.1828, - "step": 210675 - }, - { - "epoch": 170.33, - "learning_rate": 2.7097587324450848e-05, - "loss": 0.1837, - "step": 210700 - }, - { - "epoch": 170.35, - "learning_rate": 2.704132157003961e-05, - "loss": 0.1976, - "step": 210725 - }, - { - "epoch": 170.37, - "learning_rate": 2.6985055815628374e-05, - "loss": 0.1898, - "step": 210750 - }, - { - "epoch": 170.39, - "learning_rate": 2.692879006121714e-05, - "loss": 0.1906, - "step": 210775 - }, - { - "epoch": 170.41, - "learning_rate": 2.6872524306805907e-05, - "loss": 0.1866, - "step": 210800 - }, - { - "epoch": 170.43, - "learning_rate": 2.6816258552394672e-05, - "loss": 0.2003, - "step": 210825 - }, - { - "epoch": 170.45, - "learning_rate": 2.6759992797983437e-05, - "loss": 0.1728, - "step": 210850 - }, - { - "epoch": 170.47, - "learning_rate": 2.6703727043572202e-05, - "loss": 0.2115, - "step": 210875 - }, - { - "epoch": 170.49, - "learning_rate": 2.6647461289160967e-05, - "loss": 0.1753, - "step": 210900 - }, - { - "epoch": 170.51, - "learning_rate": 2.6591195534749728e-05, - "loss": 0.1987, - "step": 210925 - }, - { - "epoch": 170.53, - "learning_rate": 2.6534929780338493e-05, - "loss": 0.2055, - "step": 210950 - }, - { - "epoch": 170.55, - "learning_rate": 2.647866402592726e-05, - "loss": 0.2001, - "step": 210975 - }, - { - "epoch": 170.57, - "learning_rate": 2.6422398271516026e-05, - "loss": 0.1894, - "step": 211000 - }, - { - "epoch": 170.59, - "learning_rate": 2.636613251710479e-05, - "loss": 0.2001, - "step": 211025 - }, - { - "epoch": 170.61, - "learning_rate": 2.6309866762693555e-05, - "loss": 0.1836, - "step": 211050 - }, - { - "epoch": 170.63, - "learning_rate": 2.625360100828232e-05, - "loss": 0.2091, - "step": 211075 - }, - { - "epoch": 170.65, - "learning_rate": 2.619733525387108e-05, - "loss": 0.2003, - "step": 211100 - }, - { - "epoch": 170.68, - "learning_rate": 2.614106949945985e-05, - "loss": 0.1955, - "step": 211125 - }, - { - "epoch": 170.7, - "learning_rate": 2.6084803745048615e-05, - "loss": 0.2167, - "step": 211150 - }, - { - "epoch": 170.72, - "learning_rate": 2.602853799063738e-05, - "loss": 0.2527, - "step": 211175 - }, - { - "epoch": 170.74, - "learning_rate": 2.5972272236226144e-05, - "loss": 0.1774, - "step": 211200 - }, - { - "epoch": 170.76, - "learning_rate": 2.591600648181491e-05, - "loss": 0.2093, - "step": 211225 - }, - { - "epoch": 170.78, - "learning_rate": 2.5859740727403674e-05, - "loss": 0.191, - "step": 211250 - }, - { - "epoch": 170.8, - "learning_rate": 2.580347497299244e-05, - "loss": 0.1887, - "step": 211275 - }, - { - "epoch": 170.82, - "learning_rate": 2.5747209218581203e-05, - "loss": 0.2332, - "step": 211300 - }, - { - "epoch": 170.84, - "learning_rate": 2.5690943464169968e-05, - "loss": 0.2154, - "step": 211325 - }, - { - "epoch": 170.86, - "learning_rate": 2.5634677709758733e-05, - "loss": 0.179, - "step": 211350 - }, - { - "epoch": 170.88, - "learning_rate": 2.5578411955347498e-05, - "loss": 0.2106, - "step": 211375 - }, - { - "epoch": 170.9, - "learning_rate": 2.5522146200936263e-05, - "loss": 0.195, - "step": 211400 - }, - { - "epoch": 170.92, - "learning_rate": 2.5465880446525027e-05, - "loss": 0.1931, - "step": 211425 - }, - { - "epoch": 170.94, - "learning_rate": 2.5409614692113792e-05, - "loss": 0.1685, - "step": 211450 - }, - { - "epoch": 170.96, - "learning_rate": 2.5353348937702557e-05, - "loss": 0.1464, - "step": 211475 - }, - { - "epoch": 170.98, - "learning_rate": 2.5297083183291322e-05, - "loss": 0.1778, - "step": 211500 - }, - { - "epoch": 171.0, - "learning_rate": 2.5240817428880087e-05, - "loss": 0.1819, - "step": 211525 - }, - { - "epoch": 171.02, - "learning_rate": 2.518455167446885e-05, - "loss": 0.182, - "step": 211550 - }, - { - "epoch": 171.04, - "learning_rate": 2.5128285920057616e-05, - "loss": 0.1785, - "step": 211575 - }, - { - "epoch": 171.06, - "learning_rate": 2.5072020165646384e-05, - "loss": 0.2206, - "step": 211600 - }, - { - "epoch": 171.08, - "learning_rate": 2.5015754411235146e-05, - "loss": 0.1878, - "step": 211625 - }, - { - "epoch": 171.1, - "learning_rate": 2.495948865682391e-05, - "loss": 0.1952, - "step": 211650 - }, - { - "epoch": 171.12, - "learning_rate": 2.4903222902412675e-05, - "loss": 0.1731, - "step": 211675 - }, - { - "epoch": 171.14, - "learning_rate": 2.484695714800144e-05, - "loss": 0.2236, - "step": 211700 - }, - { - "epoch": 171.16, - "learning_rate": 2.4790691393590205e-05, - "loss": 0.1688, - "step": 211725 - }, - { - "epoch": 171.18, - "learning_rate": 2.4734425639178973e-05, - "loss": 0.1948, - "step": 211750 - }, - { - "epoch": 171.2, - "learning_rate": 2.4678159884767738e-05, - "loss": 0.174, - "step": 211775 - }, - { - "epoch": 171.22, - "learning_rate": 2.46218941303565e-05, - "loss": 0.174, - "step": 211800 - }, - { - "epoch": 171.24, - "learning_rate": 2.4565628375945264e-05, - "loss": 0.1988, - "step": 211825 - }, - { - "epoch": 171.26, - "learning_rate": 2.450936262153403e-05, - "loss": 0.2113, - "step": 211850 - }, - { - "epoch": 171.28, - "learning_rate": 2.4453096867122794e-05, - "loss": 0.1769, - "step": 211875 - }, - { - "epoch": 171.3, - "learning_rate": 2.439683111271156e-05, - "loss": 0.1963, - "step": 211900 - }, - { - "epoch": 171.32, - "learning_rate": 2.4340565358300327e-05, - "loss": 0.161, - "step": 211925 - }, - { - "epoch": 171.34, - "learning_rate": 2.428429960388909e-05, - "loss": 0.1801, - "step": 211950 - }, - { - "epoch": 171.36, - "learning_rate": 2.4228033849477853e-05, - "loss": 0.1774, - "step": 211975 - }, - { - "epoch": 171.38, - "learning_rate": 2.4171768095066618e-05, - "loss": 0.1972, - "step": 212000 - }, - { - "epoch": 171.4, - "learning_rate": 2.4115502340655383e-05, - "loss": 0.208, - "step": 212025 - }, - { - "epoch": 171.42, - "learning_rate": 2.4059236586244147e-05, - "loss": 0.1966, - "step": 212050 - }, - { - "epoch": 171.44, - "learning_rate": 2.4002970831832916e-05, - "loss": 0.165, - "step": 212075 - }, - { - "epoch": 171.46, - "learning_rate": 2.394670507742168e-05, - "loss": 0.2033, - "step": 212100 - }, - { - "epoch": 171.48, - "learning_rate": 2.3890439323010445e-05, - "loss": 0.164, - "step": 212125 - }, - { - "epoch": 171.5, - "learning_rate": 2.3834173568599207e-05, - "loss": 0.2168, - "step": 212150 - }, - { - "epoch": 171.52, - "learning_rate": 2.377790781418797e-05, - "loss": 0.2013, - "step": 212175 - }, - { - "epoch": 171.54, - "learning_rate": 2.3721642059776736e-05, - "loss": 0.1935, - "step": 212200 - }, - { - "epoch": 171.56, - "learning_rate": 2.36653763053655e-05, - "loss": 0.1854, - "step": 212225 - }, - { - "epoch": 171.58, - "learning_rate": 2.360911055095427e-05, - "loss": 0.2133, - "step": 212250 - }, - { - "epoch": 171.6, - "learning_rate": 2.3552844796543034e-05, - "loss": 0.1806, - "step": 212275 - }, - { - "epoch": 171.62, - "learning_rate": 2.34965790421318e-05, - "loss": 0.1823, - "step": 212300 - }, - { - "epoch": 171.65, - "learning_rate": 2.3440313287720564e-05, - "loss": 0.2023, - "step": 212325 - }, - { - "epoch": 171.67, - "learning_rate": 2.3384047533309325e-05, - "loss": 0.1978, - "step": 212350 - }, - { - "epoch": 171.69, - "learning_rate": 2.332778177889809e-05, - "loss": 0.1572, - "step": 212375 - }, - { - "epoch": 171.71, - "learning_rate": 2.3271516024486858e-05, - "loss": 0.2218, - "step": 212400 - }, - { - "epoch": 171.73, - "learning_rate": 2.3215250270075623e-05, - "loss": 0.1984, - "step": 212425 - }, - { - "epoch": 171.75, - "learning_rate": 2.3158984515664388e-05, - "loss": 0.2029, - "step": 212450 - }, - { - "epoch": 171.77, - "learning_rate": 2.3102718761253152e-05, - "loss": 0.1627, - "step": 212475 - }, - { - "epoch": 171.79, - "learning_rate": 2.3046453006841917e-05, - "loss": 0.1642, - "step": 212500 - }, - { - "epoch": 171.81, - "learning_rate": 2.299018725243068e-05, - "loss": 0.1891, - "step": 212525 - }, - { - "epoch": 171.83, - "learning_rate": 2.2933921498019443e-05, - "loss": 0.2037, - "step": 212550 - }, - { - "epoch": 171.85, - "learning_rate": 2.287765574360821e-05, - "loss": 0.1781, - "step": 212575 - }, - { - "epoch": 171.87, - "learning_rate": 2.2821389989196976e-05, - "loss": 0.1949, - "step": 212600 - }, - { - "epoch": 171.89, - "learning_rate": 2.276512423478574e-05, - "loss": 0.1819, - "step": 212625 - }, - { - "epoch": 171.91, - "learning_rate": 2.2708858480374506e-05, - "loss": 0.1855, - "step": 212650 - }, - { - "epoch": 171.93, - "learning_rate": 2.265259272596327e-05, - "loss": 0.1808, - "step": 212675 - }, - { - "epoch": 171.95, - "learning_rate": 2.2596326971552032e-05, - "loss": 0.1994, - "step": 212700 - }, - { - "epoch": 171.97, - "learning_rate": 2.25400612171408e-05, - "loss": 0.1876, - "step": 212725 - }, - { - "epoch": 171.99, - "learning_rate": 2.2483795462729565e-05, - "loss": 0.2074, - "step": 212750 - }, - { - "epoch": 172.01, - "learning_rate": 2.242752970831833e-05, - "loss": 0.1808, - "step": 212775 - }, - { - "epoch": 172.03, - "learning_rate": 2.2371263953907095e-05, - "loss": 0.1895, - "step": 212800 - }, - { - "epoch": 172.05, - "learning_rate": 2.231499819949586e-05, - "loss": 0.1993, - "step": 212825 - }, - { - "epoch": 172.07, - "learning_rate": 2.2258732445084624e-05, - "loss": 0.2055, - "step": 212850 - }, - { - "epoch": 172.09, - "learning_rate": 2.220246669067339e-05, - "loss": 0.2277, - "step": 212875 - }, - { - "epoch": 172.11, - "learning_rate": 2.2146200936262154e-05, - "loss": 0.2017, - "step": 212900 - }, - { - "epoch": 172.13, - "learning_rate": 2.208993518185092e-05, - "loss": 0.1825, - "step": 212925 - }, - { - "epoch": 172.15, - "learning_rate": 2.2033669427439684e-05, - "loss": 0.1839, - "step": 212950 - }, - { - "epoch": 172.17, - "learning_rate": 2.197740367302845e-05, - "loss": 0.1796, - "step": 212975 - }, - { - "epoch": 172.19, - "learning_rate": 2.1921137918617213e-05, - "loss": 0.1774, - "step": 213000 - }, - { - "epoch": 172.19, - "eval_cer": 0.07383756147141259, - "eval_loss": 0.4742075204849243, - "eval_runtime": 150.533, - "eval_samples_per_second": 27.854, - "eval_steps_per_second": 6.969, - "eval_wer": 0.3161500815660685, - "step": 213000 - }, - { - "epoch": 172.21, - "learning_rate": 2.1864872164205978e-05, - "loss": 0.1943, - "step": 213025 - }, - { - "epoch": 172.23, - "learning_rate": 2.1808606409794743e-05, - "loss": 0.1907, - "step": 213050 - }, - { - "epoch": 172.25, - "learning_rate": 2.1752340655383508e-05, - "loss": 0.1743, - "step": 213075 - }, - { - "epoch": 172.27, - "learning_rate": 2.1696074900972272e-05, - "loss": 0.1985, - "step": 213100 - }, - { - "epoch": 172.29, - "learning_rate": 2.1639809146561037e-05, - "loss": 0.2295, - "step": 213125 - }, - { - "epoch": 172.31, - "learning_rate": 2.1583543392149802e-05, - "loss": 0.1958, - "step": 213150 - }, - { - "epoch": 172.33, - "learning_rate": 2.1527277637738567e-05, - "loss": 0.1732, - "step": 213175 - }, - { - "epoch": 172.35, - "learning_rate": 2.1471011883327335e-05, - "loss": 0.2084, - "step": 213200 - }, - { - "epoch": 172.37, - "learning_rate": 2.1414746128916096e-05, - "loss": 0.1851, - "step": 213225 - }, - { - "epoch": 172.39, - "learning_rate": 2.135848037450486e-05, - "loss": 0.1872, - "step": 213250 - }, - { - "epoch": 172.41, - "learning_rate": 2.1302214620093626e-05, - "loss": 0.1918, - "step": 213275 - }, - { - "epoch": 172.43, - "learning_rate": 2.124594886568239e-05, - "loss": 0.1829, - "step": 213300 - }, - { - "epoch": 172.45, - "learning_rate": 2.1189683111271156e-05, - "loss": 0.1753, - "step": 213325 - }, - { - "epoch": 172.47, - "learning_rate": 2.1133417356859924e-05, - "loss": 0.1865, - "step": 213350 - }, - { - "epoch": 172.49, - "learning_rate": 2.107715160244869e-05, - "loss": 0.1732, - "step": 213375 - }, - { - "epoch": 172.51, - "learning_rate": 2.102088584803745e-05, - "loss": 0.1706, - "step": 213400 - }, - { - "epoch": 172.53, - "learning_rate": 2.0964620093626215e-05, - "loss": 0.1697, - "step": 213425 - }, - { - "epoch": 172.55, - "learning_rate": 2.090835433921498e-05, - "loss": 0.1971, - "step": 213450 - }, - { - "epoch": 172.57, - "learning_rate": 2.0852088584803744e-05, - "loss": 0.1733, - "step": 213475 - }, - { - "epoch": 172.59, - "learning_rate": 2.079582283039251e-05, - "loss": 0.1894, - "step": 213500 - }, - { - "epoch": 172.62, - "learning_rate": 2.0739557075981277e-05, - "loss": 0.1866, - "step": 213525 - }, - { - "epoch": 172.64, - "learning_rate": 2.0683291321570042e-05, - "loss": 0.1746, - "step": 213550 - }, - { - "epoch": 172.66, - "learning_rate": 2.0627025567158804e-05, - "loss": 0.1751, - "step": 213575 - }, - { - "epoch": 172.68, - "learning_rate": 2.057075981274757e-05, - "loss": 0.1906, - "step": 213600 - }, - { - "epoch": 172.7, - "learning_rate": 2.0514494058336333e-05, - "loss": 0.1656, - "step": 213625 - }, - { - "epoch": 172.72, - "learning_rate": 2.0458228303925098e-05, - "loss": 0.1831, - "step": 213650 - }, - { - "epoch": 172.74, - "learning_rate": 2.0401962549513866e-05, - "loss": 0.1708, - "step": 213675 - }, - { - "epoch": 172.76, - "learning_rate": 2.034569679510263e-05, - "loss": 0.1831, - "step": 213700 - }, - { - "epoch": 172.78, - "learning_rate": 2.0289431040691396e-05, - "loss": 0.1732, - "step": 213725 - }, - { - "epoch": 172.8, - "learning_rate": 2.023316528628016e-05, - "loss": 0.1691, - "step": 213750 - }, - { - "epoch": 172.82, - "learning_rate": 2.0176899531868922e-05, - "loss": 0.1903, - "step": 213775 - }, - { - "epoch": 172.84, - "learning_rate": 2.0120633777457687e-05, - "loss": 0.1739, - "step": 213800 - }, - { - "epoch": 172.86, - "learning_rate": 2.006436802304645e-05, - "loss": 0.1475, - "step": 213825 - }, - { - "epoch": 172.88, - "learning_rate": 2.000810226863522e-05, - "loss": 0.1844, - "step": 213850 - }, - { - "epoch": 172.9, - "learning_rate": 1.9951836514223985e-05, - "loss": 0.1972, - "step": 213875 - }, - { - "epoch": 172.92, - "learning_rate": 1.989557075981275e-05, - "loss": 0.1912, - "step": 213900 - }, - { - "epoch": 172.94, - "learning_rate": 1.9839305005401514e-05, - "loss": 0.1762, - "step": 213925 - }, - { - "epoch": 172.96, - "learning_rate": 1.9783039250990276e-05, - "loss": 0.2016, - "step": 213950 - }, - { - "epoch": 172.98, - "learning_rate": 1.972677349657904e-05, - "loss": 0.1875, - "step": 213975 - }, - { - "epoch": 173.0, - "learning_rate": 1.967050774216781e-05, - "loss": 0.1957, - "step": 214000 - }, - { - "epoch": 173.02, - "learning_rate": 1.9614241987756573e-05, - "loss": 0.2098, - "step": 214025 - }, - { - "epoch": 173.04, - "learning_rate": 1.9557976233345338e-05, - "loss": 0.2055, - "step": 214050 - }, - { - "epoch": 173.06, - "learning_rate": 1.9501710478934103e-05, - "loss": 0.2312, - "step": 214075 - }, - { - "epoch": 173.08, - "learning_rate": 1.9445444724522868e-05, - "loss": 0.1761, - "step": 214100 - }, - { - "epoch": 173.1, - "learning_rate": 1.938917897011163e-05, - "loss": 0.2061, - "step": 214125 - }, - { - "epoch": 173.12, - "learning_rate": 1.9332913215700394e-05, - "loss": 0.1726, - "step": 214150 - }, - { - "epoch": 173.14, - "learning_rate": 1.9276647461289162e-05, - "loss": 0.1935, - "step": 214175 - }, - { - "epoch": 173.16, - "learning_rate": 1.9222632337054375e-05, - "loss": 0.1552, - "step": 214200 - }, - { - "epoch": 173.18, - "learning_rate": 1.916636658264314e-05, - "loss": 0.2189, - "step": 214225 - }, - { - "epoch": 173.2, - "learning_rate": 1.9110100828231904e-05, - "loss": 0.1777, - "step": 214250 - }, - { - "epoch": 173.22, - "learning_rate": 1.905383507382067e-05, - "loss": 0.1906, - "step": 214275 - }, - { - "epoch": 173.24, - "learning_rate": 1.8997569319409437e-05, - "loss": 0.1802, - "step": 214300 - }, - { - "epoch": 173.26, - "learning_rate": 1.8941303564998202e-05, - "loss": 0.2032, - "step": 214325 - }, - { - "epoch": 173.28, - "learning_rate": 1.8885037810586967e-05, - "loss": 0.1831, - "step": 214350 - }, - { - "epoch": 173.3, - "learning_rate": 1.882877205617573e-05, - "loss": 0.2136, - "step": 214375 - }, - { - "epoch": 173.32, - "learning_rate": 1.8772506301764493e-05, - "loss": 0.1647, - "step": 214400 - }, - { - "epoch": 173.34, - "learning_rate": 1.8716240547353258e-05, - "loss": 0.188, - "step": 214425 - }, - { - "epoch": 173.36, - "learning_rate": 1.8659974792942023e-05, - "loss": 0.1585, - "step": 214450 - }, - { - "epoch": 173.38, - "learning_rate": 1.860370903853079e-05, - "loss": 0.1829, - "step": 214475 - }, - { - "epoch": 173.4, - "learning_rate": 1.8547443284119556e-05, - "loss": 0.1478, - "step": 214500 - }, - { - "epoch": 173.42, - "learning_rate": 1.849117752970832e-05, - "loss": 0.2183, - "step": 214525 - }, - { - "epoch": 173.44, - "learning_rate": 1.8434911775297082e-05, - "loss": 0.1815, - "step": 214550 - }, - { - "epoch": 173.46, - "learning_rate": 1.8378646020885847e-05, - "loss": 0.2044, - "step": 214575 - }, - { - "epoch": 173.48, - "learning_rate": 1.832238026647461e-05, - "loss": 0.1693, - "step": 214600 - }, - { - "epoch": 173.5, - "learning_rate": 1.826611451206338e-05, - "loss": 0.1877, - "step": 214625 - }, - { - "epoch": 173.52, - "learning_rate": 1.8209848757652144e-05, - "loss": 0.1964, - "step": 214650 - }, - { - "epoch": 173.54, - "learning_rate": 1.815358300324091e-05, - "loss": 0.2049, - "step": 214675 - }, - { - "epoch": 173.57, - "learning_rate": 1.8097317248829674e-05, - "loss": 0.179, - "step": 214700 - }, - { - "epoch": 173.59, - "learning_rate": 1.8041051494418436e-05, - "loss": 0.1841, - "step": 214725 - }, - { - "epoch": 173.61, - "learning_rate": 1.79847857400072e-05, - "loss": 0.1635, - "step": 214750 - }, - { - "epoch": 173.63, - "learning_rate": 1.7928519985595965e-05, - "loss": 0.1895, - "step": 214775 - }, - { - "epoch": 173.65, - "learning_rate": 1.7872254231184733e-05, - "loss": 0.1776, - "step": 214800 - }, - { - "epoch": 173.67, - "learning_rate": 1.7815988476773498e-05, - "loss": 0.1817, - "step": 214825 - }, - { - "epoch": 173.69, - "learning_rate": 1.7759722722362263e-05, - "loss": 0.1557, - "step": 214850 - }, - { - "epoch": 173.71, - "learning_rate": 1.7703456967951028e-05, - "loss": 0.207, - "step": 214875 - }, - { - "epoch": 173.73, - "learning_rate": 1.764719121353979e-05, - "loss": 0.1831, - "step": 214900 - }, - { - "epoch": 173.75, - "learning_rate": 1.7590925459128554e-05, - "loss": 0.2335, - "step": 214925 - }, - { - "epoch": 173.77, - "learning_rate": 1.7534659704717322e-05, - "loss": 0.2001, - "step": 214950 - }, - { - "epoch": 173.79, - "learning_rate": 1.7478393950306087e-05, - "loss": 0.2077, - "step": 214975 - }, - { - "epoch": 173.81, - "learning_rate": 1.742212819589485e-05, - "loss": 0.1638, - "step": 215000 - }, - { - "epoch": 173.83, - "learning_rate": 1.7365862441483616e-05, - "loss": 0.2241, - "step": 215025 - }, - { - "epoch": 173.85, - "learning_rate": 1.730959668707238e-05, - "loss": 0.1736, - "step": 215050 - }, - { - "epoch": 173.87, - "learning_rate": 1.7253330932661143e-05, - "loss": 0.2111, - "step": 215075 - }, - { - "epoch": 173.89, - "learning_rate": 1.719706517824991e-05, - "loss": 0.1622, - "step": 215100 - }, - { - "epoch": 173.91, - "learning_rate": 1.7140799423838676e-05, - "loss": 0.1935, - "step": 215125 - }, - { - "epoch": 173.93, - "learning_rate": 1.708453366942744e-05, - "loss": 0.1882, - "step": 215150 - }, - { - "epoch": 173.95, - "learning_rate": 1.7028267915016205e-05, - "loss": 0.2091, - "step": 215175 - }, - { - "epoch": 173.97, - "learning_rate": 1.697200216060497e-05, - "loss": 0.1914, - "step": 215200 - }, - { - "epoch": 173.99, - "learning_rate": 1.6915736406193735e-05, - "loss": 0.1978, - "step": 215225 - }, - { - "epoch": 174.01, - "learning_rate": 1.6859470651782496e-05, - "loss": 0.1971, - "step": 215250 - }, - { - "epoch": 174.03, - "learning_rate": 1.6803204897371264e-05, - "loss": 0.19, - "step": 215275 - }, - { - "epoch": 174.05, - "learning_rate": 1.674693914296003e-05, - "loss": 0.1619, - "step": 215300 - }, - { - "epoch": 174.07, - "learning_rate": 1.6690673388548794e-05, - "loss": 0.1741, - "step": 215325 - }, - { - "epoch": 174.09, - "learning_rate": 1.663440763413756e-05, - "loss": 0.1616, - "step": 215350 - }, - { - "epoch": 174.11, - "learning_rate": 1.6578141879726324e-05, - "loss": 0.2239, - "step": 215375 - }, - { - "epoch": 174.13, - "learning_rate": 1.652187612531509e-05, - "loss": 0.1858, - "step": 215400 - }, - { - "epoch": 174.15, - "learning_rate": 1.6465610370903853e-05, - "loss": 0.1955, - "step": 215425 - }, - { - "epoch": 174.17, - "learning_rate": 1.6409344616492618e-05, - "loss": 0.1749, - "step": 215450 - }, - { - "epoch": 174.19, - "learning_rate": 1.6353078862081383e-05, - "loss": 0.1855, - "step": 215475 - }, - { - "epoch": 174.21, - "learning_rate": 1.6296813107670148e-05, - "loss": 0.1706, - "step": 215500 - }, - { - "epoch": 174.23, - "learning_rate": 1.6240547353258912e-05, - "loss": 0.2086, - "step": 215525 - }, - { - "epoch": 174.25, - "learning_rate": 1.6184281598847677e-05, - "loss": 0.188, - "step": 215550 - }, - { - "epoch": 174.27, - "learning_rate": 1.6128015844436442e-05, - "loss": 0.1997, - "step": 215575 - }, - { - "epoch": 174.29, - "learning_rate": 1.607175009002521e-05, - "loss": 0.1771, - "step": 215600 - }, - { - "epoch": 174.31, - "learning_rate": 1.601548433561397e-05, - "loss": 0.1922, - "step": 215625 - }, - { - "epoch": 174.33, - "learning_rate": 1.5959218581202736e-05, - "loss": 0.1818, - "step": 215650 - }, - { - "epoch": 174.35, - "learning_rate": 1.590520345696795e-05, - "loss": 0.2173, - "step": 215675 - }, - { - "epoch": 174.37, - "learning_rate": 1.5848937702556714e-05, - "loss": 0.1975, - "step": 215700 - }, - { - "epoch": 174.39, - "learning_rate": 1.579267194814548e-05, - "loss": 0.1748, - "step": 215725 - }, - { - "epoch": 174.41, - "learning_rate": 1.5736406193734247e-05, - "loss": 0.1873, - "step": 215750 - }, - { - "epoch": 174.43, - "learning_rate": 1.568014043932301e-05, - "loss": 0.1777, - "step": 215775 - }, - { - "epoch": 174.45, - "learning_rate": 1.5623874684911776e-05, - "loss": 0.2143, - "step": 215800 - }, - { - "epoch": 174.47, - "learning_rate": 1.556760893050054e-05, - "loss": 0.1641, - "step": 215825 - }, - { - "epoch": 174.49, - "learning_rate": 1.5511343176089306e-05, - "loss": 0.1788, - "step": 215850 - }, - { - "epoch": 174.51, - "learning_rate": 1.545507742167807e-05, - "loss": 0.1697, - "step": 215875 - }, - { - "epoch": 174.54, - "learning_rate": 1.5398811667266836e-05, - "loss": 0.1693, - "step": 215900 - }, - { - "epoch": 174.56, - "learning_rate": 1.53425459128556e-05, - "loss": 0.1963, - "step": 215925 - }, - { - "epoch": 174.58, - "learning_rate": 1.5286280158444365e-05, - "loss": 0.2001, - "step": 215950 - }, - { - "epoch": 174.6, - "learning_rate": 1.523001440403313e-05, - "loss": 0.1966, - "step": 215975 - }, - { - "epoch": 174.62, - "learning_rate": 1.5173748649621893e-05, - "loss": 0.1819, - "step": 216000 - }, - { - "epoch": 174.62, - "eval_cer": 0.07368869542005893, - "eval_loss": 0.4719657897949219, - "eval_runtime": 150.9063, - "eval_samples_per_second": 27.785, - "eval_steps_per_second": 6.951, - "eval_wer": 0.31491027732463295, - "step": 216000 - }, - { - "epoch": 174.64, - "learning_rate": 1.511748289521066e-05, - "loss": 0.1881, - "step": 216025 - }, - { - "epoch": 174.66, - "learning_rate": 1.5061217140799424e-05, - "loss": 0.1883, - "step": 216050 - }, - { - "epoch": 174.68, - "learning_rate": 1.500495138638819e-05, - "loss": 0.1639, - "step": 216075 - }, - { - "epoch": 174.7, - "learning_rate": 1.4950936262153404e-05, - "loss": 0.2041, - "step": 216100 - }, - { - "epoch": 174.72, - "learning_rate": 1.4894670507742168e-05, - "loss": 0.1736, - "step": 216125 - }, - { - "epoch": 174.74, - "learning_rate": 1.4838404753330931e-05, - "loss": 0.2013, - "step": 216150 - }, - { - "epoch": 174.76, - "learning_rate": 1.4782138998919698e-05, - "loss": 0.1711, - "step": 216175 - }, - { - "epoch": 174.78, - "learning_rate": 1.4725873244508463e-05, - "loss": 0.1801, - "step": 216200 - }, - { - "epoch": 174.8, - "learning_rate": 1.4669607490097227e-05, - "loss": 0.1786, - "step": 216225 - }, - { - "epoch": 174.82, - "learning_rate": 1.4613341735685992e-05, - "loss": 0.1562, - "step": 216250 - }, - { - "epoch": 174.84, - "learning_rate": 1.4557075981274757e-05, - "loss": 0.1903, - "step": 216275 - }, - { - "epoch": 174.86, - "learning_rate": 1.4500810226863522e-05, - "loss": 0.2086, - "step": 216300 - }, - { - "epoch": 174.88, - "learning_rate": 1.4444544472452288e-05, - "loss": 0.1597, - "step": 216325 - }, - { - "epoch": 174.9, - "learning_rate": 1.4388278718041051e-05, - "loss": 0.1638, - "step": 216350 - }, - { - "epoch": 174.92, - "learning_rate": 1.4332012963629816e-05, - "loss": 0.1867, - "step": 216375 - }, - { - "epoch": 174.94, - "learning_rate": 1.4275747209218583e-05, - "loss": 0.1839, - "step": 216400 - }, - { - "epoch": 174.96, - "learning_rate": 1.4219481454807346e-05, - "loss": 0.2063, - "step": 216425 - }, - { - "epoch": 174.98, - "learning_rate": 1.416321570039611e-05, - "loss": 0.1848, - "step": 216450 - }, - { - "epoch": 175.0, - "learning_rate": 1.4106949945984877e-05, - "loss": 0.2096, - "step": 216475 - }, - { - "epoch": 175.02, - "learning_rate": 1.4050684191573642e-05, - "loss": 0.2003, - "step": 216500 - }, - { - "epoch": 175.04, - "learning_rate": 1.3994418437162405e-05, - "loss": 0.1422, - "step": 216525 - }, - { - "epoch": 175.06, - "learning_rate": 1.393815268275117e-05, - "loss": 0.1863, - "step": 216550 - }, - { - "epoch": 175.08, - "learning_rate": 1.3881886928339936e-05, - "loss": 0.1946, - "step": 216575 - }, - { - "epoch": 175.1, - "learning_rate": 1.38256211739287e-05, - "loss": 0.1949, - "step": 216600 - }, - { - "epoch": 175.12, - "learning_rate": 1.3769355419517464e-05, - "loss": 0.1733, - "step": 216625 - }, - { - "epoch": 175.14, - "learning_rate": 1.371308966510623e-05, - "loss": 0.197, - "step": 216650 - }, - { - "epoch": 175.16, - "learning_rate": 1.3656823910694996e-05, - "loss": 0.1728, - "step": 216675 - }, - { - "epoch": 175.18, - "learning_rate": 1.3600558156283759e-05, - "loss": 0.2056, - "step": 216700 - }, - { - "epoch": 175.2, - "learning_rate": 1.3544292401872525e-05, - "loss": 0.1502, - "step": 216725 - }, - { - "epoch": 175.22, - "learning_rate": 1.348802664746129e-05, - "loss": 0.1941, - "step": 216750 - }, - { - "epoch": 175.24, - "learning_rate": 1.3431760893050053e-05, - "loss": 0.1666, - "step": 216775 - }, - { - "epoch": 175.26, - "learning_rate": 1.337549513863882e-05, - "loss": 0.2049, - "step": 216800 - }, - { - "epoch": 175.28, - "learning_rate": 1.3319229384227584e-05, - "loss": 0.172, - "step": 216825 - }, - { - "epoch": 175.3, - "learning_rate": 1.326296362981635e-05, - "loss": 0.1989, - "step": 216850 - }, - { - "epoch": 175.32, - "learning_rate": 1.3206697875405114e-05, - "loss": 0.1849, - "step": 216875 - }, - { - "epoch": 175.34, - "learning_rate": 1.3150432120993879e-05, - "loss": 0.1806, - "step": 216900 - }, - { - "epoch": 175.36, - "learning_rate": 1.3094166366582644e-05, - "loss": 0.196, - "step": 216925 - }, - { - "epoch": 175.38, - "learning_rate": 1.3037900612171407e-05, - "loss": 0.2048, - "step": 216950 - }, - { - "epoch": 175.4, - "learning_rate": 1.2981634857760173e-05, - "loss": 0.1698, - "step": 216975 - }, - { - "epoch": 175.42, - "learning_rate": 1.2925369103348938e-05, - "loss": 0.203, - "step": 217000 - }, - { - "epoch": 175.44, - "learning_rate": 1.2869103348937703e-05, - "loss": 0.1793, - "step": 217025 - }, - { - "epoch": 175.46, - "learning_rate": 1.2812837594526468e-05, - "loss": 0.1805, - "step": 217050 - }, - { - "epoch": 175.49, - "learning_rate": 1.2756571840115232e-05, - "loss": 0.1815, - "step": 217075 - }, - { - "epoch": 175.51, - "learning_rate": 1.2700306085703997e-05, - "loss": 0.1887, - "step": 217100 - }, - { - "epoch": 175.53, - "learning_rate": 1.2644040331292764e-05, - "loss": 0.1623, - "step": 217125 - }, - { - "epoch": 175.55, - "learning_rate": 1.2587774576881527e-05, - "loss": 0.1942, - "step": 217150 - }, - { - "epoch": 175.57, - "learning_rate": 1.2531508822470292e-05, - "loss": 0.182, - "step": 217175 - }, - { - "epoch": 175.59, - "learning_rate": 1.2475243068059058e-05, - "loss": 0.1871, - "step": 217200 - }, - { - "epoch": 175.61, - "learning_rate": 1.2418977313647821e-05, - "loss": 0.1582, - "step": 217225 - }, - { - "epoch": 175.63, - "learning_rate": 1.2362711559236586e-05, - "loss": 0.2343, - "step": 217250 - }, - { - "epoch": 175.65, - "learning_rate": 1.2306445804825352e-05, - "loss": 0.1563, - "step": 217275 - }, - { - "epoch": 175.67, - "learning_rate": 1.2250180050414117e-05, - "loss": 0.1861, - "step": 217300 - }, - { - "epoch": 175.69, - "learning_rate": 1.219391429600288e-05, - "loss": 0.1569, - "step": 217325 - }, - { - "epoch": 175.71, - "learning_rate": 1.2137648541591645e-05, - "loss": 0.1992, - "step": 217350 - }, - { - "epoch": 175.73, - "learning_rate": 1.2081382787180412e-05, - "loss": 0.1648, - "step": 217375 - }, - { - "epoch": 175.75, - "learning_rate": 1.2025117032769175e-05, - "loss": 0.2176, - "step": 217400 - }, - { - "epoch": 175.77, - "learning_rate": 1.196885127835794e-05, - "loss": 0.1642, - "step": 217425 - }, - { - "epoch": 175.79, - "learning_rate": 1.1912585523946706e-05, - "loss": 0.1833, - "step": 217450 - }, - { - "epoch": 175.81, - "learning_rate": 1.1856319769535471e-05, - "loss": 0.1236, - "step": 217475 - }, - { - "epoch": 175.83, - "learning_rate": 1.1800054015124234e-05, - "loss": 0.2161, - "step": 217500 - }, - { - "epoch": 175.85, - "learning_rate": 1.1743788260713e-05, - "loss": 0.1724, - "step": 217525 - }, - { - "epoch": 175.87, - "learning_rate": 1.1687522506301765e-05, - "loss": 0.2116, - "step": 217550 - }, - { - "epoch": 175.89, - "learning_rate": 1.1631256751890528e-05, - "loss": 0.1617, - "step": 217575 - }, - { - "epoch": 175.91, - "learning_rate": 1.1574990997479295e-05, - "loss": 0.2011, - "step": 217600 - }, - { - "epoch": 175.93, - "learning_rate": 1.151872524306806e-05, - "loss": 0.1779, - "step": 217625 - }, - { - "epoch": 175.95, - "learning_rate": 1.1462459488656824e-05, - "loss": 0.2031, - "step": 217650 - }, - { - "epoch": 175.97, - "learning_rate": 1.140619373424559e-05, - "loss": 0.1873, - "step": 217675 - }, - { - "epoch": 175.99, - "learning_rate": 1.1349927979834354e-05, - "loss": 0.2092, - "step": 217700 - }, - { - "epoch": 176.01, - "learning_rate": 1.1293662225423119e-05, - "loss": 0.1807, - "step": 217725 - }, - { - "epoch": 176.03, - "learning_rate": 1.1237396471011882e-05, - "loss": 0.2006, - "step": 217750 - }, - { - "epoch": 176.05, - "learning_rate": 1.1181130716600648e-05, - "loss": 0.1731, - "step": 217775 - }, - { - "epoch": 176.07, - "learning_rate": 1.1124864962189413e-05, - "loss": 0.181, - "step": 217800 - }, - { - "epoch": 176.09, - "learning_rate": 1.1068599207778178e-05, - "loss": 0.1835, - "step": 217825 - }, - { - "epoch": 176.11, - "learning_rate": 1.1012333453366943e-05, - "loss": 0.1713, - "step": 217850 - }, - { - "epoch": 176.13, - "learning_rate": 1.0956067698955708e-05, - "loss": 0.1701, - "step": 217875 - }, - { - "epoch": 176.15, - "learning_rate": 1.0899801944544472e-05, - "loss": 0.1906, - "step": 217900 - }, - { - "epoch": 176.17, - "learning_rate": 1.0843536190133239e-05, - "loss": 0.1964, - "step": 217925 - }, - { - "epoch": 176.19, - "learning_rate": 1.0787270435722002e-05, - "loss": 0.2402, - "step": 217950 - }, - { - "epoch": 176.21, - "learning_rate": 1.0731004681310767e-05, - "loss": 0.2083, - "step": 217975 - }, - { - "epoch": 176.23, - "learning_rate": 1.0674738926899533e-05, - "loss": 0.188, - "step": 218000 - }, - { - "epoch": 176.25, - "learning_rate": 1.0618473172488296e-05, - "loss": 0.2039, - "step": 218025 - }, - { - "epoch": 176.27, - "learning_rate": 1.0562207418077061e-05, - "loss": 0.1994, - "step": 218050 - }, - { - "epoch": 176.29, - "learning_rate": 1.0505941663665828e-05, - "loss": 0.2071, - "step": 218075 - }, - { - "epoch": 176.31, - "learning_rate": 1.0449675909254593e-05, - "loss": 0.1852, - "step": 218100 - }, - { - "epoch": 176.33, - "learning_rate": 1.0393410154843356e-05, - "loss": 0.1698, - "step": 218125 - }, - { - "epoch": 176.35, - "learning_rate": 1.033714440043212e-05, - "loss": 0.1701, - "step": 218150 - }, - { - "epoch": 176.37, - "learning_rate": 1.0280878646020887e-05, - "loss": 0.1796, - "step": 218175 - }, - { - "epoch": 176.39, - "learning_rate": 1.022461289160965e-05, - "loss": 0.1857, - "step": 218200 - }, - { - "epoch": 176.41, - "learning_rate": 1.0168347137198415e-05, - "loss": 0.1589, - "step": 218225 - }, - { - "epoch": 176.43, - "learning_rate": 1.0112081382787181e-05, - "loss": 0.2114, - "step": 218250 - }, - { - "epoch": 176.46, - "learning_rate": 1.0055815628375946e-05, - "loss": 0.1822, - "step": 218275 - }, - { - "epoch": 176.48, - "learning_rate": 9.99954987396471e-06, - "loss": 0.1705, - "step": 218300 - }, - { - "epoch": 176.5, - "learning_rate": 9.943284119553476e-06, - "loss": 0.1892, - "step": 218325 - }, - { - "epoch": 176.52, - "learning_rate": 9.88701836514224e-06, - "loss": 0.1876, - "step": 218350 - }, - { - "epoch": 176.54, - "learning_rate": 9.830752610731004e-06, - "loss": 0.1808, - "step": 218375 - }, - { - "epoch": 176.56, - "learning_rate": 9.77448685631977e-06, - "loss": 0.1856, - "step": 218400 - }, - { - "epoch": 176.58, - "learning_rate": 9.718221101908535e-06, - "loss": 0.1873, - "step": 218425 - }, - { - "epoch": 176.6, - "learning_rate": 9.6619553474973e-06, - "loss": 0.2164, - "step": 218450 - }, - { - "epoch": 176.62, - "learning_rate": 9.605689593086065e-06, - "loss": 0.1846, - "step": 218475 - }, - { - "epoch": 176.64, - "learning_rate": 9.54942383867483e-06, - "loss": 0.2001, - "step": 218500 - }, - { - "epoch": 176.66, - "learning_rate": 9.493158084263594e-06, - "loss": 0.1865, - "step": 218525 - }, - { - "epoch": 176.68, - "learning_rate": 9.436892329852359e-06, - "loss": 0.1982, - "step": 218550 - }, - { - "epoch": 176.7, - "learning_rate": 9.380626575441124e-06, - "loss": 0.1883, - "step": 218575 - }, - { - "epoch": 176.72, - "learning_rate": 9.324360821029889e-06, - "loss": 0.1713, - "step": 218600 - }, - { - "epoch": 176.74, - "learning_rate": 9.268095066618653e-06, - "loss": 0.187, - "step": 218625 - }, - { - "epoch": 176.76, - "learning_rate": 9.211829312207418e-06, - "loss": 0.2027, - "step": 218650 - }, - { - "epoch": 176.78, - "learning_rate": 9.155563557796183e-06, - "loss": 0.2009, - "step": 218675 - }, - { - "epoch": 176.8, - "learning_rate": 9.099297803384948e-06, - "loss": 0.1972, - "step": 218700 - }, - { - "epoch": 176.82, - "learning_rate": 9.043032048973714e-06, - "loss": 0.2041, - "step": 218725 - }, - { - "epoch": 176.84, - "learning_rate": 8.986766294562477e-06, - "loss": 0.1886, - "step": 218750 - }, - { - "epoch": 176.86, - "learning_rate": 8.930500540151242e-06, - "loss": 0.1983, - "step": 218775 - }, - { - "epoch": 176.88, - "learning_rate": 8.874234785740009e-06, - "loss": 0.1995, - "step": 218800 - }, - { - "epoch": 176.9, - "learning_rate": 8.817969031328772e-06, - "loss": 0.166, - "step": 218825 - }, - { - "epoch": 176.92, - "learning_rate": 8.761703276917537e-06, - "loss": 0.1773, - "step": 218850 - }, - { - "epoch": 176.94, - "learning_rate": 8.705437522506303e-06, - "loss": 0.1902, - "step": 218875 - }, - { - "epoch": 176.96, - "learning_rate": 8.649171768095068e-06, - "loss": 0.1644, - "step": 218900 - }, - { - "epoch": 176.98, - "learning_rate": 8.592906013683831e-06, - "loss": 0.192, - "step": 218925 - }, - { - "epoch": 177.0, - "learning_rate": 8.536640259272596e-06, - "loss": 0.1746, - "step": 218950 - }, - { - "epoch": 177.02, - "learning_rate": 8.480374504861362e-06, - "loss": 0.1917, - "step": 218975 - }, - { - "epoch": 177.04, - "learning_rate": 8.424108750450125e-06, - "loss": 0.1746, - "step": 219000 - }, - { - "epoch": 177.04, - "eval_cer": 0.0737554284775623, - "eval_loss": 0.4736139476299286, - "eval_runtime": 150.3634, - "eval_samples_per_second": 27.886, - "eval_steps_per_second": 6.976, - "eval_wer": 0.3153344208809135, - "step": 219000 - }, - { - "epoch": 177.06, - "learning_rate": 8.36784299603889e-06, - "loss": 0.1999, - "step": 219025 - }, - { - "epoch": 177.08, - "learning_rate": 8.311577241627657e-06, - "loss": 0.1703, - "step": 219050 - }, - { - "epoch": 177.1, - "learning_rate": 8.255311487216421e-06, - "loss": 0.2036, - "step": 219075 - }, - { - "epoch": 177.12, - "learning_rate": 8.199045732805185e-06, - "loss": 0.1426, - "step": 219100 - }, - { - "epoch": 177.14, - "learning_rate": 8.142779978393951e-06, - "loss": 0.1903, - "step": 219125 - }, - { - "epoch": 177.16, - "learning_rate": 8.086514223982716e-06, - "loss": 0.1764, - "step": 219150 - }, - { - "epoch": 177.18, - "learning_rate": 8.030248469571479e-06, - "loss": 0.2088, - "step": 219175 - }, - { - "epoch": 177.2, - "learning_rate": 7.973982715160245e-06, - "loss": 0.1767, - "step": 219200 - }, - { - "epoch": 177.22, - "learning_rate": 7.91771696074901e-06, - "loss": 0.2087, - "step": 219225 - }, - { - "epoch": 177.24, - "learning_rate": 7.861451206337775e-06, - "loss": 0.1539, - "step": 219250 - }, - { - "epoch": 177.26, - "learning_rate": 7.80518545192654e-06, - "loss": 0.2094, - "step": 219275 - }, - { - "epoch": 177.28, - "learning_rate": 7.748919697515305e-06, - "loss": 0.1763, - "step": 219300 - }, - { - "epoch": 177.3, - "learning_rate": 7.69265394310407e-06, - "loss": 0.1884, - "step": 219325 - }, - { - "epoch": 177.32, - "learning_rate": 7.636388188692834e-06, - "loss": 0.1701, - "step": 219350 - }, - { - "epoch": 177.34, - "learning_rate": 7.580122434281599e-06, - "loss": 0.1838, - "step": 219375 - }, - { - "epoch": 177.36, - "learning_rate": 7.523856679870364e-06, - "loss": 0.1782, - "step": 219400 - }, - { - "epoch": 177.38, - "learning_rate": 7.467590925459129e-06, - "loss": 0.2152, - "step": 219425 - }, - { - "epoch": 177.41, - "learning_rate": 7.411325171047893e-06, - "loss": 0.1505, - "step": 219450 - }, - { - "epoch": 177.43, - "learning_rate": 7.355059416636658e-06, - "loss": 0.1944, - "step": 219475 - }, - { - "epoch": 177.45, - "learning_rate": 7.298793662225424e-06, - "loss": 0.1892, - "step": 219500 - }, - { - "epoch": 177.47, - "learning_rate": 7.242527907814188e-06, - "loss": 0.1961, - "step": 219525 - }, - { - "epoch": 177.49, - "learning_rate": 7.1862621534029534e-06, - "loss": 0.168, - "step": 219550 - }, - { - "epoch": 177.51, - "learning_rate": 7.129996398991718e-06, - "loss": 0.1958, - "step": 219575 - }, - { - "epoch": 177.53, - "learning_rate": 7.073730644580482e-06, - "loss": 0.171, - "step": 219600 - }, - { - "epoch": 177.55, - "learning_rate": 7.017464890169248e-06, - "loss": 0.1745, - "step": 219625 - }, - { - "epoch": 177.57, - "learning_rate": 6.961199135758012e-06, - "loss": 0.1488, - "step": 219650 - }, - { - "epoch": 177.59, - "learning_rate": 6.9049333813467774e-06, - "loss": 0.2208, - "step": 219675 - }, - { - "epoch": 177.61, - "learning_rate": 6.848667626935542e-06, - "loss": 0.1821, - "step": 219700 - }, - { - "epoch": 177.63, - "learning_rate": 6.792401872524307e-06, - "loss": 0.2024, - "step": 219725 - }, - { - "epoch": 177.65, - "learning_rate": 6.736136118113072e-06, - "loss": 0.1593, - "step": 219750 - }, - { - "epoch": 177.67, - "learning_rate": 6.679870363701837e-06, - "loss": 0.2056, - "step": 219775 - }, - { - "epoch": 177.69, - "learning_rate": 6.623604609290601e-06, - "loss": 0.2001, - "step": 219800 - }, - { - "epoch": 177.71, - "learning_rate": 6.567338854879366e-06, - "loss": 0.1689, - "step": 219825 - }, - { - "epoch": 177.73, - "learning_rate": 6.511073100468131e-06, - "loss": 0.175, - "step": 219850 - }, - { - "epoch": 177.75, - "learning_rate": 6.454807346056896e-06, - "loss": 0.1894, - "step": 219875 - }, - { - "epoch": 177.77, - "learning_rate": 6.3985415916456615e-06, - "loss": 0.1865, - "step": 219900 - }, - { - "epoch": 177.79, - "learning_rate": 6.342275837234425e-06, - "loss": 0.1763, - "step": 219925 - }, - { - "epoch": 177.81, - "learning_rate": 6.286010082823191e-06, - "loss": 0.1881, - "step": 219950 - }, - { - "epoch": 177.83, - "learning_rate": 6.229744328411956e-06, - "loss": 0.1949, - "step": 219975 - }, - { - "epoch": 177.85, - "learning_rate": 6.17347857400072e-06, - "loss": 0.1876, - "step": 220000 - }, - { - "epoch": 177.87, - "learning_rate": 6.1172128195894855e-06, - "loss": 0.2061, - "step": 220025 - }, - { - "epoch": 177.89, - "learning_rate": 6.060947065178249e-06, - "loss": 0.1828, - "step": 220050 - }, - { - "epoch": 177.91, - "learning_rate": 6.004681310767015e-06, - "loss": 0.2001, - "step": 220075 - }, - { - "epoch": 177.93, - "learning_rate": 5.94841555635578e-06, - "loss": 0.1594, - "step": 220100 - }, - { - "epoch": 177.95, - "learning_rate": 5.892149801944545e-06, - "loss": 0.2194, - "step": 220125 - }, - { - "epoch": 177.97, - "learning_rate": 5.838134677709759e-06, - "loss": 0.195, - "step": 220150 - }, - { - "epoch": 177.99, - "learning_rate": 5.781868923298524e-06, - "loss": 0.2, - "step": 220175 - }, - { - "epoch": 178.01, - "learning_rate": 5.7256031688872885e-06, - "loss": 0.1975, - "step": 220200 - }, - { - "epoch": 178.03, - "learning_rate": 5.669337414476053e-06, - "loss": 0.1658, - "step": 220225 - }, - { - "epoch": 178.05, - "learning_rate": 5.613071660064818e-06, - "loss": 0.1948, - "step": 220250 - }, - { - "epoch": 178.07, - "learning_rate": 5.556805905653583e-06, - "loss": 0.1941, - "step": 220275 - }, - { - "epoch": 178.09, - "learning_rate": 5.500540151242348e-06, - "loss": 0.1834, - "step": 220300 - }, - { - "epoch": 178.11, - "learning_rate": 5.444274396831113e-06, - "loss": 0.1895, - "step": 220325 - }, - { - "epoch": 178.13, - "learning_rate": 5.388008642419877e-06, - "loss": 0.1861, - "step": 220350 - }, - { - "epoch": 178.15, - "learning_rate": 5.331742888008643e-06, - "loss": 0.1968, - "step": 220375 - }, - { - "epoch": 178.17, - "learning_rate": 5.275477133597407e-06, - "loss": 0.2075, - "step": 220400 - }, - { - "epoch": 178.19, - "learning_rate": 5.2192113791861726e-06, - "loss": 0.2248, - "step": 220425 - }, - { - "epoch": 178.21, - "learning_rate": 5.162945624774937e-06, - "loss": 0.2085, - "step": 220450 - }, - { - "epoch": 178.23, - "learning_rate": 5.106679870363701e-06, - "loss": 0.1733, - "step": 220475 - }, - { - "epoch": 178.25, - "learning_rate": 5.050414115952467e-06, - "loss": 0.1964, - "step": 220500 - }, - { - "epoch": 178.27, - "learning_rate": 4.994148361541232e-06, - "loss": 0.1939, - "step": 220525 - }, - { - "epoch": 178.29, - "learning_rate": 4.9378826071299966e-06, - "loss": 0.176, - "step": 220550 - }, - { - "epoch": 178.31, - "learning_rate": 4.881616852718761e-06, - "loss": 0.1646, - "step": 220575 - }, - { - "epoch": 178.33, - "learning_rate": 4.825351098307526e-06, - "loss": 0.1918, - "step": 220600 - }, - { - "epoch": 178.35, - "learning_rate": 4.769085343896291e-06, - "loss": 0.1864, - "step": 220625 - }, - { - "epoch": 178.38, - "learning_rate": 4.712819589485056e-06, - "loss": 0.1978, - "step": 220650 - }, - { - "epoch": 178.4, - "learning_rate": 4.6565538350738206e-06, - "loss": 0.1684, - "step": 220675 - }, - { - "epoch": 178.42, - "learning_rate": 4.600288080662585e-06, - "loss": 0.1788, - "step": 220700 - }, - { - "epoch": 178.44, - "learning_rate": 4.544022326251351e-06, - "loss": 0.199, - "step": 220725 - }, - { - "epoch": 178.46, - "learning_rate": 4.487756571840115e-06, - "loss": 0.1756, - "step": 220750 - }, - { - "epoch": 178.48, - "learning_rate": 4.431490817428881e-06, - "loss": 0.1798, - "step": 220775 - }, - { - "epoch": 178.5, - "learning_rate": 4.3752250630176446e-06, - "loss": 0.2132, - "step": 220800 - }, - { - "epoch": 178.52, - "learning_rate": 4.31895930860641e-06, - "loss": 0.222, - "step": 220825 - }, - { - "epoch": 178.54, - "learning_rate": 4.262693554195175e-06, - "loss": 0.1828, - "step": 220850 - }, - { - "epoch": 178.56, - "learning_rate": 4.206427799783939e-06, - "loss": 0.1487, - "step": 220875 - }, - { - "epoch": 178.58, - "learning_rate": 4.150162045372705e-06, - "loss": 0.189, - "step": 220900 - }, - { - "epoch": 178.6, - "learning_rate": 4.093896290961469e-06, - "loss": 0.181, - "step": 220925 - }, - { - "epoch": 178.62, - "learning_rate": 4.037630536550234e-06, - "loss": 0.2038, - "step": 220950 - }, - { - "epoch": 178.64, - "learning_rate": 3.981364782138999e-06, - "loss": 0.1737, - "step": 220975 - }, - { - "epoch": 178.66, - "learning_rate": 3.925099027727764e-06, - "loss": 0.1809, - "step": 221000 - }, - { - "epoch": 178.68, - "learning_rate": 3.868833273316529e-06, - "loss": 0.1816, - "step": 221025 - }, - { - "epoch": 178.7, - "learning_rate": 3.8125675189052934e-06, - "loss": 0.1417, - "step": 221050 - }, - { - "epoch": 178.72, - "learning_rate": 3.7563017644940586e-06, - "loss": 0.189, - "step": 221075 - }, - { - "epoch": 178.74, - "learning_rate": 3.7000360100828234e-06, - "loss": 0.1741, - "step": 221100 - }, - { - "epoch": 178.76, - "learning_rate": 3.6437702556715882e-06, - "loss": 0.1994, - "step": 221125 - }, - { - "epoch": 178.78, - "learning_rate": 3.5875045012603526e-06, - "loss": 0.1655, - "step": 221150 - }, - { - "epoch": 178.8, - "learning_rate": 3.531238746849118e-06, - "loss": 0.1752, - "step": 221175 - }, - { - "epoch": 178.82, - "learning_rate": 3.4749729924378826e-06, - "loss": 0.2023, - "step": 221200 - }, - { - "epoch": 178.84, - "learning_rate": 3.4187072380266474e-06, - "loss": 0.2079, - "step": 221225 - }, - { - "epoch": 178.86, - "learning_rate": 3.3624414836154122e-06, - "loss": 0.1955, - "step": 221250 - }, - { - "epoch": 178.88, - "learning_rate": 3.3061757292041774e-06, - "loss": 0.1915, - "step": 221275 - }, - { - "epoch": 178.9, - "learning_rate": 3.2499099747929422e-06, - "loss": 0.1881, - "step": 221300 - }, - { - "epoch": 178.92, - "learning_rate": 3.193644220381707e-06, - "loss": 0.1544, - "step": 221325 - }, - { - "epoch": 178.94, - "learning_rate": 3.1373784659704714e-06, - "loss": 0.1657, - "step": 221350 - }, - { - "epoch": 178.96, - "learning_rate": 3.0811127115592366e-06, - "loss": 0.1753, - "step": 221375 - }, - { - "epoch": 178.98, - "learning_rate": 3.0248469571480014e-06, - "loss": 0.1749, - "step": 221400 - }, - { - "epoch": 179.0, - "learning_rate": 2.9685812027367662e-06, - "loss": 0.1666, - "step": 221425 - }, - { - "epoch": 179.02, - "learning_rate": 2.912315448325531e-06, - "loss": 0.1932, - "step": 221450 - }, - { - "epoch": 179.04, - "learning_rate": 2.8560496939142963e-06, - "loss": 0.1363, - "step": 221475 - }, - { - "epoch": 179.06, - "learning_rate": 2.799783939503061e-06, - "loss": 0.2135, - "step": 221500 - }, - { - "epoch": 179.08, - "learning_rate": 2.743518185091826e-06, - "loss": 0.1944, - "step": 221525 - }, - { - "epoch": 179.1, - "learning_rate": 2.6872524306805902e-06, - "loss": 0.1993, - "step": 221550 - }, - { - "epoch": 179.12, - "learning_rate": 2.6309866762693555e-06, - "loss": 0.1866, - "step": 221575 - }, - { - "epoch": 179.14, - "learning_rate": 2.5747209218581203e-06, - "loss": 0.2085, - "step": 221600 - }, - { - "epoch": 179.16, - "learning_rate": 2.518455167446885e-06, - "loss": 0.1564, - "step": 221625 - }, - { - "epoch": 179.18, - "learning_rate": 2.46218941303565e-06, - "loss": 0.2133, - "step": 221650 - }, - { - "epoch": 179.2, - "learning_rate": 2.405923658624415e-06, - "loss": 0.1709, - "step": 221675 - }, - { - "epoch": 179.22, - "learning_rate": 2.34965790421318e-06, - "loss": 0.2061, - "step": 221700 - }, - { - "epoch": 179.24, - "learning_rate": 2.2933921498019447e-06, - "loss": 0.1763, - "step": 221725 - }, - { - "epoch": 179.26, - "learning_rate": 2.237126395390709e-06, - "loss": 0.1902, - "step": 221750 - }, - { - "epoch": 179.28, - "learning_rate": 2.1808606409794743e-06, - "loss": 0.1433, - "step": 221775 - }, - { - "epoch": 179.3, - "learning_rate": 2.124594886568239e-06, - "loss": 0.2202, - "step": 221800 - }, - { - "epoch": 179.32, - "learning_rate": 2.068329132157004e-06, - "loss": 0.1739, - "step": 221825 - }, - { - "epoch": 179.35, - "learning_rate": 2.0120633777457687e-06, - "loss": 0.1809, - "step": 221850 - }, - { - "epoch": 179.37, - "learning_rate": 1.955797623334534e-06, - "loss": 0.1522, - "step": 221875 - }, - { - "epoch": 179.39, - "learning_rate": 1.8995318689232985e-06, - "loss": 0.204, - "step": 221900 - }, - { - "epoch": 179.41, - "learning_rate": 1.8432661145120633e-06, - "loss": 0.1432, - "step": 221925 - }, - { - "epoch": 179.43, - "learning_rate": 1.7870003601008283e-06, - "loss": 0.1777, - "step": 221950 - }, - { - "epoch": 179.45, - "learning_rate": 1.730734605689593e-06, - "loss": 0.1546, - "step": 221975 - }, - { - "epoch": 179.47, - "learning_rate": 1.674468851278358e-06, - "loss": 0.2101, - "step": 222000 - }, - { - "epoch": 179.47, - "eval_cer": 0.07384269478352823, - "eval_loss": 0.4755805432796478, - "eval_runtime": 153.5849, - "eval_samples_per_second": 27.301, - "eval_steps_per_second": 6.83, - "eval_wer": 0.3161174551386623, - "step": 222000 - }, - { - "epoch": 179.49, - "learning_rate": 1.6182030968671227e-06, - "loss": 0.1692, - "step": 222025 - }, - { - "epoch": 179.51, - "learning_rate": 1.5619373424558877e-06, - "loss": 0.1836, - "step": 222050 - }, - { - "epoch": 179.53, - "learning_rate": 1.5056715880446525e-06, - "loss": 0.207, - "step": 222075 - }, - { - "epoch": 179.55, - "learning_rate": 1.4494058336334173e-06, - "loss": 0.1892, - "step": 222100 - }, - { - "epoch": 179.57, - "learning_rate": 1.393140079222182e-06, - "loss": 0.192, - "step": 222125 - }, - { - "epoch": 179.59, - "learning_rate": 1.3368743248109471e-06, - "loss": 0.2154, - "step": 222150 - }, - { - "epoch": 179.61, - "learning_rate": 1.280608570399712e-06, - "loss": 0.1862, - "step": 222175 - }, - { - "epoch": 179.63, - "learning_rate": 1.2243428159884767e-06, - "loss": 0.2028, - "step": 222200 - }, - { - "epoch": 179.65, - "learning_rate": 1.1680770615772415e-06, - "loss": 0.1858, - "step": 222225 - }, - { - "epoch": 179.67, - "learning_rate": 1.1118113071660065e-06, - "loss": 0.1751, - "step": 222250 - }, - { - "epoch": 179.69, - "learning_rate": 1.0555455527547713e-06, - "loss": 0.1573, - "step": 222275 - }, - { - "epoch": 179.71, - "learning_rate": 9.992797983435363e-07, - "loss": 0.2087, - "step": 222300 - }, - { - "epoch": 179.73, - "learning_rate": 9.430140439323011e-07, - "loss": 0.163, - "step": 222325 - }, - { - "epoch": 179.75, - "learning_rate": 8.867482895210659e-07, - "loss": 0.1921, - "step": 222350 - }, - { - "epoch": 179.77, - "learning_rate": 8.304825351098308e-07, - "loss": 0.1446, - "step": 222375 - }, - { - "epoch": 179.79, - "learning_rate": 7.742167806985956e-07, - "loss": 0.2213, - "step": 222400 - }, - { - "epoch": 179.81, - "learning_rate": 7.179510262873605e-07, - "loss": 0.1778, - "step": 222425 - }, - { - "epoch": 179.83, - "learning_rate": 6.616852718761253e-07, - "loss": 0.1908, - "step": 222450 - }, - { - "epoch": 179.85, - "learning_rate": 6.054195174648902e-07, - "loss": 0.142, - "step": 222475 - }, - { - "epoch": 179.87, - "learning_rate": 5.49153763053655e-07, - "loss": 0.1851, - "step": 222500 - }, - { - "epoch": 179.89, - "learning_rate": 4.9288800864242e-07, - "loss": 0.1485, - "step": 222525 - }, - { - "epoch": 179.91, - "learning_rate": 4.3662225423118475e-07, - "loss": 0.1964, - "step": 222550 - }, - { - "epoch": 179.93, - "learning_rate": 3.803564998199496e-07, - "loss": 0.1942, - "step": 222575 - }, - { - "epoch": 179.95, - "learning_rate": 3.2409074540871446e-07, - "loss": 0.1905, - "step": 222600 - }, - { - "epoch": 179.97, - "learning_rate": 2.678249909974793e-07, - "loss": 0.1591, - "step": 222625 - }, - { - "epoch": 179.99, - "learning_rate": 2.1155923658624413e-07, - "loss": 0.1748, - "step": 222650 - }, - { - "epoch": 180.0, - "step": 222660, - "total_flos": 2.3788341158199368e+20, - "train_loss": 0.061750437557927515, - "train_runtime": 29496.4676, - "train_samples_per_second": 60.347, - "train_steps_per_second": 7.549 + "epoch": 493.02, + "eval_cer": 0.06007625088565741, + "eval_loss": 0.41654759645462036, + "eval_runtime": 115.3904, + "eval_samples_per_second": 26.969, + "eval_steps_per_second": 3.371, + "eval_wer": 0.27991808524254447, + "step": 21200 } ], - "max_steps": 222660, - "num_train_epochs": 180, - "total_flos": 2.3788341158199368e+20, + "max_steps": 21500, + "num_train_epochs": 500, + "total_flos": 5.302246573116527e+20, "trial_name": null, "trial_params": null }