diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,17560 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 15.0, + "eval_steps": 500, + "global_step": 289695, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.01, + "learning_rate": 5.621301775147928e-07, + "loss": 9.502, + "step": 100 + }, + { + "epoch": 0.01, + "learning_rate": 1.1479289940828402e-06, + "loss": 6.5731, + "step": 200 + }, + { + "epoch": 0.02, + "learning_rate": 1.7396449704142013e-06, + "loss": 5.0687, + "step": 300 + }, + { + "epoch": 0.02, + "learning_rate": 2.331360946745562e-06, + "loss": 4.5739, + "step": 400 + }, + { + "epoch": 0.03, + "learning_rate": 2.923076923076923e-06, + "loss": 4.2504, + "step": 500 + }, + { + "epoch": 0.03, + "learning_rate": 3.5147928994082843e-06, + "loss": 3.8214, + "step": 600 + }, + { + "epoch": 0.04, + "learning_rate": 4.106508875739645e-06, + "loss": 3.698, + "step": 700 + }, + { + "epoch": 0.04, + "learning_rate": 4.698224852071006e-06, + "loss": 3.5288, + "step": 800 + }, + { + "epoch": 0.05, + "learning_rate": 5.289940828402367e-06, + "loss": 3.2917, + "step": 900 + }, + { + "epoch": 0.05, + "learning_rate": 5.881656804733727e-06, + "loss": 3.174, + "step": 1000 + }, + { + "epoch": 0.06, + "learning_rate": 6.473372781065089e-06, + "loss": 3.0224, + "step": 1100 + }, + { + "epoch": 0.06, + "learning_rate": 7.06508875739645e-06, + "loss": 3.0186, + "step": 1200 + }, + { + "epoch": 0.07, + "learning_rate": 7.656804733727812e-06, + "loss": 2.8844, + "step": 1300 + }, + { + "epoch": 0.07, + "learning_rate": 8.248520710059172e-06, + "loss": 2.8003, + "step": 1400 + }, + { + "epoch": 0.08, + "learning_rate": 8.840236686390532e-06, + "loss": 2.6516, + "step": 1500 + }, + { + "epoch": 0.08, + "learning_rate": 9.431952662721894e-06, + "loss": 2.5261, + "step": 1600 + }, + { + "epoch": 0.09, + "learning_rate": 1.0023668639053254e-05, + "loss": 2.5945, + "step": 1700 + }, + { + "epoch": 0.09, + "learning_rate": 1.0615384615384616e-05, + "loss": 2.4841, + "step": 1800 + }, + { + "epoch": 0.1, + "learning_rate": 1.1207100591715977e-05, + "loss": 2.5586, + "step": 1900 + }, + { + "epoch": 0.1, + "learning_rate": 1.1798816568047337e-05, + "loss": 2.4368, + "step": 2000 + }, + { + "epoch": 0.11, + "learning_rate": 1.2390532544378699e-05, + "loss": 2.4365, + "step": 2100 + }, + { + "epoch": 0.11, + "learning_rate": 1.2982248520710059e-05, + "loss": 2.4752, + "step": 2200 + }, + { + "epoch": 0.12, + "learning_rate": 1.3573964497041421e-05, + "loss": 2.3907, + "step": 2300 + }, + { + "epoch": 0.12, + "learning_rate": 1.4159763313609468e-05, + "loss": 2.4214, + "step": 2400 + }, + { + "epoch": 0.13, + "learning_rate": 1.4751479289940828e-05, + "loss": 2.4079, + "step": 2500 + }, + { + "epoch": 0.13, + "learning_rate": 1.5343195266272192e-05, + "loss": 2.2597, + "step": 2600 + }, + { + "epoch": 0.14, + "learning_rate": 1.593491124260355e-05, + "loss": 2.2614, + "step": 2700 + }, + { + "epoch": 0.14, + "learning_rate": 1.6526627218934912e-05, + "loss": 2.3671, + "step": 2800 + }, + { + "epoch": 0.15, + "learning_rate": 1.7118343195266274e-05, + "loss": 2.3223, + "step": 2900 + }, + { + "epoch": 0.16, + "learning_rate": 1.7710059171597633e-05, + "loss": 2.4155, + "step": 3000 + }, + { + "epoch": 0.16, + "learning_rate": 1.8301775147928995e-05, + "loss": 2.2976, + "step": 3100 + }, + { + "epoch": 0.17, + "learning_rate": 1.8893491124260353e-05, + "loss": 2.2927, + "step": 3200 + }, + { + "epoch": 0.17, + "learning_rate": 1.9485207100591715e-05, + "loss": 2.2895, + "step": 3300 + }, + { + "epoch": 0.18, + "learning_rate": 2.0076923076923077e-05, + "loss": 2.3672, + "step": 3400 + }, + { + "epoch": 0.18, + "learning_rate": 2.066863905325444e-05, + "loss": 2.2301, + "step": 3500 + }, + { + "epoch": 0.19, + "learning_rate": 2.12603550295858e-05, + "loss": 2.2593, + "step": 3600 + }, + { + "epoch": 0.19, + "learning_rate": 2.185207100591716e-05, + "loss": 2.3393, + "step": 3700 + }, + { + "epoch": 0.2, + "learning_rate": 2.2443786982248522e-05, + "loss": 2.2819, + "step": 3800 + }, + { + "epoch": 0.2, + "learning_rate": 2.3035502958579884e-05, + "loss": 2.266, + "step": 3900 + }, + { + "epoch": 0.21, + "learning_rate": 2.3627218934911242e-05, + "loss": 2.2548, + "step": 4000 + }, + { + "epoch": 0.21, + "learning_rate": 2.4218934911242604e-05, + "loss": 2.2014, + "step": 4100 + }, + { + "epoch": 0.22, + "learning_rate": 2.4810650887573966e-05, + "loss": 2.2776, + "step": 4200 + }, + { + "epoch": 0.22, + "learning_rate": 2.5402366863905325e-05, + "loss": 2.1123, + "step": 4300 + }, + { + "epoch": 0.23, + "learning_rate": 2.5994082840236687e-05, + "loss": 2.3797, + "step": 4400 + }, + { + "epoch": 0.23, + "learning_rate": 2.6585798816568045e-05, + "loss": 2.2538, + "step": 4500 + }, + { + "epoch": 0.24, + "learning_rate": 2.717751479289941e-05, + "loss": 2.2793, + "step": 4600 + }, + { + "epoch": 0.24, + "learning_rate": 2.7763313609467454e-05, + "loss": 2.231, + "step": 4700 + }, + { + "epoch": 0.25, + "learning_rate": 2.8355029585798816e-05, + "loss": 2.2729, + "step": 4800 + }, + { + "epoch": 0.25, + "learning_rate": 2.8946745562130178e-05, + "loss": 2.2386, + "step": 4900 + }, + { + "epoch": 0.26, + "learning_rate": 2.953846153846154e-05, + "loss": 2.4201, + "step": 5000 + }, + { + "epoch": 0.26, + "learning_rate": 3.01301775147929e-05, + "loss": 2.2768, + "step": 5100 + }, + { + "epoch": 0.27, + "learning_rate": 3.072189349112426e-05, + "loss": 2.2313, + "step": 5200 + }, + { + "epoch": 0.27, + "learning_rate": 3.131360946745562e-05, + "loss": 2.2918, + "step": 5300 + }, + { + "epoch": 0.28, + "learning_rate": 3.1905325443786984e-05, + "loss": 2.2836, + "step": 5400 + }, + { + "epoch": 0.28, + "learning_rate": 3.249704142011834e-05, + "loss": 2.3043, + "step": 5500 + }, + { + "epoch": 0.29, + "learning_rate": 3.30887573964497e-05, + "loss": 2.1663, + "step": 5600 + }, + { + "epoch": 0.3, + "learning_rate": 3.368047337278107e-05, + "loss": 2.2577, + "step": 5700 + }, + { + "epoch": 0.3, + "learning_rate": 3.4272189349112425e-05, + "loss": 2.1866, + "step": 5800 + }, + { + "epoch": 0.31, + "learning_rate": 3.486390532544379e-05, + "loss": 2.2416, + "step": 5900 + }, + { + "epoch": 0.31, + "learning_rate": 3.545562130177515e-05, + "loss": 2.2288, + "step": 6000 + }, + { + "epoch": 0.32, + "learning_rate": 3.6047337278106515e-05, + "loss": 2.1223, + "step": 6100 + }, + { + "epoch": 0.32, + "learning_rate": 3.6639053254437867e-05, + "loss": 2.3423, + "step": 6200 + }, + { + "epoch": 0.33, + "learning_rate": 3.723076923076923e-05, + "loss": 2.235, + "step": 6300 + }, + { + "epoch": 0.33, + "learning_rate": 3.782248520710059e-05, + "loss": 2.2591, + "step": 6400 + }, + { + "epoch": 0.34, + "learning_rate": 3.8414201183431956e-05, + "loss": 2.2002, + "step": 6500 + }, + { + "epoch": 0.34, + "learning_rate": 3.9005917159763314e-05, + "loss": 2.2121, + "step": 6600 + }, + { + "epoch": 0.35, + "learning_rate": 3.959763313609467e-05, + "loss": 2.2261, + "step": 6700 + }, + { + "epoch": 0.35, + "learning_rate": 4.018934911242604e-05, + "loss": 2.1885, + "step": 6800 + }, + { + "epoch": 0.36, + "learning_rate": 4.07810650887574e-05, + "loss": 2.1876, + "step": 6900 + }, + { + "epoch": 0.36, + "learning_rate": 4.137278106508876e-05, + "loss": 2.175, + "step": 7000 + }, + { + "epoch": 0.37, + "learning_rate": 4.196449704142012e-05, + "loss": 2.1904, + "step": 7100 + }, + { + "epoch": 0.37, + "learning_rate": 4.255621301775148e-05, + "loss": 2.0075, + "step": 7200 + }, + { + "epoch": 0.38, + "learning_rate": 4.314792899408284e-05, + "loss": 2.2386, + "step": 7300 + }, + { + "epoch": 0.38, + "learning_rate": 4.37396449704142e-05, + "loss": 2.2165, + "step": 7400 + }, + { + "epoch": 0.39, + "learning_rate": 4.433136094674556e-05, + "loss": 2.2467, + "step": 7500 + }, + { + "epoch": 0.39, + "learning_rate": 4.492307692307693e-05, + "loss": 2.254, + "step": 7600 + }, + { + "epoch": 0.4, + "learning_rate": 4.5514792899408286e-05, + "loss": 2.1702, + "step": 7700 + }, + { + "epoch": 0.4, + "learning_rate": 4.6106508875739644e-05, + "loss": 2.1327, + "step": 7800 + }, + { + "epoch": 0.41, + "learning_rate": 4.669822485207101e-05, + "loss": 2.24, + "step": 7900 + }, + { + "epoch": 0.41, + "learning_rate": 4.728994082840237e-05, + "loss": 2.1117, + "step": 8000 + }, + { + "epoch": 0.42, + "learning_rate": 4.7881656804733734e-05, + "loss": 2.2405, + "step": 8100 + }, + { + "epoch": 0.42, + "learning_rate": 4.8473372781065085e-05, + "loss": 2.1799, + "step": 8200 + }, + { + "epoch": 0.43, + "learning_rate": 4.906508875739645e-05, + "loss": 2.1877, + "step": 8300 + }, + { + "epoch": 0.43, + "learning_rate": 4.965680473372781e-05, + "loss": 2.2009, + "step": 8400 + }, + { + "epoch": 0.44, + "learning_rate": 5.0248520710059175e-05, + "loss": 2.162, + "step": 8500 + }, + { + "epoch": 0.45, + "learning_rate": 5.084023668639053e-05, + "loss": 2.2372, + "step": 8600 + }, + { + "epoch": 0.45, + "learning_rate": 5.143195266272189e-05, + "loss": 2.2015, + "step": 8700 + }, + { + "epoch": 0.46, + "learning_rate": 5.201775147928994e-05, + "loss": 2.2623, + "step": 8800 + }, + { + "epoch": 0.46, + "learning_rate": 5.26094674556213e-05, + "loss": 2.2089, + "step": 8900 + }, + { + "epoch": 0.47, + "learning_rate": 5.3201183431952666e-05, + "loss": 2.2191, + "step": 9000 + }, + { + "epoch": 0.47, + "learning_rate": 5.3792899408284025e-05, + "loss": 2.2591, + "step": 9100 + }, + { + "epoch": 0.48, + "learning_rate": 5.438461538461538e-05, + "loss": 2.1673, + "step": 9200 + }, + { + "epoch": 0.48, + "learning_rate": 5.497633136094675e-05, + "loss": 2.3361, + "step": 9300 + }, + { + "epoch": 0.49, + "learning_rate": 5.556804733727811e-05, + "loss": 2.3092, + "step": 9400 + }, + { + "epoch": 0.49, + "learning_rate": 5.615976331360947e-05, + "loss": 2.3328, + "step": 9500 + }, + { + "epoch": 0.5, + "learning_rate": 5.675147928994083e-05, + "loss": 2.1896, + "step": 9600 + }, + { + "epoch": 0.5, + "learning_rate": 5.734319526627219e-05, + "loss": 2.2207, + "step": 9700 + }, + { + "epoch": 0.51, + "learning_rate": 5.793491124260355e-05, + "loss": 2.2983, + "step": 9800 + }, + { + "epoch": 0.51, + "learning_rate": 5.8526627218934913e-05, + "loss": 2.232, + "step": 9900 + }, + { + "epoch": 0.52, + "learning_rate": 5.911834319526627e-05, + "loss": 2.3217, + "step": 10000 + }, + { + "epoch": 0.52, + "learning_rate": 5.971005917159764e-05, + "loss": 2.2792, + "step": 10100 + }, + { + "epoch": 0.53, + "learning_rate": 5.999999507283829e-05, + "loss": 2.2231, + "step": 10200 + }, + { + "epoch": 0.53, + "learning_rate": 5.999995680730862e-05, + "loss": 2.3753, + "step": 10300 + }, + { + "epoch": 0.54, + "learning_rate": 5.99998806551643e-05, + "loss": 2.2769, + "step": 10400 + }, + { + "epoch": 0.54, + "learning_rate": 5.999976661650152e-05, + "loss": 2.1685, + "step": 10500 + }, + { + "epoch": 0.55, + "learning_rate": 5.99996146914643e-05, + "loss": 2.2553, + "step": 10600 + }, + { + "epoch": 0.55, + "learning_rate": 5.999942488024448e-05, + "loss": 2.141, + "step": 10700 + }, + { + "epoch": 0.56, + "learning_rate": 5.999919718308179e-05, + "loss": 2.3038, + "step": 10800 + }, + { + "epoch": 0.56, + "learning_rate": 5.999893160026379e-05, + "loss": 2.2144, + "step": 10900 + }, + { + "epoch": 0.57, + "learning_rate": 5.999862813212587e-05, + "loss": 2.2907, + "step": 11000 + }, + { + "epoch": 0.57, + "learning_rate": 5.999828677905128e-05, + "loss": 2.2789, + "step": 11100 + }, + { + "epoch": 0.58, + "learning_rate": 5.9997907541471113e-05, + "loss": 2.2022, + "step": 11200 + }, + { + "epoch": 0.59, + "learning_rate": 5.999749041986431e-05, + "loss": 2.0724, + "step": 11300 + }, + { + "epoch": 0.59, + "learning_rate": 5.9997035414757635e-05, + "loss": 2.0722, + "step": 11400 + }, + { + "epoch": 0.6, + "learning_rate": 5.999654252672572e-05, + "loss": 2.0308, + "step": 11500 + }, + { + "epoch": 0.6, + "learning_rate": 5.999601175639101e-05, + "loss": 2.1458, + "step": 11600 + }, + { + "epoch": 0.61, + "learning_rate": 5.9995443104423844e-05, + "loss": 2.1932, + "step": 11700 + }, + { + "epoch": 0.61, + "learning_rate": 5.9994836571542334e-05, + "loss": 2.1513, + "step": 11800 + }, + { + "epoch": 0.62, + "learning_rate": 5.999419215851248e-05, + "loss": 2.0049, + "step": 11900 + }, + { + "epoch": 0.62, + "learning_rate": 5.999350986614808e-05, + "loss": 2.1251, + "step": 12000 + }, + { + "epoch": 0.63, + "learning_rate": 5.9992789695310836e-05, + "loss": 2.0781, + "step": 12100 + }, + { + "epoch": 0.63, + "learning_rate": 5.9992031646910215e-05, + "loss": 2.0652, + "step": 12200 + }, + { + "epoch": 0.64, + "learning_rate": 5.999123572190355e-05, + "loss": 2.04, + "step": 12300 + }, + { + "epoch": 0.64, + "learning_rate": 5.999040192129601e-05, + "loss": 2.0588, + "step": 12400 + }, + { + "epoch": 0.65, + "learning_rate": 5.998953024614059e-05, + "loss": 2.1285, + "step": 12500 + }, + { + "epoch": 0.65, + "learning_rate": 5.9988620697538115e-05, + "loss": 1.9282, + "step": 12600 + }, + { + "epoch": 0.66, + "learning_rate": 5.998767327663726e-05, + "loss": 2.0434, + "step": 12700 + }, + { + "epoch": 0.66, + "learning_rate": 5.9986687984634504e-05, + "loss": 1.9448, + "step": 12800 + }, + { + "epoch": 0.67, + "learning_rate": 5.998567524184435e-05, + "loss": 1.9255, + "step": 12900 + }, + { + "epoch": 0.67, + "learning_rate": 5.998461459009765e-05, + "loss": 1.9484, + "step": 13000 + }, + { + "epoch": 0.68, + "learning_rate": 5.9983516071111834e-05, + "loss": 1.9843, + "step": 13100 + }, + { + "epoch": 0.68, + "learning_rate": 5.99823796862742e-05, + "loss": 1.9812, + "step": 13200 + }, + { + "epoch": 0.69, + "learning_rate": 5.998120543701989e-05, + "loss": 2.0037, + "step": 13300 + }, + { + "epoch": 0.69, + "learning_rate": 5.997999332483183e-05, + "loss": 2.0109, + "step": 13400 + }, + { + "epoch": 0.7, + "learning_rate": 5.997874335124079e-05, + "loss": 1.9634, + "step": 13500 + }, + { + "epoch": 0.7, + "learning_rate": 5.997745551782536e-05, + "loss": 2.014, + "step": 13600 + }, + { + "epoch": 0.71, + "learning_rate": 5.997612982621192e-05, + "loss": 2.0308, + "step": 13700 + }, + { + "epoch": 0.71, + "learning_rate": 5.9974766278074676e-05, + "loss": 1.9613, + "step": 13800 + }, + { + "epoch": 0.72, + "learning_rate": 5.997336487513563e-05, + "loss": 1.9359, + "step": 13900 + }, + { + "epoch": 0.72, + "learning_rate": 5.997192561916461e-05, + "loss": 1.9366, + "step": 14000 + }, + { + "epoch": 0.73, + "learning_rate": 5.997044851197922e-05, + "loss": 2.0161, + "step": 14100 + }, + { + "epoch": 0.74, + "learning_rate": 5.99689335554449e-05, + "loss": 1.9627, + "step": 14200 + }, + { + "epoch": 0.74, + "learning_rate": 5.996738075147486e-05, + "loss": 1.989, + "step": 14300 + }, + { + "epoch": 0.75, + "learning_rate": 5.9965790102030127e-05, + "loss": 1.9321, + "step": 14400 + }, + { + "epoch": 0.75, + "learning_rate": 5.99641616091195e-05, + "loss": 1.7904, + "step": 14500 + }, + { + "epoch": 0.76, + "learning_rate": 5.996249527479962e-05, + "loss": 1.8188, + "step": 14600 + }, + { + "epoch": 0.76, + "learning_rate": 5.996079110117484e-05, + "loss": 1.9421, + "step": 14700 + }, + { + "epoch": 0.77, + "learning_rate": 5.995904909039736e-05, + "loss": 1.7732, + "step": 14800 + }, + { + "epoch": 0.77, + "learning_rate": 5.995726924466715e-05, + "loss": 1.8639, + "step": 14900 + }, + { + "epoch": 0.78, + "learning_rate": 5.99554699302807e-05, + "loss": 1.8302, + "step": 15000 + }, + { + "epoch": 0.78, + "learning_rate": 5.995361479972862e-05, + "loss": 1.9115, + "step": 15100 + }, + { + "epoch": 0.79, + "learning_rate": 5.995172184108671e-05, + "loss": 1.9075, + "step": 15200 + }, + { + "epoch": 0.79, + "learning_rate": 5.994979105674557e-05, + "loss": 1.7628, + "step": 15300 + }, + { + "epoch": 0.8, + "learning_rate": 5.9947822449143566e-05, + "loss": 1.8985, + "step": 15400 + }, + { + "epoch": 0.8, + "learning_rate": 5.9945816020766824e-05, + "loss": 1.8767, + "step": 15500 + }, + { + "epoch": 0.81, + "learning_rate": 5.994377177414925e-05, + "loss": 1.7613, + "step": 15600 + }, + { + "epoch": 0.81, + "learning_rate": 5.9941689711872495e-05, + "loss": 1.8906, + "step": 15700 + }, + { + "epoch": 0.82, + "learning_rate": 5.993956983656598e-05, + "loss": 1.7939, + "step": 15800 + }, + { + "epoch": 0.82, + "learning_rate": 5.993741215090686e-05, + "loss": 1.8201, + "step": 15900 + }, + { + "epoch": 0.83, + "learning_rate": 5.993521665762006e-05, + "loss": 1.7952, + "step": 16000 + }, + { + "epoch": 0.83, + "learning_rate": 5.993298335947824e-05, + "loss": 1.7649, + "step": 16100 + }, + { + "epoch": 0.84, + "learning_rate": 5.9930712259301815e-05, + "loss": 1.7605, + "step": 16200 + }, + { + "epoch": 0.84, + "learning_rate": 5.9928403359958925e-05, + "loss": 1.855, + "step": 16300 + }, + { + "epoch": 0.85, + "learning_rate": 5.9926056664365456e-05, + "loss": 1.7398, + "step": 16400 + }, + { + "epoch": 0.85, + "learning_rate": 5.992367217548502e-05, + "loss": 1.8579, + "step": 16500 + }, + { + "epoch": 0.86, + "learning_rate": 5.992124989632898e-05, + "loss": 1.8768, + "step": 16600 + }, + { + "epoch": 0.86, + "learning_rate": 5.991878982995638e-05, + "loss": 1.7858, + "step": 16700 + }, + { + "epoch": 0.87, + "learning_rate": 5.9916291979474026e-05, + "loss": 1.784, + "step": 16800 + }, + { + "epoch": 0.88, + "learning_rate": 5.991375634803642e-05, + "loss": 1.8008, + "step": 16900 + }, + { + "epoch": 0.88, + "learning_rate": 5.991118293884579e-05, + "loss": 1.8043, + "step": 17000 + }, + { + "epoch": 0.89, + "learning_rate": 5.990857175515206e-05, + "loss": 1.7571, + "step": 17100 + }, + { + "epoch": 0.89, + "learning_rate": 5.9905922800252854e-05, + "loss": 1.8927, + "step": 17200 + }, + { + "epoch": 0.9, + "learning_rate": 5.990323607749354e-05, + "loss": 1.7737, + "step": 17300 + }, + { + "epoch": 0.9, + "learning_rate": 5.9900511590267124e-05, + "loss": 1.7595, + "step": 17400 + }, + { + "epoch": 0.91, + "learning_rate": 5.989774934201433e-05, + "loss": 1.7205, + "step": 17500 + }, + { + "epoch": 0.91, + "learning_rate": 5.989494933622358e-05, + "loss": 1.816, + "step": 17600 + }, + { + "epoch": 0.92, + "learning_rate": 5.989211157643097e-05, + "loss": 1.7381, + "step": 17700 + }, + { + "epoch": 0.92, + "learning_rate": 5.9889236066220285e-05, + "loss": 1.8072, + "step": 17800 + }, + { + "epoch": 0.93, + "learning_rate": 5.988632280922295e-05, + "loss": 1.7647, + "step": 17900 + }, + { + "epoch": 0.93, + "learning_rate": 5.988337180911812e-05, + "loss": 1.7531, + "step": 18000 + }, + { + "epoch": 0.94, + "learning_rate": 5.9880383069632536e-05, + "loss": 1.7142, + "step": 18100 + }, + { + "epoch": 0.94, + "learning_rate": 5.987741749382682e-05, + "loss": 1.8254, + "step": 18200 + }, + { + "epoch": 0.95, + "learning_rate": 5.987435404154869e-05, + "loss": 1.8182, + "step": 18300 + }, + { + "epoch": 0.95, + "learning_rate": 5.9871252861278286e-05, + "loss": 1.7693, + "step": 18400 + }, + { + "epoch": 0.96, + "learning_rate": 5.9868113956932036e-05, + "loss": 1.7431, + "step": 18500 + }, + { + "epoch": 0.96, + "learning_rate": 5.986493733247402e-05, + "loss": 1.7961, + "step": 18600 + }, + { + "epoch": 0.97, + "learning_rate": 5.986172299191598e-05, + "loss": 1.6683, + "step": 18700 + }, + { + "epoch": 0.97, + "learning_rate": 5.985847093931726e-05, + "loss": 1.7305, + "step": 18800 + }, + { + "epoch": 0.98, + "learning_rate": 5.985518117878484e-05, + "loss": 1.7088, + "step": 18900 + }, + { + "epoch": 0.98, + "learning_rate": 5.9851853714473335e-05, + "loss": 1.6971, + "step": 19000 + }, + { + "epoch": 0.99, + "learning_rate": 5.984848855058495e-05, + "loss": 1.6925, + "step": 19100 + }, + { + "epoch": 0.99, + "learning_rate": 5.984508569136952e-05, + "loss": 1.6972, + "step": 19200 + }, + { + "epoch": 1.0, + "learning_rate": 5.984164514112447e-05, + "loss": 1.65, + "step": 19300 + }, + { + "epoch": 1.0, + "eval_accuracy": 0.6241805248136068, + "eval_cer": 0.30962444297001096, + "eval_loss": 1.6472936868667603, + "eval_runtime": 4313.7933, + "eval_samples_per_second": 3.98, + "eval_steps_per_second": 0.249, + "eval_wer": 0.5482265749073584, + "step": 19313 + }, + { + "epoch": 1.0, + "learning_rate": 5.983816690419484e-05, + "loss": 1.6502, + "step": 19400 + }, + { + "epoch": 1.01, + "learning_rate": 5.983465098497327e-05, + "loss": 1.7195, + "step": 19500 + }, + { + "epoch": 1.01, + "learning_rate": 5.983109738789995e-05, + "loss": 1.6154, + "step": 19600 + }, + { + "epoch": 1.02, + "learning_rate": 5.9827506117462686e-05, + "loss": 1.6513, + "step": 19700 + }, + { + "epoch": 1.03, + "learning_rate": 5.9823877178196866e-05, + "loss": 1.6085, + "step": 19800 + }, + { + "epoch": 1.03, + "learning_rate": 5.982021057468542e-05, + "loss": 1.557, + "step": 19900 + }, + { + "epoch": 1.04, + "learning_rate": 5.9816506311558886e-05, + "loss": 1.6473, + "step": 20000 + }, + { + "epoch": 1.04, + "learning_rate": 5.981276439349531e-05, + "loss": 1.6252, + "step": 20100 + }, + { + "epoch": 1.05, + "learning_rate": 5.980898482522034e-05, + "loss": 1.5114, + "step": 20200 + }, + { + "epoch": 1.05, + "learning_rate": 5.980516761150713e-05, + "loss": 1.4987, + "step": 20300 + }, + { + "epoch": 1.06, + "learning_rate": 5.980131275717641e-05, + "loss": 1.5771, + "step": 20400 + }, + { + "epoch": 1.06, + "learning_rate": 5.979742026709645e-05, + "loss": 1.5157, + "step": 20500 + }, + { + "epoch": 1.07, + "learning_rate": 5.9793490146183e-05, + "loss": 1.5522, + "step": 20600 + }, + { + "epoch": 1.07, + "learning_rate": 5.9789522399399387e-05, + "loss": 1.6356, + "step": 20700 + }, + { + "epoch": 1.08, + "learning_rate": 5.978551703175643e-05, + "loss": 1.5537, + "step": 20800 + }, + { + "epoch": 1.08, + "learning_rate": 5.978147404831245e-05, + "loss": 1.5864, + "step": 20900 + }, + { + "epoch": 1.09, + "learning_rate": 5.977739345417331e-05, + "loss": 1.5781, + "step": 21000 + }, + { + "epoch": 1.09, + "learning_rate": 5.9773275254492334e-05, + "loss": 1.6126, + "step": 21100 + }, + { + "epoch": 1.1, + "learning_rate": 5.9769119454470346e-05, + "loss": 1.5866, + "step": 21200 + }, + { + "epoch": 1.1, + "learning_rate": 5.9764926059355683e-05, + "loss": 1.6155, + "step": 21300 + }, + { + "epoch": 1.11, + "learning_rate": 5.976069507444411e-05, + "loss": 1.582, + "step": 21400 + }, + { + "epoch": 1.11, + "learning_rate": 5.97564265050789e-05, + "loss": 1.6416, + "step": 21500 + }, + { + "epoch": 1.12, + "learning_rate": 5.975212035665079e-05, + "loss": 1.4625, + "step": 21600 + }, + { + "epoch": 1.12, + "learning_rate": 5.9747776634597963e-05, + "loss": 1.6298, + "step": 21700 + }, + { + "epoch": 1.13, + "learning_rate": 5.9743395344406064e-05, + "loss": 1.5382, + "step": 21800 + }, + { + "epoch": 1.13, + "learning_rate": 5.973897649160815e-05, + "loss": 1.547, + "step": 21900 + }, + { + "epoch": 1.14, + "learning_rate": 5.9734520081784775e-05, + "loss": 1.567, + "step": 22000 + }, + { + "epoch": 1.14, + "learning_rate": 5.9730026120563875e-05, + "loss": 1.5915, + "step": 22100 + }, + { + "epoch": 1.15, + "learning_rate": 5.972549461362082e-05, + "loss": 1.5134, + "step": 22200 + }, + { + "epoch": 1.15, + "learning_rate": 5.972097144295192e-05, + "loss": 1.5749, + "step": 22300 + }, + { + "epoch": 1.16, + "learning_rate": 5.971636523709392e-05, + "loss": 1.5486, + "step": 22400 + }, + { + "epoch": 1.17, + "learning_rate": 5.9711721502765944e-05, + "loss": 1.5602, + "step": 22500 + }, + { + "epoch": 1.17, + "learning_rate": 5.970704024583252e-05, + "loss": 1.4998, + "step": 22600 + }, + { + "epoch": 1.18, + "learning_rate": 5.970232147220556e-05, + "loss": 1.5321, + "step": 22700 + }, + { + "epoch": 1.18, + "learning_rate": 5.969756518784433e-05, + "loss": 1.5061, + "step": 22800 + }, + { + "epoch": 1.19, + "learning_rate": 5.969277139875551e-05, + "loss": 1.5233, + "step": 22900 + }, + { + "epoch": 1.19, + "learning_rate": 5.968794011099312e-05, + "loss": 1.5719, + "step": 23000 + }, + { + "epoch": 1.2, + "learning_rate": 5.968307133065853e-05, + "loss": 1.6042, + "step": 23100 + }, + { + "epoch": 1.2, + "learning_rate": 5.9678165063900475e-05, + "loss": 1.575, + "step": 23200 + }, + { + "epoch": 1.21, + "learning_rate": 5.967322131691504e-05, + "loss": 1.6676, + "step": 23300 + }, + { + "epoch": 1.21, + "learning_rate": 5.9668240095945606e-05, + "loss": 1.5472, + "step": 23400 + }, + { + "epoch": 1.22, + "learning_rate": 5.966322140728291e-05, + "loss": 1.5739, + "step": 23500 + }, + { + "epoch": 1.22, + "learning_rate": 5.9658165257264996e-05, + "loss": 1.5337, + "step": 23600 + }, + { + "epoch": 1.23, + "learning_rate": 5.9653071652277224e-05, + "loss": 1.5106, + "step": 23700 + }, + { + "epoch": 1.23, + "learning_rate": 5.9647940598752254e-05, + "loss": 1.494, + "step": 23800 + }, + { + "epoch": 1.24, + "learning_rate": 5.964277210317004e-05, + "loss": 1.5296, + "step": 23900 + }, + { + "epoch": 1.24, + "learning_rate": 5.96375661720578e-05, + "loss": 1.5525, + "step": 24000 + }, + { + "epoch": 1.25, + "learning_rate": 5.963232281199006e-05, + "loss": 1.5075, + "step": 24100 + }, + { + "epoch": 1.25, + "learning_rate": 5.962704202958861e-05, + "loss": 1.4719, + "step": 24200 + }, + { + "epoch": 1.26, + "learning_rate": 5.9621723831522475e-05, + "loss": 1.5053, + "step": 24300 + }, + { + "epoch": 1.26, + "learning_rate": 5.961636822450795e-05, + "loss": 1.5558, + "step": 24400 + }, + { + "epoch": 1.27, + "learning_rate": 5.961097521530859e-05, + "loss": 1.5275, + "step": 24500 + }, + { + "epoch": 1.27, + "learning_rate": 5.960554481073515e-05, + "loss": 1.4672, + "step": 24600 + }, + { + "epoch": 1.28, + "learning_rate": 5.960013188062705e-05, + "loss": 1.5327, + "step": 24700 + }, + { + "epoch": 1.28, + "learning_rate": 5.9594627079708444e-05, + "loss": 1.4686, + "step": 24800 + }, + { + "epoch": 1.29, + "learning_rate": 5.958908490406165e-05, + "loss": 1.548, + "step": 24900 + }, + { + "epoch": 1.29, + "learning_rate": 5.958350536068581e-05, + "loss": 1.5065, + "step": 25000 + }, + { + "epoch": 1.3, + "learning_rate": 5.9577888456627254e-05, + "loss": 1.5478, + "step": 25100 + }, + { + "epoch": 1.3, + "learning_rate": 5.9572234198979544e-05, + "loss": 1.5496, + "step": 25200 + }, + { + "epoch": 1.31, + "learning_rate": 5.9566542594883356e-05, + "loss": 1.5035, + "step": 25300 + }, + { + "epoch": 1.32, + "learning_rate": 5.9560813651526565e-05, + "loss": 1.5482, + "step": 25400 + }, + { + "epoch": 1.32, + "learning_rate": 5.955510522366766e-05, + "loss": 1.6321, + "step": 25500 + }, + { + "epoch": 1.33, + "learning_rate": 5.954930199675307e-05, + "loss": 1.4299, + "step": 25600 + }, + { + "epoch": 1.33, + "learning_rate": 5.9543461452350854e-05, + "loss": 1.5901, + "step": 25700 + }, + { + "epoch": 1.34, + "learning_rate": 5.953758359783694e-05, + "loss": 1.425, + "step": 25800 + }, + { + "epoch": 1.34, + "learning_rate": 5.9531668440634424e-05, + "loss": 1.4047, + "step": 25900 + }, + { + "epoch": 1.35, + "learning_rate": 5.952571598821347e-05, + "loss": 1.4779, + "step": 26000 + }, + { + "epoch": 1.35, + "learning_rate": 5.951972624809139e-05, + "loss": 1.4993, + "step": 26100 + }, + { + "epoch": 1.36, + "learning_rate": 5.951369922783254e-05, + "loss": 1.4967, + "step": 26200 + }, + { + "epoch": 1.36, + "learning_rate": 5.95076349350484e-05, + "loss": 1.4111, + "step": 26300 + }, + { + "epoch": 1.37, + "learning_rate": 5.950153337739747e-05, + "loss": 1.4713, + "step": 26400 + }, + { + "epoch": 1.37, + "learning_rate": 5.949539456258536e-05, + "loss": 1.4811, + "step": 26500 + }, + { + "epoch": 1.38, + "learning_rate": 5.948921849836471e-05, + "loss": 1.4733, + "step": 26600 + }, + { + "epoch": 1.38, + "learning_rate": 5.9483005192535203e-05, + "loss": 1.4498, + "step": 26700 + }, + { + "epoch": 1.39, + "learning_rate": 5.947675465294355e-05, + "loss": 1.4915, + "step": 26800 + }, + { + "epoch": 1.39, + "learning_rate": 5.947046688748348e-05, + "loss": 1.576, + "step": 26900 + }, + { + "epoch": 1.4, + "learning_rate": 5.946414190409576e-05, + "loss": 1.4747, + "step": 27000 + }, + { + "epoch": 1.4, + "learning_rate": 5.9457779710768136e-05, + "loss": 1.4618, + "step": 27100 + }, + { + "epoch": 1.41, + "learning_rate": 5.945138031553535e-05, + "loss": 1.496, + "step": 27200 + }, + { + "epoch": 1.41, + "learning_rate": 5.944494372647913e-05, + "loss": 1.453, + "step": 27300 + }, + { + "epoch": 1.42, + "learning_rate": 5.943846995172817e-05, + "loss": 1.4488, + "step": 27400 + }, + { + "epoch": 1.42, + "learning_rate": 5.943195899945812e-05, + "loss": 1.3713, + "step": 27500 + }, + { + "epoch": 1.43, + "learning_rate": 5.942541087789161e-05, + "loss": 1.4559, + "step": 27600 + }, + { + "epoch": 1.43, + "learning_rate": 5.941882559529818e-05, + "loss": 1.5319, + "step": 27700 + }, + { + "epoch": 1.44, + "learning_rate": 5.941220315999431e-05, + "loss": 1.4513, + "step": 27800 + }, + { + "epoch": 1.44, + "learning_rate": 5.94055435803434e-05, + "loss": 1.4144, + "step": 27900 + }, + { + "epoch": 1.45, + "learning_rate": 5.939884686475576e-05, + "loss": 1.4676, + "step": 28000 + }, + { + "epoch": 1.45, + "learning_rate": 5.93921130216886e-05, + "loss": 1.4143, + "step": 28100 + }, + { + "epoch": 1.46, + "learning_rate": 5.938534205964602e-05, + "loss": 1.3961, + "step": 28200 + }, + { + "epoch": 1.47, + "learning_rate": 5.9378533987178984e-05, + "loss": 1.4351, + "step": 28300 + }, + { + "epoch": 1.47, + "learning_rate": 5.937175744825397e-05, + "loss": 1.4756, + "step": 28400 + }, + { + "epoch": 1.48, + "learning_rate": 5.936494455421633e-05, + "loss": 1.44, + "step": 28500 + }, + { + "epoch": 1.48, + "learning_rate": 5.935802594385472e-05, + "loss": 1.4426, + "step": 28600 + }, + { + "epoch": 1.49, + "learning_rate": 5.9351070257565887e-05, + "loss": 1.5183, + "step": 28700 + }, + { + "epoch": 1.49, + "learning_rate": 5.934407750413408e-05, + "loss": 1.4696, + "step": 28800 + }, + { + "epoch": 1.5, + "learning_rate": 5.9337047692390365e-05, + "loss": 1.4894, + "step": 28900 + }, + { + "epoch": 1.5, + "learning_rate": 5.932998083121263e-05, + "loss": 1.4572, + "step": 29000 + }, + { + "epoch": 1.51, + "learning_rate": 5.932287692952552e-05, + "loss": 1.4113, + "step": 29100 + }, + { + "epoch": 1.51, + "learning_rate": 5.93157359963005e-05, + "loss": 1.5115, + "step": 29200 + }, + { + "epoch": 1.52, + "learning_rate": 5.930855804055575e-05, + "loss": 1.447, + "step": 29300 + }, + { + "epoch": 1.52, + "learning_rate": 5.930134307135624e-05, + "loss": 1.3965, + "step": 29400 + }, + { + "epoch": 1.53, + "learning_rate": 5.929409109781368e-05, + "loss": 1.386, + "step": 29500 + }, + { + "epoch": 1.53, + "learning_rate": 5.92868021290865e-05, + "loss": 1.3903, + "step": 29600 + }, + { + "epoch": 1.54, + "learning_rate": 5.9279476174379853e-05, + "loss": 1.4516, + "step": 29700 + }, + { + "epoch": 1.54, + "learning_rate": 5.9272113242945624e-05, + "loss": 1.4179, + "step": 29800 + }, + { + "epoch": 1.55, + "learning_rate": 5.926471334408236e-05, + "loss": 1.4241, + "step": 29900 + }, + { + "epoch": 1.55, + "learning_rate": 5.925727648713532e-05, + "loss": 1.3328, + "step": 30000 + }, + { + "epoch": 1.56, + "learning_rate": 5.924980268149644e-05, + "loss": 1.4585, + "step": 30100 + }, + { + "epoch": 1.56, + "learning_rate": 5.9242291936604285e-05, + "loss": 1.4253, + "step": 30200 + }, + { + "epoch": 1.57, + "learning_rate": 5.923474426194411e-05, + "loss": 1.4561, + "step": 30300 + }, + { + "epoch": 1.57, + "learning_rate": 5.922715966704777e-05, + "loss": 1.4155, + "step": 30400 + }, + { + "epoch": 1.58, + "learning_rate": 5.9219538161493786e-05, + "loss": 1.3616, + "step": 30500 + }, + { + "epoch": 1.58, + "learning_rate": 5.9211879754907256e-05, + "loss": 1.3037, + "step": 30600 + }, + { + "epoch": 1.59, + "learning_rate": 5.9204184456959924e-05, + "loss": 1.4393, + "step": 30700 + }, + { + "epoch": 1.59, + "learning_rate": 5.919645227737007e-05, + "loss": 1.4787, + "step": 30800 + }, + { + "epoch": 1.6, + "learning_rate": 5.918868322590259e-05, + "loss": 1.3642, + "step": 30900 + }, + { + "epoch": 1.61, + "learning_rate": 5.918087731236893e-05, + "loss": 1.3832, + "step": 31000 + }, + { + "epoch": 1.61, + "learning_rate": 5.91730345466271e-05, + "loss": 1.435, + "step": 31100 + }, + { + "epoch": 1.62, + "learning_rate": 5.9165154938581625e-05, + "loss": 1.3421, + "step": 31200 + }, + { + "epoch": 1.62, + "learning_rate": 5.9157238498183594e-05, + "loss": 1.3711, + "step": 31300 + }, + { + "epoch": 1.63, + "learning_rate": 5.914928523543058e-05, + "loss": 1.4473, + "step": 31400 + }, + { + "epoch": 1.63, + "learning_rate": 5.9141295160366676e-05, + "loss": 1.4473, + "step": 31500 + }, + { + "epoch": 1.64, + "learning_rate": 5.913326828308247e-05, + "loss": 1.2771, + "step": 31600 + }, + { + "epoch": 1.64, + "learning_rate": 5.912520461371499e-05, + "loss": 1.3727, + "step": 31700 + }, + { + "epoch": 1.65, + "learning_rate": 5.911710416244778e-05, + "loss": 1.4304, + "step": 31800 + }, + { + "epoch": 1.65, + "learning_rate": 5.91089669395108e-05, + "loss": 1.3999, + "step": 31900 + }, + { + "epoch": 1.66, + "learning_rate": 5.910079295518046e-05, + "loss": 1.3341, + "step": 32000 + }, + { + "epoch": 1.66, + "learning_rate": 5.909258221977959e-05, + "loss": 1.3578, + "step": 32100 + }, + { + "epoch": 1.67, + "learning_rate": 5.908433474367745e-05, + "loss": 1.3354, + "step": 32200 + }, + { + "epoch": 1.67, + "learning_rate": 5.907605053728967e-05, + "loss": 1.3043, + "step": 32300 + }, + { + "epoch": 1.68, + "learning_rate": 5.90677296110783e-05, + "loss": 1.2493, + "step": 32400 + }, + { + "epoch": 1.68, + "learning_rate": 5.905937197555174e-05, + "loss": 1.4088, + "step": 32500 + }, + { + "epoch": 1.69, + "learning_rate": 5.905106176623172e-05, + "loss": 1.4173, + "step": 32600 + }, + { + "epoch": 1.69, + "learning_rate": 5.904263111061438e-05, + "loss": 1.344, + "step": 32700 + }, + { + "epoch": 1.7, + "learning_rate": 5.903416377737847e-05, + "loss": 1.3147, + "step": 32800 + }, + { + "epoch": 1.7, + "learning_rate": 5.902565977721728e-05, + "loss": 1.4387, + "step": 32900 + }, + { + "epoch": 1.71, + "learning_rate": 5.901711912087044e-05, + "loss": 1.3172, + "step": 33000 + }, + { + "epoch": 1.71, + "learning_rate": 5.9008541819123836e-05, + "loss": 1.364, + "step": 33100 + }, + { + "epoch": 1.72, + "learning_rate": 5.8999927882809645e-05, + "loss": 1.275, + "step": 33200 + }, + { + "epoch": 1.72, + "learning_rate": 5.899127732280632e-05, + "loss": 1.3297, + "step": 33300 + }, + { + "epoch": 1.73, + "learning_rate": 5.898259015003856e-05, + "loss": 1.3118, + "step": 33400 + }, + { + "epoch": 1.73, + "learning_rate": 5.897386637547728e-05, + "loss": 1.3985, + "step": 33500 + }, + { + "epoch": 1.74, + "learning_rate": 5.896510601013967e-05, + "loss": 1.4055, + "step": 33600 + }, + { + "epoch": 1.74, + "learning_rate": 5.895630906508907e-05, + "loss": 1.3629, + "step": 33700 + }, + { + "epoch": 1.75, + "learning_rate": 5.894747555143506e-05, + "loss": 1.337, + "step": 33800 + }, + { + "epoch": 1.76, + "learning_rate": 5.893860548033339e-05, + "loss": 1.3023, + "step": 33900 + }, + { + "epoch": 1.76, + "learning_rate": 5.892969886298596e-05, + "loss": 1.2466, + "step": 34000 + }, + { + "epoch": 1.77, + "learning_rate": 5.892075571064085e-05, + "loss": 1.2955, + "step": 34100 + }, + { + "epoch": 1.77, + "learning_rate": 5.891177603459227e-05, + "loss": 1.3385, + "step": 34200 + }, + { + "epoch": 1.78, + "learning_rate": 5.890275984618055e-05, + "loss": 1.3597, + "step": 34300 + }, + { + "epoch": 1.78, + "learning_rate": 5.8893707156792135e-05, + "loss": 1.2796, + "step": 34400 + }, + { + "epoch": 1.79, + "learning_rate": 5.888461797785956e-05, + "loss": 1.3459, + "step": 34500 + }, + { + "epoch": 1.79, + "learning_rate": 5.8875492320861454e-05, + "loss": 1.3587, + "step": 34600 + }, + { + "epoch": 1.8, + "learning_rate": 5.8866330197322516e-05, + "loss": 1.4192, + "step": 34700 + }, + { + "epoch": 1.8, + "learning_rate": 5.8857131618813486e-05, + "loss": 1.358, + "step": 34800 + }, + { + "epoch": 1.81, + "learning_rate": 5.8847989127526116e-05, + "loss": 1.305, + "step": 34900 + }, + { + "epoch": 1.81, + "learning_rate": 5.883871803823229e-05, + "loss": 1.3683, + "step": 35000 + }, + { + "epoch": 1.82, + "learning_rate": 5.882941052883947e-05, + "loss": 1.3466, + "step": 35100 + }, + { + "epoch": 1.82, + "learning_rate": 5.882006661110199e-05, + "loss": 1.3494, + "step": 35200 + }, + { + "epoch": 1.83, + "learning_rate": 5.881078028008705e-05, + "loss": 1.3197, + "step": 35300 + }, + { + "epoch": 1.83, + "learning_rate": 5.880136394489542e-05, + "loss": 1.3363, + "step": 35400 + }, + { + "epoch": 1.84, + "learning_rate": 5.8791911236778864e-05, + "loss": 1.441, + "step": 35500 + }, + { + "epoch": 1.84, + "learning_rate": 5.878242216767509e-05, + "loss": 1.2912, + "step": 35600 + }, + { + "epoch": 1.85, + "learning_rate": 5.8772896749567756e-05, + "loss": 1.277, + "step": 35700 + }, + { + "epoch": 1.85, + "learning_rate": 5.87633349944864e-05, + "loss": 1.3575, + "step": 35800 + }, + { + "epoch": 1.86, + "learning_rate": 5.875373691450646e-05, + "loss": 1.2954, + "step": 35900 + }, + { + "epoch": 1.86, + "learning_rate": 5.874410252174923e-05, + "loss": 1.2788, + "step": 36000 + }, + { + "epoch": 1.87, + "learning_rate": 5.87344318283819e-05, + "loss": 1.3734, + "step": 36100 + }, + { + "epoch": 1.87, + "learning_rate": 5.872472484661747e-05, + "loss": 1.3874, + "step": 36200 + }, + { + "epoch": 1.88, + "learning_rate": 5.8714981588714784e-05, + "loss": 1.4144, + "step": 36300 + }, + { + "epoch": 1.88, + "learning_rate": 5.8705202066978494e-05, + "loss": 1.3132, + "step": 36400 + }, + { + "epoch": 1.89, + "learning_rate": 5.8695386293759045e-05, + "loss": 1.3473, + "step": 36500 + }, + { + "epoch": 1.9, + "learning_rate": 5.868553428145268e-05, + "loss": 1.1999, + "step": 36600 + }, + { + "epoch": 1.9, + "learning_rate": 5.8675646042501386e-05, + "loss": 1.3309, + "step": 36700 + }, + { + "epoch": 1.91, + "learning_rate": 5.8665721589392915e-05, + "loss": 1.3468, + "step": 36800 + }, + { + "epoch": 1.91, + "learning_rate": 5.8655760934660754e-05, + "loss": 1.2338, + "step": 36900 + }, + { + "epoch": 1.92, + "learning_rate": 5.8645764090884096e-05, + "loss": 1.2547, + "step": 37000 + }, + { + "epoch": 1.92, + "learning_rate": 5.8635731070687844e-05, + "loss": 1.2999, + "step": 37100 + }, + { + "epoch": 1.93, + "learning_rate": 5.86256618867426e-05, + "loss": 1.4702, + "step": 37200 + }, + { + "epoch": 1.93, + "learning_rate": 5.8615556551764615e-05, + "loss": 1.3204, + "step": 37300 + }, + { + "epoch": 1.94, + "learning_rate": 5.8605415078515815e-05, + "loss": 1.3127, + "step": 37400 + }, + { + "epoch": 1.94, + "learning_rate": 5.8595237479803736e-05, + "loss": 1.3934, + "step": 37500 + }, + { + "epoch": 1.95, + "learning_rate": 5.858502376848158e-05, + "loss": 1.2739, + "step": 37600 + }, + { + "epoch": 1.95, + "learning_rate": 5.85747739574481e-05, + "loss": 1.3122, + "step": 37700 + }, + { + "epoch": 1.96, + "learning_rate": 5.8564488059647706e-05, + "loss": 1.35, + "step": 37800 + }, + { + "epoch": 1.96, + "learning_rate": 5.8554166088070315e-05, + "loss": 1.3605, + "step": 37900 + }, + { + "epoch": 1.97, + "learning_rate": 5.854380805575145e-05, + "loss": 1.3194, + "step": 38000 + }, + { + "epoch": 1.97, + "learning_rate": 5.8533413975772136e-05, + "loss": 1.2737, + "step": 38100 + }, + { + "epoch": 1.98, + "learning_rate": 5.852298386125897e-05, + "loss": 1.2602, + "step": 38200 + }, + { + "epoch": 1.98, + "learning_rate": 5.851262256500513e-05, + "loss": 1.3075, + "step": 38300 + }, + { + "epoch": 1.99, + "learning_rate": 5.850212078100181e-05, + "loss": 1.2872, + "step": 38400 + }, + { + "epoch": 1.99, + "learning_rate": 5.849158300198444e-05, + "loss": 1.3064, + "step": 38500 + }, + { + "epoch": 2.0, + "learning_rate": 5.8481009241261095e-05, + "loss": 1.2797, + "step": 38600 + }, + { + "epoch": 2.0, + "eval_accuracy": 0.6232878756989748, + "eval_cer": 0.23382789596773815, + "eval_loss": 1.2337921857833862, + "eval_runtime": 4874.1634, + "eval_samples_per_second": 3.522, + "eval_steps_per_second": 0.22, + "eval_wer": 0.44312687488971236, + "step": 38626 + }, + { + "epoch": 2.0, + "learning_rate": 5.847039951218522e-05, + "loss": 1.1756, + "step": 38700 + }, + { + "epoch": 2.01, + "learning_rate": 5.845975382815577e-05, + "loss": 1.2514, + "step": 38800 + }, + { + "epoch": 2.01, + "learning_rate": 5.844907220261703e-05, + "loss": 1.1599, + "step": 38900 + }, + { + "epoch": 2.02, + "learning_rate": 5.843835464905872e-05, + "loss": 1.1254, + "step": 39000 + }, + { + "epoch": 2.02, + "learning_rate": 5.842760118101592e-05, + "loss": 1.2388, + "step": 39100 + }, + { + "epoch": 2.03, + "learning_rate": 5.8416811812069056e-05, + "loss": 1.2362, + "step": 39200 + }, + { + "epoch": 2.03, + "learning_rate": 5.8405986555843916e-05, + "loss": 1.1625, + "step": 39300 + }, + { + "epoch": 2.04, + "learning_rate": 5.839512542601159e-05, + "loss": 1.2258, + "step": 39400 + }, + { + "epoch": 2.05, + "learning_rate": 5.8384228436288476e-05, + "loss": 1.2098, + "step": 39500 + }, + { + "epoch": 2.05, + "learning_rate": 5.837329560043628e-05, + "loss": 1.1358, + "step": 39600 + }, + { + "epoch": 2.06, + "learning_rate": 5.836232693226193e-05, + "loss": 1.1938, + "step": 39700 + }, + { + "epoch": 2.06, + "learning_rate": 5.835132244561766e-05, + "loss": 1.1202, + "step": 39800 + }, + { + "epoch": 2.07, + "learning_rate": 5.8340282154400905e-05, + "loss": 1.1792, + "step": 39900 + }, + { + "epoch": 2.07, + "learning_rate": 5.8329206072554335e-05, + "loss": 1.2488, + "step": 40000 + }, + { + "epoch": 2.08, + "learning_rate": 5.83180942140658e-05, + "loss": 1.1636, + "step": 40100 + }, + { + "epoch": 2.08, + "learning_rate": 5.830694659296836e-05, + "loss": 1.1551, + "step": 40200 + }, + { + "epoch": 2.09, + "learning_rate": 5.829587523394537e-05, + "loss": 1.1864, + "step": 40300 + }, + { + "epoch": 2.09, + "learning_rate": 5.8284656487183875e-05, + "loss": 1.1599, + "step": 40400 + }, + { + "epoch": 2.1, + "learning_rate": 5.82734020200416e-05, + "loss": 1.1651, + "step": 40500 + }, + { + "epoch": 2.1, + "learning_rate": 5.82621118467317e-05, + "loss": 1.1779, + "step": 40600 + }, + { + "epoch": 2.11, + "learning_rate": 5.8250785981512384e-05, + "loss": 1.1994, + "step": 40700 + }, + { + "epoch": 2.11, + "learning_rate": 5.823942443868698e-05, + "loss": 1.2254, + "step": 40800 + }, + { + "epoch": 2.12, + "learning_rate": 5.822802723260385e-05, + "loss": 1.0945, + "step": 40900 + }, + { + "epoch": 2.12, + "learning_rate": 5.8216594377656414e-05, + "loss": 1.1229, + "step": 41000 + }, + { + "epoch": 2.13, + "learning_rate": 5.820512588828308e-05, + "loss": 1.1594, + "step": 41100 + }, + { + "epoch": 2.13, + "learning_rate": 5.819362177896728e-05, + "loss": 1.1218, + "step": 41200 + }, + { + "epoch": 2.14, + "learning_rate": 5.818208206423743e-05, + "loss": 1.2261, + "step": 41300 + }, + { + "epoch": 2.14, + "learning_rate": 5.817050675866691e-05, + "loss": 1.1001, + "step": 41400 + }, + { + "epoch": 2.15, + "learning_rate": 5.815889587687405e-05, + "loss": 1.1222, + "step": 41500 + }, + { + "epoch": 2.15, + "learning_rate": 5.81472494335221e-05, + "loss": 1.108, + "step": 41600 + }, + { + "epoch": 2.16, + "learning_rate": 5.813556744331922e-05, + "loss": 1.1862, + "step": 41700 + }, + { + "epoch": 2.16, + "learning_rate": 5.812384992101847e-05, + "loss": 1.1968, + "step": 41800 + }, + { + "epoch": 2.17, + "learning_rate": 5.811209688141778e-05, + "loss": 1.1308, + "step": 41900 + }, + { + "epoch": 2.17, + "learning_rate": 5.8100308339359934e-05, + "loss": 1.2425, + "step": 42000 + }, + { + "epoch": 2.18, + "learning_rate": 5.808848430973256e-05, + "loss": 1.0727, + "step": 42100 + }, + { + "epoch": 2.19, + "learning_rate": 5.807662480746807e-05, + "loss": 1.2195, + "step": 42200 + }, + { + "epoch": 2.19, + "learning_rate": 5.806472984754373e-05, + "loss": 1.1253, + "step": 42300 + }, + { + "epoch": 2.2, + "learning_rate": 5.805279944498154e-05, + "loss": 1.226, + "step": 42400 + }, + { + "epoch": 2.2, + "learning_rate": 5.804083361484826e-05, + "loss": 1.1783, + "step": 42500 + }, + { + "epoch": 2.21, + "learning_rate": 5.802883237225542e-05, + "loss": 1.2107, + "step": 42600 + }, + { + "epoch": 2.21, + "learning_rate": 5.8016795732359265e-05, + "loss": 1.1673, + "step": 42700 + }, + { + "epoch": 2.22, + "learning_rate": 5.800472371036072e-05, + "loss": 1.168, + "step": 42800 + }, + { + "epoch": 2.22, + "learning_rate": 5.799261632150541e-05, + "loss": 1.208, + "step": 42900 + }, + { + "epoch": 2.23, + "learning_rate": 5.7980473581083634e-05, + "loss": 1.1476, + "step": 43000 + }, + { + "epoch": 2.23, + "learning_rate": 5.796829550443031e-05, + "loss": 1.1235, + "step": 43100 + }, + { + "epoch": 2.24, + "learning_rate": 5.7956082106925004e-05, + "loss": 1.1751, + "step": 43200 + }, + { + "epoch": 2.24, + "learning_rate": 5.794383340399188e-05, + "loss": 1.1916, + "step": 43300 + }, + { + "epoch": 2.25, + "learning_rate": 5.793154941109969e-05, + "loss": 1.1765, + "step": 43400 + }, + { + "epoch": 2.25, + "learning_rate": 5.791923014376177e-05, + "loss": 1.0941, + "step": 43500 + }, + { + "epoch": 2.26, + "learning_rate": 5.790687561753595e-05, + "loss": 1.1125, + "step": 43600 + }, + { + "epoch": 2.26, + "learning_rate": 5.789448584802465e-05, + "loss": 1.2128, + "step": 43700 + }, + { + "epoch": 2.27, + "learning_rate": 5.7882060850874774e-05, + "loss": 1.1037, + "step": 43800 + }, + { + "epoch": 2.27, + "learning_rate": 5.786960064177771e-05, + "loss": 1.1701, + "step": 43900 + }, + { + "epoch": 2.28, + "learning_rate": 5.785710523646931e-05, + "loss": 1.1476, + "step": 44000 + }, + { + "epoch": 2.28, + "learning_rate": 5.784457465072989e-05, + "loss": 1.1389, + "step": 44100 + }, + { + "epoch": 2.29, + "learning_rate": 5.78320089003842e-05, + "loss": 1.1858, + "step": 44200 + }, + { + "epoch": 2.29, + "learning_rate": 5.781940800130137e-05, + "loss": 1.2607, + "step": 44300 + }, + { + "epoch": 2.3, + "learning_rate": 5.7806771969394945e-05, + "loss": 1.1416, + "step": 44400 + }, + { + "epoch": 2.3, + "learning_rate": 5.779410082062283e-05, + "loss": 1.1553, + "step": 44500 + }, + { + "epoch": 2.31, + "learning_rate": 5.778139457098727e-05, + "loss": 1.1428, + "step": 44600 + }, + { + "epoch": 2.31, + "learning_rate": 5.7768653236534865e-05, + "loss": 1.1515, + "step": 44700 + }, + { + "epoch": 2.32, + "learning_rate": 5.77558768333565e-05, + "loss": 1.2046, + "step": 44800 + }, + { + "epoch": 2.32, + "learning_rate": 5.7743065377587336e-05, + "loss": 1.117, + "step": 44900 + }, + { + "epoch": 2.33, + "learning_rate": 5.773021888540684e-05, + "loss": 1.22, + "step": 45000 + }, + { + "epoch": 2.34, + "learning_rate": 5.77173373730387e-05, + "loss": 1.0883, + "step": 45100 + }, + { + "epoch": 2.34, + "learning_rate": 5.770442085675084e-05, + "loss": 1.1552, + "step": 45200 + }, + { + "epoch": 2.35, + "learning_rate": 5.769146935285536e-05, + "loss": 1.191, + "step": 45300 + }, + { + "epoch": 2.35, + "learning_rate": 5.767848287770861e-05, + "loss": 1.0745, + "step": 45400 + }, + { + "epoch": 2.36, + "learning_rate": 5.766546144771105e-05, + "loss": 1.1629, + "step": 45500 + }, + { + "epoch": 2.36, + "learning_rate": 5.765240507930729e-05, + "loss": 1.2327, + "step": 45600 + }, + { + "epoch": 2.37, + "learning_rate": 5.763931378898609e-05, + "loss": 1.2258, + "step": 45700 + }, + { + "epoch": 2.37, + "learning_rate": 5.762618759328028e-05, + "loss": 1.1294, + "step": 45800 + }, + { + "epoch": 2.38, + "learning_rate": 5.76130265087668e-05, + "loss": 1.2536, + "step": 45900 + }, + { + "epoch": 2.38, + "learning_rate": 5.759983055206664e-05, + "loss": 1.1157, + "step": 46000 + }, + { + "epoch": 2.39, + "learning_rate": 5.7586732220447036e-05, + "loss": 1.1445, + "step": 46100 + }, + { + "epoch": 2.39, + "learning_rate": 5.7573466917717874e-05, + "loss": 1.1632, + "step": 46200 + }, + { + "epoch": 2.4, + "learning_rate": 5.756016679276139e-05, + "loss": 1.1203, + "step": 46300 + }, + { + "epoch": 2.4, + "learning_rate": 5.754683186237419e-05, + "loss": 1.1151, + "step": 46400 + }, + { + "epoch": 2.41, + "learning_rate": 5.753346214339678e-05, + "loss": 1.0912, + "step": 46500 + }, + { + "epoch": 2.41, + "learning_rate": 5.752005765271365e-05, + "loss": 1.1626, + "step": 46600 + }, + { + "epoch": 2.42, + "learning_rate": 5.7506618407253175e-05, + "loss": 1.1107, + "step": 46700 + }, + { + "epoch": 2.42, + "learning_rate": 5.749314442398764e-05, + "loss": 1.109, + "step": 46800 + }, + { + "epoch": 2.43, + "learning_rate": 5.747963571993318e-05, + "loss": 1.0809, + "step": 46900 + }, + { + "epoch": 2.43, + "learning_rate": 5.746609231214979e-05, + "loss": 1.1573, + "step": 47000 + }, + { + "epoch": 2.44, + "learning_rate": 5.745251421774128e-05, + "loss": 1.0366, + "step": 47100 + }, + { + "epoch": 2.44, + "learning_rate": 5.74389014538553e-05, + "loss": 1.1549, + "step": 47200 + }, + { + "epoch": 2.45, + "learning_rate": 5.742525403768325e-05, + "loss": 1.085, + "step": 47300 + }, + { + "epoch": 2.45, + "learning_rate": 5.741157198646029e-05, + "loss": 1.1592, + "step": 47400 + }, + { + "epoch": 2.46, + "learning_rate": 5.739785531746534e-05, + "loss": 1.1038, + "step": 47500 + }, + { + "epoch": 2.46, + "learning_rate": 5.738410404802103e-05, + "loss": 1.1276, + "step": 47600 + }, + { + "epoch": 2.47, + "learning_rate": 5.7370318195493684e-05, + "loss": 1.1947, + "step": 47700 + }, + { + "epoch": 2.48, + "learning_rate": 5.7356497777293313e-05, + "loss": 1.1262, + "step": 47800 + }, + { + "epoch": 2.48, + "learning_rate": 5.7342642810873555e-05, + "loss": 1.1127, + "step": 47900 + }, + { + "epoch": 2.49, + "learning_rate": 5.7328753313731704e-05, + "loss": 1.0605, + "step": 48000 + }, + { + "epoch": 2.49, + "learning_rate": 5.731482930340865e-05, + "loss": 1.1133, + "step": 48100 + }, + { + "epoch": 2.5, + "learning_rate": 5.7300870797488876e-05, + "loss": 1.1276, + "step": 48200 + }, + { + "epoch": 2.5, + "learning_rate": 5.7286877813600414e-05, + "loss": 1.1756, + "step": 48300 + }, + { + "epoch": 2.51, + "learning_rate": 5.727285036941487e-05, + "loss": 1.2768, + "step": 48400 + }, + { + "epoch": 2.51, + "learning_rate": 5.725878848264733e-05, + "loss": 1.0529, + "step": 48500 + }, + { + "epoch": 2.52, + "learning_rate": 5.72446921710564e-05, + "loss": 1.0764, + "step": 48600 + }, + { + "epoch": 2.52, + "learning_rate": 5.723056145244416e-05, + "loss": 1.116, + "step": 48700 + }, + { + "epoch": 2.53, + "learning_rate": 5.721639634465614e-05, + "loss": 1.1171, + "step": 48800 + }, + { + "epoch": 2.53, + "learning_rate": 5.720219686558129e-05, + "loss": 1.1873, + "step": 48900 + }, + { + "epoch": 2.54, + "learning_rate": 5.718796303315198e-05, + "loss": 1.1516, + "step": 49000 + }, + { + "epoch": 2.54, + "learning_rate": 5.717369486534397e-05, + "loss": 1.1561, + "step": 49100 + }, + { + "epoch": 2.55, + "learning_rate": 5.715939238017635e-05, + "loss": 1.153, + "step": 49200 + }, + { + "epoch": 2.55, + "learning_rate": 5.71450555957116e-05, + "loss": 1.1497, + "step": 49300 + }, + { + "epoch": 2.56, + "learning_rate": 5.713068453005545e-05, + "loss": 1.1132, + "step": 49400 + }, + { + "epoch": 2.56, + "learning_rate": 5.7116279201356994e-05, + "loss": 1.1306, + "step": 49500 + }, + { + "epoch": 2.57, + "learning_rate": 5.7101839627808545e-05, + "loss": 1.1591, + "step": 49600 + }, + { + "epoch": 2.57, + "learning_rate": 5.7087365827645694e-05, + "loss": 1.1825, + "step": 49700 + }, + { + "epoch": 2.58, + "learning_rate": 5.707285781914723e-05, + "loss": 1.1536, + "step": 49800 + }, + { + "epoch": 2.58, + "learning_rate": 5.705831562063515e-05, + "loss": 1.0688, + "step": 49900 + }, + { + "epoch": 2.59, + "learning_rate": 5.704388518326552e-05, + "loss": 1.1515, + "step": 50000 + }, + { + "epoch": 2.59, + "learning_rate": 5.702927500130608e-05, + "loss": 1.1314, + "step": 50100 + }, + { + "epoch": 2.6, + "learning_rate": 5.701477729645006e-05, + "loss": 1.1567, + "step": 50200 + }, + { + "epoch": 2.6, + "learning_rate": 5.700009920411118e-05, + "loss": 1.1368, + "step": 50300 + }, + { + "epoch": 2.61, + "learning_rate": 5.698538701364476e-05, + "loss": 1.0618, + "step": 50400 + }, + { + "epoch": 2.61, + "learning_rate": 5.697064074363065e-05, + "loss": 1.082, + "step": 50500 + }, + { + "epoch": 2.62, + "learning_rate": 5.6955860412691743e-05, + "loss": 1.0973, + "step": 50600 + }, + { + "epoch": 2.63, + "learning_rate": 5.694104603949398e-05, + "loss": 1.2041, + "step": 50700 + }, + { + "epoch": 2.63, + "learning_rate": 5.692619764274625e-05, + "loss": 0.982, + "step": 50800 + }, + { + "epoch": 2.64, + "learning_rate": 5.691131524120044e-05, + "loss": 1.073, + "step": 50900 + }, + { + "epoch": 2.64, + "learning_rate": 5.689639885365136e-05, + "loss": 1.1153, + "step": 51000 + }, + { + "epoch": 2.65, + "learning_rate": 5.688144849893676e-05, + "loss": 1.2138, + "step": 51100 + }, + { + "epoch": 2.65, + "learning_rate": 5.686646419593728e-05, + "loss": 1.1121, + "step": 51200 + }, + { + "epoch": 2.66, + "learning_rate": 5.685144596357642e-05, + "loss": 1.162, + "step": 51300 + }, + { + "epoch": 2.66, + "learning_rate": 5.6836393820820555e-05, + "loss": 1.1484, + "step": 51400 + }, + { + "epoch": 2.67, + "learning_rate": 5.6821307786678865e-05, + "loss": 1.1192, + "step": 51500 + }, + { + "epoch": 2.67, + "learning_rate": 5.680618788020332e-05, + "loss": 1.1031, + "step": 51600 + }, + { + "epoch": 2.68, + "learning_rate": 5.67910341204887e-05, + "loss": 1.088, + "step": 51700 + }, + { + "epoch": 2.68, + "learning_rate": 5.677584652667252e-05, + "loss": 1.1462, + "step": 51800 + }, + { + "epoch": 2.69, + "learning_rate": 5.676062511793503e-05, + "loss": 1.2101, + "step": 51900 + }, + { + "epoch": 2.69, + "learning_rate": 5.674536991349917e-05, + "loss": 1.0907, + "step": 52000 + }, + { + "epoch": 2.7, + "learning_rate": 5.6730080932630566e-05, + "loss": 1.1004, + "step": 52100 + }, + { + "epoch": 2.7, + "learning_rate": 5.6714758194637505e-05, + "loss": 1.1093, + "step": 52200 + }, + { + "epoch": 2.71, + "learning_rate": 5.669940171887092e-05, + "loss": 1.1207, + "step": 52300 + }, + { + "epoch": 2.71, + "learning_rate": 5.6684011524724305e-05, + "loss": 1.016, + "step": 52400 + }, + { + "epoch": 2.72, + "learning_rate": 5.6668587631633796e-05, + "loss": 1.1161, + "step": 52500 + }, + { + "epoch": 2.72, + "learning_rate": 5.6653130059078044e-05, + "loss": 1.1093, + "step": 52600 + }, + { + "epoch": 2.73, + "learning_rate": 5.663763882657824e-05, + "loss": 1.1251, + "step": 52700 + }, + { + "epoch": 2.73, + "learning_rate": 5.66221139536981e-05, + "loss": 1.1405, + "step": 52800 + }, + { + "epoch": 2.74, + "learning_rate": 5.660655546004383e-05, + "loss": 1.0735, + "step": 52900 + }, + { + "epoch": 2.74, + "learning_rate": 5.6590963365264046e-05, + "loss": 1.171, + "step": 53000 + }, + { + "epoch": 2.75, + "learning_rate": 5.657533768904985e-05, + "loss": 1.1539, + "step": 53100 + }, + { + "epoch": 2.75, + "learning_rate": 5.6559678451134755e-05, + "loss": 1.1414, + "step": 53200 + }, + { + "epoch": 2.76, + "learning_rate": 5.65439856712946e-05, + "loss": 1.1534, + "step": 53300 + }, + { + "epoch": 2.76, + "learning_rate": 5.652825936934766e-05, + "loss": 1.1381, + "step": 53400 + }, + { + "epoch": 2.77, + "learning_rate": 5.6512499565154486e-05, + "loss": 1.1861, + "step": 53500 + }, + { + "epoch": 2.78, + "learning_rate": 5.649686437715548e-05, + "loss": 1.1615, + "step": 53600 + }, + { + "epoch": 2.78, + "learning_rate": 5.648119639246426e-05, + "loss": 1.2778, + "step": 53700 + }, + { + "epoch": 2.79, + "learning_rate": 5.646533686977088e-05, + "loss": 1.2387, + "step": 53800 + }, + { + "epoch": 2.79, + "learning_rate": 5.64494439242954e-05, + "loss": 1.1014, + "step": 53900 + }, + { + "epoch": 2.8, + "learning_rate": 5.643351757610886e-05, + "loss": 1.1069, + "step": 54000 + }, + { + "epoch": 2.8, + "learning_rate": 5.641755784532446e-05, + "loss": 1.2293, + "step": 54100 + }, + { + "epoch": 2.81, + "learning_rate": 5.6401564752097556e-05, + "loss": 1.1891, + "step": 54200 + }, + { + "epoch": 2.81, + "learning_rate": 5.638553831662567e-05, + "loss": 1.1197, + "step": 54300 + }, + { + "epoch": 2.82, + "learning_rate": 5.63694785591484e-05, + "loss": 1.152, + "step": 54400 + }, + { + "epoch": 2.82, + "learning_rate": 5.635338549994743e-05, + "loss": 1.1227, + "step": 54500 + }, + { + "epoch": 2.83, + "learning_rate": 5.6337259159346516e-05, + "loss": 1.1376, + "step": 54600 + }, + { + "epoch": 2.83, + "learning_rate": 5.632109955771144e-05, + "loss": 1.0894, + "step": 54700 + }, + { + "epoch": 2.84, + "learning_rate": 5.630490671544997e-05, + "loss": 1.1708, + "step": 54800 + }, + { + "epoch": 2.84, + "learning_rate": 5.6288680653011886e-05, + "loss": 1.1858, + "step": 54900 + }, + { + "epoch": 2.85, + "learning_rate": 5.627242139088889e-05, + "loss": 1.1409, + "step": 55000 + }, + { + "epoch": 2.85, + "learning_rate": 5.625612894961463e-05, + "loss": 1.1009, + "step": 55100 + }, + { + "epoch": 2.86, + "learning_rate": 5.623980334976465e-05, + "loss": 1.0752, + "step": 55200 + }, + { + "epoch": 2.86, + "learning_rate": 5.622344461195637e-05, + "loss": 1.0932, + "step": 55300 + }, + { + "epoch": 2.87, + "learning_rate": 5.6207052756849046e-05, + "loss": 1.1308, + "step": 55400 + }, + { + "epoch": 2.87, + "learning_rate": 5.61906278051438e-05, + "loss": 1.0719, + "step": 55500 + }, + { + "epoch": 2.88, + "learning_rate": 5.6174169777583507e-05, + "loss": 1.0901, + "step": 55600 + }, + { + "epoch": 2.88, + "learning_rate": 5.615767869495282e-05, + "loss": 1.1567, + "step": 55700 + }, + { + "epoch": 2.89, + "learning_rate": 5.614115457807816e-05, + "loss": 1.163, + "step": 55800 + }, + { + "epoch": 2.89, + "learning_rate": 5.612459744782764e-05, + "loss": 1.1562, + "step": 55900 + }, + { + "epoch": 2.9, + "learning_rate": 5.6108007325111084e-05, + "loss": 1.209, + "step": 56000 + }, + { + "epoch": 2.9, + "learning_rate": 5.609138423087998e-05, + "loss": 1.0763, + "step": 56100 + }, + { + "epoch": 2.91, + "learning_rate": 5.607472818612743e-05, + "loss": 1.1295, + "step": 56200 + }, + { + "epoch": 2.92, + "learning_rate": 5.6058039211888196e-05, + "loss": 1.0759, + "step": 56300 + }, + { + "epoch": 2.92, + "learning_rate": 5.6041317329238584e-05, + "loss": 1.1202, + "step": 56400 + }, + { + "epoch": 2.93, + "learning_rate": 5.602456255929648e-05, + "loss": 1.0674, + "step": 56500 + }, + { + "epoch": 2.93, + "learning_rate": 5.6007774923221296e-05, + "loss": 1.0632, + "step": 56600 + }, + { + "epoch": 2.94, + "learning_rate": 5.599095444221395e-05, + "loss": 1.1333, + "step": 56700 + }, + { + "epoch": 2.94, + "learning_rate": 5.597410113751684e-05, + "loss": 1.1168, + "step": 56800 + }, + { + "epoch": 2.95, + "learning_rate": 5.595721503041383e-05, + "loss": 1.0455, + "step": 56900 + }, + { + "epoch": 2.95, + "learning_rate": 5.594029614223019e-05, + "loss": 1.0849, + "step": 57000 + }, + { + "epoch": 2.96, + "learning_rate": 5.5923344494332596e-05, + "loss": 1.063, + "step": 57100 + }, + { + "epoch": 2.96, + "learning_rate": 5.59063601081291e-05, + "loss": 1.1484, + "step": 57200 + }, + { + "epoch": 2.97, + "learning_rate": 5.5889343005069104e-05, + "loss": 1.0446, + "step": 57300 + }, + { + "epoch": 2.97, + "learning_rate": 5.58722932066433e-05, + "loss": 1.0936, + "step": 57400 + }, + { + "epoch": 2.98, + "learning_rate": 5.585521073438371e-05, + "loss": 1.0569, + "step": 57500 + }, + { + "epoch": 2.98, + "learning_rate": 5.58380956098636e-05, + "loss": 1.0789, + "step": 57600 + }, + { + "epoch": 2.99, + "learning_rate": 5.5821119493699745e-05, + "loss": 1.1029, + "step": 57700 + }, + { + "epoch": 2.99, + "learning_rate": 5.580393945552586e-05, + "loss": 1.1352, + "step": 57800 + }, + { + "epoch": 3.0, + "learning_rate": 5.578672682984138e-05, + "loss": 1.1338, + "step": 57900 + }, + { + "epoch": 3.0, + "eval_accuracy": 0.625636722390494, + "eval_cer": 0.21062439120798454, + "eval_loss": 1.1177055835723877, + "eval_runtime": 4150.3314, + "eval_samples_per_second": 4.137, + "eval_steps_per_second": 0.259, + "eval_wer": 0.4081524616199047, + "step": 57939 + }, + { + "epoch": 3.0, + "learning_rate": 5.576948163838394e-05, + "loss": 1.0508, + "step": 58000 + }, + { + "epoch": 3.01, + "learning_rate": 5.57522039029323e-05, + "loss": 0.9576, + "step": 58100 + }, + { + "epoch": 3.01, + "learning_rate": 5.573489364530633e-05, + "loss": 0.9834, + "step": 58200 + }, + { + "epoch": 3.02, + "learning_rate": 5.5717550887366955e-05, + "loss": 0.9367, + "step": 58300 + }, + { + "epoch": 3.02, + "learning_rate": 5.570017565101615e-05, + "loss": 0.9954, + "step": 58400 + }, + { + "epoch": 3.03, + "learning_rate": 5.5682767958196926e-05, + "loss": 1.0304, + "step": 58500 + }, + { + "epoch": 3.03, + "learning_rate": 5.5665327830893254e-05, + "loss": 1.0092, + "step": 58600 + }, + { + "epoch": 3.04, + "learning_rate": 5.5647855291130065e-05, + "loss": 0.9443, + "step": 58700 + }, + { + "epoch": 3.04, + "learning_rate": 5.563035036097326e-05, + "loss": 1.0192, + "step": 58800 + }, + { + "epoch": 3.05, + "learning_rate": 5.561281306252962e-05, + "loss": 0.8802, + "step": 58900 + }, + { + "epoch": 3.05, + "learning_rate": 5.5595243417946795e-05, + "loss": 0.9751, + "step": 59000 + }, + { + "epoch": 3.06, + "learning_rate": 5.557764144941329e-05, + "loss": 0.9979, + "step": 59100 + }, + { + "epoch": 3.07, + "learning_rate": 5.5560007179158455e-05, + "loss": 1.154, + "step": 59200 + }, + { + "epoch": 3.07, + "learning_rate": 5.554234062945241e-05, + "loss": 1.0513, + "step": 59300 + }, + { + "epoch": 3.08, + "learning_rate": 5.5524641822606034e-05, + "loss": 1.058, + "step": 59400 + }, + { + "epoch": 3.08, + "learning_rate": 5.550691078097098e-05, + "loss": 1.0706, + "step": 59500 + }, + { + "epoch": 3.09, + "learning_rate": 5.5489147526939555e-05, + "loss": 0.9358, + "step": 59600 + }, + { + "epoch": 3.09, + "learning_rate": 5.5471530196651304e-05, + "loss": 1.031, + "step": 59700 + }, + { + "epoch": 3.1, + "learning_rate": 5.545370290673039e-05, + "loss": 1.0824, + "step": 59800 + }, + { + "epoch": 3.1, + "learning_rate": 5.5436022225004696e-05, + "loss": 1.074, + "step": 59900 + }, + { + "epoch": 3.11, + "learning_rate": 5.541813098835151e-05, + "loss": 1.0516, + "step": 60000 + }, + { + "epoch": 3.11, + "learning_rate": 5.540020765142099e-05, + "loss": 1.0641, + "step": 60100 + }, + { + "epoch": 3.12, + "learning_rate": 5.5382252236848324e-05, + "loss": 1.0567, + "step": 60200 + }, + { + "epoch": 3.12, + "learning_rate": 5.53642647673092e-05, + "loss": 1.0981, + "step": 60300 + }, + { + "epoch": 3.13, + "learning_rate": 5.5346245265519796e-05, + "loss": 1.1005, + "step": 60400 + }, + { + "epoch": 3.13, + "learning_rate": 5.532819375423673e-05, + "loss": 1.0853, + "step": 60500 + }, + { + "epoch": 3.14, + "learning_rate": 5.5310110256257084e-05, + "loss": 0.9992, + "step": 60600 + }, + { + "epoch": 3.14, + "learning_rate": 5.5291994794418285e-05, + "loss": 1.1045, + "step": 60700 + }, + { + "epoch": 3.15, + "learning_rate": 5.5273847391598166e-05, + "loss": 1.0457, + "step": 60800 + }, + { + "epoch": 3.15, + "learning_rate": 5.525566807071487e-05, + "loss": 1.0527, + "step": 60900 + }, + { + "epoch": 3.16, + "learning_rate": 5.523745685472687e-05, + "loss": 0.9843, + "step": 61000 + }, + { + "epoch": 3.16, + "learning_rate": 5.52192137666329e-05, + "loss": 1.0711, + "step": 61100 + }, + { + "epoch": 3.17, + "learning_rate": 5.520093882947196e-05, + "loss": 1.0931, + "step": 61200 + }, + { + "epoch": 3.17, + "learning_rate": 5.518263206632327e-05, + "loss": 1.1513, + "step": 61300 + }, + { + "epoch": 3.18, + "learning_rate": 5.5164293500306235e-05, + "loss": 0.9855, + "step": 61400 + }, + { + "epoch": 3.18, + "learning_rate": 5.514592315458043e-05, + "loss": 1.061, + "step": 61500 + }, + { + "epoch": 3.19, + "learning_rate": 5.512752105234555e-05, + "loss": 1.039, + "step": 61600 + }, + { + "epoch": 3.19, + "learning_rate": 5.510908721684143e-05, + "loss": 1.013, + "step": 61700 + }, + { + "epoch": 3.2, + "learning_rate": 5.509062167134794e-05, + "loss": 1.0715, + "step": 61800 + }, + { + "epoch": 3.21, + "learning_rate": 5.507212443918502e-05, + "loss": 1.0883, + "step": 61900 + }, + { + "epoch": 3.21, + "learning_rate": 5.505359554371262e-05, + "loss": 1.0697, + "step": 62000 + }, + { + "epoch": 3.22, + "learning_rate": 5.503503500833068e-05, + "loss": 1.1306, + "step": 62100 + }, + { + "epoch": 3.22, + "learning_rate": 5.5016442856479085e-05, + "loss": 0.9879, + "step": 62200 + }, + { + "epoch": 3.23, + "learning_rate": 5.499781911163767e-05, + "loss": 1.0714, + "step": 62300 + }, + { + "epoch": 3.23, + "learning_rate": 5.4979163797326156e-05, + "loss": 0.9911, + "step": 62400 + }, + { + "epoch": 3.24, + "learning_rate": 5.4960476937104125e-05, + "loss": 0.9638, + "step": 62500 + }, + { + "epoch": 3.24, + "learning_rate": 5.494175855457102e-05, + "loss": 1.0626, + "step": 62600 + }, + { + "epoch": 3.25, + "learning_rate": 5.4923008673366064e-05, + "loss": 1.0843, + "step": 62700 + }, + { + "epoch": 3.25, + "learning_rate": 5.490422731716829e-05, + "loss": 0.9651, + "step": 62800 + }, + { + "epoch": 3.26, + "learning_rate": 5.488541450969646e-05, + "loss": 1.0842, + "step": 62900 + }, + { + "epoch": 3.26, + "learning_rate": 5.486657027470906e-05, + "loss": 1.0361, + "step": 63000 + }, + { + "epoch": 3.27, + "learning_rate": 5.484769463600427e-05, + "loss": 1.0038, + "step": 63100 + }, + { + "epoch": 3.27, + "learning_rate": 5.482897684285779e-05, + "loss": 1.0452, + "step": 63200 + }, + { + "epoch": 3.28, + "learning_rate": 5.481003878171305e-05, + "loss": 0.9425, + "step": 63300 + }, + { + "epoch": 3.28, + "learning_rate": 5.479106938824391e-05, + "loss": 0.9516, + "step": 63400 + }, + { + "epoch": 3.29, + "learning_rate": 5.4772068686406616e-05, + "loss": 0.9714, + "step": 63500 + }, + { + "epoch": 3.29, + "learning_rate": 5.4753036700196934e-05, + "loss": 1.0238, + "step": 63600 + }, + { + "epoch": 3.3, + "learning_rate": 5.473397345365017e-05, + "loss": 1.0053, + "step": 63700 + }, + { + "epoch": 3.3, + "learning_rate": 5.4714878970841077e-05, + "loss": 0.9941, + "step": 63800 + }, + { + "epoch": 3.31, + "learning_rate": 5.469575327588386e-05, + "loss": 1.0312, + "step": 63900 + }, + { + "epoch": 3.31, + "learning_rate": 5.4676596392932154e-05, + "loss": 1.0646, + "step": 64000 + }, + { + "epoch": 3.32, + "learning_rate": 5.4657408346178975e-05, + "loss": 0.9859, + "step": 64100 + }, + { + "epoch": 3.32, + "learning_rate": 5.4638189159856704e-05, + "loss": 0.9635, + "step": 64200 + }, + { + "epoch": 3.33, + "learning_rate": 5.461893885823703e-05, + "loss": 0.9991, + "step": 64300 + }, + { + "epoch": 3.33, + "learning_rate": 5.459965746563094e-05, + "loss": 0.969, + "step": 64400 + }, + { + "epoch": 3.34, + "learning_rate": 5.458034500638871e-05, + "loss": 0.995, + "step": 64500 + }, + { + "epoch": 3.34, + "learning_rate": 5.456100150489981e-05, + "loss": 1.001, + "step": 64600 + }, + { + "epoch": 3.35, + "learning_rate": 5.454162698559296e-05, + "loss": 0.9856, + "step": 64700 + }, + { + "epoch": 3.36, + "learning_rate": 5.452222147293601e-05, + "loss": 1.0488, + "step": 64800 + }, + { + "epoch": 3.36, + "learning_rate": 5.450278499143597e-05, + "loss": 1.0627, + "step": 64900 + }, + { + "epoch": 3.37, + "learning_rate": 5.448331756563896e-05, + "loss": 1.0156, + "step": 65000 + }, + { + "epoch": 3.37, + "learning_rate": 5.446381922013018e-05, + "loss": 1.0151, + "step": 65100 + }, + { + "epoch": 3.38, + "learning_rate": 5.4444289979533864e-05, + "loss": 0.9805, + "step": 65200 + }, + { + "epoch": 3.38, + "learning_rate": 5.442472986851329e-05, + "loss": 0.9225, + "step": 65300 + }, + { + "epoch": 3.39, + "learning_rate": 5.4405138911770695e-05, + "loss": 1.0183, + "step": 65400 + }, + { + "epoch": 3.39, + "learning_rate": 5.43855171340473e-05, + "loss": 1.0395, + "step": 65500 + }, + { + "epoch": 3.4, + "learning_rate": 5.4365864560123205e-05, + "loss": 1.0325, + "step": 65600 + }, + { + "epoch": 3.4, + "learning_rate": 5.434618121481745e-05, + "loss": 0.9621, + "step": 65700 + }, + { + "epoch": 3.41, + "learning_rate": 5.43264671229879e-05, + "loss": 0.9145, + "step": 65800 + }, + { + "epoch": 3.41, + "learning_rate": 5.4306722309531284e-05, + "loss": 0.9692, + "step": 65900 + }, + { + "epoch": 3.42, + "learning_rate": 5.4286946799383085e-05, + "loss": 0.8968, + "step": 66000 + }, + { + "epoch": 3.42, + "learning_rate": 5.426714061751759e-05, + "loss": 0.9248, + "step": 66100 + }, + { + "epoch": 3.43, + "learning_rate": 5.424730378894781e-05, + "loss": 0.9828, + "step": 66200 + }, + { + "epoch": 3.43, + "learning_rate": 5.422743633872546e-05, + "loss": 0.9811, + "step": 66300 + }, + { + "epoch": 3.44, + "learning_rate": 5.4207538291940906e-05, + "loss": 0.9537, + "step": 66400 + }, + { + "epoch": 3.44, + "learning_rate": 5.418760967372319e-05, + "loss": 1.0041, + "step": 66500 + }, + { + "epoch": 3.45, + "learning_rate": 5.416765050923993e-05, + "loss": 1.0955, + "step": 66600 + }, + { + "epoch": 3.45, + "learning_rate": 5.4147660823697346e-05, + "loss": 0.9946, + "step": 66700 + }, + { + "epoch": 3.46, + "learning_rate": 5.4127640642340194e-05, + "loss": 0.986, + "step": 66800 + }, + { + "epoch": 3.46, + "learning_rate": 5.4107589990451726e-05, + "loss": 0.8793, + "step": 66900 + }, + { + "epoch": 3.47, + "learning_rate": 5.408750889335369e-05, + "loss": 1.0332, + "step": 67000 + }, + { + "epoch": 3.47, + "learning_rate": 5.4067397376406305e-05, + "loss": 0.9489, + "step": 67100 + }, + { + "epoch": 3.48, + "learning_rate": 5.4047255465008156e-05, + "loss": 0.9779, + "step": 67200 + }, + { + "epoch": 3.48, + "learning_rate": 5.402708318459625e-05, + "loss": 1.0407, + "step": 67300 + }, + { + "epoch": 3.49, + "learning_rate": 5.4006880560645956e-05, + "loss": 0.9063, + "step": 67400 + }, + { + "epoch": 3.5, + "learning_rate": 5.398664761867092e-05, + "loss": 0.92, + "step": 67500 + }, + { + "epoch": 3.5, + "learning_rate": 5.3966384384223105e-05, + "loss": 1.0103, + "step": 67600 + }, + { + "epoch": 3.51, + "learning_rate": 5.394609088289273e-05, + "loss": 0.9764, + "step": 67700 + }, + { + "epoch": 3.51, + "learning_rate": 5.392576714030825e-05, + "loss": 0.9779, + "step": 67800 + }, + { + "epoch": 3.52, + "learning_rate": 5.390541318213627e-05, + "loss": 0.9238, + "step": 67900 + }, + { + "epoch": 3.52, + "learning_rate": 5.388502903408159e-05, + "loss": 0.9526, + "step": 68000 + }, + { + "epoch": 3.53, + "learning_rate": 5.386461472188714e-05, + "loss": 1.0248, + "step": 68100 + }, + { + "epoch": 3.53, + "learning_rate": 5.38441702713339e-05, + "loss": 0.93, + "step": 68200 + }, + { + "epoch": 3.54, + "learning_rate": 5.382369570824096e-05, + "loss": 0.9105, + "step": 68300 + }, + { + "epoch": 3.54, + "learning_rate": 5.380319105846542e-05, + "loss": 1.0037, + "step": 68400 + }, + { + "epoch": 3.55, + "learning_rate": 5.378265634790238e-05, + "loss": 1.0091, + "step": 68500 + }, + { + "epoch": 3.55, + "learning_rate": 5.3762091602484886e-05, + "loss": 0.9353, + "step": 68600 + }, + { + "epoch": 3.56, + "learning_rate": 5.374149684818393e-05, + "loss": 0.9854, + "step": 68700 + }, + { + "epoch": 3.56, + "learning_rate": 5.372087211100842e-05, + "loss": 0.9115, + "step": 68800 + }, + { + "epoch": 3.57, + "learning_rate": 5.3700217417005085e-05, + "loss": 0.8826, + "step": 68900 + }, + { + "epoch": 3.57, + "learning_rate": 5.367953279225852e-05, + "loss": 0.9315, + "step": 69000 + }, + { + "epoch": 3.58, + "learning_rate": 5.3658818262891106e-05, + "loss": 0.9321, + "step": 69100 + }, + { + "epoch": 3.58, + "learning_rate": 5.363828144695367e-05, + "loss": 1.0095, + "step": 69200 + }, + { + "epoch": 3.59, + "learning_rate": 5.361750748525558e-05, + "loss": 1.0853, + "step": 69300 + }, + { + "epoch": 3.59, + "learning_rate": 5.359670369726771e-05, + "loss": 1.0438, + "step": 69400 + }, + { + "epoch": 3.6, + "learning_rate": 5.3575870109262955e-05, + "loss": 0.9615, + "step": 69500 + }, + { + "epoch": 3.6, + "learning_rate": 5.355500674755181e-05, + "loss": 1.0223, + "step": 69600 + }, + { + "epoch": 3.61, + "learning_rate": 5.353411363848239e-05, + "loss": 0.9982, + "step": 69700 + }, + { + "epoch": 3.61, + "learning_rate": 5.351319080844037e-05, + "loss": 0.9757, + "step": 69800 + }, + { + "epoch": 3.62, + "learning_rate": 5.349223828384896e-05, + "loss": 0.9835, + "step": 69900 + }, + { + "epoch": 3.62, + "learning_rate": 5.347125609116888e-05, + "loss": 0.9905, + "step": 70000 + }, + { + "epoch": 3.63, + "learning_rate": 5.345024425689829e-05, + "loss": 0.8798, + "step": 70100 + }, + { + "epoch": 3.63, + "learning_rate": 5.342920280757282e-05, + "loss": 0.9783, + "step": 70200 + }, + { + "epoch": 3.64, + "learning_rate": 5.340813176976549e-05, + "loss": 1.0385, + "step": 70300 + }, + { + "epoch": 3.65, + "learning_rate": 5.338703117008666e-05, + "loss": 0.9933, + "step": 70400 + }, + { + "epoch": 3.65, + "learning_rate": 5.336590103518407e-05, + "loss": 0.9996, + "step": 70500 + }, + { + "epoch": 3.66, + "learning_rate": 5.334474139174272e-05, + "loss": 1.0044, + "step": 70600 + }, + { + "epoch": 3.66, + "learning_rate": 5.332376430358462e-05, + "loss": 1.1097, + "step": 70700 + }, + { + "epoch": 3.67, + "learning_rate": 5.330254601768781e-05, + "loss": 0.9849, + "step": 70800 + }, + { + "epoch": 3.67, + "learning_rate": 5.32812983032626e-05, + "loss": 1.07, + "step": 70900 + }, + { + "epoch": 3.68, + "learning_rate": 5.3260021187142476e-05, + "loss": 0.9453, + "step": 71000 + }, + { + "epoch": 3.68, + "learning_rate": 5.3238714696198105e-05, + "loss": 0.9546, + "step": 71100 + }, + { + "epoch": 3.69, + "learning_rate": 5.321737885733719e-05, + "loss": 0.9472, + "step": 71200 + }, + { + "epoch": 3.69, + "learning_rate": 5.319601369750453e-05, + "loss": 0.9841, + "step": 71300 + }, + { + "epoch": 3.7, + "learning_rate": 5.317461924368196e-05, + "loss": 1.0296, + "step": 71400 + }, + { + "epoch": 3.7, + "learning_rate": 5.315319552288831e-05, + "loss": 1.0366, + "step": 71500 + }, + { + "epoch": 3.71, + "learning_rate": 5.313174256217934e-05, + "loss": 1.0427, + "step": 71600 + }, + { + "epoch": 3.71, + "learning_rate": 5.3110260388647755e-05, + "loss": 0.991, + "step": 71700 + }, + { + "epoch": 3.72, + "learning_rate": 5.308874902942318e-05, + "loss": 0.9768, + "step": 71800 + }, + { + "epoch": 3.72, + "learning_rate": 5.306742406109498e-05, + "loss": 1.0361, + "step": 71900 + }, + { + "epoch": 3.73, + "learning_rate": 5.304585470319904e-05, + "loss": 0.9672, + "step": 72000 + }, + { + "epoch": 3.73, + "learning_rate": 5.302425624094733e-05, + "loss": 0.9892, + "step": 72100 + }, + { + "epoch": 3.74, + "learning_rate": 5.30026287016163e-05, + "loss": 1.0636, + "step": 72200 + }, + { + "epoch": 3.74, + "learning_rate": 5.298097211251914e-05, + "loss": 1.0009, + "step": 72300 + }, + { + "epoch": 3.75, + "learning_rate": 5.295928650100572e-05, + "loss": 0.9696, + "step": 72400 + }, + { + "epoch": 3.75, + "learning_rate": 5.2937571894462544e-05, + "loss": 0.923, + "step": 72500 + }, + { + "epoch": 3.76, + "learning_rate": 5.291582832031276e-05, + "loss": 1.0612, + "step": 72600 + }, + { + "epoch": 3.76, + "learning_rate": 5.2894055806016084e-05, + "loss": 0.9948, + "step": 72700 + }, + { + "epoch": 3.77, + "learning_rate": 5.28722543790688e-05, + "loss": 0.9445, + "step": 72800 + }, + { + "epoch": 3.77, + "learning_rate": 5.2850424067003664e-05, + "loss": 1.0116, + "step": 72900 + }, + { + "epoch": 3.78, + "learning_rate": 5.282856489738995e-05, + "loss": 0.9842, + "step": 73000 + }, + { + "epoch": 3.79, + "learning_rate": 5.280667689783335e-05, + "loss": 0.9368, + "step": 73100 + }, + { + "epoch": 3.79, + "learning_rate": 5.2784760095976e-05, + "loss": 1.0701, + "step": 73200 + }, + { + "epoch": 3.8, + "learning_rate": 5.276281451949638e-05, + "loss": 1.029, + "step": 73300 + }, + { + "epoch": 3.8, + "learning_rate": 5.27408401961093e-05, + "loss": 0.9274, + "step": 73400 + }, + { + "epoch": 3.81, + "learning_rate": 5.271883715356591e-05, + "loss": 0.9563, + "step": 73500 + }, + { + "epoch": 3.81, + "learning_rate": 5.2696805419653604e-05, + "loss": 1.0421, + "step": 73600 + }, + { + "epoch": 3.82, + "learning_rate": 5.267474502219601e-05, + "loss": 0.9467, + "step": 73700 + }, + { + "epoch": 3.82, + "learning_rate": 5.2652877021039474e-05, + "loss": 1.0449, + "step": 73800 + }, + { + "epoch": 3.83, + "learning_rate": 5.263075966604667e-05, + "loss": 1.0646, + "step": 73900 + }, + { + "epoch": 3.83, + "learning_rate": 5.2608613730917035e-05, + "loss": 1.0097, + "step": 74000 + }, + { + "epoch": 3.84, + "learning_rate": 5.258643924361842e-05, + "loss": 0.8886, + "step": 74100 + }, + { + "epoch": 3.84, + "learning_rate": 5.2564236232154755e-05, + "loss": 1.0571, + "step": 74200 + }, + { + "epoch": 3.85, + "learning_rate": 5.254200472456597e-05, + "loss": 1.0357, + "step": 74300 + }, + { + "epoch": 3.85, + "learning_rate": 5.251974474892799e-05, + "loss": 1.0421, + "step": 74400 + }, + { + "epoch": 3.86, + "learning_rate": 5.24974563333527e-05, + "loss": 1.0463, + "step": 74500 + }, + { + "epoch": 3.86, + "learning_rate": 5.2475139505987886e-05, + "loss": 0.9742, + "step": 74600 + }, + { + "epoch": 3.87, + "learning_rate": 5.245279429501722e-05, + "loss": 1.007, + "step": 74700 + }, + { + "epoch": 3.87, + "learning_rate": 5.243042072866024e-05, + "loss": 0.9713, + "step": 74800 + }, + { + "epoch": 3.88, + "learning_rate": 5.240801883517226e-05, + "loss": 1.0107, + "step": 74900 + }, + { + "epoch": 3.88, + "learning_rate": 5.2385588642844396e-05, + "loss": 0.9962, + "step": 75000 + }, + { + "epoch": 3.89, + "learning_rate": 5.2363130180003475e-05, + "loss": 0.9331, + "step": 75100 + }, + { + "epoch": 3.89, + "learning_rate": 5.2340643475012054e-05, + "loss": 0.9714, + "step": 75200 + }, + { + "epoch": 3.9, + "learning_rate": 5.2318128556268335e-05, + "loss": 1.0285, + "step": 75300 + }, + { + "epoch": 3.9, + "learning_rate": 5.229558545220618e-05, + "loss": 0.9754, + "step": 75400 + }, + { + "epoch": 3.91, + "learning_rate": 5.2273014191294996e-05, + "loss": 0.891, + "step": 75500 + }, + { + "epoch": 3.91, + "learning_rate": 5.225041480203981e-05, + "loss": 0.9843, + "step": 75600 + }, + { + "epoch": 3.92, + "learning_rate": 5.222778731298113e-05, + "loss": 0.9306, + "step": 75700 + }, + { + "epoch": 3.92, + "learning_rate": 5.220513175269497e-05, + "loss": 0.9514, + "step": 75800 + }, + { + "epoch": 3.93, + "learning_rate": 5.2182448149792764e-05, + "loss": 0.9658, + "step": 75900 + }, + { + "epoch": 3.94, + "learning_rate": 5.21597365329214e-05, + "loss": 0.9659, + "step": 76000 + }, + { + "epoch": 3.94, + "learning_rate": 5.213699693076313e-05, + "loss": 0.9714, + "step": 76100 + }, + { + "epoch": 3.95, + "learning_rate": 5.211422937203554e-05, + "loss": 0.9627, + "step": 76200 + }, + { + "epoch": 3.95, + "learning_rate": 5.2091433885491534e-05, + "loss": 1.0028, + "step": 76300 + }, + { + "epoch": 3.96, + "learning_rate": 5.206861049991928e-05, + "loss": 0.9826, + "step": 76400 + }, + { + "epoch": 3.96, + "learning_rate": 5.204575924414218e-05, + "loss": 1.0277, + "step": 76500 + }, + { + "epoch": 3.97, + "learning_rate": 5.2022880147018836e-05, + "loss": 0.9574, + "step": 76600 + }, + { + "epoch": 3.97, + "learning_rate": 5.1999973237442996e-05, + "loss": 0.9756, + "step": 76700 + }, + { + "epoch": 3.98, + "learning_rate": 5.197703854434355e-05, + "loss": 1.0119, + "step": 76800 + }, + { + "epoch": 3.98, + "learning_rate": 5.195407609668448e-05, + "loss": 0.8842, + "step": 76900 + }, + { + "epoch": 3.99, + "learning_rate": 5.19310859234648e-05, + "loss": 1.0501, + "step": 77000 + }, + { + "epoch": 3.99, + "learning_rate": 5.1908068053718536e-05, + "loss": 0.93, + "step": 77100 + }, + { + "epoch": 4.0, + "learning_rate": 5.188502251651471e-05, + "loss": 1.0311, + "step": 77200 + }, + { + "epoch": 4.0, + "eval_accuracy": 0.6242595235321529, + "eval_cer": 0.20671776990367557, + "eval_loss": 1.060347318649292, + "eval_runtime": 4478.7305, + "eval_samples_per_second": 3.833, + "eval_steps_per_second": 0.24, + "eval_wer": 0.39638844773836834, + "step": 77252 + }, + { + "epoch": 4.0, + "learning_rate": 5.1861949340957276e-05, + "loss": 0.9968, + "step": 77300 + }, + { + "epoch": 4.01, + "learning_rate": 5.1838848556185096e-05, + "loss": 0.9948, + "step": 77400 + }, + { + "epoch": 4.01, + "learning_rate": 5.1815720191371896e-05, + "loss": 0.8875, + "step": 77500 + }, + { + "epoch": 4.02, + "learning_rate": 5.179256427572623e-05, + "loss": 0.7775, + "step": 77600 + }, + { + "epoch": 4.02, + "learning_rate": 5.176938083849145e-05, + "loss": 0.9335, + "step": 77700 + }, + { + "epoch": 4.03, + "learning_rate": 5.1746169908945666e-05, + "loss": 0.9498, + "step": 77800 + }, + { + "epoch": 4.03, + "learning_rate": 5.1722931516401704e-05, + "loss": 0.8583, + "step": 77900 + }, + { + "epoch": 4.04, + "learning_rate": 5.169966569020706e-05, + "loss": 0.8926, + "step": 78000 + }, + { + "epoch": 4.04, + "learning_rate": 5.167637245974391e-05, + "loss": 0.9, + "step": 78100 + }, + { + "epoch": 4.05, + "learning_rate": 5.165305185442901e-05, + "loss": 0.8565, + "step": 78200 + }, + { + "epoch": 4.05, + "learning_rate": 5.162970390371369e-05, + "loss": 0.9534, + "step": 78300 + }, + { + "epoch": 4.06, + "learning_rate": 5.160632863708382e-05, + "loss": 0.845, + "step": 78400 + }, + { + "epoch": 4.06, + "learning_rate": 5.158292608405978e-05, + "loss": 0.9558, + "step": 78500 + }, + { + "epoch": 4.07, + "learning_rate": 5.155949627419638e-05, + "loss": 0.9293, + "step": 78600 + }, + { + "epoch": 4.07, + "learning_rate": 5.153603923708288e-05, + "loss": 0.9034, + "step": 78700 + }, + { + "epoch": 4.08, + "learning_rate": 5.15125550023429e-05, + "loss": 0.8865, + "step": 78800 + }, + { + "epoch": 4.09, + "learning_rate": 5.1489043599634436e-05, + "loss": 0.8646, + "step": 78900 + }, + { + "epoch": 4.09, + "learning_rate": 5.146550505864977e-05, + "loss": 0.8272, + "step": 79000 + }, + { + "epoch": 4.1, + "learning_rate": 5.144193940911546e-05, + "loss": 0.8763, + "step": 79100 + }, + { + "epoch": 4.1, + "learning_rate": 5.1418346680792324e-05, + "loss": 0.9321, + "step": 79200 + }, + { + "epoch": 4.11, + "learning_rate": 5.139472690347535e-05, + "loss": 0.8672, + "step": 79300 + }, + { + "epoch": 4.11, + "learning_rate": 5.1371080106993684e-05, + "loss": 0.9223, + "step": 79400 + }, + { + "epoch": 4.12, + "learning_rate": 5.134740632121062e-05, + "loss": 0.882, + "step": 79500 + }, + { + "epoch": 4.12, + "learning_rate": 5.132370557602351e-05, + "loss": 0.9213, + "step": 79600 + }, + { + "epoch": 4.13, + "learning_rate": 5.1299977901363765e-05, + "loss": 0.8625, + "step": 79700 + }, + { + "epoch": 4.13, + "learning_rate": 5.127622332719681e-05, + "loss": 0.8876, + "step": 79800 + }, + { + "epoch": 4.14, + "learning_rate": 5.125244188352203e-05, + "loss": 0.8432, + "step": 79900 + }, + { + "epoch": 4.14, + "learning_rate": 5.122863360037275e-05, + "loss": 0.8954, + "step": 80000 + }, + { + "epoch": 4.15, + "learning_rate": 5.1204798507816184e-05, + "loss": 0.866, + "step": 80100 + }, + { + "epoch": 4.15, + "learning_rate": 5.118093663595341e-05, + "loss": 0.8963, + "step": 80200 + }, + { + "epoch": 4.16, + "learning_rate": 5.115704801491933e-05, + "loss": 0.8805, + "step": 80300 + }, + { + "epoch": 4.16, + "learning_rate": 5.113313267488261e-05, + "loss": 0.8865, + "step": 80400 + }, + { + "epoch": 4.17, + "learning_rate": 5.110919064604567e-05, + "loss": 0.931, + "step": 80500 + }, + { + "epoch": 4.17, + "learning_rate": 5.108546177737918e-05, + "loss": 0.8367, + "step": 80600 + }, + { + "epoch": 4.18, + "learning_rate": 5.106146672781685e-05, + "loss": 0.909, + "step": 80700 + }, + { + "epoch": 4.18, + "learning_rate": 5.103744507996043e-05, + "loss": 0.9418, + "step": 80800 + }, + { + "epoch": 4.19, + "learning_rate": 5.10133968641466e-05, + "loss": 0.907, + "step": 80900 + }, + { + "epoch": 4.19, + "learning_rate": 5.09893221107456e-05, + "loss": 0.9852, + "step": 81000 + }, + { + "epoch": 4.2, + "learning_rate": 5.096522085016115e-05, + "loss": 0.8823, + "step": 81100 + }, + { + "epoch": 4.2, + "learning_rate": 5.0941093112830474e-05, + "loss": 0.9136, + "step": 81200 + }, + { + "epoch": 4.21, + "learning_rate": 5.0917180601869215e-05, + "loss": 0.9733, + "step": 81300 + }, + { + "epoch": 4.21, + "learning_rate": 5.089300026649806e-05, + "loss": 1.003, + "step": 81400 + }, + { + "epoch": 4.22, + "learning_rate": 5.086879354558726e-05, + "loss": 0.9774, + "step": 81500 + }, + { + "epoch": 4.23, + "learning_rate": 5.084456046970721e-05, + "loss": 0.9474, + "step": 81600 + }, + { + "epoch": 4.23, + "learning_rate": 5.08203010694616e-05, + "loss": 0.9164, + "step": 81700 + }, + { + "epoch": 4.24, + "learning_rate": 5.0796015375487355e-05, + "loss": 1.0097, + "step": 81800 + }, + { + "epoch": 4.24, + "learning_rate": 5.0771703418454614e-05, + "loss": 0.9588, + "step": 81900 + }, + { + "epoch": 4.25, + "learning_rate": 5.0747608740709825e-05, + "loss": 0.8867, + "step": 82000 + }, + { + "epoch": 4.25, + "learning_rate": 5.072324461156706e-05, + "loss": 0.8906, + "step": 82100 + }, + { + "epoch": 4.26, + "learning_rate": 5.06988543112672e-05, + "loss": 0.8889, + "step": 82200 + }, + { + "epoch": 4.26, + "learning_rate": 5.0674437870612466e-05, + "loss": 0.9173, + "step": 82300 + }, + { + "epoch": 4.27, + "learning_rate": 5.064999532043813e-05, + "loss": 0.9074, + "step": 82400 + }, + { + "epoch": 4.27, + "learning_rate": 5.062552669161242e-05, + "loss": 0.8503, + "step": 82500 + }, + { + "epoch": 4.28, + "learning_rate": 5.060103201503648e-05, + "loss": 1.0082, + "step": 82600 + }, + { + "epoch": 4.28, + "learning_rate": 5.0576511321644386e-05, + "loss": 0.9588, + "step": 82700 + }, + { + "epoch": 4.29, + "learning_rate": 5.055196464240304e-05, + "loss": 0.9177, + "step": 82800 + }, + { + "epoch": 4.29, + "learning_rate": 5.052739200831218e-05, + "loss": 0.9282, + "step": 82900 + }, + { + "epoch": 4.3, + "learning_rate": 5.050279345040432e-05, + "loss": 0.934, + "step": 83000 + }, + { + "epoch": 4.3, + "learning_rate": 5.0478168999744686e-05, + "loss": 0.9055, + "step": 83100 + }, + { + "epoch": 4.31, + "learning_rate": 5.045351868743125e-05, + "loss": 0.9463, + "step": 83200 + }, + { + "epoch": 4.31, + "learning_rate": 5.04288425445946e-05, + "loss": 0.9407, + "step": 83300 + }, + { + "epoch": 4.32, + "learning_rate": 5.040414060239797e-05, + "loss": 0.9587, + "step": 83400 + }, + { + "epoch": 4.32, + "learning_rate": 5.037941289203718e-05, + "loss": 0.8661, + "step": 83500 + }, + { + "epoch": 4.33, + "learning_rate": 5.035465944474056e-05, + "loss": 0.9441, + "step": 83600 + }, + { + "epoch": 4.33, + "learning_rate": 5.0329880291768995e-05, + "loss": 0.8675, + "step": 83700 + }, + { + "epoch": 4.34, + "learning_rate": 5.030507546441578e-05, + "loss": 0.9416, + "step": 83800 + }, + { + "epoch": 4.34, + "learning_rate": 5.0280244994006676e-05, + "loss": 0.8766, + "step": 83900 + }, + { + "epoch": 4.35, + "learning_rate": 5.0255388911899795e-05, + "loss": 0.9028, + "step": 84000 + }, + { + "epoch": 4.35, + "learning_rate": 5.023050724948562e-05, + "loss": 0.8647, + "step": 84100 + }, + { + "epoch": 4.36, + "learning_rate": 5.0205849236663635e-05, + "loss": 0.9969, + "step": 84200 + }, + { + "epoch": 4.36, + "learning_rate": 5.018091676295394e-05, + "loss": 0.9579, + "step": 84300 + }, + { + "epoch": 4.37, + "learning_rate": 5.0155958802987014e-05, + "loss": 0.9138, + "step": 84400 + }, + { + "epoch": 4.38, + "learning_rate": 5.013097538828198e-05, + "loss": 0.9941, + "step": 84500 + }, + { + "epoch": 4.38, + "learning_rate": 5.01059665503901e-05, + "loss": 0.9895, + "step": 84600 + }, + { + "epoch": 4.39, + "learning_rate": 5.00809323208948e-05, + "loss": 0.9051, + "step": 84700 + }, + { + "epoch": 4.39, + "learning_rate": 5.0055872731411486e-05, + "loss": 0.8826, + "step": 84800 + }, + { + "epoch": 4.4, + "learning_rate": 5.0030787813587655e-05, + "loss": 0.9454, + "step": 84900 + }, + { + "epoch": 4.4, + "learning_rate": 5.000567759910279e-05, + "loss": 0.9397, + "step": 85000 + }, + { + "epoch": 4.41, + "learning_rate": 4.998054211966828e-05, + "loss": 0.9275, + "step": 85100 + }, + { + "epoch": 4.41, + "learning_rate": 4.995538140702746e-05, + "loss": 0.9587, + "step": 85200 + }, + { + "epoch": 4.42, + "learning_rate": 4.993019549295551e-05, + "loss": 0.9904, + "step": 85300 + }, + { + "epoch": 4.42, + "learning_rate": 4.9904984409259446e-05, + "loss": 0.9545, + "step": 85400 + }, + { + "epoch": 4.43, + "learning_rate": 4.987974818777807e-05, + "loss": 0.9598, + "step": 85500 + }, + { + "epoch": 4.43, + "learning_rate": 4.985448686038193e-05, + "loss": 0.8992, + "step": 85600 + }, + { + "epoch": 4.44, + "learning_rate": 4.982920045897325e-05, + "loss": 0.9731, + "step": 85700 + }, + { + "epoch": 4.44, + "learning_rate": 4.9803889015486e-05, + "loss": 0.8847, + "step": 85800 + }, + { + "epoch": 4.45, + "learning_rate": 4.977855256188567e-05, + "loss": 0.9499, + "step": 85900 + }, + { + "epoch": 4.45, + "learning_rate": 4.975319113016941e-05, + "loss": 0.9343, + "step": 86000 + }, + { + "epoch": 4.46, + "learning_rate": 4.972780475236591e-05, + "loss": 0.9115, + "step": 86100 + }, + { + "epoch": 4.46, + "learning_rate": 4.970239346053532e-05, + "loss": 0.9117, + "step": 86200 + }, + { + "epoch": 4.47, + "learning_rate": 4.967721177156708e-05, + "loss": 0.9186, + "step": 86300 + }, + { + "epoch": 4.47, + "learning_rate": 4.965175099632768e-05, + "loss": 0.9145, + "step": 86400 + }, + { + "epoch": 4.48, + "learning_rate": 4.962626540310865e-05, + "loss": 0.9075, + "step": 86500 + }, + { + "epoch": 4.48, + "learning_rate": 4.960075502409547e-05, + "loss": 0.9366, + "step": 86600 + }, + { + "epoch": 4.49, + "learning_rate": 4.9575219891504906e-05, + "loss": 0.8687, + "step": 86700 + }, + { + "epoch": 4.49, + "learning_rate": 4.9549660037585e-05, + "loss": 1.0142, + "step": 86800 + }, + { + "epoch": 4.5, + "learning_rate": 4.952407549461501e-05, + "loss": 0.9499, + "step": 86900 + }, + { + "epoch": 4.5, + "learning_rate": 4.949846629490537e-05, + "loss": 0.94, + "step": 87000 + }, + { + "epoch": 4.51, + "learning_rate": 4.947283247079767e-05, + "loss": 0.8782, + "step": 87100 + }, + { + "epoch": 4.52, + "learning_rate": 4.944717405466456e-05, + "loss": 0.9052, + "step": 87200 + }, + { + "epoch": 4.52, + "learning_rate": 4.942149107890979e-05, + "loss": 0.9292, + "step": 87300 + }, + { + "epoch": 4.53, + "learning_rate": 4.9395783575968085e-05, + "loss": 0.9317, + "step": 87400 + }, + { + "epoch": 4.53, + "learning_rate": 4.93700515783052e-05, + "loss": 0.9255, + "step": 87500 + }, + { + "epoch": 4.54, + "learning_rate": 4.934429511841776e-05, + "loss": 0.9532, + "step": 87600 + }, + { + "epoch": 4.54, + "learning_rate": 4.931851422883334e-05, + "loss": 0.8874, + "step": 87700 + }, + { + "epoch": 4.55, + "learning_rate": 4.929270894211032e-05, + "loss": 0.9602, + "step": 87800 + }, + { + "epoch": 4.55, + "learning_rate": 4.926687929083793e-05, + "loss": 0.9681, + "step": 87900 + }, + { + "epoch": 4.56, + "learning_rate": 4.9241025307636126e-05, + "loss": 0.8903, + "step": 88000 + }, + { + "epoch": 4.56, + "learning_rate": 4.921514702515565e-05, + "loss": 0.8892, + "step": 88100 + }, + { + "epoch": 4.57, + "learning_rate": 4.918924447607787e-05, + "loss": 0.9924, + "step": 88200 + }, + { + "epoch": 4.57, + "learning_rate": 4.916357708079473e-05, + "loss": 0.9151, + "step": 88300 + }, + { + "epoch": 4.58, + "learning_rate": 4.913762633853836e-05, + "loss": 0.9054, + "step": 88400 + }, + { + "epoch": 4.58, + "learning_rate": 4.911165142758471e-05, + "loss": 0.8564, + "step": 88500 + }, + { + "epoch": 4.59, + "learning_rate": 4.9085652380737236e-05, + "loss": 0.9039, + "step": 88600 + }, + { + "epoch": 4.59, + "learning_rate": 4.905962923082983e-05, + "loss": 0.9499, + "step": 88700 + }, + { + "epoch": 4.6, + "learning_rate": 4.903358201072683e-05, + "loss": 0.912, + "step": 88800 + }, + { + "epoch": 4.6, + "learning_rate": 4.9007510753323004e-05, + "loss": 0.9318, + "step": 88900 + }, + { + "epoch": 4.61, + "learning_rate": 4.898141549154344e-05, + "loss": 1.0008, + "step": 89000 + }, + { + "epoch": 4.61, + "learning_rate": 4.895529625834356e-05, + "loss": 0.915, + "step": 89100 + }, + { + "epoch": 4.62, + "learning_rate": 4.892915308670907e-05, + "loss": 0.96, + "step": 89200 + }, + { + "epoch": 4.62, + "learning_rate": 4.890298600965587e-05, + "loss": 0.9005, + "step": 89300 + }, + { + "epoch": 4.63, + "learning_rate": 4.887679506023009e-05, + "loss": 0.9833, + "step": 89400 + }, + { + "epoch": 4.63, + "learning_rate": 4.885058027150798e-05, + "loss": 0.9122, + "step": 89500 + }, + { + "epoch": 4.64, + "learning_rate": 4.88246041802769e-05, + "loss": 0.8953, + "step": 89600 + }, + { + "epoch": 4.64, + "learning_rate": 4.879834204987772e-05, + "loss": 1.0277, + "step": 89700 + }, + { + "epoch": 4.65, + "learning_rate": 4.877205617925967e-05, + "loss": 0.9414, + "step": 89800 + }, + { + "epoch": 4.65, + "learning_rate": 4.874574660161886e-05, + "loss": 1.0195, + "step": 89900 + }, + { + "epoch": 4.66, + "learning_rate": 4.8719413350181386e-05, + "loss": 0.913, + "step": 90000 + }, + { + "epoch": 4.67, + "learning_rate": 4.869305645820321e-05, + "loss": 0.9354, + "step": 90100 + }, + { + "epoch": 4.67, + "learning_rate": 4.866667595897016e-05, + "loss": 0.8649, + "step": 90200 + }, + { + "epoch": 4.68, + "learning_rate": 4.864027188579789e-05, + "loss": 0.8968, + "step": 90300 + }, + { + "epoch": 4.68, + "learning_rate": 4.86138442720318e-05, + "loss": 0.9678, + "step": 90400 + }, + { + "epoch": 4.69, + "learning_rate": 4.858739315104703e-05, + "loss": 0.8485, + "step": 90500 + }, + { + "epoch": 4.69, + "learning_rate": 4.856091855624842e-05, + "loss": 0.8886, + "step": 90600 + }, + { + "epoch": 4.7, + "learning_rate": 4.8534420521070446e-05, + "loss": 0.8262, + "step": 90700 + }, + { + "epoch": 4.7, + "learning_rate": 4.850789907897717e-05, + "loss": 0.8408, + "step": 90800 + }, + { + "epoch": 4.71, + "learning_rate": 4.848135426346224e-05, + "loss": 0.8686, + "step": 90900 + }, + { + "epoch": 4.71, + "learning_rate": 4.84547861080488e-05, + "loss": 0.9004, + "step": 91000 + }, + { + "epoch": 4.72, + "learning_rate": 4.8428194646289495e-05, + "loss": 0.9077, + "step": 91100 + }, + { + "epoch": 4.72, + "learning_rate": 4.840157991176638e-05, + "loss": 0.8231, + "step": 91200 + }, + { + "epoch": 4.73, + "learning_rate": 4.837494193809091e-05, + "loss": 0.8458, + "step": 91300 + }, + { + "epoch": 4.73, + "learning_rate": 4.834828075890389e-05, + "loss": 0.9483, + "step": 91400 + }, + { + "epoch": 4.74, + "learning_rate": 4.832159640787542e-05, + "loss": 0.8433, + "step": 91500 + }, + { + "epoch": 4.74, + "learning_rate": 4.8294888918704895e-05, + "loss": 0.9254, + "step": 91600 + }, + { + "epoch": 4.75, + "learning_rate": 4.8268158325120896e-05, + "loss": 0.9304, + "step": 91700 + }, + { + "epoch": 4.75, + "learning_rate": 4.824140466088119e-05, + "loss": 0.9286, + "step": 91800 + }, + { + "epoch": 4.76, + "learning_rate": 4.821462795977268e-05, + "loss": 0.9325, + "step": 91900 + }, + { + "epoch": 4.76, + "learning_rate": 4.818782825561138e-05, + "loss": 0.9492, + "step": 92000 + }, + { + "epoch": 4.77, + "learning_rate": 4.816100558224233e-05, + "loss": 0.9017, + "step": 92100 + }, + { + "epoch": 4.77, + "learning_rate": 4.813415997353961e-05, + "loss": 0.931, + "step": 92200 + }, + { + "epoch": 4.78, + "learning_rate": 4.810729146340621e-05, + "loss": 0.8489, + "step": 92300 + }, + { + "epoch": 4.78, + "learning_rate": 4.808040008577411e-05, + "loss": 0.86, + "step": 92400 + }, + { + "epoch": 4.79, + "learning_rate": 4.8053485874604096e-05, + "loss": 0.946, + "step": 92500 + }, + { + "epoch": 4.79, + "learning_rate": 4.802654886388586e-05, + "loss": 0.7644, + "step": 92600 + }, + { + "epoch": 4.8, + "learning_rate": 4.799958908763784e-05, + "loss": 0.9249, + "step": 92700 + }, + { + "epoch": 4.81, + "learning_rate": 4.797260657990725e-05, + "loss": 0.8402, + "step": 92800 + }, + { + "epoch": 4.81, + "learning_rate": 4.794560137477e-05, + "loss": 0.9012, + "step": 92900 + }, + { + "epoch": 4.82, + "learning_rate": 4.791857350633065e-05, + "loss": 0.8346, + "step": 93000 + }, + { + "epoch": 4.82, + "learning_rate": 4.7891523008722423e-05, + "loss": 0.9424, + "step": 93100 + }, + { + "epoch": 4.83, + "learning_rate": 4.786444991610708e-05, + "loss": 0.8269, + "step": 93200 + }, + { + "epoch": 4.83, + "learning_rate": 4.783735426267492e-05, + "loss": 0.8904, + "step": 93300 + }, + { + "epoch": 4.84, + "learning_rate": 4.7810236082644764e-05, + "loss": 0.8982, + "step": 93400 + }, + { + "epoch": 4.84, + "learning_rate": 4.778309541026386e-05, + "loss": 0.9415, + "step": 93500 + }, + { + "epoch": 4.85, + "learning_rate": 4.775593227980785e-05, + "loss": 0.9349, + "step": 93600 + }, + { + "epoch": 4.85, + "learning_rate": 4.772874672558077e-05, + "loss": 0.8556, + "step": 93700 + }, + { + "epoch": 4.86, + "learning_rate": 4.770153878191494e-05, + "loss": 0.8097, + "step": 93800 + }, + { + "epoch": 4.86, + "learning_rate": 4.767430848317098e-05, + "loss": 0.9081, + "step": 93900 + }, + { + "epoch": 4.87, + "learning_rate": 4.764705586373774e-05, + "loss": 0.906, + "step": 94000 + }, + { + "epoch": 4.87, + "learning_rate": 4.7619780958032244e-05, + "loss": 0.8773, + "step": 94100 + }, + { + "epoch": 4.88, + "learning_rate": 4.759248380049966e-05, + "loss": 0.8273, + "step": 94200 + }, + { + "epoch": 4.88, + "learning_rate": 4.75651644256133e-05, + "loss": 0.9172, + "step": 94300 + }, + { + "epoch": 4.89, + "learning_rate": 4.7538096393143614e-05, + "loss": 0.7936, + "step": 94400 + }, + { + "epoch": 4.89, + "learning_rate": 4.75107329083939e-05, + "loss": 0.919, + "step": 94500 + }, + { + "epoch": 4.9, + "learning_rate": 4.748334730953268e-05, + "loss": 0.9955, + "step": 94600 + }, + { + "epoch": 4.9, + "learning_rate": 4.745593963114494e-05, + "loss": 0.8785, + "step": 94700 + }, + { + "epoch": 4.91, + "learning_rate": 4.742850990784352e-05, + "loss": 0.8939, + "step": 94800 + }, + { + "epoch": 4.91, + "learning_rate": 4.740105817426913e-05, + "loss": 0.9731, + "step": 94900 + }, + { + "epoch": 4.92, + "learning_rate": 4.737358446509026e-05, + "loss": 0.9154, + "step": 95000 + }, + { + "epoch": 4.92, + "learning_rate": 4.7346088815003146e-05, + "loss": 0.9898, + "step": 95100 + }, + { + "epoch": 4.93, + "learning_rate": 4.731857125873174e-05, + "loss": 0.8608, + "step": 95200 + }, + { + "epoch": 4.93, + "learning_rate": 4.7291031831027673e-05, + "loss": 0.9947, + "step": 95300 + }, + { + "epoch": 4.94, + "learning_rate": 4.7263470566670175e-05, + "loss": 0.9944, + "step": 95400 + }, + { + "epoch": 4.94, + "learning_rate": 4.723588750046607e-05, + "loss": 0.974, + "step": 95500 + }, + { + "epoch": 4.95, + "learning_rate": 4.72082826672497e-05, + "loss": 0.9666, + "step": 95600 + }, + { + "epoch": 4.96, + "learning_rate": 4.71806561018829e-05, + "loss": 0.9483, + "step": 95700 + }, + { + "epoch": 4.96, + "learning_rate": 4.715300783925497e-05, + "loss": 0.8933, + "step": 95800 + }, + { + "epoch": 4.97, + "learning_rate": 4.712533791428258e-05, + "loss": 0.8743, + "step": 95900 + }, + { + "epoch": 4.97, + "learning_rate": 4.709764636190978e-05, + "loss": 0.8872, + "step": 96000 + }, + { + "epoch": 4.98, + "learning_rate": 4.7069933217107946e-05, + "loss": 0.8391, + "step": 96100 + }, + { + "epoch": 4.98, + "learning_rate": 4.7042198514875675e-05, + "loss": 0.853, + "step": 96200 + }, + { + "epoch": 4.99, + "learning_rate": 4.7014442290238824e-05, + "loss": 0.8739, + "step": 96300 + }, + { + "epoch": 4.99, + "learning_rate": 4.698666457825043e-05, + "loss": 0.848, + "step": 96400 + }, + { + "epoch": 5.0, + "learning_rate": 4.6958865413990646e-05, + "loss": 0.942, + "step": 96500 + }, + { + "epoch": 5.0, + "eval_accuracy": 0.6235030288909599, + "eval_cer": 0.19120704340010636, + "eval_loss": 0.9764400720596313, + "eval_runtime": 4323.3286, + "eval_samples_per_second": 3.971, + "eval_steps_per_second": 0.248, + "eval_wer": 0.3744662078701253, + "step": 96565 + }, + { + "epoch": 5.0, + "learning_rate": 4.6931044832566745e-05, + "loss": 0.8896, + "step": 96600 + }, + { + "epoch": 5.01, + "learning_rate": 4.690320286911302e-05, + "loss": 0.802, + "step": 96700 + }, + { + "epoch": 5.01, + "learning_rate": 4.6875339558790795e-05, + "loss": 0.8266, + "step": 96800 + }, + { + "epoch": 5.02, + "learning_rate": 4.684745493678833e-05, + "loss": 0.7704, + "step": 96900 + }, + { + "epoch": 5.02, + "learning_rate": 4.681954903832079e-05, + "loss": 0.8544, + "step": 97000 + }, + { + "epoch": 5.03, + "learning_rate": 4.679162189863024e-05, + "loss": 0.8739, + "step": 97100 + }, + { + "epoch": 5.03, + "learning_rate": 4.6763673552985575e-05, + "loss": 0.9071, + "step": 97200 + }, + { + "epoch": 5.04, + "learning_rate": 4.673570403668242e-05, + "loss": 0.8233, + "step": 97300 + }, + { + "epoch": 5.04, + "learning_rate": 4.670771338504319e-05, + "loss": 0.7495, + "step": 97400 + }, + { + "epoch": 5.05, + "learning_rate": 4.667970163341696e-05, + "loss": 0.7638, + "step": 97500 + }, + { + "epoch": 5.05, + "learning_rate": 4.665166881717948e-05, + "loss": 0.8591, + "step": 97600 + }, + { + "epoch": 5.06, + "learning_rate": 4.662361497173306e-05, + "loss": 0.8176, + "step": 97700 + }, + { + "epoch": 5.06, + "learning_rate": 4.659554013250661e-05, + "loss": 0.7969, + "step": 97800 + }, + { + "epoch": 5.07, + "learning_rate": 4.656744433495552e-05, + "loss": 0.7673, + "step": 97900 + }, + { + "epoch": 5.07, + "learning_rate": 4.653932761456166e-05, + "loss": 0.794, + "step": 98000 + }, + { + "epoch": 5.08, + "learning_rate": 4.651119000683336e-05, + "loss": 0.7859, + "step": 98100 + }, + { + "epoch": 5.08, + "learning_rate": 4.6483031547305264e-05, + "loss": 0.845, + "step": 98200 + }, + { + "epoch": 5.09, + "learning_rate": 4.645485227153838e-05, + "loss": 0.742, + "step": 98300 + }, + { + "epoch": 5.1, + "learning_rate": 4.6426652215120025e-05, + "loss": 0.7588, + "step": 98400 + }, + { + "epoch": 5.1, + "learning_rate": 4.6398431413663716e-05, + "loss": 0.7491, + "step": 98500 + }, + { + "epoch": 5.11, + "learning_rate": 4.637018990280921e-05, + "loss": 0.7376, + "step": 98600 + }, + { + "epoch": 5.11, + "learning_rate": 4.634192771822238e-05, + "loss": 0.7825, + "step": 98700 + }, + { + "epoch": 5.12, + "learning_rate": 4.631364489559525e-05, + "loss": 0.7606, + "step": 98800 + }, + { + "epoch": 5.12, + "learning_rate": 4.628534147064586e-05, + "loss": 0.7506, + "step": 98900 + }, + { + "epoch": 5.13, + "learning_rate": 4.6257017479118326e-05, + "loss": 0.7978, + "step": 99000 + }, + { + "epoch": 5.13, + "learning_rate": 4.6228672956782684e-05, + "loss": 0.7532, + "step": 99100 + }, + { + "epoch": 5.14, + "learning_rate": 4.6200307939434916e-05, + "loss": 0.7597, + "step": 99200 + }, + { + "epoch": 5.14, + "learning_rate": 4.617192246289689e-05, + "loss": 0.8297, + "step": 99300 + }, + { + "epoch": 5.15, + "learning_rate": 4.614351656301632e-05, + "loss": 0.7436, + "step": 99400 + }, + { + "epoch": 5.15, + "learning_rate": 4.611509027566669e-05, + "loss": 0.8071, + "step": 99500 + }, + { + "epoch": 5.16, + "learning_rate": 4.608664363674727e-05, + "loss": 0.7963, + "step": 99600 + }, + { + "epoch": 5.16, + "learning_rate": 4.605817668218298e-05, + "loss": 0.7603, + "step": 99700 + }, + { + "epoch": 5.17, + "learning_rate": 4.602968944792444e-05, + "loss": 0.7347, + "step": 99800 + }, + { + "epoch": 5.17, + "learning_rate": 4.6001181969947854e-05, + "loss": 0.8433, + "step": 99900 + }, + { + "epoch": 5.18, + "learning_rate": 4.5972654284255e-05, + "loss": 0.7755, + "step": 100000 + }, + { + "epoch": 5.18, + "learning_rate": 4.59441064268732e-05, + "loss": 0.8077, + "step": 100100 + }, + { + "epoch": 5.19, + "learning_rate": 4.59155384338552e-05, + "loss": 0.7763, + "step": 100200 + }, + { + "epoch": 5.19, + "learning_rate": 4.588723632157926e-05, + "loss": 0.7931, + "step": 100300 + }, + { + "epoch": 5.2, + "learning_rate": 4.585862836600463e-05, + "loss": 0.8006, + "step": 100400 + }, + { + "epoch": 5.2, + "learning_rate": 4.5830000382743106e-05, + "loss": 0.789, + "step": 100500 + }, + { + "epoch": 5.21, + "learning_rate": 4.580135240794865e-05, + "loss": 0.7526, + "step": 100600 + }, + { + "epoch": 5.21, + "learning_rate": 4.5772684477800504e-05, + "loss": 0.7726, + "step": 100700 + }, + { + "epoch": 5.22, + "learning_rate": 4.574399662850304e-05, + "loss": 0.7832, + "step": 100800 + }, + { + "epoch": 5.22, + "learning_rate": 4.571528889628585e-05, + "loss": 0.8115, + "step": 100900 + }, + { + "epoch": 5.23, + "learning_rate": 4.5686561317403605e-05, + "loss": 0.7478, + "step": 101000 + }, + { + "epoch": 5.23, + "learning_rate": 4.565781392813605e-05, + "loss": 0.7625, + "step": 101100 + }, + { + "epoch": 5.24, + "learning_rate": 4.562904676478795e-05, + "loss": 0.8037, + "step": 101200 + }, + { + "epoch": 5.25, + "learning_rate": 4.5600259863689036e-05, + "loss": 0.8188, + "step": 101300 + }, + { + "epoch": 5.25, + "learning_rate": 4.557145326119396e-05, + "loss": 0.7661, + "step": 101400 + }, + { + "epoch": 5.26, + "learning_rate": 4.554262699368227e-05, + "loss": 0.7966, + "step": 101500 + }, + { + "epoch": 5.26, + "learning_rate": 4.551378109755835e-05, + "loss": 0.7572, + "step": 101600 + }, + { + "epoch": 5.27, + "learning_rate": 4.548491560925134e-05, + "loss": 0.7894, + "step": 101700 + }, + { + "epoch": 5.27, + "learning_rate": 4.5456030565215174e-05, + "loss": 0.793, + "step": 101800 + }, + { + "epoch": 5.28, + "learning_rate": 4.542712600192843e-05, + "loss": 0.8103, + "step": 101900 + }, + { + "epoch": 5.28, + "learning_rate": 4.539820195589439e-05, + "loss": 0.7329, + "step": 102000 + }, + { + "epoch": 5.29, + "learning_rate": 4.536925846364088e-05, + "loss": 0.8594, + "step": 102100 + }, + { + "epoch": 5.29, + "learning_rate": 4.534029556172036e-05, + "loss": 0.7805, + "step": 102200 + }, + { + "epoch": 5.3, + "learning_rate": 4.531131328670971e-05, + "loss": 0.9, + "step": 102300 + }, + { + "epoch": 5.3, + "learning_rate": 4.528231167521037e-05, + "loss": 0.8412, + "step": 102400 + }, + { + "epoch": 5.31, + "learning_rate": 4.525329076384813e-05, + "loss": 0.7814, + "step": 102500 + }, + { + "epoch": 5.31, + "learning_rate": 4.5224250589273174e-05, + "loss": 0.7831, + "step": 102600 + }, + { + "epoch": 5.32, + "learning_rate": 4.5195191188160034e-05, + "loss": 0.7809, + "step": 102700 + }, + { + "epoch": 5.32, + "learning_rate": 4.5166112597207505e-05, + "loss": 0.7722, + "step": 102800 + }, + { + "epoch": 5.33, + "learning_rate": 4.513701485313862e-05, + "loss": 0.7847, + "step": 102900 + }, + { + "epoch": 5.33, + "learning_rate": 4.5107897992700585e-05, + "loss": 0.8117, + "step": 103000 + }, + { + "epoch": 5.34, + "learning_rate": 4.5079344958207595e-05, + "loss": 0.8499, + "step": 103100 + }, + { + "epoch": 5.34, + "learning_rate": 4.505019035586476e-05, + "loss": 0.8759, + "step": 103200 + }, + { + "epoch": 5.35, + "learning_rate": 4.5021016746802494e-05, + "loss": 0.7639, + "step": 103300 + }, + { + "epoch": 5.35, + "learning_rate": 4.4991824167863794e-05, + "loss": 0.798, + "step": 103400 + }, + { + "epoch": 5.36, + "learning_rate": 4.49626126559157e-05, + "loss": 0.8245, + "step": 103500 + }, + { + "epoch": 5.36, + "learning_rate": 4.4933382247849054e-05, + "loss": 0.7966, + "step": 103600 + }, + { + "epoch": 5.37, + "learning_rate": 4.490413298057865e-05, + "loss": 0.7965, + "step": 103700 + }, + { + "epoch": 5.37, + "learning_rate": 4.487486489104305e-05, + "loss": 0.8178, + "step": 103800 + }, + { + "epoch": 5.38, + "learning_rate": 4.4845578016204604e-05, + "loss": 0.7432, + "step": 103900 + }, + { + "epoch": 5.38, + "learning_rate": 4.481627239304939e-05, + "loss": 0.8282, + "step": 104000 + }, + { + "epoch": 5.39, + "learning_rate": 4.4786948058587156e-05, + "loss": 0.8101, + "step": 104100 + }, + { + "epoch": 5.4, + "learning_rate": 4.475760504985128e-05, + "loss": 0.7412, + "step": 104200 + }, + { + "epoch": 5.4, + "learning_rate": 4.472824340389871e-05, + "loss": 0.7656, + "step": 104300 + }, + { + "epoch": 5.41, + "learning_rate": 4.4698863157809955e-05, + "loss": 0.7442, + "step": 104400 + }, + { + "epoch": 5.41, + "learning_rate": 4.4669464348689005e-05, + "loss": 0.8096, + "step": 104500 + }, + { + "epoch": 5.42, + "learning_rate": 4.4640047013663293e-05, + "loss": 0.8049, + "step": 104600 + }, + { + "epoch": 5.42, + "learning_rate": 4.461061118988365e-05, + "loss": 0.7463, + "step": 104700 + }, + { + "epoch": 5.43, + "learning_rate": 4.458115691452425e-05, + "loss": 0.7635, + "step": 104800 + }, + { + "epoch": 5.43, + "learning_rate": 4.455168422478256e-05, + "loss": 0.7464, + "step": 104900 + }, + { + "epoch": 5.44, + "learning_rate": 4.452219315787934e-05, + "loss": 0.7944, + "step": 105000 + }, + { + "epoch": 5.44, + "learning_rate": 4.4492683751058506e-05, + "loss": 0.7778, + "step": 105100 + }, + { + "epoch": 5.45, + "learning_rate": 4.446315604158718e-05, + "loss": 0.8076, + "step": 105200 + }, + { + "epoch": 5.45, + "learning_rate": 4.4433610066755576e-05, + "loss": 0.8433, + "step": 105300 + }, + { + "epoch": 5.46, + "learning_rate": 4.440404586387698e-05, + "loss": 0.8064, + "step": 105400 + }, + { + "epoch": 5.46, + "learning_rate": 4.43744634702877e-05, + "loss": 0.8567, + "step": 105500 + }, + { + "epoch": 5.47, + "learning_rate": 4.434515901855278e-05, + "loss": 0.805, + "step": 105600 + }, + { + "epoch": 5.47, + "learning_rate": 4.431554053661747e-05, + "loss": 0.8769, + "step": 105700 + }, + { + "epoch": 5.48, + "learning_rate": 4.428590397574387e-05, + "loss": 0.8037, + "step": 105800 + }, + { + "epoch": 5.48, + "learning_rate": 4.425624937335967e-05, + "loss": 0.7936, + "step": 105900 + }, + { + "epoch": 5.49, + "learning_rate": 4.4226576766915335e-05, + "loss": 0.7728, + "step": 106000 + }, + { + "epoch": 5.49, + "learning_rate": 4.419688619388409e-05, + "loss": 0.7778, + "step": 106100 + }, + { + "epoch": 5.5, + "learning_rate": 4.4167177691761816e-05, + "loss": 0.787, + "step": 106200 + }, + { + "epoch": 5.5, + "learning_rate": 4.413745129806707e-05, + "loss": 0.7842, + "step": 106300 + }, + { + "epoch": 5.51, + "learning_rate": 4.4107707050340954e-05, + "loss": 0.7803, + "step": 106400 + }, + { + "epoch": 5.51, + "learning_rate": 4.4077944986147186e-05, + "loss": 0.8602, + "step": 106500 + }, + { + "epoch": 5.52, + "learning_rate": 4.4048165143071936e-05, + "loss": 0.7886, + "step": 106600 + }, + { + "epoch": 5.52, + "learning_rate": 4.401836755872383e-05, + "loss": 0.7533, + "step": 106700 + }, + { + "epoch": 5.53, + "learning_rate": 4.3988552270733925e-05, + "loss": 0.7682, + "step": 106800 + }, + { + "epoch": 5.54, + "learning_rate": 4.395871931675561e-05, + "loss": 0.7694, + "step": 106900 + }, + { + "epoch": 5.54, + "learning_rate": 4.392886873446459e-05, + "loss": 0.7936, + "step": 107000 + }, + { + "epoch": 5.55, + "learning_rate": 4.389900056155885e-05, + "loss": 0.8758, + "step": 107100 + }, + { + "epoch": 5.55, + "learning_rate": 4.3869114835758554e-05, + "loss": 0.823, + "step": 107200 + }, + { + "epoch": 5.56, + "learning_rate": 4.383921159480607e-05, + "loss": 0.7796, + "step": 107300 + }, + { + "epoch": 5.56, + "learning_rate": 4.380929087646588e-05, + "loss": 0.7798, + "step": 107400 + }, + { + "epoch": 5.57, + "learning_rate": 4.37793527185245e-05, + "loss": 0.7862, + "step": 107500 + }, + { + "epoch": 5.57, + "learning_rate": 4.374939715879054e-05, + "loss": 0.8475, + "step": 107600 + }, + { + "epoch": 5.58, + "learning_rate": 4.3719424235094515e-05, + "loss": 0.7653, + "step": 107700 + }, + { + "epoch": 5.58, + "learning_rate": 4.368943398528891e-05, + "loss": 0.7646, + "step": 107800 + }, + { + "epoch": 5.59, + "learning_rate": 4.365942644724808e-05, + "loss": 0.7898, + "step": 107900 + }, + { + "epoch": 5.59, + "learning_rate": 4.362940165886822e-05, + "loss": 0.8598, + "step": 108000 + }, + { + "epoch": 5.6, + "learning_rate": 4.359935965806729e-05, + "loss": 0.8077, + "step": 108100 + }, + { + "epoch": 5.6, + "learning_rate": 4.356930048278501e-05, + "loss": 0.7643, + "step": 108200 + }, + { + "epoch": 5.61, + "learning_rate": 4.3539224170982786e-05, + "loss": 0.8222, + "step": 108300 + }, + { + "epoch": 5.61, + "learning_rate": 4.350913076064366e-05, + "loss": 0.8024, + "step": 108400 + }, + { + "epoch": 5.62, + "learning_rate": 4.347902028977225e-05, + "loss": 0.7986, + "step": 108500 + }, + { + "epoch": 5.62, + "learning_rate": 4.344889279639476e-05, + "loss": 0.7564, + "step": 108600 + }, + { + "epoch": 5.63, + "learning_rate": 4.3418748318558855e-05, + "loss": 0.7893, + "step": 108700 + }, + { + "epoch": 5.63, + "learning_rate": 4.3388586894333674e-05, + "loss": 0.7863, + "step": 108800 + }, + { + "epoch": 5.64, + "learning_rate": 4.335840856180974e-05, + "loss": 0.9097, + "step": 108900 + }, + { + "epoch": 5.64, + "learning_rate": 4.332821335909894e-05, + "loss": 0.8541, + "step": 109000 + }, + { + "epoch": 5.65, + "learning_rate": 4.329800132433446e-05, + "loss": 0.8332, + "step": 109100 + }, + { + "epoch": 5.65, + "learning_rate": 4.326777249567075e-05, + "loss": 0.8675, + "step": 109200 + }, + { + "epoch": 5.66, + "learning_rate": 4.3237526911283444e-05, + "loss": 0.7923, + "step": 109300 + }, + { + "epoch": 5.66, + "learning_rate": 4.320726460936939e-05, + "loss": 0.822, + "step": 109400 + }, + { + "epoch": 5.67, + "learning_rate": 4.31769856281465e-05, + "loss": 0.8198, + "step": 109500 + }, + { + "epoch": 5.67, + "learning_rate": 4.314669000585375e-05, + "loss": 0.7492, + "step": 109600 + }, + { + "epoch": 5.68, + "learning_rate": 4.311637778075118e-05, + "loss": 0.7917, + "step": 109700 + }, + { + "epoch": 5.69, + "learning_rate": 4.308604899111973e-05, + "loss": 0.7732, + "step": 109800 + }, + { + "epoch": 5.69, + "learning_rate": 4.305570367526132e-05, + "loss": 0.8391, + "step": 109900 + }, + { + "epoch": 5.7, + "learning_rate": 4.30253418714987e-05, + "loss": 0.8007, + "step": 110000 + }, + { + "epoch": 5.7, + "learning_rate": 4.2994963618175476e-05, + "loss": 0.7709, + "step": 110100 + }, + { + "epoch": 5.71, + "learning_rate": 4.296456895365598e-05, + "loss": 0.817, + "step": 110200 + }, + { + "epoch": 5.71, + "learning_rate": 4.293415791632533e-05, + "loss": 0.7481, + "step": 110300 + }, + { + "epoch": 5.72, + "learning_rate": 4.290403489903577e-05, + "loss": 0.7823, + "step": 110400 + }, + { + "epoch": 5.72, + "learning_rate": 4.287359139409021e-05, + "loss": 0.7768, + "step": 110500 + }, + { + "epoch": 5.73, + "learning_rate": 4.284313163122803e-05, + "loss": 0.8416, + "step": 110600 + }, + { + "epoch": 5.73, + "learning_rate": 4.2812655648916536e-05, + "loss": 0.7178, + "step": 110700 + }, + { + "epoch": 5.74, + "learning_rate": 4.278216348564351e-05, + "loss": 0.7738, + "step": 110800 + }, + { + "epoch": 5.74, + "learning_rate": 4.275165517991717e-05, + "loss": 0.7242, + "step": 110900 + }, + { + "epoch": 5.75, + "learning_rate": 4.2721130770266116e-05, + "loss": 0.7984, + "step": 111000 + }, + { + "epoch": 5.75, + "learning_rate": 4.2690590295239283e-05, + "loss": 0.8005, + "step": 111100 + }, + { + "epoch": 5.76, + "learning_rate": 4.266003379340593e-05, + "loss": 0.749, + "step": 111200 + }, + { + "epoch": 5.76, + "learning_rate": 4.2629461303355474e-05, + "loss": 0.7994, + "step": 111300 + }, + { + "epoch": 5.77, + "learning_rate": 4.259887286369763e-05, + "loss": 0.7662, + "step": 111400 + }, + { + "epoch": 5.77, + "learning_rate": 4.2568268513062164e-05, + "loss": 0.792, + "step": 111500 + }, + { + "epoch": 5.78, + "learning_rate": 4.253764829009899e-05, + "loss": 0.8394, + "step": 111600 + }, + { + "epoch": 5.78, + "learning_rate": 4.2507012233478036e-05, + "loss": 0.7875, + "step": 111700 + }, + { + "epoch": 5.79, + "learning_rate": 4.247636038188925e-05, + "loss": 0.7232, + "step": 111800 + }, + { + "epoch": 5.79, + "learning_rate": 4.244569277404252e-05, + "loss": 0.7161, + "step": 111900 + }, + { + "epoch": 5.8, + "learning_rate": 4.241500944866763e-05, + "loss": 0.6989, + "step": 112000 + }, + { + "epoch": 5.8, + "learning_rate": 4.23843104445142e-05, + "loss": 0.7476, + "step": 112100 + }, + { + "epoch": 5.81, + "learning_rate": 4.235359580035168e-05, + "loss": 0.7298, + "step": 112200 + }, + { + "epoch": 5.81, + "learning_rate": 4.232286555496925e-05, + "loss": 0.7839, + "step": 112300 + }, + { + "epoch": 5.82, + "learning_rate": 4.229211974717579e-05, + "loss": 0.7747, + "step": 112400 + }, + { + "epoch": 5.83, + "learning_rate": 4.2261358415799854e-05, + "loss": 0.8086, + "step": 112500 + }, + { + "epoch": 5.83, + "learning_rate": 4.223058159968958e-05, + "loss": 0.7591, + "step": 112600 + }, + { + "epoch": 5.84, + "learning_rate": 4.219978933771267e-05, + "loss": 0.7889, + "step": 112700 + }, + { + "epoch": 5.84, + "learning_rate": 4.216898166875633e-05, + "loss": 0.8414, + "step": 112800 + }, + { + "epoch": 5.85, + "learning_rate": 4.2138158631727236e-05, + "loss": 0.7773, + "step": 112900 + }, + { + "epoch": 5.85, + "learning_rate": 4.210732026555146e-05, + "loss": 0.737, + "step": 113000 + }, + { + "epoch": 5.86, + "learning_rate": 4.207677522129677e-05, + "loss": 0.8243, + "step": 113100 + }, + { + "epoch": 5.86, + "learning_rate": 4.204590646600264e-05, + "loss": 0.774, + "step": 113200 + }, + { + "epoch": 5.87, + "learning_rate": 4.201502249806608e-05, + "loss": 0.8191, + "step": 113300 + }, + { + "epoch": 5.87, + "learning_rate": 4.198412335649009e-05, + "loss": 0.7554, + "step": 113400 + }, + { + "epoch": 5.88, + "learning_rate": 4.1953209080296875e-05, + "loss": 0.7577, + "step": 113500 + }, + { + "epoch": 5.88, + "learning_rate": 4.1922279708527705e-05, + "loss": 0.766, + "step": 113600 + }, + { + "epoch": 5.89, + "learning_rate": 4.189164479892727e-05, + "loss": 0.7521, + "step": 113700 + }, + { + "epoch": 5.89, + "learning_rate": 4.1860685503187196e-05, + "loss": 0.6928, + "step": 113800 + }, + { + "epoch": 5.9, + "learning_rate": 4.182971122871818e-05, + "loss": 0.7394, + "step": 113900 + }, + { + "epoch": 5.9, + "learning_rate": 4.179872201463731e-05, + "loss": 0.7885, + "step": 114000 + }, + { + "epoch": 5.91, + "learning_rate": 4.176771790008051e-05, + "loss": 0.7045, + "step": 114100 + }, + { + "epoch": 5.91, + "learning_rate": 4.173669892420254e-05, + "loss": 0.7222, + "step": 114200 + }, + { + "epoch": 5.92, + "learning_rate": 4.170566512617692e-05, + "loss": 0.7956, + "step": 114300 + }, + { + "epoch": 5.92, + "learning_rate": 4.1674616545195893e-05, + "loss": 0.7408, + "step": 114400 + }, + { + "epoch": 5.93, + "learning_rate": 4.1643553220470364e-05, + "loss": 0.7018, + "step": 114500 + }, + { + "epoch": 5.93, + "learning_rate": 4.161247519122987e-05, + "loss": 0.7406, + "step": 114600 + }, + { + "epoch": 5.94, + "learning_rate": 4.1581382496722515e-05, + "loss": 0.7798, + "step": 114700 + }, + { + "epoch": 5.94, + "learning_rate": 4.155027517621491e-05, + "loss": 0.8111, + "step": 114800 + }, + { + "epoch": 5.95, + "learning_rate": 4.151915326899216e-05, + "loss": 0.7038, + "step": 114900 + }, + { + "epoch": 5.95, + "learning_rate": 4.148801681435775e-05, + "loss": 0.7191, + "step": 115000 + }, + { + "epoch": 5.96, + "learning_rate": 4.14568658516336e-05, + "loss": 0.7988, + "step": 115100 + }, + { + "epoch": 5.96, + "learning_rate": 4.142570042015989e-05, + "loss": 0.8082, + "step": 115200 + }, + { + "epoch": 5.97, + "learning_rate": 4.1394520559295136e-05, + "loss": 0.7372, + "step": 115300 + }, + { + "epoch": 5.98, + "learning_rate": 4.136332630841599e-05, + "loss": 0.7898, + "step": 115400 + }, + { + "epoch": 5.98, + "learning_rate": 4.133211770691738e-05, + "loss": 0.7048, + "step": 115500 + }, + { + "epoch": 5.99, + "learning_rate": 4.130089479421226e-05, + "loss": 0.7423, + "step": 115600 + }, + { + "epoch": 5.99, + "learning_rate": 4.126965760973172e-05, + "loss": 0.7438, + "step": 115700 + }, + { + "epoch": 6.0, + "learning_rate": 4.1238406192924864e-05, + "loss": 0.766, + "step": 115800 + }, + { + "epoch": 6.0, + "eval_accuracy": 0.6219183218779124, + "eval_cer": 0.16595752690448964, + "eval_loss": 0.8587498664855957, + "eval_runtime": 4247.0817, + "eval_samples_per_second": 4.042, + "eval_steps_per_second": 0.253, + "eval_wer": 0.343897417798953, + "step": 115878 + }, + { + "epoch": 6.0, + "learning_rate": 4.120714058325875e-05, + "loss": 0.6504, + "step": 115900 + }, + { + "epoch": 6.01, + "learning_rate": 4.117586082021838e-05, + "loss": 0.683, + "step": 116000 + }, + { + "epoch": 6.01, + "learning_rate": 4.114456694330662e-05, + "loss": 0.6041, + "step": 116100 + }, + { + "epoch": 6.02, + "learning_rate": 4.111325899204415e-05, + "loss": 0.6508, + "step": 116200 + }, + { + "epoch": 6.02, + "learning_rate": 4.108193700596945e-05, + "loss": 0.6381, + "step": 116300 + }, + { + "epoch": 6.03, + "learning_rate": 4.1050601024638724e-05, + "loss": 0.6473, + "step": 116400 + }, + { + "epoch": 6.03, + "learning_rate": 4.1019251087625804e-05, + "loss": 0.7016, + "step": 116500 + }, + { + "epoch": 6.04, + "learning_rate": 4.098788723452219e-05, + "loss": 0.6773, + "step": 116600 + }, + { + "epoch": 6.04, + "learning_rate": 4.09568233507913e-05, + "loss": 0.6768, + "step": 116700 + }, + { + "epoch": 6.05, + "learning_rate": 4.092543192252339e-05, + "loss": 0.6799, + "step": 116800 + }, + { + "epoch": 6.05, + "learning_rate": 4.0894026696647956e-05, + "loss": 0.7135, + "step": 116900 + }, + { + "epoch": 6.06, + "learning_rate": 4.086260771282636e-05, + "loss": 0.675, + "step": 117000 + }, + { + "epoch": 6.06, + "learning_rate": 4.083117501073725e-05, + "loss": 0.6726, + "step": 117100 + }, + { + "epoch": 6.07, + "learning_rate": 4.079972863007666e-05, + "loss": 0.6296, + "step": 117200 + }, + { + "epoch": 6.07, + "learning_rate": 4.0768268610557875e-05, + "loss": 0.6291, + "step": 117300 + }, + { + "epoch": 6.08, + "learning_rate": 4.0736794991911404e-05, + "loss": 0.6297, + "step": 117400 + }, + { + "epoch": 6.08, + "learning_rate": 4.070530781388494e-05, + "loss": 0.5904, + "step": 117500 + }, + { + "epoch": 6.09, + "learning_rate": 4.067380711624329e-05, + "loss": 0.6298, + "step": 117600 + }, + { + "epoch": 6.09, + "learning_rate": 4.0642292938768317e-05, + "loss": 0.6538, + "step": 117700 + }, + { + "epoch": 6.1, + "learning_rate": 4.0610765321258955e-05, + "loss": 0.7108, + "step": 117800 + }, + { + "epoch": 6.1, + "learning_rate": 4.057922430353108e-05, + "loss": 0.6498, + "step": 117900 + }, + { + "epoch": 6.11, + "learning_rate": 4.0547669925417485e-05, + "loss": 0.5904, + "step": 118000 + }, + { + "epoch": 6.12, + "learning_rate": 4.051610222676785e-05, + "loss": 0.7362, + "step": 118100 + }, + { + "epoch": 6.12, + "learning_rate": 4.048452124744868e-05, + "loss": 0.7146, + "step": 118200 + }, + { + "epoch": 6.13, + "learning_rate": 4.0452927027343234e-05, + "loss": 0.641, + "step": 118300 + }, + { + "epoch": 6.13, + "learning_rate": 4.0421319606351514e-05, + "loss": 0.7092, + "step": 118400 + }, + { + "epoch": 6.14, + "learning_rate": 4.038969902439018e-05, + "loss": 0.6569, + "step": 118500 + }, + { + "epoch": 6.14, + "learning_rate": 4.035806532139253e-05, + "loss": 0.6219, + "step": 118600 + }, + { + "epoch": 6.15, + "learning_rate": 4.032641853730839e-05, + "loss": 0.6279, + "step": 118700 + }, + { + "epoch": 6.15, + "learning_rate": 4.0294758712104154e-05, + "loss": 0.6412, + "step": 118800 + }, + { + "epoch": 6.16, + "learning_rate": 4.0263085885762665e-05, + "loss": 0.7391, + "step": 118900 + }, + { + "epoch": 6.16, + "learning_rate": 4.023140009828318e-05, + "loss": 0.6782, + "step": 119000 + }, + { + "epoch": 6.17, + "learning_rate": 4.019970138968134e-05, + "loss": 0.6498, + "step": 119100 + }, + { + "epoch": 6.17, + "learning_rate": 4.016798979998907e-05, + "loss": 0.6338, + "step": 119200 + }, + { + "epoch": 6.18, + "learning_rate": 4.013626536925463e-05, + "loss": 0.6382, + "step": 119300 + }, + { + "epoch": 6.18, + "learning_rate": 4.0104528137542415e-05, + "loss": 0.7003, + "step": 119400 + }, + { + "epoch": 6.19, + "learning_rate": 4.007277814493305e-05, + "loss": 0.6801, + "step": 119500 + }, + { + "epoch": 6.19, + "learning_rate": 4.004101543152322e-05, + "loss": 0.721, + "step": 119600 + }, + { + "epoch": 6.2, + "learning_rate": 4.000924003742575e-05, + "loss": 0.578, + "step": 119700 + }, + { + "epoch": 6.2, + "learning_rate": 3.997745200276939e-05, + "loss": 0.6042, + "step": 119800 + }, + { + "epoch": 6.21, + "learning_rate": 3.994565136769892e-05, + "loss": 0.6644, + "step": 119900 + }, + { + "epoch": 6.21, + "learning_rate": 3.9913838172375014e-05, + "loss": 0.6669, + "step": 120000 + }, + { + "epoch": 6.22, + "learning_rate": 3.98820124569742e-05, + "loss": 0.6534, + "step": 120100 + }, + { + "epoch": 6.22, + "learning_rate": 3.985017426168883e-05, + "loss": 0.618, + "step": 120200 + }, + { + "epoch": 6.23, + "learning_rate": 3.9818323626727004e-05, + "loss": 0.6918, + "step": 120300 + }, + { + "epoch": 6.23, + "learning_rate": 3.9786460592312535e-05, + "loss": 0.6987, + "step": 120400 + }, + { + "epoch": 6.24, + "learning_rate": 3.9754585198684906e-05, + "loss": 0.6486, + "step": 120500 + }, + { + "epoch": 6.24, + "learning_rate": 3.972269748609919e-05, + "loss": 0.6118, + "step": 120600 + }, + { + "epoch": 6.25, + "learning_rate": 3.969079749482602e-05, + "loss": 0.6117, + "step": 120700 + }, + { + "epoch": 6.25, + "learning_rate": 3.9658885265151575e-05, + "loss": 0.6317, + "step": 120800 + }, + { + "epoch": 6.26, + "learning_rate": 3.9626960837377425e-05, + "loss": 0.6415, + "step": 120900 + }, + { + "epoch": 6.27, + "learning_rate": 3.959502425182059e-05, + "loss": 0.6018, + "step": 121000 + }, + { + "epoch": 6.27, + "learning_rate": 3.956307554881345e-05, + "loss": 0.7095, + "step": 121100 + }, + { + "epoch": 6.28, + "learning_rate": 3.953111476870364e-05, + "loss": 0.5965, + "step": 121200 + }, + { + "epoch": 6.28, + "learning_rate": 3.949914195185409e-05, + "loss": 0.6149, + "step": 121300 + }, + { + "epoch": 6.29, + "learning_rate": 3.9467157138642925e-05, + "loss": 0.6564, + "step": 121400 + }, + { + "epoch": 6.29, + "learning_rate": 3.9435160369463393e-05, + "loss": 0.6621, + "step": 121500 + }, + { + "epoch": 6.3, + "learning_rate": 3.9403151684723886e-05, + "loss": 0.7013, + "step": 121600 + }, + { + "epoch": 6.3, + "learning_rate": 3.9371131124847796e-05, + "loss": 0.704, + "step": 121700 + }, + { + "epoch": 6.31, + "learning_rate": 3.933909873027355e-05, + "loss": 0.6063, + "step": 121800 + }, + { + "epoch": 6.31, + "learning_rate": 3.93070545414545e-05, + "loss": 0.6725, + "step": 121900 + }, + { + "epoch": 6.32, + "learning_rate": 3.92749985988589e-05, + "loss": 0.6381, + "step": 122000 + }, + { + "epoch": 6.32, + "learning_rate": 3.924325167737658e-05, + "loss": 0.6149, + "step": 122100 + }, + { + "epoch": 6.33, + "learning_rate": 3.92111724652194e-05, + "loss": 0.6111, + "step": 122200 + }, + { + "epoch": 6.33, + "learning_rate": 3.917908162037409e-05, + "loss": 0.6689, + "step": 122300 + }, + { + "epoch": 6.34, + "learning_rate": 3.914697918336782e-05, + "loss": 0.6897, + "step": 122400 + }, + { + "epoch": 6.34, + "learning_rate": 3.911486519474241e-05, + "loss": 0.6236, + "step": 122500 + }, + { + "epoch": 6.35, + "learning_rate": 3.908273969505425e-05, + "loss": 0.6442, + "step": 122600 + }, + { + "epoch": 6.35, + "learning_rate": 3.905060272487429e-05, + "loss": 0.6472, + "step": 122700 + }, + { + "epoch": 6.36, + "learning_rate": 3.9018454324787946e-05, + "loss": 0.6484, + "step": 122800 + }, + { + "epoch": 6.36, + "learning_rate": 3.8986294535395086e-05, + "loss": 0.6062, + "step": 122900 + }, + { + "epoch": 6.37, + "learning_rate": 3.895412339730995e-05, + "loss": 0.6842, + "step": 123000 + }, + { + "epoch": 6.37, + "learning_rate": 3.892194095116111e-05, + "loss": 0.6999, + "step": 123100 + }, + { + "epoch": 6.38, + "learning_rate": 3.888974723759143e-05, + "loss": 0.6224, + "step": 123200 + }, + { + "epoch": 6.38, + "learning_rate": 3.8857542297258e-05, + "loss": 0.6343, + "step": 123300 + }, + { + "epoch": 6.39, + "learning_rate": 3.882532617083206e-05, + "loss": 0.643, + "step": 123400 + }, + { + "epoch": 6.39, + "learning_rate": 3.879309889899903e-05, + "loss": 0.64, + "step": 123500 + }, + { + "epoch": 6.4, + "learning_rate": 3.876086052245835e-05, + "loss": 0.7578, + "step": 123600 + }, + { + "epoch": 6.41, + "learning_rate": 3.872861108192354e-05, + "loss": 0.6281, + "step": 123700 + }, + { + "epoch": 6.41, + "learning_rate": 3.869635061812203e-05, + "loss": 0.6344, + "step": 123800 + }, + { + "epoch": 6.42, + "learning_rate": 3.866407917179524e-05, + "loss": 0.6059, + "step": 123900 + }, + { + "epoch": 6.42, + "learning_rate": 3.8631796783698384e-05, + "loss": 0.6236, + "step": 124000 + }, + { + "epoch": 6.43, + "learning_rate": 3.8599503494600566e-05, + "loss": 0.6006, + "step": 124100 + }, + { + "epoch": 6.43, + "learning_rate": 3.856719934528461e-05, + "loss": 0.657, + "step": 124200 + }, + { + "epoch": 6.44, + "learning_rate": 3.8534884376547066e-05, + "loss": 0.6742, + "step": 124300 + }, + { + "epoch": 6.44, + "learning_rate": 3.850255862919816e-05, + "loss": 0.6213, + "step": 124400 + }, + { + "epoch": 6.45, + "learning_rate": 3.847022214406172e-05, + "loss": 0.5855, + "step": 124500 + }, + { + "epoch": 6.45, + "learning_rate": 3.843787496197515e-05, + "loss": 0.5984, + "step": 124600 + }, + { + "epoch": 6.46, + "learning_rate": 3.8405517123789315e-05, + "loss": 0.6884, + "step": 124700 + }, + { + "epoch": 6.46, + "learning_rate": 3.837314867036861e-05, + "loss": 0.5899, + "step": 124800 + }, + { + "epoch": 6.47, + "learning_rate": 3.834076964259078e-05, + "loss": 0.7443, + "step": 124900 + }, + { + "epoch": 6.47, + "learning_rate": 3.830838008134694e-05, + "loss": 0.6178, + "step": 125000 + }, + { + "epoch": 6.48, + "learning_rate": 3.8276304079883395e-05, + "loss": 0.6905, + "step": 125100 + }, + { + "epoch": 6.48, + "learning_rate": 3.8243893678747906e-05, + "loss": 0.6043, + "step": 125200 + }, + { + "epoch": 6.49, + "learning_rate": 3.8211472866489994e-05, + "loss": 0.6439, + "step": 125300 + }, + { + "epoch": 6.49, + "learning_rate": 3.817904168405355e-05, + "loss": 0.6254, + "step": 125400 + }, + { + "epoch": 6.5, + "learning_rate": 3.814660017239555e-05, + "loss": 0.6638, + "step": 125500 + }, + { + "epoch": 6.5, + "learning_rate": 3.811414837248603e-05, + "loss": 0.5851, + "step": 125600 + }, + { + "epoch": 6.51, + "learning_rate": 3.8081686325308004e-05, + "loss": 0.5789, + "step": 125700 + }, + { + "epoch": 6.51, + "learning_rate": 3.804921407185743e-05, + "loss": 0.6397, + "step": 125800 + }, + { + "epoch": 6.52, + "learning_rate": 3.801673165314318e-05, + "loss": 0.5918, + "step": 125900 + }, + { + "epoch": 6.52, + "learning_rate": 3.798423911018691e-05, + "loss": 0.6261, + "step": 126000 + }, + { + "epoch": 6.53, + "learning_rate": 3.795173648402312e-05, + "loss": 0.6259, + "step": 126100 + }, + { + "epoch": 6.53, + "learning_rate": 3.791922381569901e-05, + "loss": 0.6493, + "step": 126200 + }, + { + "epoch": 6.54, + "learning_rate": 3.788670114627447e-05, + "loss": 0.6243, + "step": 126300 + }, + { + "epoch": 6.54, + "learning_rate": 3.785416851682201e-05, + "loss": 0.5652, + "step": 126400 + }, + { + "epoch": 6.55, + "learning_rate": 3.782195144287454e-05, + "loss": 0.6096, + "step": 126500 + }, + { + "epoch": 6.56, + "learning_rate": 3.778939911520906e-05, + "loss": 0.5848, + "step": 126600 + }, + { + "epoch": 6.56, + "learning_rate": 3.775683695039735e-05, + "loss": 0.608, + "step": 126700 + }, + { + "epoch": 6.57, + "learning_rate": 3.7724264989561774e-05, + "loss": 0.5728, + "step": 126800 + }, + { + "epoch": 6.57, + "learning_rate": 3.769168327383713e-05, + "loss": 0.617, + "step": 126900 + }, + { + "epoch": 6.58, + "learning_rate": 3.7659091844370494e-05, + "loss": 0.6545, + "step": 127000 + }, + { + "epoch": 6.58, + "learning_rate": 3.7626490742321226e-05, + "loss": 0.6609, + "step": 127100 + }, + { + "epoch": 6.59, + "learning_rate": 3.75938800088609e-05, + "loss": 0.6689, + "step": 127200 + }, + { + "epoch": 6.59, + "learning_rate": 3.756125968517324e-05, + "loss": 0.5786, + "step": 127300 + }, + { + "epoch": 6.6, + "learning_rate": 3.752862981245411e-05, + "loss": 0.6583, + "step": 127400 + }, + { + "epoch": 6.6, + "learning_rate": 3.7495990431911404e-05, + "loss": 0.6339, + "step": 127500 + }, + { + "epoch": 6.61, + "learning_rate": 3.746334158476506e-05, + "loss": 0.634, + "step": 127600 + }, + { + "epoch": 6.61, + "learning_rate": 3.74306833122469e-05, + "loss": 0.6532, + "step": 127700 + }, + { + "epoch": 6.62, + "learning_rate": 3.739801565560075e-05, + "loss": 0.6319, + "step": 127800 + }, + { + "epoch": 6.62, + "learning_rate": 3.736533865608219e-05, + "loss": 0.7002, + "step": 127900 + }, + { + "epoch": 6.63, + "learning_rate": 3.733265235495866e-05, + "loss": 0.621, + "step": 128000 + }, + { + "epoch": 6.63, + "learning_rate": 3.729995679350934e-05, + "loss": 0.6048, + "step": 128100 + }, + { + "epoch": 6.64, + "learning_rate": 3.726725201302507e-05, + "loss": 0.7234, + "step": 128200 + }, + { + "epoch": 6.64, + "learning_rate": 3.723453805480838e-05, + "loss": 0.6741, + "step": 128300 + }, + { + "epoch": 6.65, + "learning_rate": 3.720181496017335e-05, + "loss": 0.6612, + "step": 128400 + }, + { + "epoch": 6.65, + "learning_rate": 3.716908277044563e-05, + "loss": 0.6609, + "step": 128500 + }, + { + "epoch": 6.66, + "learning_rate": 3.713634152696233e-05, + "loss": 0.6778, + "step": 128600 + }, + { + "epoch": 6.66, + "learning_rate": 3.710359127107201e-05, + "loss": 0.6509, + "step": 128700 + }, + { + "epoch": 6.67, + "learning_rate": 3.70708320441346e-05, + "loss": 0.6462, + "step": 128800 + }, + { + "epoch": 6.67, + "learning_rate": 3.703806388752138e-05, + "loss": 0.6561, + "step": 128900 + }, + { + "epoch": 6.68, + "learning_rate": 3.7005286842614876e-05, + "loss": 0.6187, + "step": 129000 + }, + { + "epoch": 6.68, + "learning_rate": 3.6972500950808875e-05, + "loss": 0.6868, + "step": 129100 + }, + { + "epoch": 6.69, + "learning_rate": 3.6939706253508306e-05, + "loss": 0.628, + "step": 129200 + }, + { + "epoch": 6.69, + "learning_rate": 3.6906902792129243e-05, + "loss": 0.6163, + "step": 129300 + }, + { + "epoch": 6.7, + "learning_rate": 3.68740906080988e-05, + "loss": 0.5937, + "step": 129400 + }, + { + "epoch": 6.71, + "learning_rate": 3.684126974285513e-05, + "loss": 0.681, + "step": 129500 + }, + { + "epoch": 6.71, + "learning_rate": 3.680844023784734e-05, + "loss": 0.631, + "step": 129600 + }, + { + "epoch": 6.72, + "learning_rate": 3.6775602134535455e-05, + "loss": 0.6824, + "step": 129700 + }, + { + "epoch": 6.72, + "learning_rate": 3.674275547439035e-05, + "loss": 0.6407, + "step": 129800 + }, + { + "epoch": 6.73, + "learning_rate": 3.670990029889371e-05, + "loss": 0.6186, + "step": 129900 + }, + { + "epoch": 6.73, + "learning_rate": 3.667736532784086e-05, + "loss": 0.669, + "step": 130000 + }, + { + "epoch": 6.74, + "learning_rate": 3.664449333024725e-05, + "loss": 0.62, + "step": 130100 + }, + { + "epoch": 6.74, + "learning_rate": 3.6611612941396287e-05, + "loss": 0.7114, + "step": 130200 + }, + { + "epoch": 6.75, + "learning_rate": 3.6578724202812236e-05, + "loss": 0.6253, + "step": 130300 + }, + { + "epoch": 6.75, + "learning_rate": 3.6545827156029946e-05, + "loss": 0.6395, + "step": 130400 + }, + { + "epoch": 6.76, + "learning_rate": 3.6512921842594716e-05, + "loss": 0.6544, + "step": 130500 + }, + { + "epoch": 6.76, + "learning_rate": 3.64800083040623e-05, + "loss": 0.6112, + "step": 130600 + }, + { + "epoch": 6.77, + "learning_rate": 3.644708658199887e-05, + "loss": 0.6396, + "step": 130700 + }, + { + "epoch": 6.77, + "learning_rate": 3.6414156717980885e-05, + "loss": 0.6016, + "step": 130800 + }, + { + "epoch": 6.78, + "learning_rate": 3.638121875359511e-05, + "loss": 0.5658, + "step": 130900 + }, + { + "epoch": 6.78, + "learning_rate": 3.634827273043853e-05, + "loss": 0.6806, + "step": 131000 + }, + { + "epoch": 6.79, + "learning_rate": 3.6315318690118336e-05, + "loss": 0.6453, + "step": 131100 + }, + { + "epoch": 6.79, + "learning_rate": 3.6282356674251795e-05, + "loss": 0.6659, + "step": 131200 + }, + { + "epoch": 6.8, + "learning_rate": 3.624938672446629e-05, + "loss": 0.6963, + "step": 131300 + }, + { + "epoch": 6.8, + "learning_rate": 3.6216408882399205e-05, + "loss": 0.6495, + "step": 131400 + }, + { + "epoch": 6.81, + "learning_rate": 3.6183423189697887e-05, + "loss": 0.5949, + "step": 131500 + }, + { + "epoch": 6.81, + "learning_rate": 3.615042968801961e-05, + "loss": 0.6344, + "step": 131600 + }, + { + "epoch": 6.82, + "learning_rate": 3.6117428419031506e-05, + "loss": 0.654, + "step": 131700 + }, + { + "epoch": 6.82, + "learning_rate": 3.608441942441051e-05, + "loss": 0.7161, + "step": 131800 + }, + { + "epoch": 6.83, + "learning_rate": 3.605140274584331e-05, + "loss": 0.6516, + "step": 131900 + }, + { + "epoch": 6.83, + "learning_rate": 3.601837842502632e-05, + "loss": 0.6429, + "step": 132000 + }, + { + "epoch": 6.84, + "learning_rate": 3.598534650366557e-05, + "loss": 0.6813, + "step": 132100 + }, + { + "epoch": 6.85, + "learning_rate": 3.5952307023476735e-05, + "loss": 0.6645, + "step": 132200 + }, + { + "epoch": 6.85, + "learning_rate": 3.591926002618499e-05, + "loss": 0.6393, + "step": 132300 + }, + { + "epoch": 6.86, + "learning_rate": 3.5886205553525036e-05, + "loss": 0.5708, + "step": 132400 + }, + { + "epoch": 6.86, + "learning_rate": 3.585314364724099e-05, + "loss": 0.5741, + "step": 132500 + }, + { + "epoch": 6.87, + "learning_rate": 3.5820074349086376e-05, + "loss": 0.6672, + "step": 132600 + }, + { + "epoch": 6.87, + "learning_rate": 3.5786997700824056e-05, + "loss": 0.7122, + "step": 132700 + }, + { + "epoch": 6.88, + "learning_rate": 3.575391374422614e-05, + "loss": 0.6256, + "step": 132800 + }, + { + "epoch": 6.88, + "learning_rate": 3.5720822521074014e-05, + "loss": 0.6111, + "step": 132900 + }, + { + "epoch": 6.89, + "learning_rate": 3.56877240731582e-05, + "loss": 0.6476, + "step": 133000 + }, + { + "epoch": 6.89, + "learning_rate": 3.5654618442278394e-05, + "loss": 0.5478, + "step": 133100 + }, + { + "epoch": 6.9, + "learning_rate": 3.5621505670243285e-05, + "loss": 0.5939, + "step": 133200 + }, + { + "epoch": 6.9, + "learning_rate": 3.5588385798870666e-05, + "loss": 0.6257, + "step": 133300 + }, + { + "epoch": 6.91, + "learning_rate": 3.555525886998725e-05, + "loss": 0.6488, + "step": 133400 + }, + { + "epoch": 6.91, + "learning_rate": 3.552212492542866e-05, + "loss": 0.6461, + "step": 133500 + }, + { + "epoch": 6.92, + "learning_rate": 3.54889840070394e-05, + "loss": 0.6159, + "step": 133600 + }, + { + "epoch": 6.92, + "learning_rate": 3.545583615667276e-05, + "loss": 0.6886, + "step": 133700 + }, + { + "epoch": 6.93, + "learning_rate": 3.542268141619081e-05, + "loss": 0.5951, + "step": 133800 + }, + { + "epoch": 6.93, + "learning_rate": 3.5389519827464286e-05, + "loss": 0.6032, + "step": 133900 + }, + { + "epoch": 6.94, + "learning_rate": 3.535635143237261e-05, + "loss": 0.6592, + "step": 134000 + }, + { + "epoch": 6.94, + "learning_rate": 3.532317627280376e-05, + "loss": 0.6893, + "step": 134100 + }, + { + "epoch": 6.95, + "learning_rate": 3.5289994390654305e-05, + "loss": 0.6331, + "step": 134200 + }, + { + "epoch": 6.95, + "learning_rate": 3.525680582782927e-05, + "loss": 0.6415, + "step": 134300 + }, + { + "epoch": 6.96, + "learning_rate": 3.522394261098223e-05, + "loss": 0.6603, + "step": 134400 + }, + { + "epoch": 6.96, + "learning_rate": 3.5190740878315674e-05, + "loss": 0.5925, + "step": 134500 + }, + { + "epoch": 6.97, + "learning_rate": 3.5157532590319715e-05, + "loss": 0.6227, + "step": 134600 + }, + { + "epoch": 6.97, + "learning_rate": 3.512431778893271e-05, + "loss": 0.6268, + "step": 134700 + }, + { + "epoch": 6.98, + "learning_rate": 3.509109651610129e-05, + "loss": 0.6578, + "step": 134800 + }, + { + "epoch": 6.98, + "learning_rate": 3.505786881378021e-05, + "loss": 0.5979, + "step": 134900 + }, + { + "epoch": 6.99, + "learning_rate": 3.5024634723932385e-05, + "loss": 0.6515, + "step": 135000 + }, + { + "epoch": 7.0, + "learning_rate": 3.499139428852877e-05, + "loss": 0.6007, + "step": 135100 + }, + { + "epoch": 7.0, + "eval_accuracy": 0.6233020736253495, + "eval_cer": 0.1471199137926978, + "eval_loss": 0.7827567458152771, + "eval_runtime": 4701.066, + "eval_samples_per_second": 3.652, + "eval_steps_per_second": 0.228, + "eval_wer": 0.3108699488265396, + "step": 135191 + }, + { + "epoch": 7.0, + "learning_rate": 3.4958147549548344e-05, + "loss": 0.6295, + "step": 135200 + }, + { + "epoch": 7.01, + "learning_rate": 3.492489454897807e-05, + "loss": 0.4985, + "step": 135300 + }, + { + "epoch": 7.01, + "learning_rate": 3.4891635328812754e-05, + "loss": 0.5288, + "step": 135400 + }, + { + "epoch": 7.02, + "learning_rate": 3.485836993105514e-05, + "loss": 0.5136, + "step": 135500 + }, + { + "epoch": 7.02, + "learning_rate": 3.48250983977157e-05, + "loss": 0.5103, + "step": 135600 + }, + { + "epoch": 7.03, + "learning_rate": 3.479182077081272e-05, + "loss": 0.6064, + "step": 135700 + }, + { + "epoch": 7.03, + "learning_rate": 3.4758537092372105e-05, + "loss": 0.5331, + "step": 135800 + }, + { + "epoch": 7.04, + "learning_rate": 3.472524740442749e-05, + "loss": 0.5674, + "step": 135900 + }, + { + "epoch": 7.04, + "learning_rate": 3.469195174902002e-05, + "loss": 0.5853, + "step": 136000 + }, + { + "epoch": 7.05, + "learning_rate": 3.465865016819843e-05, + "loss": 0.5743, + "step": 136100 + }, + { + "epoch": 7.05, + "learning_rate": 3.462534270401891e-05, + "loss": 0.5413, + "step": 136200 + }, + { + "epoch": 7.06, + "learning_rate": 3.4592029398545105e-05, + "loss": 0.4956, + "step": 136300 + }, + { + "epoch": 7.06, + "learning_rate": 3.455871029384801e-05, + "loss": 0.5276, + "step": 136400 + }, + { + "epoch": 7.07, + "learning_rate": 3.452538543200594e-05, + "loss": 0.5519, + "step": 136500 + }, + { + "epoch": 7.07, + "learning_rate": 3.449205485510451e-05, + "loss": 0.5254, + "step": 136600 + }, + { + "epoch": 7.08, + "learning_rate": 3.445871860523654e-05, + "loss": 0.5327, + "step": 136700 + }, + { + "epoch": 7.08, + "learning_rate": 3.442537672450202e-05, + "loss": 0.5509, + "step": 136800 + }, + { + "epoch": 7.09, + "learning_rate": 3.4392029255008035e-05, + "loss": 0.4957, + "step": 136900 + }, + { + "epoch": 7.09, + "learning_rate": 3.435867623886872e-05, + "loss": 0.531, + "step": 137000 + }, + { + "epoch": 7.1, + "learning_rate": 3.432531771820526e-05, + "loss": 0.5403, + "step": 137100 + }, + { + "epoch": 7.1, + "learning_rate": 3.429195373514574e-05, + "loss": 0.5113, + "step": 137200 + }, + { + "epoch": 7.11, + "learning_rate": 3.4258584331825185e-05, + "loss": 0.5026, + "step": 137300 + }, + { + "epoch": 7.11, + "learning_rate": 3.422520955038543e-05, + "loss": 0.5408, + "step": 137400 + }, + { + "epoch": 7.12, + "learning_rate": 3.419182943297513e-05, + "loss": 0.4939, + "step": 137500 + }, + { + "epoch": 7.12, + "learning_rate": 3.415844402174967e-05, + "loss": 0.5522, + "step": 137600 + }, + { + "epoch": 7.13, + "learning_rate": 3.412505335887109e-05, + "loss": 0.5576, + "step": 137700 + }, + { + "epoch": 7.14, + "learning_rate": 3.4091657486508125e-05, + "loss": 0.5742, + "step": 137800 + }, + { + "epoch": 7.14, + "learning_rate": 3.4058256446836035e-05, + "loss": 0.5466, + "step": 137900 + }, + { + "epoch": 7.15, + "learning_rate": 3.402485028203664e-05, + "loss": 0.5434, + "step": 138000 + }, + { + "epoch": 7.15, + "learning_rate": 3.399143903429819e-05, + "loss": 0.5741, + "step": 138100 + }, + { + "epoch": 7.16, + "learning_rate": 3.395835693351336e-05, + "loss": 0.5013, + "step": 138200 + }, + { + "epoch": 7.16, + "learning_rate": 3.3924935696263814e-05, + "loss": 0.5658, + "step": 138300 + }, + { + "epoch": 7.17, + "learning_rate": 3.389150950225627e-05, + "loss": 0.5626, + "step": 138400 + }, + { + "epoch": 7.17, + "learning_rate": 3.3858078393704255e-05, + "loss": 0.5064, + "step": 138500 + }, + { + "epoch": 7.18, + "learning_rate": 3.3824642412827605e-05, + "loss": 0.5213, + "step": 138600 + }, + { + "epoch": 7.18, + "learning_rate": 3.379120160185222e-05, + "loss": 0.5777, + "step": 138700 + }, + { + "epoch": 7.19, + "learning_rate": 3.375775600301014e-05, + "loss": 0.5134, + "step": 138800 + }, + { + "epoch": 7.19, + "learning_rate": 3.3724305658539445e-05, + "loss": 0.5304, + "step": 138900 + }, + { + "epoch": 7.2, + "learning_rate": 3.3690850610684195e-05, + "loss": 0.5252, + "step": 139000 + }, + { + "epoch": 7.2, + "learning_rate": 3.365739090169441e-05, + "loss": 0.5443, + "step": 139100 + }, + { + "epoch": 7.21, + "learning_rate": 3.362392657382598e-05, + "loss": 0.5533, + "step": 139200 + }, + { + "epoch": 7.21, + "learning_rate": 3.359045766934066e-05, + "loss": 0.6242, + "step": 139300 + }, + { + "epoch": 7.22, + "learning_rate": 3.355731898720051e-05, + "loss": 0.5322, + "step": 139400 + }, + { + "epoch": 7.22, + "learning_rate": 3.352384110100111e-05, + "loss": 0.6311, + "step": 139500 + }, + { + "epoch": 7.23, + "learning_rate": 3.3490358764581634e-05, + "loss": 0.5272, + "step": 139600 + }, + { + "epoch": 7.23, + "learning_rate": 3.345687202022657e-05, + "loss": 0.6052, + "step": 139700 + }, + { + "epoch": 7.24, + "learning_rate": 3.342338091022594e-05, + "loss": 0.5603, + "step": 139800 + }, + { + "epoch": 7.24, + "learning_rate": 3.338988547687533e-05, + "loss": 0.578, + "step": 139900 + }, + { + "epoch": 7.25, + "learning_rate": 3.335638576247572e-05, + "loss": 0.5756, + "step": 140000 + }, + { + "epoch": 7.25, + "learning_rate": 3.3322881809333544e-05, + "loss": 0.523, + "step": 140100 + }, + { + "epoch": 7.26, + "learning_rate": 3.328937365976057e-05, + "loss": 0.6046, + "step": 140200 + }, + { + "epoch": 7.26, + "learning_rate": 3.3255861356073875e-05, + "loss": 0.5995, + "step": 140300 + }, + { + "epoch": 7.27, + "learning_rate": 3.322234494059578e-05, + "loss": 0.5843, + "step": 140400 + }, + { + "epoch": 7.27, + "learning_rate": 3.3188824455653793e-05, + "loss": 0.5643, + "step": 140500 + }, + { + "epoch": 7.28, + "learning_rate": 3.315529994358056e-05, + "loss": 0.5653, + "step": 140600 + }, + { + "epoch": 7.29, + "learning_rate": 3.312177144671381e-05, + "loss": 0.5712, + "step": 140700 + }, + { + "epoch": 7.29, + "learning_rate": 3.3088239007396345e-05, + "loss": 0.5376, + "step": 140800 + }, + { + "epoch": 7.3, + "learning_rate": 3.305470266797588e-05, + "loss": 0.6073, + "step": 140900 + }, + { + "epoch": 7.3, + "learning_rate": 3.302116247080511e-05, + "loss": 0.5558, + "step": 141000 + }, + { + "epoch": 7.31, + "learning_rate": 3.298761845824156e-05, + "loss": 0.5691, + "step": 141100 + }, + { + "epoch": 7.31, + "learning_rate": 3.2954070672647615e-05, + "loss": 0.5601, + "step": 141200 + }, + { + "epoch": 7.32, + "learning_rate": 3.2920519156390386e-05, + "loss": 0.5355, + "step": 141300 + }, + { + "epoch": 7.32, + "learning_rate": 3.288696395184172e-05, + "loss": 0.5195, + "step": 141400 + }, + { + "epoch": 7.33, + "learning_rate": 3.285340510137811e-05, + "loss": 0.5234, + "step": 141500 + }, + { + "epoch": 7.33, + "learning_rate": 3.281984264738067e-05, + "loss": 0.512, + "step": 141600 + }, + { + "epoch": 7.34, + "learning_rate": 3.278627663223504e-05, + "loss": 0.5434, + "step": 141700 + }, + { + "epoch": 7.34, + "learning_rate": 3.275270709833138e-05, + "loss": 0.6089, + "step": 141800 + }, + { + "epoch": 7.35, + "learning_rate": 3.271913408806427e-05, + "loss": 0.5515, + "step": 141900 + }, + { + "epoch": 7.35, + "learning_rate": 3.268555764383271e-05, + "loss": 0.5667, + "step": 142000 + }, + { + "epoch": 7.36, + "learning_rate": 3.2651977808040025e-05, + "loss": 0.5399, + "step": 142100 + }, + { + "epoch": 7.36, + "learning_rate": 3.26183946230938e-05, + "loss": 0.5176, + "step": 142200 + }, + { + "epoch": 7.37, + "learning_rate": 3.2584808131405875e-05, + "loss": 0.5678, + "step": 142300 + }, + { + "epoch": 7.37, + "learning_rate": 3.255121837539227e-05, + "loss": 0.5264, + "step": 142400 + }, + { + "epoch": 7.38, + "learning_rate": 3.251762539747312e-05, + "loss": 0.5497, + "step": 142500 + }, + { + "epoch": 7.38, + "learning_rate": 3.2484029240072605e-05, + "loss": 0.5119, + "step": 142600 + }, + { + "epoch": 7.39, + "learning_rate": 3.245042994561896e-05, + "loss": 0.502, + "step": 142700 + }, + { + "epoch": 7.39, + "learning_rate": 3.241682755654436e-05, + "loss": 0.5123, + "step": 142800 + }, + { + "epoch": 7.4, + "learning_rate": 3.238322211528488e-05, + "loss": 0.5582, + "step": 142900 + }, + { + "epoch": 7.4, + "learning_rate": 3.234961366428048e-05, + "loss": 0.5432, + "step": 143000 + }, + { + "epoch": 7.41, + "learning_rate": 3.231600224597489e-05, + "loss": 0.5886, + "step": 143100 + }, + { + "epoch": 7.41, + "learning_rate": 3.22823879028156e-05, + "loss": 0.546, + "step": 143200 + }, + { + "epoch": 7.42, + "learning_rate": 3.22487706772538e-05, + "loss": 0.5494, + "step": 143300 + }, + { + "epoch": 7.43, + "learning_rate": 3.2215150611744304e-05, + "loss": 0.5608, + "step": 143400 + }, + { + "epoch": 7.43, + "learning_rate": 3.218152774874554e-05, + "loss": 0.5305, + "step": 143500 + }, + { + "epoch": 7.44, + "learning_rate": 3.214790213071942e-05, + "loss": 0.538, + "step": 143600 + }, + { + "epoch": 7.44, + "learning_rate": 3.21142738001314e-05, + "loss": 0.5307, + "step": 143700 + }, + { + "epoch": 7.45, + "learning_rate": 3.2080642799450296e-05, + "loss": 0.5585, + "step": 143800 + }, + { + "epoch": 7.45, + "learning_rate": 3.2047009171148365e-05, + "loss": 0.5091, + "step": 143900 + }, + { + "epoch": 7.46, + "learning_rate": 3.20133729577011e-05, + "loss": 0.5686, + "step": 144000 + }, + { + "epoch": 7.46, + "learning_rate": 3.1979734201587344e-05, + "loss": 0.4615, + "step": 144100 + }, + { + "epoch": 7.47, + "learning_rate": 3.1946092945289095e-05, + "loss": 0.5033, + "step": 144200 + }, + { + "epoch": 7.47, + "learning_rate": 3.1912449231291525e-05, + "loss": 0.5426, + "step": 144300 + }, + { + "epoch": 7.48, + "learning_rate": 3.1878803102082905e-05, + "loss": 0.5009, + "step": 144400 + }, + { + "epoch": 7.48, + "learning_rate": 3.184515460015456e-05, + "loss": 0.5021, + "step": 144500 + }, + { + "epoch": 7.49, + "learning_rate": 3.1811503768000836e-05, + "loss": 0.5141, + "step": 144600 + }, + { + "epoch": 7.49, + "learning_rate": 3.1777850648118965e-05, + "loss": 0.5724, + "step": 144700 + }, + { + "epoch": 7.5, + "learning_rate": 3.174419528300912e-05, + "loss": 0.509, + "step": 144800 + }, + { + "epoch": 7.5, + "learning_rate": 3.171053771517428e-05, + "loss": 0.5749, + "step": 144900 + }, + { + "epoch": 7.51, + "learning_rate": 3.167687798712022e-05, + "loss": 0.5917, + "step": 145000 + }, + { + "epoch": 7.51, + "learning_rate": 3.1643216141355446e-05, + "loss": 0.5789, + "step": 145100 + }, + { + "epoch": 7.52, + "learning_rate": 3.1609552220391134e-05, + "loss": 0.5656, + "step": 145200 + }, + { + "epoch": 7.52, + "learning_rate": 3.157588626674106e-05, + "loss": 0.5222, + "step": 145300 + }, + { + "epoch": 7.53, + "learning_rate": 3.154221832292161e-05, + "loss": 0.4999, + "step": 145400 + }, + { + "epoch": 7.53, + "learning_rate": 3.150854843145163e-05, + "loss": 0.5091, + "step": 145500 + }, + { + "epoch": 7.54, + "learning_rate": 3.147487663485249e-05, + "loss": 0.5375, + "step": 145600 + }, + { + "epoch": 7.54, + "learning_rate": 3.14412029756479e-05, + "loss": 0.544, + "step": 145700 + }, + { + "epoch": 7.55, + "learning_rate": 3.1407527496363964e-05, + "loss": 0.5443, + "step": 145800 + }, + { + "epoch": 7.55, + "learning_rate": 3.137385023952908e-05, + "loss": 0.523, + "step": 145900 + }, + { + "epoch": 7.56, + "learning_rate": 3.1340171247673866e-05, + "loss": 0.5427, + "step": 146000 + }, + { + "epoch": 7.56, + "learning_rate": 3.130649056333117e-05, + "loss": 0.5186, + "step": 146100 + }, + { + "epoch": 7.57, + "learning_rate": 3.127280822903595e-05, + "loss": 0.5422, + "step": 146200 + }, + { + "epoch": 7.58, + "learning_rate": 3.123912428732525e-05, + "loss": 0.5579, + "step": 146300 + }, + { + "epoch": 7.58, + "learning_rate": 3.120543878073816e-05, + "loss": 0.5969, + "step": 146400 + }, + { + "epoch": 7.59, + "learning_rate": 3.117175175181571e-05, + "loss": 0.5286, + "step": 146500 + }, + { + "epoch": 7.59, + "learning_rate": 3.11380632431009e-05, + "loss": 0.5439, + "step": 146600 + }, + { + "epoch": 7.6, + "learning_rate": 3.1104373297138574e-05, + "loss": 0.4923, + "step": 146700 + }, + { + "epoch": 7.6, + "learning_rate": 3.1070681956475386e-05, + "loss": 0.5593, + "step": 146800 + }, + { + "epoch": 7.61, + "learning_rate": 3.1036989263659765e-05, + "loss": 0.5485, + "step": 146900 + }, + { + "epoch": 7.61, + "learning_rate": 3.1003295261241835e-05, + "loss": 0.4644, + "step": 147000 + }, + { + "epoch": 7.62, + "learning_rate": 3.096959999177339e-05, + "loss": 0.5179, + "step": 147100 + }, + { + "epoch": 7.62, + "learning_rate": 3.0935903497807787e-05, + "loss": 0.5253, + "step": 147200 + }, + { + "epoch": 7.63, + "learning_rate": 3.09022058219e-05, + "loss": 0.5904, + "step": 147300 + }, + { + "epoch": 7.63, + "learning_rate": 3.086850700660642e-05, + "loss": 0.5803, + "step": 147400 + }, + { + "epoch": 7.64, + "learning_rate": 3.0834807094484923e-05, + "loss": 0.5077, + "step": 147500 + }, + { + "epoch": 7.64, + "learning_rate": 3.080110612809474e-05, + "loss": 0.5093, + "step": 147600 + }, + { + "epoch": 7.65, + "learning_rate": 3.0767404149996474e-05, + "loss": 0.5708, + "step": 147700 + }, + { + "epoch": 7.65, + "learning_rate": 3.073370120275196e-05, + "loss": 0.5837, + "step": 147800 + }, + { + "epoch": 7.66, + "learning_rate": 3.069999732892429e-05, + "loss": 0.5114, + "step": 147900 + }, + { + "epoch": 7.66, + "learning_rate": 3.066629257107772e-05, + "loss": 0.5691, + "step": 148000 + }, + { + "epoch": 7.67, + "learning_rate": 3.06325869717776e-05, + "loss": 0.5233, + "step": 148100 + }, + { + "epoch": 7.67, + "learning_rate": 3.059888057359037e-05, + "loss": 0.5256, + "step": 148200 + }, + { + "epoch": 7.68, + "learning_rate": 3.056517341908348e-05, + "loss": 0.4868, + "step": 148300 + }, + { + "epoch": 7.68, + "learning_rate": 3.05314655508253e-05, + "loss": 0.4624, + "step": 148400 + }, + { + "epoch": 7.69, + "learning_rate": 3.0497757011385136e-05, + "loss": 0.5497, + "step": 148500 + }, + { + "epoch": 7.69, + "learning_rate": 3.046404784333313e-05, + "loss": 0.5332, + "step": 148600 + }, + { + "epoch": 7.7, + "learning_rate": 3.043033808924023e-05, + "loss": 0.4968, + "step": 148700 + }, + { + "epoch": 7.7, + "learning_rate": 3.03969648972041e-05, + "loss": 0.5009, + "step": 148800 + }, + { + "epoch": 7.71, + "learning_rate": 3.036325410354333e-05, + "loss": 0.5167, + "step": 148900 + }, + { + "epoch": 7.72, + "learning_rate": 3.032954285113297e-05, + "loss": 0.5391, + "step": 149000 + }, + { + "epoch": 7.72, + "learning_rate": 3.0295831182546564e-05, + "loss": 0.5178, + "step": 149100 + }, + { + "epoch": 7.73, + "learning_rate": 3.0262119140358223e-05, + "loss": 0.4955, + "step": 149200 + }, + { + "epoch": 7.73, + "learning_rate": 3.0228406767142517e-05, + "loss": 0.5166, + "step": 149300 + }, + { + "epoch": 7.74, + "learning_rate": 3.0194694105474417e-05, + "loss": 0.5033, + "step": 149400 + }, + { + "epoch": 7.74, + "learning_rate": 3.016098119792928e-05, + "loss": 0.526, + "step": 149500 + }, + { + "epoch": 7.75, + "learning_rate": 3.0127268087082767e-05, + "loss": 0.4734, + "step": 149600 + }, + { + "epoch": 7.75, + "learning_rate": 3.0093554815510786e-05, + "loss": 0.5994, + "step": 149700 + }, + { + "epoch": 7.76, + "learning_rate": 3.0059841425789465e-05, + "loss": 0.5695, + "step": 149800 + }, + { + "epoch": 7.76, + "learning_rate": 3.0026127960495065e-05, + "loss": 0.5684, + "step": 149900 + }, + { + "epoch": 7.77, + "learning_rate": 2.999241446220394e-05, + "loss": 0.5203, + "step": 150000 + }, + { + "epoch": 7.77, + "learning_rate": 2.9958700973492515e-05, + "loss": 0.5049, + "step": 150100 + }, + { + "epoch": 7.78, + "learning_rate": 2.9924987536937187e-05, + "loss": 0.5597, + "step": 150200 + }, + { + "epoch": 7.78, + "learning_rate": 2.9891274195114258e-05, + "loss": 0.5307, + "step": 150300 + }, + { + "epoch": 7.79, + "learning_rate": 2.985756099059995e-05, + "loss": 0.6372, + "step": 150400 + }, + { + "epoch": 7.79, + "learning_rate": 2.98238479659703e-05, + "loss": 0.5117, + "step": 150500 + }, + { + "epoch": 7.8, + "learning_rate": 2.979013516380112e-05, + "loss": 0.5675, + "step": 150600 + }, + { + "epoch": 7.8, + "learning_rate": 2.975642262666791e-05, + "loss": 0.5168, + "step": 150700 + }, + { + "epoch": 7.81, + "learning_rate": 2.9722710397145888e-05, + "loss": 0.4552, + "step": 150800 + }, + { + "epoch": 7.81, + "learning_rate": 2.968899851780984e-05, + "loss": 0.4923, + "step": 150900 + }, + { + "epoch": 7.82, + "learning_rate": 2.9655287031234145e-05, + "loss": 0.5883, + "step": 151000 + }, + { + "epoch": 7.82, + "learning_rate": 2.9621575979992654e-05, + "loss": 0.5095, + "step": 151100 + }, + { + "epoch": 7.83, + "learning_rate": 2.9587865406658684e-05, + "loss": 0.471, + "step": 151200 + }, + { + "epoch": 7.83, + "learning_rate": 2.955415535380494e-05, + "loss": 0.5369, + "step": 151300 + }, + { + "epoch": 7.84, + "learning_rate": 2.95204458640035e-05, + "loss": 0.5351, + "step": 151400 + }, + { + "epoch": 7.84, + "learning_rate": 2.948673697982568e-05, + "loss": 0.4888, + "step": 151500 + }, + { + "epoch": 7.85, + "learning_rate": 2.9453028743842065e-05, + "loss": 0.513, + "step": 151600 + }, + { + "epoch": 7.85, + "learning_rate": 2.9419658270515565e-05, + "loss": 0.5295, + "step": 151700 + }, + { + "epoch": 7.86, + "learning_rate": 2.9385951451084732e-05, + "loss": 0.5496, + "step": 151800 + }, + { + "epoch": 7.87, + "learning_rate": 2.935224540712904e-05, + "loss": 0.5873, + "step": 151900 + }, + { + "epoch": 7.87, + "learning_rate": 2.9318540181215486e-05, + "loss": 0.5711, + "step": 152000 + }, + { + "epoch": 7.88, + "learning_rate": 2.9284835815910026e-05, + "loss": 0.5278, + "step": 152100 + }, + { + "epoch": 7.88, + "learning_rate": 2.9251469383788377e-05, + "loss": 0.5717, + "step": 152200 + }, + { + "epoch": 7.89, + "learning_rate": 2.9217766857724506e-05, + "loss": 0.5137, + "step": 152300 + }, + { + "epoch": 7.89, + "learning_rate": 2.918406531953426e-05, + "loss": 0.5104, + "step": 152400 + }, + { + "epoch": 7.9, + "learning_rate": 2.9150364811778914e-05, + "loss": 0.5148, + "step": 152500 + }, + { + "epoch": 7.9, + "learning_rate": 2.9116665377018474e-05, + "loss": 0.5313, + "step": 152600 + }, + { + "epoch": 7.91, + "learning_rate": 2.9082967057811593e-05, + "loss": 0.557, + "step": 152700 + }, + { + "epoch": 7.91, + "learning_rate": 2.9049269896715514e-05, + "loss": 0.4987, + "step": 152800 + }, + { + "epoch": 7.92, + "learning_rate": 2.9015573936285985e-05, + "loss": 0.5586, + "step": 152900 + }, + { + "epoch": 7.92, + "learning_rate": 2.8981879219077276e-05, + "loss": 0.4819, + "step": 153000 + }, + { + "epoch": 7.93, + "learning_rate": 2.894818578764208e-05, + "loss": 0.5112, + "step": 153100 + }, + { + "epoch": 7.93, + "learning_rate": 2.891449368453146e-05, + "loss": 0.5051, + "step": 153200 + }, + { + "epoch": 7.94, + "learning_rate": 2.888080295229478e-05, + "loss": 0.537, + "step": 153300 + }, + { + "epoch": 7.94, + "learning_rate": 2.884711363347972e-05, + "loss": 0.5448, + "step": 153400 + }, + { + "epoch": 7.95, + "learning_rate": 2.881342577063213e-05, + "loss": 0.5341, + "step": 153500 + }, + { + "epoch": 7.95, + "learning_rate": 2.8779739406296072e-05, + "loss": 0.5011, + "step": 153600 + }, + { + "epoch": 7.96, + "learning_rate": 2.874605458301364e-05, + "loss": 0.5377, + "step": 153700 + }, + { + "epoch": 7.96, + "learning_rate": 2.8712371343325056e-05, + "loss": 0.5191, + "step": 153800 + }, + { + "epoch": 7.97, + "learning_rate": 2.8678689729768497e-05, + "loss": 0.5079, + "step": 153900 + }, + { + "epoch": 7.97, + "learning_rate": 2.8645009784880118e-05, + "loss": 0.4986, + "step": 154000 + }, + { + "epoch": 7.98, + "learning_rate": 2.8611331551193937e-05, + "loss": 0.5484, + "step": 154100 + }, + { + "epoch": 7.98, + "learning_rate": 2.8577655071241823e-05, + "loss": 0.5133, + "step": 154200 + }, + { + "epoch": 7.99, + "learning_rate": 2.8543980387553435e-05, + "loss": 0.4963, + "step": 154300 + }, + { + "epoch": 7.99, + "learning_rate": 2.8510307542656163e-05, + "loss": 0.5091, + "step": 154400 + }, + { + "epoch": 8.0, + "learning_rate": 2.8476636579075073e-05, + "loss": 0.5041, + "step": 154500 + }, + { + "epoch": 8.0, + "eval_accuracy": 0.623841230778192, + "eval_cer": 0.13118756205561125, + "eval_loss": 0.7133947610855103, + "eval_runtime": 4120.7514, + "eval_samples_per_second": 4.166, + "eval_steps_per_second": 0.26, + "eval_wer": 0.2833774483853891, + "step": 154504 + }, + { + "epoch": 8.0, + "learning_rate": 2.844296753933284e-05, + "loss": 0.4175, + "step": 154600 + }, + { + "epoch": 8.01, + "learning_rate": 2.8409300465949734e-05, + "loss": 0.3852, + "step": 154700 + }, + { + "epoch": 8.02, + "learning_rate": 2.8375635401443522e-05, + "loss": 0.4678, + "step": 154800 + }, + { + "epoch": 8.02, + "learning_rate": 2.8341972388329465e-05, + "loss": 0.4266, + "step": 154900 + }, + { + "epoch": 8.03, + "learning_rate": 2.8308311469120194e-05, + "loss": 0.441, + "step": 155000 + }, + { + "epoch": 8.03, + "learning_rate": 2.8274652686325706e-05, + "loss": 0.4787, + "step": 155100 + }, + { + "epoch": 8.04, + "learning_rate": 2.824099608245331e-05, + "loss": 0.483, + "step": 155200 + }, + { + "epoch": 8.04, + "learning_rate": 2.820734170000758e-05, + "loss": 0.4796, + "step": 155300 + }, + { + "epoch": 8.05, + "learning_rate": 2.817368958149024e-05, + "loss": 0.4281, + "step": 155400 + }, + { + "epoch": 8.05, + "learning_rate": 2.8140039769400184e-05, + "loss": 0.4397, + "step": 155500 + }, + { + "epoch": 8.06, + "learning_rate": 2.8106392306233402e-05, + "loss": 0.3527, + "step": 155600 + }, + { + "epoch": 8.06, + "learning_rate": 2.80727472344829e-05, + "loss": 0.4499, + "step": 155700 + }, + { + "epoch": 8.07, + "learning_rate": 2.8039104596638653e-05, + "loss": 0.4868, + "step": 155800 + }, + { + "epoch": 8.07, + "learning_rate": 2.8005464435187584e-05, + "loss": 0.4762, + "step": 155900 + }, + { + "epoch": 8.08, + "learning_rate": 2.7971826792613493e-05, + "loss": 0.4406, + "step": 156000 + }, + { + "epoch": 8.08, + "learning_rate": 2.7938191711396987e-05, + "loss": 0.4422, + "step": 156100 + }, + { + "epoch": 8.09, + "learning_rate": 2.790455923401542e-05, + "loss": 0.4997, + "step": 156200 + }, + { + "epoch": 8.09, + "learning_rate": 2.7870929402942894e-05, + "loss": 0.4919, + "step": 156300 + }, + { + "epoch": 8.1, + "learning_rate": 2.7837302260650145e-05, + "loss": 0.4381, + "step": 156400 + }, + { + "epoch": 8.1, + "learning_rate": 2.7803677849604532e-05, + "loss": 0.402, + "step": 156500 + }, + { + "epoch": 8.11, + "learning_rate": 2.7770056212269943e-05, + "loss": 0.4214, + "step": 156600 + }, + { + "epoch": 8.11, + "learning_rate": 2.7736437391106766e-05, + "loss": 0.4431, + "step": 156700 + }, + { + "epoch": 8.12, + "learning_rate": 2.7703157573907592e-05, + "loss": 0.4752, + "step": 156800 + }, + { + "epoch": 8.12, + "learning_rate": 2.7669544483233218e-05, + "loss": 0.4246, + "step": 156900 + }, + { + "epoch": 8.13, + "learning_rate": 2.763593433566541e-05, + "loss": 0.4097, + "step": 157000 + }, + { + "epoch": 8.13, + "learning_rate": 2.7602327173650067e-05, + "loss": 0.4304, + "step": 157100 + }, + { + "epoch": 8.14, + "learning_rate": 2.7568723039629306e-05, + "loss": 0.4245, + "step": 157200 + }, + { + "epoch": 8.14, + "learning_rate": 2.753512197604139e-05, + "loss": 0.4365, + "step": 157300 + }, + { + "epoch": 8.15, + "learning_rate": 2.750152402532076e-05, + "loss": 0.4264, + "step": 157400 + }, + { + "epoch": 8.16, + "learning_rate": 2.7467929229897886e-05, + "loss": 0.4054, + "step": 157500 + }, + { + "epoch": 8.16, + "learning_rate": 2.7434337632199273e-05, + "loss": 0.4363, + "step": 157600 + }, + { + "epoch": 8.17, + "learning_rate": 2.7400749274647358e-05, + "loss": 0.4259, + "step": 157700 + }, + { + "epoch": 8.17, + "learning_rate": 2.736716419966053e-05, + "loss": 0.4341, + "step": 157800 + }, + { + "epoch": 8.18, + "learning_rate": 2.7333582449652996e-05, + "loss": 0.4196, + "step": 157900 + }, + { + "epoch": 8.18, + "learning_rate": 2.7300004067034788e-05, + "loss": 0.4334, + "step": 158000 + }, + { + "epoch": 8.19, + "learning_rate": 2.7266429094211676e-05, + "loss": 0.4092, + "step": 158100 + }, + { + "epoch": 8.19, + "learning_rate": 2.7232857573585115e-05, + "loss": 0.4511, + "step": 158200 + }, + { + "epoch": 8.2, + "learning_rate": 2.71992895475522e-05, + "loss": 0.4676, + "step": 158300 + }, + { + "epoch": 8.2, + "learning_rate": 2.7166060685748846e-05, + "loss": 0.4574, + "step": 158400 + }, + { + "epoch": 8.21, + "learning_rate": 2.7132499740073298e-05, + "loss": 0.4556, + "step": 158500 + }, + { + "epoch": 8.21, + "learning_rate": 2.7098942415732214e-05, + "loss": 0.4002, + "step": 158600 + }, + { + "epoch": 8.22, + "learning_rate": 2.7065388755104753e-05, + "loss": 0.4303, + "step": 158700 + }, + { + "epoch": 8.22, + "learning_rate": 2.7031838800565487e-05, + "loss": 0.4455, + "step": 158800 + }, + { + "epoch": 8.23, + "learning_rate": 2.6998292594484267e-05, + "loss": 0.4663, + "step": 158900 + }, + { + "epoch": 8.23, + "learning_rate": 2.6964750179226225e-05, + "loss": 0.5129, + "step": 159000 + }, + { + "epoch": 8.24, + "learning_rate": 2.6931211597151706e-05, + "loss": 0.4733, + "step": 159100 + }, + { + "epoch": 8.24, + "learning_rate": 2.6897676890616234e-05, + "loss": 0.5034, + "step": 159200 + }, + { + "epoch": 8.25, + "learning_rate": 2.6864146101970402e-05, + "loss": 0.4488, + "step": 159300 + }, + { + "epoch": 8.25, + "learning_rate": 2.683061927355987e-05, + "loss": 0.4588, + "step": 159400 + }, + { + "epoch": 8.26, + "learning_rate": 2.6797096447725313e-05, + "loss": 0.4206, + "step": 159500 + }, + { + "epoch": 8.26, + "learning_rate": 2.6763577666802343e-05, + "loss": 0.4115, + "step": 159600 + }, + { + "epoch": 8.27, + "learning_rate": 2.673006297312144e-05, + "loss": 0.4476, + "step": 159700 + }, + { + "epoch": 8.27, + "learning_rate": 2.6696552409007948e-05, + "loss": 0.4332, + "step": 159800 + }, + { + "epoch": 8.28, + "learning_rate": 2.6663046016781997e-05, + "loss": 0.4789, + "step": 159900 + }, + { + "epoch": 8.28, + "learning_rate": 2.662954383875844e-05, + "loss": 0.4759, + "step": 160000 + }, + { + "epoch": 8.29, + "learning_rate": 2.659604591724679e-05, + "loss": 0.4541, + "step": 160100 + }, + { + "epoch": 8.29, + "learning_rate": 2.6562552294551216e-05, + "loss": 0.4329, + "step": 160200 + }, + { + "epoch": 8.3, + "learning_rate": 2.652906301297044e-05, + "loss": 0.4267, + "step": 160300 + }, + { + "epoch": 8.31, + "learning_rate": 2.6495578114797732e-05, + "loss": 0.438, + "step": 160400 + }, + { + "epoch": 8.31, + "learning_rate": 2.646209764232076e-05, + "loss": 0.4356, + "step": 160500 + }, + { + "epoch": 8.32, + "learning_rate": 2.6428621637821668e-05, + "loss": 0.4229, + "step": 160600 + }, + { + "epoch": 8.32, + "learning_rate": 2.6395150143576924e-05, + "loss": 0.4587, + "step": 160700 + }, + { + "epoch": 8.33, + "learning_rate": 2.6361683201857322e-05, + "loss": 0.5384, + "step": 160800 + }, + { + "epoch": 8.33, + "learning_rate": 2.6328220854927878e-05, + "loss": 0.446, + "step": 160900 + }, + { + "epoch": 8.34, + "learning_rate": 2.6294763145047826e-05, + "loss": 0.4512, + "step": 161000 + }, + { + "epoch": 8.34, + "learning_rate": 2.626131011447054e-05, + "loss": 0.4071, + "step": 161100 + }, + { + "epoch": 8.35, + "learning_rate": 2.6227861805443477e-05, + "loss": 0.491, + "step": 161200 + }, + { + "epoch": 8.35, + "learning_rate": 2.6194418260208166e-05, + "loss": 0.4912, + "step": 161300 + }, + { + "epoch": 8.36, + "learning_rate": 2.6160979521000047e-05, + "loss": 0.4527, + "step": 161400 + }, + { + "epoch": 8.36, + "learning_rate": 2.6127545630048568e-05, + "loss": 0.4221, + "step": 161500 + }, + { + "epoch": 8.37, + "learning_rate": 2.6094116629577e-05, + "loss": 0.4288, + "step": 161600 + }, + { + "epoch": 8.37, + "learning_rate": 2.6060692561802487e-05, + "loss": 0.4415, + "step": 161700 + }, + { + "epoch": 8.38, + "learning_rate": 2.602727346893589e-05, + "loss": 0.4692, + "step": 161800 + }, + { + "epoch": 8.38, + "learning_rate": 2.5993859393181815e-05, + "loss": 0.3856, + "step": 161900 + }, + { + "epoch": 8.39, + "learning_rate": 2.5960450376738544e-05, + "loss": 0.4803, + "step": 162000 + }, + { + "epoch": 8.39, + "learning_rate": 2.592704646179795e-05, + "loss": 0.4437, + "step": 162100 + }, + { + "epoch": 8.4, + "learning_rate": 2.5893647690545464e-05, + "loss": 0.423, + "step": 162200 + }, + { + "epoch": 8.4, + "learning_rate": 2.586025410516002e-05, + "loss": 0.4138, + "step": 162300 + }, + { + "epoch": 8.41, + "learning_rate": 2.5826865747814024e-05, + "loss": 0.3996, + "step": 162400 + }, + { + "epoch": 8.41, + "learning_rate": 2.5793482660673265e-05, + "loss": 0.4284, + "step": 162500 + }, + { + "epoch": 8.42, + "learning_rate": 2.5760104885896854e-05, + "loss": 0.4264, + "step": 162600 + }, + { + "epoch": 8.42, + "learning_rate": 2.5726732465637236e-05, + "loss": 0.4415, + "step": 162700 + }, + { + "epoch": 8.43, + "learning_rate": 2.5693365442040062e-05, + "loss": 0.4576, + "step": 162800 + }, + { + "epoch": 8.43, + "learning_rate": 2.566000385724419e-05, + "loss": 0.4432, + "step": 162900 + }, + { + "epoch": 8.44, + "learning_rate": 2.5626647753381574e-05, + "loss": 0.3915, + "step": 163000 + }, + { + "epoch": 8.45, + "learning_rate": 2.559329717257729e-05, + "loss": 0.436, + "step": 163100 + }, + { + "epoch": 8.45, + "learning_rate": 2.5559952156949416e-05, + "loss": 0.4346, + "step": 163200 + }, + { + "epoch": 8.46, + "learning_rate": 2.5526612748609e-05, + "loss": 0.3681, + "step": 163300 + }, + { + "epoch": 8.46, + "learning_rate": 2.5493278989660026e-05, + "loss": 0.4642, + "step": 163400 + }, + { + "epoch": 8.47, + "learning_rate": 2.5459950922199312e-05, + "loss": 0.4078, + "step": 163500 + }, + { + "epoch": 8.47, + "learning_rate": 2.5426628588316506e-05, + "loss": 0.4157, + "step": 163600 + }, + { + "epoch": 8.48, + "learning_rate": 2.5393312030094033e-05, + "loss": 0.4477, + "step": 163700 + }, + { + "epoch": 8.48, + "learning_rate": 2.5360001289607003e-05, + "loss": 0.4093, + "step": 163800 + }, + { + "epoch": 8.49, + "learning_rate": 2.5326696408923168e-05, + "loss": 0.4422, + "step": 163900 + }, + { + "epoch": 8.49, + "learning_rate": 2.529339743010291e-05, + "loss": 0.4586, + "step": 164000 + }, + { + "epoch": 8.5, + "learning_rate": 2.5260104395199132e-05, + "loss": 0.3854, + "step": 164100 + }, + { + "epoch": 8.5, + "learning_rate": 2.522681734625726e-05, + "loss": 0.4227, + "step": 164200 + }, + { + "epoch": 8.51, + "learning_rate": 2.5193536325315116e-05, + "loss": 0.4431, + "step": 164300 + }, + { + "epoch": 8.51, + "learning_rate": 2.516026137440295e-05, + "loss": 0.4253, + "step": 164400 + }, + { + "epoch": 8.52, + "learning_rate": 2.512699253554332e-05, + "loss": 0.4602, + "step": 164500 + }, + { + "epoch": 8.52, + "learning_rate": 2.5093729850751086e-05, + "loss": 0.4894, + "step": 164600 + }, + { + "epoch": 8.53, + "learning_rate": 2.506047336203332e-05, + "loss": 0.4152, + "step": 164700 + }, + { + "epoch": 8.53, + "learning_rate": 2.5027223111389274e-05, + "loss": 0.4815, + "step": 164800 + }, + { + "epoch": 8.54, + "learning_rate": 2.4993979140810328e-05, + "loss": 0.4675, + "step": 164900 + }, + { + "epoch": 8.54, + "learning_rate": 2.4960741492279928e-05, + "loss": 0.4584, + "step": 165000 + }, + { + "epoch": 8.55, + "learning_rate": 2.492751020777352e-05, + "loss": 0.4197, + "step": 165100 + }, + { + "epoch": 8.55, + "learning_rate": 2.4894285329258538e-05, + "loss": 0.4777, + "step": 165200 + }, + { + "epoch": 8.56, + "learning_rate": 2.486139905094485e-05, + "loss": 0.4601, + "step": 165300 + }, + { + "epoch": 8.56, + "learning_rate": 2.4828187045175914e-05, + "loss": 0.4749, + "step": 165400 + }, + { + "epoch": 8.57, + "learning_rate": 2.4794981570832536e-05, + "loss": 0.4526, + "step": 165500 + }, + { + "epoch": 8.57, + "learning_rate": 2.476178266984953e-05, + "loss": 0.4477, + "step": 165600 + }, + { + "epoch": 8.58, + "learning_rate": 2.4728590384153438e-05, + "loss": 0.4511, + "step": 165700 + }, + { + "epoch": 8.58, + "learning_rate": 2.4695404755662414e-05, + "loss": 0.4447, + "step": 165800 + }, + { + "epoch": 8.59, + "learning_rate": 2.4662225826286235e-05, + "loss": 0.4394, + "step": 165900 + }, + { + "epoch": 8.6, + "learning_rate": 2.4629053637926187e-05, + "loss": 0.4015, + "step": 166000 + }, + { + "epoch": 8.6, + "learning_rate": 2.4595888232475087e-05, + "loss": 0.4373, + "step": 166100 + }, + { + "epoch": 8.61, + "learning_rate": 2.4562729651817142e-05, + "loss": 0.4236, + "step": 166200 + }, + { + "epoch": 8.61, + "learning_rate": 2.4529577937827954e-05, + "loss": 0.3912, + "step": 166300 + }, + { + "epoch": 8.62, + "learning_rate": 2.4496433132374473e-05, + "loss": 0.4464, + "step": 166400 + }, + { + "epoch": 8.62, + "learning_rate": 2.446329527731491e-05, + "loss": 0.5125, + "step": 166500 + }, + { + "epoch": 8.63, + "learning_rate": 2.4430164414498676e-05, + "loss": 0.4599, + "step": 166600 + }, + { + "epoch": 8.63, + "learning_rate": 2.439704058576638e-05, + "loss": 0.4262, + "step": 166700 + }, + { + "epoch": 8.64, + "learning_rate": 2.436392383294975e-05, + "loss": 0.4223, + "step": 166800 + }, + { + "epoch": 8.64, + "learning_rate": 2.433081419787155e-05, + "loss": 0.4537, + "step": 166900 + }, + { + "epoch": 8.65, + "learning_rate": 2.4297711722345604e-05, + "loss": 0.4085, + "step": 167000 + }, + { + "epoch": 8.65, + "learning_rate": 2.4264616448176637e-05, + "loss": 0.4349, + "step": 167100 + }, + { + "epoch": 8.66, + "learning_rate": 2.4231528417160304e-05, + "loss": 0.4658, + "step": 167200 + }, + { + "epoch": 8.66, + "learning_rate": 2.419844767108313e-05, + "loss": 0.4801, + "step": 167300 + }, + { + "epoch": 8.67, + "learning_rate": 2.4165374251722427e-05, + "loss": 0.4308, + "step": 167400 + }, + { + "epoch": 8.67, + "learning_rate": 2.4132638824743865e-05, + "loss": 0.483, + "step": 167500 + }, + { + "epoch": 8.68, + "learning_rate": 2.409958010980184e-05, + "loss": 0.4433, + "step": 167600 + }, + { + "epoch": 8.68, + "learning_rate": 2.406652884643502e-05, + "loss": 0.4464, + "step": 167700 + }, + { + "epoch": 8.69, + "learning_rate": 2.4033485076383488e-05, + "loss": 0.4448, + "step": 167800 + }, + { + "epoch": 8.69, + "learning_rate": 2.4000448841377867e-05, + "loss": 0.4246, + "step": 167900 + }, + { + "epoch": 8.7, + "learning_rate": 2.3967750432079663e-05, + "loss": 0.5037, + "step": 168000 + }, + { + "epoch": 8.7, + "learning_rate": 2.3934729315928343e-05, + "loss": 0.4366, + "step": 168100 + }, + { + "epoch": 8.71, + "learning_rate": 2.3901715859540486e-05, + "loss": 0.4372, + "step": 168200 + }, + { + "epoch": 8.71, + "learning_rate": 2.386871010460843e-05, + "loss": 0.5103, + "step": 168300 + }, + { + "epoch": 8.72, + "learning_rate": 2.3835712092814762e-05, + "loss": 0.4388, + "step": 168400 + }, + { + "epoch": 8.72, + "learning_rate": 2.3802721865832324e-05, + "loss": 0.3981, + "step": 168500 + }, + { + "epoch": 8.73, + "learning_rate": 2.3769739465324093e-05, + "loss": 0.4546, + "step": 168600 + }, + { + "epoch": 8.74, + "learning_rate": 2.3736764932943204e-05, + "loss": 0.4217, + "step": 168700 + }, + { + "epoch": 8.74, + "learning_rate": 2.370379831033281e-05, + "loss": 0.4197, + "step": 168800 + }, + { + "epoch": 8.75, + "learning_rate": 2.3670839639126102e-05, + "loss": 0.4467, + "step": 168900 + }, + { + "epoch": 8.75, + "learning_rate": 2.363788896094621e-05, + "loss": 0.5078, + "step": 169000 + }, + { + "epoch": 8.76, + "learning_rate": 2.3604946317406204e-05, + "loss": 0.4327, + "step": 169100 + }, + { + "epoch": 8.76, + "learning_rate": 2.357201175010898e-05, + "loss": 0.4614, + "step": 169200 + }, + { + "epoch": 8.77, + "learning_rate": 2.353908530064722e-05, + "loss": 0.4342, + "step": 169300 + }, + { + "epoch": 8.77, + "learning_rate": 2.35061670106034e-05, + "loss": 0.4709, + "step": 169400 + }, + { + "epoch": 8.78, + "learning_rate": 2.347325692154964e-05, + "loss": 0.4878, + "step": 169500 + }, + { + "epoch": 8.78, + "learning_rate": 2.344035507504776e-05, + "loss": 0.4265, + "step": 169600 + }, + { + "epoch": 8.79, + "learning_rate": 2.3407461512649116e-05, + "loss": 0.4399, + "step": 169700 + }, + { + "epoch": 8.79, + "learning_rate": 2.337457627589463e-05, + "loss": 0.4227, + "step": 169800 + }, + { + "epoch": 8.8, + "learning_rate": 2.33416994063147e-05, + "loss": 0.4234, + "step": 169900 + }, + { + "epoch": 8.8, + "learning_rate": 2.3308830945429175e-05, + "loss": 0.4312, + "step": 170000 + }, + { + "epoch": 8.81, + "learning_rate": 2.3275970934747265e-05, + "loss": 0.4391, + "step": 170100 + }, + { + "epoch": 8.81, + "learning_rate": 2.3243119415767508e-05, + "loss": 0.4591, + "step": 170200 + }, + { + "epoch": 8.82, + "learning_rate": 2.3210276429977734e-05, + "loss": 0.433, + "step": 170300 + }, + { + "epoch": 8.82, + "learning_rate": 2.3177442018854995e-05, + "loss": 0.4178, + "step": 170400 + }, + { + "epoch": 8.83, + "learning_rate": 2.3144616223865488e-05, + "loss": 0.4094, + "step": 170500 + }, + { + "epoch": 8.83, + "learning_rate": 2.3111799086464552e-05, + "loss": 0.4256, + "step": 170600 + }, + { + "epoch": 8.84, + "learning_rate": 2.3079318689284015e-05, + "loss": 0.3786, + "step": 170700 + }, + { + "epoch": 8.84, + "learning_rate": 2.3046518903772723e-05, + "loss": 0.4336, + "step": 170800 + }, + { + "epoch": 8.85, + "learning_rate": 2.3013727899736035e-05, + "loss": 0.4592, + "step": 170900 + }, + { + "epoch": 8.85, + "learning_rate": 2.2980945718585346e-05, + "loss": 0.4094, + "step": 171000 + }, + { + "epoch": 8.86, + "learning_rate": 2.2948172401720915e-05, + "loss": 0.4502, + "step": 171100 + }, + { + "epoch": 8.86, + "learning_rate": 2.2915407990531787e-05, + "loss": 0.4912, + "step": 171200 + }, + { + "epoch": 8.87, + "learning_rate": 2.288265252639579e-05, + "loss": 0.4287, + "step": 171300 + }, + { + "epoch": 8.87, + "learning_rate": 2.2849906050679424e-05, + "loss": 0.4383, + "step": 171400 + }, + { + "epoch": 8.88, + "learning_rate": 2.2817168604737877e-05, + "loss": 0.4662, + "step": 171500 + }, + { + "epoch": 8.89, + "learning_rate": 2.2784440229914887e-05, + "loss": 0.4573, + "step": 171600 + }, + { + "epoch": 8.89, + "learning_rate": 2.2751720967542756e-05, + "loss": 0.4446, + "step": 171700 + }, + { + "epoch": 8.9, + "learning_rate": 2.2719010858942296e-05, + "loss": 0.4817, + "step": 171800 + }, + { + "epoch": 8.9, + "learning_rate": 2.2686309945422734e-05, + "loss": 0.4742, + "step": 171900 + }, + { + "epoch": 8.91, + "learning_rate": 2.2653618268281693e-05, + "loss": 0.4296, + "step": 172000 + }, + { + "epoch": 8.91, + "learning_rate": 2.262093586880512e-05, + "loss": 0.452, + "step": 172100 + }, + { + "epoch": 8.92, + "learning_rate": 2.2588262788267276e-05, + "loss": 0.4447, + "step": 172200 + }, + { + "epoch": 8.92, + "learning_rate": 2.2555599067930625e-05, + "loss": 0.4559, + "step": 172300 + }, + { + "epoch": 8.93, + "learning_rate": 2.2522944749045826e-05, + "loss": 0.4478, + "step": 172400 + }, + { + "epoch": 8.93, + "learning_rate": 2.249029987285165e-05, + "loss": 0.4827, + "step": 172500 + }, + { + "epoch": 8.94, + "learning_rate": 2.245766448057495e-05, + "loss": 0.4839, + "step": 172600 + }, + { + "epoch": 8.94, + "learning_rate": 2.2425038613430612e-05, + "loss": 0.4112, + "step": 172700 + }, + { + "epoch": 8.95, + "learning_rate": 2.2392422312621486e-05, + "loss": 0.4452, + "step": 172800 + }, + { + "epoch": 8.95, + "learning_rate": 2.2359815619338324e-05, + "loss": 0.418, + "step": 172900 + }, + { + "epoch": 8.96, + "learning_rate": 2.2327218574759757e-05, + "loss": 0.4824, + "step": 173000 + }, + { + "epoch": 8.96, + "learning_rate": 2.2294631220052258e-05, + "loss": 0.4024, + "step": 173100 + }, + { + "epoch": 8.97, + "learning_rate": 2.2262053596370023e-05, + "loss": 0.3932, + "step": 173200 + }, + { + "epoch": 8.97, + "learning_rate": 2.2229485744854963e-05, + "loss": 0.4221, + "step": 173300 + }, + { + "epoch": 8.98, + "learning_rate": 2.2196927706636672e-05, + "loss": 0.4589, + "step": 173400 + }, + { + "epoch": 8.98, + "learning_rate": 2.2164704955756062e-05, + "loss": 0.4389, + "step": 173500 + }, + { + "epoch": 8.99, + "learning_rate": 2.2132166568311804e-05, + "loss": 0.4138, + "step": 173600 + }, + { + "epoch": 8.99, + "learning_rate": 2.2099638117067632e-05, + "loss": 0.4401, + "step": 173700 + }, + { + "epoch": 9.0, + "learning_rate": 2.206711964310336e-05, + "loss": 0.4503, + "step": 173800 + }, + { + "epoch": 9.0, + "eval_accuracy": 0.6238725390260951, + "eval_cer": 0.11975474210746738, + "eval_loss": 0.6584149599075317, + "eval_runtime": 4766.8269, + "eval_samples_per_second": 3.602, + "eval_steps_per_second": 0.225, + "eval_wer": 0.26746661961061113, + "step": 173817 + }, + { + "epoch": 9.0, + "learning_rate": 2.203461118748622e-05, + "loss": 0.3225, + "step": 173900 + }, + { + "epoch": 9.01, + "learning_rate": 2.200211279127078e-05, + "loss": 0.3775, + "step": 174000 + }, + { + "epoch": 9.01, + "learning_rate": 2.1969624495498885e-05, + "loss": 0.3479, + "step": 174100 + }, + { + "epoch": 9.02, + "learning_rate": 2.1937146341199673e-05, + "loss": 0.351, + "step": 174200 + }, + { + "epoch": 9.03, + "learning_rate": 2.1904678369389446e-05, + "loss": 0.38, + "step": 174300 + }, + { + "epoch": 9.03, + "learning_rate": 2.1872220621071627e-05, + "loss": 0.3347, + "step": 174400 + }, + { + "epoch": 9.04, + "learning_rate": 2.183977313723676e-05, + "loss": 0.3999, + "step": 174500 + }, + { + "epoch": 9.04, + "learning_rate": 2.1807335958862414e-05, + "loss": 0.4183, + "step": 174600 + }, + { + "epoch": 9.05, + "learning_rate": 2.177490912691315e-05, + "loss": 0.3779, + "step": 174700 + }, + { + "epoch": 9.05, + "learning_rate": 2.1742492682340444e-05, + "loss": 0.3699, + "step": 174800 + }, + { + "epoch": 9.06, + "learning_rate": 2.171008666608267e-05, + "loss": 0.3813, + "step": 174900 + }, + { + "epoch": 9.06, + "learning_rate": 2.1677691119065036e-05, + "loss": 0.3502, + "step": 175000 + }, + { + "epoch": 9.07, + "learning_rate": 2.1645306082199527e-05, + "loss": 0.3529, + "step": 175100 + }, + { + "epoch": 9.07, + "learning_rate": 2.1612931596384818e-05, + "loss": 0.3358, + "step": 175200 + }, + { + "epoch": 9.08, + "learning_rate": 2.1580567702506325e-05, + "loss": 0.3796, + "step": 175300 + }, + { + "epoch": 9.08, + "learning_rate": 2.1548537921280166e-05, + "loss": 0.3693, + "step": 175400 + }, + { + "epoch": 9.09, + "learning_rate": 2.1516195226937784e-05, + "loss": 0.3381, + "step": 175500 + }, + { + "epoch": 9.09, + "learning_rate": 2.1483863246698893e-05, + "loss": 0.3414, + "step": 175600 + }, + { + "epoch": 9.1, + "learning_rate": 2.1451542021395203e-05, + "loss": 0.3965, + "step": 175700 + }, + { + "epoch": 9.1, + "learning_rate": 2.141923159184484e-05, + "loss": 0.3863, + "step": 175800 + }, + { + "epoch": 9.11, + "learning_rate": 2.1386931998852268e-05, + "loss": 0.3401, + "step": 175900 + }, + { + "epoch": 9.11, + "learning_rate": 2.1354643283208293e-05, + "loss": 0.3604, + "step": 176000 + }, + { + "epoch": 9.12, + "learning_rate": 2.132236548568998e-05, + "loss": 0.3471, + "step": 176100 + }, + { + "epoch": 9.12, + "learning_rate": 2.1290098647060624e-05, + "loss": 0.3806, + "step": 176200 + }, + { + "epoch": 9.13, + "learning_rate": 2.1257842808069625e-05, + "loss": 0.3954, + "step": 176300 + }, + { + "epoch": 9.13, + "learning_rate": 2.122559800945255e-05, + "loss": 0.3644, + "step": 176400 + }, + { + "epoch": 9.14, + "learning_rate": 2.1193364291930984e-05, + "loss": 0.3391, + "step": 176500 + }, + { + "epoch": 9.14, + "learning_rate": 2.1161141696212546e-05, + "loss": 0.42, + "step": 176600 + }, + { + "epoch": 9.15, + "learning_rate": 2.11289302629908e-05, + "loss": 0.3518, + "step": 176700 + }, + { + "epoch": 9.15, + "learning_rate": 2.1096730032945197e-05, + "loss": 0.3345, + "step": 176800 + }, + { + "epoch": 9.16, + "learning_rate": 2.1064541046741054e-05, + "loss": 0.3439, + "step": 176900 + }, + { + "epoch": 9.16, + "learning_rate": 2.1032363345029494e-05, + "loss": 0.3435, + "step": 177000 + }, + { + "epoch": 9.17, + "learning_rate": 2.1000196968447383e-05, + "loss": 0.4107, + "step": 177100 + }, + { + "epoch": 9.18, + "learning_rate": 2.096804195761727e-05, + "loss": 0.3455, + "step": 177200 + }, + { + "epoch": 9.18, + "learning_rate": 2.0935898353147377e-05, + "loss": 0.3637, + "step": 177300 + }, + { + "epoch": 9.19, + "learning_rate": 2.0903766195631494e-05, + "loss": 0.3595, + "step": 177400 + }, + { + "epoch": 9.19, + "learning_rate": 2.0871645525648998e-05, + "loss": 0.3716, + "step": 177500 + }, + { + "epoch": 9.2, + "learning_rate": 2.0839536383764687e-05, + "loss": 0.3503, + "step": 177600 + }, + { + "epoch": 9.2, + "learning_rate": 2.0807438810528874e-05, + "loss": 0.3734, + "step": 177700 + }, + { + "epoch": 9.21, + "learning_rate": 2.077535284647721e-05, + "loss": 0.386, + "step": 177800 + }, + { + "epoch": 9.21, + "learning_rate": 2.0743278532130727e-05, + "loss": 0.3812, + "step": 177900 + }, + { + "epoch": 9.22, + "learning_rate": 2.0711215907995708e-05, + "loss": 0.4289, + "step": 178000 + }, + { + "epoch": 9.22, + "learning_rate": 2.0679165014563682e-05, + "loss": 0.3529, + "step": 178100 + }, + { + "epoch": 9.23, + "learning_rate": 2.064712589231138e-05, + "loss": 0.4035, + "step": 178200 + }, + { + "epoch": 9.23, + "learning_rate": 2.0615098581700666e-05, + "loss": 0.3737, + "step": 178300 + }, + { + "epoch": 9.24, + "learning_rate": 2.058308312317845e-05, + "loss": 0.3675, + "step": 178400 + }, + { + "epoch": 9.24, + "learning_rate": 2.0551079557176714e-05, + "loss": 0.3668, + "step": 178500 + }, + { + "epoch": 9.25, + "learning_rate": 2.0519087924112416e-05, + "loss": 0.3633, + "step": 178600 + }, + { + "epoch": 9.25, + "learning_rate": 2.048710826438744e-05, + "loss": 0.3432, + "step": 178700 + }, + { + "epoch": 9.26, + "learning_rate": 2.0455140618388525e-05, + "loss": 0.4205, + "step": 178800 + }, + { + "epoch": 9.26, + "learning_rate": 2.0423185026487273e-05, + "loss": 0.3651, + "step": 178900 + }, + { + "epoch": 9.27, + "learning_rate": 2.039124152904005e-05, + "loss": 0.3716, + "step": 179000 + }, + { + "epoch": 9.27, + "learning_rate": 2.0359310166387934e-05, + "loss": 0.3673, + "step": 179100 + }, + { + "epoch": 9.28, + "learning_rate": 2.032739097885671e-05, + "loss": 0.3872, + "step": 179200 + }, + { + "epoch": 9.28, + "learning_rate": 2.0295484006756757e-05, + "loss": 0.3107, + "step": 179300 + }, + { + "epoch": 9.29, + "learning_rate": 2.026358929038303e-05, + "loss": 0.4159, + "step": 179400 + }, + { + "epoch": 9.29, + "learning_rate": 2.023170687001503e-05, + "loss": 0.3565, + "step": 179500 + }, + { + "epoch": 9.3, + "learning_rate": 2.0199836785916712e-05, + "loss": 0.3406, + "step": 179600 + }, + { + "epoch": 9.3, + "learning_rate": 2.0167979078336443e-05, + "loss": 0.3878, + "step": 179700 + }, + { + "epoch": 9.31, + "learning_rate": 2.0136133787506974e-05, + "loss": 0.3569, + "step": 179800 + }, + { + "epoch": 9.31, + "learning_rate": 2.010430095364538e-05, + "loss": 0.3783, + "step": 179900 + }, + { + "epoch": 9.32, + "learning_rate": 2.007279875832696e-05, + "loss": 0.3457, + "step": 180000 + }, + { + "epoch": 9.33, + "learning_rate": 2.0040990833416912e-05, + "loss": 0.3422, + "step": 180100 + }, + { + "epoch": 9.33, + "learning_rate": 2.000919548562972e-05, + "loss": 0.4037, + "step": 180200 + }, + { + "epoch": 9.34, + "learning_rate": 1.9977412755119382e-05, + "loss": 0.3384, + "step": 180300 + }, + { + "epoch": 9.34, + "learning_rate": 1.9945642682023955e-05, + "loss": 0.3697, + "step": 180400 + }, + { + "epoch": 9.35, + "learning_rate": 1.9913885306465514e-05, + "loss": 0.3503, + "step": 180500 + }, + { + "epoch": 9.35, + "learning_rate": 1.988214066855009e-05, + "loss": 0.4168, + "step": 180600 + }, + { + "epoch": 9.36, + "learning_rate": 1.9850408808367656e-05, + "loss": 0.4272, + "step": 180700 + }, + { + "epoch": 9.36, + "learning_rate": 1.9818689765992013e-05, + "loss": 0.3656, + "step": 180800 + }, + { + "epoch": 9.37, + "learning_rate": 1.978698358148079e-05, + "loss": 0.3384, + "step": 180900 + }, + { + "epoch": 9.37, + "learning_rate": 1.975529029487538e-05, + "loss": 0.3568, + "step": 181000 + }, + { + "epoch": 9.38, + "learning_rate": 1.97236099462009e-05, + "loss": 0.3738, + "step": 181100 + }, + { + "epoch": 9.38, + "learning_rate": 1.969194257546609e-05, + "loss": 0.3403, + "step": 181200 + }, + { + "epoch": 9.39, + "learning_rate": 1.9660288222663328e-05, + "loss": 0.3645, + "step": 181300 + }, + { + "epoch": 9.39, + "learning_rate": 1.9628646927768566e-05, + "loss": 0.3755, + "step": 181400 + }, + { + "epoch": 9.4, + "learning_rate": 1.9597018730741227e-05, + "loss": 0.3855, + "step": 181500 + }, + { + "epoch": 9.4, + "learning_rate": 1.9565403671524213e-05, + "loss": 0.3379, + "step": 181600 + }, + { + "epoch": 9.41, + "learning_rate": 1.953380179004384e-05, + "loss": 0.3888, + "step": 181700 + }, + { + "epoch": 9.41, + "learning_rate": 1.9502213126209773e-05, + "loss": 0.3963, + "step": 181800 + }, + { + "epoch": 9.42, + "learning_rate": 1.9470637719914997e-05, + "loss": 0.3638, + "step": 181900 + }, + { + "epoch": 9.42, + "learning_rate": 1.943907561103573e-05, + "loss": 0.3669, + "step": 182000 + }, + { + "epoch": 9.43, + "learning_rate": 1.9407526839431414e-05, + "loss": 0.3706, + "step": 182100 + }, + { + "epoch": 9.43, + "learning_rate": 1.9375991444944646e-05, + "loss": 0.4036, + "step": 182200 + }, + { + "epoch": 9.44, + "learning_rate": 1.9344469467401135e-05, + "loss": 0.3972, + "step": 182300 + }, + { + "epoch": 9.44, + "learning_rate": 1.9312960946609643e-05, + "loss": 0.3526, + "step": 182400 + }, + { + "epoch": 9.45, + "learning_rate": 1.9281465922361907e-05, + "loss": 0.3695, + "step": 182500 + }, + { + "epoch": 9.45, + "learning_rate": 1.924998443443267e-05, + "loss": 0.3589, + "step": 182600 + }, + { + "epoch": 9.46, + "learning_rate": 1.9218516522579544e-05, + "loss": 0.4098, + "step": 182700 + }, + { + "epoch": 9.47, + "learning_rate": 1.918706222654303e-05, + "loss": 0.3642, + "step": 182800 + }, + { + "epoch": 9.47, + "learning_rate": 1.9155621586046376e-05, + "loss": 0.3603, + "step": 182900 + }, + { + "epoch": 9.48, + "learning_rate": 1.9124194640795647e-05, + "loss": 0.3952, + "step": 183000 + }, + { + "epoch": 9.48, + "learning_rate": 1.9092781430479568e-05, + "loss": 0.389, + "step": 183100 + }, + { + "epoch": 9.49, + "learning_rate": 1.906138199476956e-05, + "loss": 0.3789, + "step": 183200 + }, + { + "epoch": 9.49, + "learning_rate": 1.9030310161023346e-05, + "loss": 0.4149, + "step": 183300 + }, + { + "epoch": 9.5, + "learning_rate": 1.899893825473489e-05, + "loss": 0.3683, + "step": 183400 + }, + { + "epoch": 9.5, + "learning_rate": 1.8967580241566007e-05, + "loss": 0.365, + "step": 183500 + }, + { + "epoch": 9.51, + "learning_rate": 1.8936236161118374e-05, + "loss": 0.3279, + "step": 183600 + }, + { + "epoch": 9.51, + "learning_rate": 1.890490605297609e-05, + "loss": 0.354, + "step": 183700 + }, + { + "epoch": 9.52, + "learning_rate": 1.887358995670561e-05, + "loss": 0.3564, + "step": 183800 + }, + { + "epoch": 9.52, + "learning_rate": 1.8842287911855683e-05, + "loss": 0.3445, + "step": 183900 + }, + { + "epoch": 9.53, + "learning_rate": 1.8810999957957303e-05, + "loss": 0.3781, + "step": 184000 + }, + { + "epoch": 9.53, + "learning_rate": 1.8780038802682546e-05, + "loss": 0.3788, + "step": 184100 + }, + { + "epoch": 9.54, + "learning_rate": 1.874877900731403e-05, + "loss": 0.3954, + "step": 184200 + }, + { + "epoch": 9.54, + "learning_rate": 1.8717533420988445e-05, + "loss": 0.3442, + "step": 184300 + }, + { + "epoch": 9.55, + "learning_rate": 1.868630208316549e-05, + "loss": 0.3862, + "step": 184400 + }, + { + "epoch": 9.55, + "learning_rate": 1.865508503328687e-05, + "loss": 0.4042, + "step": 184500 + }, + { + "epoch": 9.56, + "learning_rate": 1.8623882310776267e-05, + "loss": 0.4147, + "step": 184600 + }, + { + "epoch": 9.56, + "learning_rate": 1.8592693955039243e-05, + "loss": 0.3573, + "step": 184700 + }, + { + "epoch": 9.57, + "learning_rate": 1.856152000546323e-05, + "loss": 0.4193, + "step": 184800 + }, + { + "epoch": 9.57, + "learning_rate": 1.8530360501417476e-05, + "loss": 0.3744, + "step": 184900 + }, + { + "epoch": 9.58, + "learning_rate": 1.849921548225297e-05, + "loss": 0.3508, + "step": 185000 + }, + { + "epoch": 9.58, + "learning_rate": 1.8468084987302406e-05, + "loss": 0.3633, + "step": 185100 + }, + { + "epoch": 9.59, + "learning_rate": 1.843696905588014e-05, + "loss": 0.3627, + "step": 185200 + }, + { + "epoch": 9.59, + "learning_rate": 1.8405867727282152e-05, + "loss": 0.2985, + "step": 185300 + }, + { + "epoch": 9.6, + "learning_rate": 1.8374781040785968e-05, + "loss": 0.3724, + "step": 185400 + }, + { + "epoch": 9.6, + "learning_rate": 1.8343709035650604e-05, + "loss": 0.383, + "step": 185500 + }, + { + "epoch": 9.61, + "learning_rate": 1.831265175111657e-05, + "loss": 0.3862, + "step": 185600 + }, + { + "epoch": 9.62, + "learning_rate": 1.8281609226405757e-05, + "loss": 0.3485, + "step": 185700 + }, + { + "epoch": 9.62, + "learning_rate": 1.825058150072144e-05, + "loss": 0.3734, + "step": 185800 + }, + { + "epoch": 9.63, + "learning_rate": 1.8219568613248178e-05, + "loss": 0.3766, + "step": 185900 + }, + { + "epoch": 9.63, + "learning_rate": 1.818857060315181e-05, + "loss": 0.4136, + "step": 186000 + }, + { + "epoch": 9.64, + "learning_rate": 1.8157587509579373e-05, + "loss": 0.3742, + "step": 186100 + }, + { + "epoch": 9.64, + "learning_rate": 1.8126619371659096e-05, + "loss": 0.3298, + "step": 186200 + }, + { + "epoch": 9.65, + "learning_rate": 1.809566622850028e-05, + "loss": 0.3685, + "step": 186300 + }, + { + "epoch": 9.65, + "learning_rate": 1.8064728119193307e-05, + "loss": 0.3969, + "step": 186400 + }, + { + "epoch": 9.66, + "learning_rate": 1.8033805082809584e-05, + "loss": 0.3978, + "step": 186500 + }, + { + "epoch": 9.66, + "learning_rate": 1.800289715840148e-05, + "loss": 0.3523, + "step": 186600 + }, + { + "epoch": 9.67, + "learning_rate": 1.7972004385002256e-05, + "loss": 0.4137, + "step": 186700 + }, + { + "epoch": 9.67, + "learning_rate": 1.794112680162605e-05, + "loss": 0.3297, + "step": 186800 + }, + { + "epoch": 9.68, + "learning_rate": 1.7910264447267835e-05, + "loss": 0.3601, + "step": 186900 + }, + { + "epoch": 9.68, + "learning_rate": 1.7879417360903327e-05, + "loss": 0.3419, + "step": 187000 + }, + { + "epoch": 9.69, + "learning_rate": 1.7848585581489e-05, + "loss": 0.354, + "step": 187100 + }, + { + "epoch": 9.69, + "learning_rate": 1.781776914796193e-05, + "loss": 0.3734, + "step": 187200 + }, + { + "epoch": 9.7, + "learning_rate": 1.778696809923987e-05, + "loss": 0.3652, + "step": 187300 + }, + { + "epoch": 9.7, + "learning_rate": 1.7756182474221125e-05, + "loss": 0.3254, + "step": 187400 + }, + { + "epoch": 9.71, + "learning_rate": 1.7725412311784528e-05, + "loss": 0.3193, + "step": 187500 + }, + { + "epoch": 9.71, + "learning_rate": 1.769465765078936e-05, + "loss": 0.3591, + "step": 187600 + }, + { + "epoch": 9.72, + "learning_rate": 1.7663918530075347e-05, + "loss": 0.4299, + "step": 187700 + }, + { + "epoch": 9.72, + "learning_rate": 1.7633194988462597e-05, + "loss": 0.4245, + "step": 187800 + }, + { + "epoch": 9.73, + "learning_rate": 1.7602487064751533e-05, + "loss": 0.3599, + "step": 187900 + }, + { + "epoch": 9.73, + "learning_rate": 1.757179479772283e-05, + "loss": 0.4007, + "step": 188000 + }, + { + "epoch": 9.74, + "learning_rate": 1.7541118226137437e-05, + "loss": 0.3497, + "step": 188100 + }, + { + "epoch": 9.74, + "learning_rate": 1.751045738873645e-05, + "loss": 0.3746, + "step": 188200 + }, + { + "epoch": 9.75, + "learning_rate": 1.7479812324241106e-05, + "loss": 0.3302, + "step": 188300 + }, + { + "epoch": 9.76, + "learning_rate": 1.7449183071352713e-05, + "loss": 0.3491, + "step": 188400 + }, + { + "epoch": 9.76, + "learning_rate": 1.7418569668752622e-05, + "loss": 0.3873, + "step": 188500 + }, + { + "epoch": 9.77, + "learning_rate": 1.7387972155102155e-05, + "loss": 0.3782, + "step": 188600 + }, + { + "epoch": 9.77, + "learning_rate": 1.7357390569042582e-05, + "loss": 0.3721, + "step": 188700 + }, + { + "epoch": 9.78, + "learning_rate": 1.7326824949195045e-05, + "loss": 0.3975, + "step": 188800 + }, + { + "epoch": 9.78, + "learning_rate": 1.7296275334160536e-05, + "loss": 0.3531, + "step": 188900 + }, + { + "epoch": 9.79, + "learning_rate": 1.7265741762519817e-05, + "loss": 0.3696, + "step": 189000 + }, + { + "epoch": 9.79, + "learning_rate": 1.723522427283339e-05, + "loss": 0.3453, + "step": 189100 + }, + { + "epoch": 9.8, + "learning_rate": 1.72047229036415e-05, + "loss": 0.4007, + "step": 189200 + }, + { + "epoch": 9.8, + "learning_rate": 1.7174237693463946e-05, + "loss": 0.3284, + "step": 189300 + }, + { + "epoch": 9.81, + "learning_rate": 1.7143768680800162e-05, + "loss": 0.3874, + "step": 189400 + }, + { + "epoch": 9.81, + "learning_rate": 1.711331590412916e-05, + "loss": 0.3517, + "step": 189500 + }, + { + "epoch": 9.82, + "learning_rate": 1.708287940190941e-05, + "loss": 0.4294, + "step": 189600 + }, + { + "epoch": 9.82, + "learning_rate": 1.705245921257881e-05, + "loss": 0.3419, + "step": 189700 + }, + { + "epoch": 9.83, + "learning_rate": 1.7022055374554687e-05, + "loss": 0.3833, + "step": 189800 + }, + { + "epoch": 9.83, + "learning_rate": 1.699166792623373e-05, + "loss": 0.3834, + "step": 189900 + }, + { + "epoch": 9.84, + "learning_rate": 1.6961296905991925e-05, + "loss": 0.396, + "step": 190000 + }, + { + "epoch": 9.84, + "learning_rate": 1.6930942352184447e-05, + "loss": 0.3701, + "step": 190100 + }, + { + "epoch": 9.85, + "learning_rate": 1.6900604303145766e-05, + "loss": 0.3537, + "step": 190200 + }, + { + "epoch": 9.85, + "learning_rate": 1.687028279718947e-05, + "loss": 0.3376, + "step": 190300 + }, + { + "epoch": 9.86, + "learning_rate": 1.6839977872608245e-05, + "loss": 0.3158, + "step": 190400 + }, + { + "epoch": 9.86, + "learning_rate": 1.6809689567673844e-05, + "loss": 0.3283, + "step": 190500 + }, + { + "epoch": 9.87, + "learning_rate": 1.6779720554525263e-05, + "loss": 0.3579, + "step": 190600 + }, + { + "epoch": 9.87, + "learning_rate": 1.674946543646535e-05, + "loss": 0.308, + "step": 190700 + }, + { + "epoch": 9.88, + "learning_rate": 1.671922705235941e-05, + "loss": 0.39, + "step": 190800 + }, + { + "epoch": 9.88, + "learning_rate": 1.668900544039517e-05, + "loss": 0.3776, + "step": 190900 + }, + { + "epoch": 9.89, + "learning_rate": 1.665880063873918e-05, + "loss": 0.3698, + "step": 191000 + }, + { + "epoch": 9.89, + "learning_rate": 1.6628612685536766e-05, + "loss": 0.3641, + "step": 191100 + }, + { + "epoch": 9.9, + "learning_rate": 1.6598441618911917e-05, + "loss": 0.3387, + "step": 191200 + }, + { + "epoch": 9.91, + "learning_rate": 1.656828747696738e-05, + "loss": 0.3966, + "step": 191300 + }, + { + "epoch": 9.91, + "learning_rate": 1.6538150297784475e-05, + "loss": 0.3669, + "step": 191400 + }, + { + "epoch": 9.92, + "learning_rate": 1.650803011942312e-05, + "loss": 0.3289, + "step": 191500 + }, + { + "epoch": 9.92, + "learning_rate": 1.6477926979921732e-05, + "loss": 0.3889, + "step": 191600 + }, + { + "epoch": 9.93, + "learning_rate": 1.6447840917297262e-05, + "loss": 0.3857, + "step": 191700 + }, + { + "epoch": 9.93, + "learning_rate": 1.641777196954506e-05, + "loss": 0.3726, + "step": 191800 + }, + { + "epoch": 9.94, + "learning_rate": 1.6387720174638858e-05, + "loss": 0.3447, + "step": 191900 + }, + { + "epoch": 9.94, + "learning_rate": 1.6357685570530748e-05, + "loss": 0.3672, + "step": 192000 + }, + { + "epoch": 9.95, + "learning_rate": 1.632766819515109e-05, + "loss": 0.342, + "step": 192100 + }, + { + "epoch": 9.95, + "learning_rate": 1.6297668086408505e-05, + "loss": 0.3357, + "step": 192200 + }, + { + "epoch": 9.96, + "learning_rate": 1.6267685282189795e-05, + "loss": 0.3342, + "step": 192300 + }, + { + "epoch": 9.96, + "learning_rate": 1.6237719820359914e-05, + "loss": 0.3357, + "step": 192400 + }, + { + "epoch": 9.97, + "learning_rate": 1.6207771738761918e-05, + "loss": 0.3392, + "step": 192500 + }, + { + "epoch": 9.97, + "learning_rate": 1.6177841075216897e-05, + "loss": 0.3754, + "step": 192600 + }, + { + "epoch": 9.98, + "learning_rate": 1.6147927867523954e-05, + "loss": 0.3334, + "step": 192700 + }, + { + "epoch": 9.98, + "learning_rate": 1.6118032153460186e-05, + "loss": 0.422, + "step": 192800 + }, + { + "epoch": 9.99, + "learning_rate": 1.608815397078051e-05, + "loss": 0.3799, + "step": 192900 + }, + { + "epoch": 9.99, + "learning_rate": 1.6058293357217788e-05, + "loss": 0.3258, + "step": 193000 + }, + { + "epoch": 10.0, + "learning_rate": 1.6028450350482634e-05, + "loss": 0.3423, + "step": 193100 + }, + { + "epoch": 10.0, + "eval_accuracy": 0.6243996825489282, + "eval_cer": 0.11433102286469878, + "eval_loss": 0.6315078735351562, + "eval_runtime": 3868.8283, + "eval_samples_per_second": 4.438, + "eval_steps_per_second": 0.277, + "eval_wer": 0.2548555967296041, + "step": 193130 + }, + { + "epoch": 10.0, + "learning_rate": 1.5998624988263486e-05, + "loss": 0.3581, + "step": 193200 + }, + { + "epoch": 10.01, + "learning_rate": 1.5968817308226438e-05, + "loss": 0.3215, + "step": 193300 + }, + { + "epoch": 10.01, + "learning_rate": 1.5939027348015272e-05, + "loss": 0.2873, + "step": 193400 + }, + { + "epoch": 10.02, + "learning_rate": 1.590925514525143e-05, + "loss": 0.2765, + "step": 193500 + }, + { + "epoch": 10.02, + "learning_rate": 1.5879500737533894e-05, + "loss": 0.3225, + "step": 193600 + }, + { + "epoch": 10.03, + "learning_rate": 1.584976416243916e-05, + "loss": 0.3119, + "step": 193700 + }, + { + "epoch": 10.03, + "learning_rate": 1.5820045457521215e-05, + "loss": 0.2835, + "step": 193800 + }, + { + "epoch": 10.04, + "learning_rate": 1.5790344660311507e-05, + "loss": 0.3561, + "step": 193900 + }, + { + "epoch": 10.05, + "learning_rate": 1.576066180831885e-05, + "loss": 0.2817, + "step": 194000 + }, + { + "epoch": 10.05, + "learning_rate": 1.5730996939029353e-05, + "loss": 0.3193, + "step": 194100 + }, + { + "epoch": 10.06, + "learning_rate": 1.5701942850049104e-05, + "loss": 0.355, + "step": 194200 + }, + { + "epoch": 10.06, + "learning_rate": 1.5672313697014618e-05, + "loss": 0.3135, + "step": 194300 + }, + { + "epoch": 10.07, + "learning_rate": 1.5642702638257175e-05, + "loss": 0.2976, + "step": 194400 + }, + { + "epoch": 10.07, + "learning_rate": 1.5613109711172243e-05, + "loss": 0.3064, + "step": 194500 + }, + { + "epoch": 10.08, + "learning_rate": 1.5583534953132413e-05, + "loss": 0.3202, + "step": 194600 + }, + { + "epoch": 10.08, + "learning_rate": 1.5553978401487322e-05, + "loss": 0.2833, + "step": 194700 + }, + { + "epoch": 10.09, + "learning_rate": 1.5524440093563608e-05, + "loss": 0.2937, + "step": 194800 + }, + { + "epoch": 10.09, + "learning_rate": 1.5494920066664872e-05, + "loss": 0.3587, + "step": 194900 + }, + { + "epoch": 10.1, + "learning_rate": 1.5465418358071634e-05, + "loss": 0.3132, + "step": 195000 + }, + { + "epoch": 10.1, + "learning_rate": 1.5435935005041284e-05, + "loss": 0.3295, + "step": 195100 + }, + { + "epoch": 10.11, + "learning_rate": 1.5406470044808013e-05, + "loss": 0.3304, + "step": 195200 + }, + { + "epoch": 10.11, + "learning_rate": 1.5377023514582793e-05, + "loss": 0.2938, + "step": 195300 + }, + { + "epoch": 10.12, + "learning_rate": 1.534759545155333e-05, + "loss": 0.3199, + "step": 195400 + }, + { + "epoch": 10.12, + "learning_rate": 1.5318185892883997e-05, + "loss": 0.2592, + "step": 195500 + }, + { + "epoch": 10.13, + "learning_rate": 1.5288794875715802e-05, + "loss": 0.2936, + "step": 195600 + }, + { + "epoch": 10.13, + "learning_rate": 1.5259422437166327e-05, + "loss": 0.3087, + "step": 195700 + }, + { + "epoch": 10.14, + "learning_rate": 1.5230068614329726e-05, + "loss": 0.2909, + "step": 195800 + }, + { + "epoch": 10.14, + "learning_rate": 1.5200733444276598e-05, + "loss": 0.3524, + "step": 195900 + }, + { + "epoch": 10.15, + "learning_rate": 1.5171416964054005e-05, + "loss": 0.2767, + "step": 196000 + }, + { + "epoch": 10.15, + "learning_rate": 1.51421192106854e-05, + "loss": 0.2691, + "step": 196100 + }, + { + "epoch": 10.16, + "learning_rate": 1.5113132918063264e-05, + "loss": 0.3269, + "step": 196200 + }, + { + "epoch": 10.16, + "learning_rate": 1.5083872541187148e-05, + "loss": 0.3216, + "step": 196300 + }, + { + "epoch": 10.17, + "learning_rate": 1.505463100172392e-05, + "loss": 0.2961, + "step": 196400 + }, + { + "epoch": 10.17, + "learning_rate": 1.5025408336602395e-05, + "loss": 0.3803, + "step": 196500 + }, + { + "epoch": 10.18, + "learning_rate": 1.4996204582727553e-05, + "loss": 0.3175, + "step": 196600 + }, + { + "epoch": 10.18, + "learning_rate": 1.4967019776980495e-05, + "loss": 0.3132, + "step": 196700 + }, + { + "epoch": 10.19, + "learning_rate": 1.4937853956218389e-05, + "loss": 0.2971, + "step": 196800 + }, + { + "epoch": 10.2, + "learning_rate": 1.490870715727443e-05, + "loss": 0.3315, + "step": 196900 + }, + { + "epoch": 10.2, + "learning_rate": 1.487957941695779e-05, + "loss": 0.2903, + "step": 197000 + }, + { + "epoch": 10.21, + "learning_rate": 1.485047077205357e-05, + "loss": 0.3587, + "step": 197100 + }, + { + "epoch": 10.21, + "learning_rate": 1.4821381259322743e-05, + "loss": 0.3223, + "step": 197200 + }, + { + "epoch": 10.22, + "learning_rate": 1.479231091550217e-05, + "loss": 0.3002, + "step": 197300 + }, + { + "epoch": 10.22, + "learning_rate": 1.4763259777304434e-05, + "loss": 0.286, + "step": 197400 + }, + { + "epoch": 10.23, + "learning_rate": 1.4734227881417905e-05, + "loss": 0.2775, + "step": 197500 + }, + { + "epoch": 10.23, + "learning_rate": 1.470521526450664e-05, + "loss": 0.2704, + "step": 197600 + }, + { + "epoch": 10.24, + "learning_rate": 1.4676221963210378e-05, + "loss": 0.3099, + "step": 197700 + }, + { + "epoch": 10.24, + "learning_rate": 1.464724801414441e-05, + "loss": 0.3033, + "step": 197800 + }, + { + "epoch": 10.25, + "learning_rate": 1.461829345389962e-05, + "loss": 0.3045, + "step": 197900 + }, + { + "epoch": 10.25, + "learning_rate": 1.458935831904242e-05, + "loss": 0.3258, + "step": 198000 + }, + { + "epoch": 10.26, + "learning_rate": 1.4560442646114664e-05, + "loss": 0.3397, + "step": 198100 + }, + { + "epoch": 10.26, + "learning_rate": 1.4531546471633646e-05, + "loss": 0.3002, + "step": 198200 + }, + { + "epoch": 10.27, + "learning_rate": 1.4502669832091999e-05, + "loss": 0.2697, + "step": 198300 + }, + { + "epoch": 10.27, + "learning_rate": 1.4473812763957734e-05, + "loss": 0.307, + "step": 198400 + }, + { + "epoch": 10.28, + "learning_rate": 1.4444975303674124e-05, + "loss": 0.3387, + "step": 198500 + }, + { + "epoch": 10.28, + "learning_rate": 1.4416157487659675e-05, + "loss": 0.2841, + "step": 198600 + }, + { + "epoch": 10.29, + "learning_rate": 1.4387359352308091e-05, + "loss": 0.3334, + "step": 198700 + }, + { + "epoch": 10.29, + "learning_rate": 1.4358580933988215e-05, + "loss": 0.3319, + "step": 198800 + }, + { + "epoch": 10.3, + "learning_rate": 1.4329822269044001e-05, + "loss": 0.2294, + "step": 198900 + }, + { + "epoch": 10.3, + "learning_rate": 1.4301083393794444e-05, + "loss": 0.2971, + "step": 199000 + }, + { + "epoch": 10.31, + "learning_rate": 1.4272364344533554e-05, + "loss": 0.2742, + "step": 199100 + }, + { + "epoch": 10.31, + "learning_rate": 1.4243665157530306e-05, + "loss": 0.2903, + "step": 199200 + }, + { + "epoch": 10.32, + "learning_rate": 1.4214985869028581e-05, + "loss": 0.3247, + "step": 199300 + }, + { + "epoch": 10.32, + "learning_rate": 1.4186326515247136e-05, + "loss": 0.3236, + "step": 199400 + }, + { + "epoch": 10.33, + "learning_rate": 1.4157687132379558e-05, + "loss": 0.3346, + "step": 199500 + }, + { + "epoch": 10.34, + "learning_rate": 1.412906775659421e-05, + "loss": 0.3009, + "step": 199600 + }, + { + "epoch": 10.34, + "learning_rate": 1.410046842403416e-05, + "loss": 0.3295, + "step": 199700 + }, + { + "epoch": 10.35, + "learning_rate": 1.4071889170817241e-05, + "loss": 0.2926, + "step": 199800 + }, + { + "epoch": 10.35, + "learning_rate": 1.4043330033035832e-05, + "loss": 0.2931, + "step": 199900 + }, + { + "epoch": 10.36, + "learning_rate": 1.4014791046756971e-05, + "loss": 0.2827, + "step": 200000 + }, + { + "epoch": 10.36, + "learning_rate": 1.3986272248022211e-05, + "loss": 0.355, + "step": 200100 + }, + { + "epoch": 10.37, + "learning_rate": 1.3957773672847655e-05, + "loss": 0.332, + "step": 200200 + }, + { + "epoch": 10.37, + "learning_rate": 1.3929295357223843e-05, + "loss": 0.3049, + "step": 200300 + }, + { + "epoch": 10.38, + "learning_rate": 1.3900837337115686e-05, + "loss": 0.3135, + "step": 200400 + }, + { + "epoch": 10.38, + "learning_rate": 1.3872399648462538e-05, + "loss": 0.2836, + "step": 200500 + }, + { + "epoch": 10.39, + "learning_rate": 1.3843982327178035e-05, + "loss": 0.2951, + "step": 200600 + }, + { + "epoch": 10.39, + "learning_rate": 1.3815585409150106e-05, + "loss": 0.2727, + "step": 200700 + }, + { + "epoch": 10.4, + "learning_rate": 1.3787208930240872e-05, + "loss": 0.3089, + "step": 200800 + }, + { + "epoch": 10.4, + "learning_rate": 1.3758852926286713e-05, + "loss": 0.3056, + "step": 200900 + }, + { + "epoch": 10.41, + "learning_rate": 1.3730517433098098e-05, + "loss": 0.3409, + "step": 201000 + }, + { + "epoch": 10.41, + "learning_rate": 1.3702202486459613e-05, + "loss": 0.2777, + "step": 201100 + }, + { + "epoch": 10.42, + "learning_rate": 1.3673908122129891e-05, + "loss": 0.3029, + "step": 201200 + }, + { + "epoch": 10.42, + "learning_rate": 1.364563437584157e-05, + "loss": 0.3321, + "step": 201300 + }, + { + "epoch": 10.43, + "learning_rate": 1.3617381283301254e-05, + "loss": 0.3083, + "step": 201400 + }, + { + "epoch": 10.43, + "learning_rate": 1.3589148880189462e-05, + "loss": 0.3129, + "step": 201500 + }, + { + "epoch": 10.44, + "learning_rate": 1.3560937202160583e-05, + "loss": 0.2745, + "step": 201600 + }, + { + "epoch": 10.44, + "learning_rate": 1.3532746284842839e-05, + "loss": 0.3623, + "step": 201700 + }, + { + "epoch": 10.45, + "learning_rate": 1.350457616383822e-05, + "loss": 0.3104, + "step": 201800 + }, + { + "epoch": 10.45, + "learning_rate": 1.3476426874722471e-05, + "loss": 0.3299, + "step": 201900 + }, + { + "epoch": 10.46, + "learning_rate": 1.3448298453045012e-05, + "loss": 0.3284, + "step": 202000 + }, + { + "epoch": 10.46, + "learning_rate": 1.342047190592984e-05, + "loss": 0.3088, + "step": 202100 + }, + { + "epoch": 10.47, + "learning_rate": 1.3392385116111598e-05, + "loss": 0.3102, + "step": 202200 + }, + { + "epoch": 10.47, + "learning_rate": 1.3364319299867036e-05, + "loss": 0.2955, + "step": 202300 + }, + { + "epoch": 10.48, + "learning_rate": 1.3336274492640198e-05, + "loss": 0.3074, + "step": 202400 + }, + { + "epoch": 10.49, + "learning_rate": 1.3308250729848547e-05, + "loss": 0.2815, + "step": 202500 + }, + { + "epoch": 10.49, + "learning_rate": 1.328024804688299e-05, + "loss": 0.3451, + "step": 202600 + }, + { + "epoch": 10.5, + "learning_rate": 1.3252266479107804e-05, + "loss": 0.2783, + "step": 202700 + }, + { + "epoch": 10.5, + "learning_rate": 1.3224306061860598e-05, + "loss": 0.3012, + "step": 202800 + }, + { + "epoch": 10.51, + "learning_rate": 1.3196366830452284e-05, + "loss": 0.2491, + "step": 202900 + }, + { + "epoch": 10.51, + "learning_rate": 1.3168448820167e-05, + "loss": 0.3271, + "step": 203000 + }, + { + "epoch": 10.52, + "learning_rate": 1.3140552066262101e-05, + "loss": 0.2614, + "step": 203100 + }, + { + "epoch": 10.52, + "learning_rate": 1.3112676603968081e-05, + "loss": 0.2749, + "step": 203200 + }, + { + "epoch": 10.53, + "learning_rate": 1.3084822468488564e-05, + "loss": 0.2651, + "step": 203300 + }, + { + "epoch": 10.53, + "learning_rate": 1.305698969500022e-05, + "loss": 0.3279, + "step": 203400 + }, + { + "epoch": 10.54, + "learning_rate": 1.3029178318652762e-05, + "loss": 0.3055, + "step": 203500 + }, + { + "epoch": 10.54, + "learning_rate": 1.3001388374568865e-05, + "loss": 0.3167, + "step": 203600 + }, + { + "epoch": 10.55, + "learning_rate": 1.2973619897844144e-05, + "loss": 0.309, + "step": 203700 + }, + { + "epoch": 10.55, + "learning_rate": 1.294587292354709e-05, + "loss": 0.2698, + "step": 203800 + }, + { + "epoch": 10.56, + "learning_rate": 1.2918147486719083e-05, + "loss": 0.3068, + "step": 203900 + }, + { + "epoch": 10.56, + "learning_rate": 1.2890443622374242e-05, + "loss": 0.2657, + "step": 204000 + }, + { + "epoch": 10.57, + "learning_rate": 1.2862761365499468e-05, + "loss": 0.3267, + "step": 204100 + }, + { + "epoch": 10.57, + "learning_rate": 1.2835100751054406e-05, + "loss": 0.3417, + "step": 204200 + }, + { + "epoch": 10.58, + "learning_rate": 1.2807461813971333e-05, + "loss": 0.3366, + "step": 204300 + }, + { + "epoch": 10.58, + "learning_rate": 1.2779844589155138e-05, + "loss": 0.2962, + "step": 204400 + }, + { + "epoch": 10.59, + "learning_rate": 1.2752249111483316e-05, + "loss": 0.2521, + "step": 204500 + }, + { + "epoch": 10.59, + "learning_rate": 1.272467541580591e-05, + "loss": 0.2986, + "step": 204600 + }, + { + "epoch": 10.6, + "learning_rate": 1.269712353694543e-05, + "loss": 0.2991, + "step": 204700 + }, + { + "epoch": 10.6, + "learning_rate": 1.2669593509696813e-05, + "loss": 0.309, + "step": 204800 + }, + { + "epoch": 10.61, + "learning_rate": 1.264208536882746e-05, + "loss": 0.2833, + "step": 204900 + }, + { + "epoch": 10.61, + "learning_rate": 1.2614599149077086e-05, + "loss": 0.2626, + "step": 205000 + }, + { + "epoch": 10.62, + "learning_rate": 1.2587134885157746e-05, + "loss": 0.2807, + "step": 205100 + }, + { + "epoch": 10.62, + "learning_rate": 1.2559692611753726e-05, + "loss": 0.3143, + "step": 205200 + }, + { + "epoch": 10.63, + "learning_rate": 1.2532272363521598e-05, + "loss": 0.2939, + "step": 205300 + }, + { + "epoch": 10.64, + "learning_rate": 1.2504874175090084e-05, + "loss": 0.324, + "step": 205400 + }, + { + "epoch": 10.64, + "learning_rate": 1.2477498081060055e-05, + "loss": 0.3235, + "step": 205500 + }, + { + "epoch": 10.65, + "learning_rate": 1.2450144116004476e-05, + "loss": 0.3101, + "step": 205600 + }, + { + "epoch": 10.65, + "learning_rate": 1.2422812314468368e-05, + "loss": 0.3213, + "step": 205700 + }, + { + "epoch": 10.66, + "learning_rate": 1.239550271096876e-05, + "loss": 0.327, + "step": 205800 + }, + { + "epoch": 10.66, + "learning_rate": 1.2368215339994643e-05, + "loss": 0.275, + "step": 205900 + }, + { + "epoch": 10.67, + "learning_rate": 1.2340950236006963e-05, + "loss": 0.3248, + "step": 206000 + }, + { + "epoch": 10.67, + "learning_rate": 1.2313707433438492e-05, + "loss": 0.3304, + "step": 206100 + }, + { + "epoch": 10.68, + "learning_rate": 1.2286486966693875e-05, + "loss": 0.3151, + "step": 206200 + }, + { + "epoch": 10.68, + "learning_rate": 1.225928887014953e-05, + "loss": 0.3125, + "step": 206300 + }, + { + "epoch": 10.69, + "learning_rate": 1.2232113178153658e-05, + "loss": 0.2852, + "step": 206400 + }, + { + "epoch": 10.69, + "learning_rate": 1.2204959925026115e-05, + "loss": 0.2412, + "step": 206500 + }, + { + "epoch": 10.7, + "learning_rate": 1.2177829145058446e-05, + "loss": 0.2797, + "step": 206600 + }, + { + "epoch": 10.7, + "learning_rate": 1.2150720872513833e-05, + "loss": 0.2782, + "step": 206700 + }, + { + "epoch": 10.71, + "learning_rate": 1.2123635141627013e-05, + "loss": 0.3174, + "step": 206800 + }, + { + "epoch": 10.71, + "learning_rate": 1.2096571986604239e-05, + "loss": 0.2844, + "step": 206900 + }, + { + "epoch": 10.72, + "learning_rate": 1.2069531441623265e-05, + "loss": 0.2779, + "step": 207000 + }, + { + "epoch": 10.72, + "learning_rate": 1.2042513540833324e-05, + "loss": 0.3101, + "step": 207100 + }, + { + "epoch": 10.73, + "learning_rate": 1.2015518318355022e-05, + "loss": 0.3275, + "step": 207200 + }, + { + "epoch": 10.73, + "learning_rate": 1.19885458082803e-05, + "loss": 0.2881, + "step": 207300 + }, + { + "epoch": 10.74, + "learning_rate": 1.196159604467247e-05, + "loss": 0.3021, + "step": 207400 + }, + { + "epoch": 10.74, + "learning_rate": 1.1934669061566085e-05, + "loss": 0.3556, + "step": 207500 + }, + { + "epoch": 10.75, + "learning_rate": 1.1907764892966942e-05, + "loss": 0.2849, + "step": 207600 + }, + { + "epoch": 10.75, + "learning_rate": 1.188088357285199e-05, + "loss": 0.331, + "step": 207700 + }, + { + "epoch": 10.76, + "learning_rate": 1.1854025135169383e-05, + "loss": 0.2932, + "step": 207800 + }, + { + "epoch": 10.76, + "learning_rate": 1.1827457855504407e-05, + "loss": 0.2993, + "step": 207900 + }, + { + "epoch": 10.77, + "learning_rate": 1.1800645054745122e-05, + "loss": 0.2928, + "step": 208000 + }, + { + "epoch": 10.78, + "learning_rate": 1.1773855237750498e-05, + "loss": 0.3574, + "step": 208100 + }, + { + "epoch": 10.78, + "learning_rate": 1.1747088438353123e-05, + "loss": 0.2846, + "step": 208200 + }, + { + "epoch": 10.79, + "learning_rate": 1.17206120136211e-05, + "loss": 0.3218, + "step": 208300 + }, + { + "epoch": 10.79, + "learning_rate": 1.1693891119780737e-05, + "loss": 0.3094, + "step": 208400 + }, + { + "epoch": 10.8, + "learning_rate": 1.1667193344523416e-05, + "loss": 0.2953, + "step": 208500 + }, + { + "epoch": 10.8, + "learning_rate": 1.1640518721565466e-05, + "loss": 0.2743, + "step": 208600 + }, + { + "epoch": 10.81, + "learning_rate": 1.1613867284593965e-05, + "loss": 0.3647, + "step": 208700 + }, + { + "epoch": 10.81, + "learning_rate": 1.1587239067266727e-05, + "loss": 0.3406, + "step": 208800 + }, + { + "epoch": 10.82, + "learning_rate": 1.1560634103212217e-05, + "loss": 0.3039, + "step": 208900 + }, + { + "epoch": 10.82, + "learning_rate": 1.1534052426029587e-05, + "loss": 0.2903, + "step": 209000 + }, + { + "epoch": 10.83, + "learning_rate": 1.1507494069288513e-05, + "loss": 0.3347, + "step": 209100 + }, + { + "epoch": 10.83, + "learning_rate": 1.1480959066529258e-05, + "loss": 0.2897, + "step": 209200 + }, + { + "epoch": 10.84, + "learning_rate": 1.1454447451262576e-05, + "loss": 0.2908, + "step": 209300 + }, + { + "epoch": 10.84, + "learning_rate": 1.1427959256969724e-05, + "loss": 0.2682, + "step": 209400 + }, + { + "epoch": 10.85, + "learning_rate": 1.1401494517102318e-05, + "loss": 0.3303, + "step": 209500 + }, + { + "epoch": 10.85, + "learning_rate": 1.1375053265082388e-05, + "loss": 0.3095, + "step": 209600 + }, + { + "epoch": 10.86, + "learning_rate": 1.1348635534302324e-05, + "loss": 0.2782, + "step": 209700 + }, + { + "epoch": 10.86, + "learning_rate": 1.1322241358124778e-05, + "loss": 0.2991, + "step": 209800 + }, + { + "epoch": 10.87, + "learning_rate": 1.1295870769882651e-05, + "loss": 0.268, + "step": 209900 + }, + { + "epoch": 10.87, + "learning_rate": 1.1269523802879065e-05, + "loss": 0.2727, + "step": 210000 + }, + { + "epoch": 10.88, + "learning_rate": 1.1243200490387337e-05, + "loss": 0.2808, + "step": 210100 + }, + { + "epoch": 10.88, + "learning_rate": 1.1216900865650885e-05, + "loss": 0.3068, + "step": 210200 + }, + { + "epoch": 10.89, + "learning_rate": 1.1190624961883181e-05, + "loss": 0.2887, + "step": 210300 + }, + { + "epoch": 10.89, + "learning_rate": 1.1164372812267814e-05, + "loss": 0.2723, + "step": 210400 + }, + { + "epoch": 10.9, + "learning_rate": 1.1138144449958318e-05, + "loss": 0.3043, + "step": 210500 + }, + { + "epoch": 10.9, + "learning_rate": 1.1111939908078203e-05, + "loss": 0.3369, + "step": 210600 + }, + { + "epoch": 10.91, + "learning_rate": 1.10857592197209e-05, + "loss": 0.283, + "step": 210700 + }, + { + "epoch": 10.91, + "learning_rate": 1.1059602417949706e-05, + "loss": 0.3219, + "step": 210800 + }, + { + "epoch": 10.92, + "learning_rate": 1.103346953579776e-05, + "loss": 0.2987, + "step": 210900 + }, + { + "epoch": 10.93, + "learning_rate": 1.1007360606267994e-05, + "loss": 0.3782, + "step": 211000 + }, + { + "epoch": 10.93, + "learning_rate": 1.098127566233308e-05, + "loss": 0.2543, + "step": 211100 + }, + { + "epoch": 10.94, + "learning_rate": 1.095521473693541e-05, + "loss": 0.3168, + "step": 211200 + }, + { + "epoch": 10.94, + "learning_rate": 1.092917786298704e-05, + "loss": 0.3239, + "step": 211300 + }, + { + "epoch": 10.95, + "learning_rate": 1.0903425081940498e-05, + "loss": 0.2929, + "step": 211400 + }, + { + "epoch": 10.95, + "learning_rate": 1.087743616817101e-05, + "loss": 0.3091, + "step": 211500 + }, + { + "epoch": 10.96, + "learning_rate": 1.0851471404076525e-05, + "loss": 0.2931, + "step": 211600 + }, + { + "epoch": 10.96, + "learning_rate": 1.0825530822447652e-05, + "loss": 0.3156, + "step": 211700 + }, + { + "epoch": 10.97, + "learning_rate": 1.0799614456044466e-05, + "loss": 0.2806, + "step": 211800 + }, + { + "epoch": 10.97, + "learning_rate": 1.0773722337596453e-05, + "loss": 0.2978, + "step": 211900 + }, + { + "epoch": 10.98, + "learning_rate": 1.0747854499802492e-05, + "loss": 0.2772, + "step": 212000 + }, + { + "epoch": 10.98, + "learning_rate": 1.0722010975330786e-05, + "loss": 0.3246, + "step": 212100 + }, + { + "epoch": 10.99, + "learning_rate": 1.0696191796818838e-05, + "loss": 0.304, + "step": 212200 + }, + { + "epoch": 10.99, + "learning_rate": 1.0670396996873405e-05, + "loss": 0.27, + "step": 212300 + }, + { + "epoch": 11.0, + "learning_rate": 1.0644626608070454e-05, + "loss": 0.3004, + "step": 212400 + }, + { + "epoch": 11.0, + "eval_accuracy": 0.6237065325023299, + "eval_cer": 0.10729138726936488, + "eval_loss": 0.6110624074935913, + "eval_runtime": 3860.9494, + "eval_samples_per_second": 4.447, + "eval_steps_per_second": 0.278, + "eval_wer": 0.24484442091641667, + "step": 212443 + }, + { + "epoch": 11.0, + "learning_rate": 1.0618880662955127e-05, + "loss": 0.2614, + "step": 212500 + }, + { + "epoch": 11.01, + "learning_rate": 1.0593159194041692e-05, + "loss": 0.28, + "step": 212600 + }, + { + "epoch": 11.01, + "learning_rate": 1.0567462233813507e-05, + "loss": 0.2401, + "step": 212700 + }, + { + "epoch": 11.02, + "learning_rate": 1.0541789814722985e-05, + "loss": 0.2585, + "step": 212800 + }, + { + "epoch": 11.02, + "learning_rate": 1.0516141969191534e-05, + "loss": 0.2988, + "step": 212900 + }, + { + "epoch": 11.03, + "learning_rate": 1.049051872960954e-05, + "loss": 0.2261, + "step": 213000 + }, + { + "epoch": 11.03, + "learning_rate": 1.046492012833631e-05, + "loss": 0.2124, + "step": 213100 + }, + { + "epoch": 11.04, + "learning_rate": 1.0439601814780665e-05, + "loss": 0.2704, + "step": 213200 + }, + { + "epoch": 11.04, + "learning_rate": 1.0414052339889268e-05, + "loss": 0.2479, + "step": 213300 + }, + { + "epoch": 11.05, + "learning_rate": 1.0388527599875197e-05, + "loss": 0.2429, + "step": 213400 + }, + { + "epoch": 11.05, + "learning_rate": 1.036302762697336e-05, + "loss": 0.2513, + "step": 213500 + }, + { + "epoch": 11.06, + "learning_rate": 1.0337552453387392e-05, + "loss": 0.2474, + "step": 213600 + }, + { + "epoch": 11.07, + "learning_rate": 1.031210211128961e-05, + "loss": 0.2806, + "step": 213700 + }, + { + "epoch": 11.07, + "learning_rate": 1.0286676632820973e-05, + "loss": 0.2689, + "step": 213800 + }, + { + "epoch": 11.08, + "learning_rate": 1.0261276050091035e-05, + "loss": 0.2038, + "step": 213900 + }, + { + "epoch": 11.08, + "learning_rate": 1.0235900395177912e-05, + "loss": 0.2609, + "step": 214000 + }, + { + "epoch": 11.09, + "learning_rate": 1.0210549700128234e-05, + "loss": 0.2602, + "step": 214100 + }, + { + "epoch": 11.09, + "learning_rate": 1.0185223996957123e-05, + "loss": 0.265, + "step": 214200 + }, + { + "epoch": 11.1, + "learning_rate": 1.0159923317648125e-05, + "loss": 0.2521, + "step": 214300 + }, + { + "epoch": 11.1, + "learning_rate": 1.013464769415319e-05, + "loss": 0.279, + "step": 214400 + }, + { + "epoch": 11.11, + "learning_rate": 1.0109397158392622e-05, + "loss": 0.2393, + "step": 214500 + }, + { + "epoch": 11.11, + "learning_rate": 1.008417174225505e-05, + "loss": 0.2723, + "step": 214600 + }, + { + "epoch": 11.12, + "learning_rate": 1.0058971477597368e-05, + "loss": 0.2334, + "step": 214700 + }, + { + "epoch": 11.12, + "learning_rate": 1.0033796396244706e-05, + "loss": 0.2477, + "step": 214800 + }, + { + "epoch": 11.13, + "learning_rate": 1.0008646529990411e-05, + "loss": 0.2546, + "step": 214900 + }, + { + "epoch": 11.13, + "learning_rate": 9.983521910595981e-06, + "loss": 0.2627, + "step": 215000 + }, + { + "epoch": 11.14, + "learning_rate": 9.95842256979098e-06, + "loss": 0.2431, + "step": 215100 + }, + { + "epoch": 11.14, + "learning_rate": 9.933348539273131e-06, + "loss": 0.2065, + "step": 215200 + }, + { + "epoch": 11.15, + "learning_rate": 9.908299850708132e-06, + "loss": 0.2921, + "step": 215300 + }, + { + "epoch": 11.15, + "learning_rate": 9.883276535729706e-06, + "loss": 0.2411, + "step": 215400 + }, + { + "epoch": 11.16, + "learning_rate": 9.858278625939494e-06, + "loss": 0.231, + "step": 215500 + }, + { + "epoch": 11.16, + "learning_rate": 9.833306152907109e-06, + "loss": 0.2867, + "step": 215600 + }, + { + "epoch": 11.17, + "learning_rate": 9.808359148170003e-06, + "loss": 0.2353, + "step": 215700 + }, + { + "epoch": 11.17, + "learning_rate": 9.78343764323347e-06, + "loss": 0.2539, + "step": 215800 + }, + { + "epoch": 11.18, + "learning_rate": 9.758541669570612e-06, + "loss": 0.2395, + "step": 215900 + }, + { + "epoch": 11.18, + "learning_rate": 9.733671258622271e-06, + "loss": 0.2329, + "step": 216000 + }, + { + "epoch": 11.19, + "learning_rate": 9.708826441797017e-06, + "loss": 0.2812, + "step": 216100 + }, + { + "epoch": 11.19, + "learning_rate": 9.6840072504711e-06, + "loss": 0.2231, + "step": 216200 + }, + { + "epoch": 11.2, + "learning_rate": 9.659213715988395e-06, + "loss": 0.3159, + "step": 216300 + }, + { + "epoch": 11.2, + "learning_rate": 9.63444586966039e-06, + "loss": 0.2714, + "step": 216400 + }, + { + "epoch": 11.21, + "learning_rate": 9.609703742766123e-06, + "loss": 0.2682, + "step": 216500 + }, + { + "epoch": 11.22, + "learning_rate": 9.58498736655215e-06, + "loss": 0.2685, + "step": 216600 + }, + { + "epoch": 11.22, + "learning_rate": 9.560296772232516e-06, + "loss": 0.2445, + "step": 216700 + }, + { + "epoch": 11.23, + "learning_rate": 9.535631990988694e-06, + "loss": 0.3023, + "step": 216800 + }, + { + "epoch": 11.23, + "learning_rate": 9.510993053969568e-06, + "loss": 0.2387, + "step": 216900 + }, + { + "epoch": 11.24, + "learning_rate": 9.486379992291371e-06, + "loss": 0.2628, + "step": 217000 + }, + { + "epoch": 11.24, + "learning_rate": 9.461792837037692e-06, + "loss": 0.2273, + "step": 217100 + }, + { + "epoch": 11.25, + "learning_rate": 9.437231619259352e-06, + "loss": 0.2328, + "step": 217200 + }, + { + "epoch": 11.25, + "learning_rate": 9.412696369974443e-06, + "loss": 0.2542, + "step": 217300 + }, + { + "epoch": 11.26, + "learning_rate": 9.388187120168278e-06, + "loss": 0.2482, + "step": 217400 + }, + { + "epoch": 11.26, + "learning_rate": 9.363703900793322e-06, + "loss": 0.2567, + "step": 217500 + }, + { + "epoch": 11.27, + "learning_rate": 9.339246742769137e-06, + "loss": 0.2664, + "step": 217600 + }, + { + "epoch": 11.27, + "learning_rate": 9.314815676982405e-06, + "loss": 0.2786, + "step": 217700 + }, + { + "epoch": 11.28, + "learning_rate": 9.290410734286866e-06, + "loss": 0.2932, + "step": 217800 + }, + { + "epoch": 11.28, + "learning_rate": 9.266031945503252e-06, + "loss": 0.224, + "step": 217900 + }, + { + "epoch": 11.29, + "learning_rate": 9.241679341419238e-06, + "loss": 0.2889, + "step": 218000 + }, + { + "epoch": 11.29, + "learning_rate": 9.217352952789486e-06, + "loss": 0.2455, + "step": 218100 + }, + { + "epoch": 11.3, + "learning_rate": 9.193052810335521e-06, + "loss": 0.286, + "step": 218200 + }, + { + "epoch": 11.3, + "learning_rate": 9.168778944745729e-06, + "loss": 0.2461, + "step": 218300 + }, + { + "epoch": 11.31, + "learning_rate": 9.14453138667528e-06, + "loss": 0.268, + "step": 218400 + }, + { + "epoch": 11.31, + "learning_rate": 9.120310166746175e-06, + "loss": 0.2312, + "step": 218500 + }, + { + "epoch": 11.32, + "learning_rate": 9.096115315547119e-06, + "loss": 0.254, + "step": 218600 + }, + { + "epoch": 11.32, + "learning_rate": 9.07194686363352e-06, + "loss": 0.2669, + "step": 218700 + }, + { + "epoch": 11.33, + "learning_rate": 9.047804841527451e-06, + "loss": 0.2705, + "step": 218800 + }, + { + "epoch": 11.33, + "learning_rate": 9.023689279717606e-06, + "loss": 0.2648, + "step": 218900 + }, + { + "epoch": 11.34, + "learning_rate": 8.999600208659256e-06, + "loss": 0.2489, + "step": 219000 + }, + { + "epoch": 11.34, + "learning_rate": 8.975537658774234e-06, + "loss": 0.2556, + "step": 219100 + }, + { + "epoch": 11.35, + "learning_rate": 8.95150166045086e-06, + "loss": 0.2737, + "step": 219200 + }, + { + "epoch": 11.36, + "learning_rate": 8.927492244043936e-06, + "loss": 0.2878, + "step": 219300 + }, + { + "epoch": 11.36, + "learning_rate": 8.903509439874684e-06, + "loss": 0.2483, + "step": 219400 + }, + { + "epoch": 11.37, + "learning_rate": 8.879553278230721e-06, + "loss": 0.2211, + "step": 219500 + }, + { + "epoch": 11.37, + "learning_rate": 8.855623789366041e-06, + "loss": 0.2374, + "step": 219600 + }, + { + "epoch": 11.38, + "learning_rate": 8.83172100350091e-06, + "loss": 0.2482, + "step": 219700 + }, + { + "epoch": 11.38, + "learning_rate": 8.807844950821896e-06, + "loss": 0.2371, + "step": 219800 + }, + { + "epoch": 11.39, + "learning_rate": 8.783995661481794e-06, + "loss": 0.2041, + "step": 219900 + }, + { + "epoch": 11.39, + "learning_rate": 8.760173165599638e-06, + "loss": 0.241, + "step": 220000 + }, + { + "epoch": 11.4, + "learning_rate": 8.73637749326057e-06, + "loss": 0.2509, + "step": 220100 + }, + { + "epoch": 11.4, + "learning_rate": 8.712608674515875e-06, + "loss": 0.223, + "step": 220200 + }, + { + "epoch": 11.41, + "learning_rate": 8.688866739382962e-06, + "loss": 0.3093, + "step": 220300 + }, + { + "epoch": 11.41, + "learning_rate": 8.66515171784525e-06, + "loss": 0.2571, + "step": 220400 + }, + { + "epoch": 11.42, + "learning_rate": 8.641463639852158e-06, + "loss": 0.2676, + "step": 220500 + }, + { + "epoch": 11.42, + "learning_rate": 8.617802535319106e-06, + "loss": 0.3011, + "step": 220600 + }, + { + "epoch": 11.43, + "learning_rate": 8.594404641374807e-06, + "loss": 0.2658, + "step": 220700 + }, + { + "epoch": 11.43, + "learning_rate": 8.570797302892276e-06, + "loss": 0.2672, + "step": 220800 + }, + { + "epoch": 11.44, + "learning_rate": 8.547217027113531e-06, + "loss": 0.2925, + "step": 220900 + }, + { + "epoch": 11.44, + "learning_rate": 8.52366384381783e-06, + "loss": 0.282, + "step": 221000 + }, + { + "epoch": 11.45, + "learning_rate": 8.50013778275026e-06, + "loss": 0.2907, + "step": 221100 + }, + { + "epoch": 11.45, + "learning_rate": 8.476638873621588e-06, + "loss": 0.277, + "step": 221200 + }, + { + "epoch": 11.46, + "learning_rate": 8.453167146108342e-06, + "loss": 0.2971, + "step": 221300 + }, + { + "epoch": 11.46, + "learning_rate": 8.4297226298527e-06, + "loss": 0.2447, + "step": 221400 + }, + { + "epoch": 11.47, + "learning_rate": 8.406305354462509e-06, + "loss": 0.2095, + "step": 221500 + }, + { + "epoch": 11.47, + "learning_rate": 8.382915349511161e-06, + "loss": 0.2336, + "step": 221600 + }, + { + "epoch": 11.48, + "learning_rate": 8.359552644537631e-06, + "loss": 0.27, + "step": 221700 + }, + { + "epoch": 11.48, + "learning_rate": 8.336217269046446e-06, + "loss": 0.2828, + "step": 221800 + }, + { + "epoch": 11.49, + "learning_rate": 8.31290925250759e-06, + "loss": 0.3209, + "step": 221900 + }, + { + "epoch": 11.49, + "learning_rate": 8.289628624356475e-06, + "loss": 0.2422, + "step": 222000 + }, + { + "epoch": 11.5, + "learning_rate": 8.266375413993978e-06, + "loss": 0.2734, + "step": 222100 + }, + { + "epoch": 11.51, + "learning_rate": 8.243149650786308e-06, + "loss": 0.2832, + "step": 222200 + }, + { + "epoch": 11.51, + "learning_rate": 8.219951364065039e-06, + "loss": 0.2812, + "step": 222300 + }, + { + "epoch": 11.52, + "learning_rate": 8.196780583127003e-06, + "loss": 0.2581, + "step": 222400 + }, + { + "epoch": 11.52, + "learning_rate": 8.173637337234347e-06, + "loss": 0.2566, + "step": 222500 + }, + { + "epoch": 11.53, + "learning_rate": 8.15052165561442e-06, + "loss": 0.2238, + "step": 222600 + }, + { + "epoch": 11.53, + "learning_rate": 8.127433567459755e-06, + "loss": 0.2555, + "step": 222700 + }, + { + "epoch": 11.54, + "learning_rate": 8.104373101928046e-06, + "loss": 0.2473, + "step": 222800 + }, + { + "epoch": 11.54, + "learning_rate": 8.0813402881421e-06, + "loss": 0.2396, + "step": 222900 + }, + { + "epoch": 11.55, + "learning_rate": 8.058335155189803e-06, + "loss": 0.2593, + "step": 223000 + }, + { + "epoch": 11.55, + "learning_rate": 8.035357732124088e-06, + "loss": 0.2268, + "step": 223100 + }, + { + "epoch": 11.56, + "learning_rate": 8.012408047962883e-06, + "loss": 0.2451, + "step": 223200 + }, + { + "epoch": 11.56, + "learning_rate": 7.989486131689097e-06, + "loss": 0.2565, + "step": 223300 + }, + { + "epoch": 11.57, + "learning_rate": 7.966592012250557e-06, + "loss": 0.2213, + "step": 223400 + }, + { + "epoch": 11.57, + "learning_rate": 7.943725718559997e-06, + "loss": 0.2423, + "step": 223500 + }, + { + "epoch": 11.58, + "learning_rate": 7.920887279495023e-06, + "loss": 0.2418, + "step": 223600 + }, + { + "epoch": 11.58, + "learning_rate": 7.898076723898027e-06, + "loss": 0.2675, + "step": 223700 + }, + { + "epoch": 11.59, + "learning_rate": 7.875294080576216e-06, + "loss": 0.2394, + "step": 223800 + }, + { + "epoch": 11.59, + "learning_rate": 7.852539378301528e-06, + "loss": 0.2837, + "step": 223900 + }, + { + "epoch": 11.6, + "learning_rate": 7.829812645810654e-06, + "loss": 0.2402, + "step": 224000 + }, + { + "epoch": 11.6, + "learning_rate": 7.807113911804909e-06, + "loss": 0.2844, + "step": 224100 + }, + { + "epoch": 11.61, + "learning_rate": 7.78444320495027e-06, + "loss": 0.2573, + "step": 224200 + }, + { + "epoch": 11.61, + "learning_rate": 7.761800553877344e-06, + "loss": 0.2704, + "step": 224300 + }, + { + "epoch": 11.62, + "learning_rate": 7.739185987181283e-06, + "loss": 0.2575, + "step": 224400 + }, + { + "epoch": 11.62, + "learning_rate": 7.716599533421754e-06, + "loss": 0.2535, + "step": 224500 + }, + { + "epoch": 11.63, + "learning_rate": 7.694041221122947e-06, + "loss": 0.2395, + "step": 224600 + }, + { + "epoch": 11.63, + "learning_rate": 7.671736240662314e-06, + "loss": 0.2537, + "step": 224700 + }, + { + "epoch": 11.64, + "learning_rate": 7.649234014590572e-06, + "loss": 0.2477, + "step": 224800 + }, + { + "epoch": 11.65, + "learning_rate": 7.6267600150547335e-06, + "loss": 0.283, + "step": 224900 + }, + { + "epoch": 11.65, + "learning_rate": 7.604314270436946e-06, + "loss": 0.2581, + "step": 225000 + }, + { + "epoch": 11.66, + "learning_rate": 7.581896809083726e-06, + "loss": 0.2955, + "step": 225100 + }, + { + "epoch": 11.66, + "learning_rate": 7.5595076593058095e-06, + "loss": 0.2787, + "step": 225200 + }, + { + "epoch": 11.67, + "learning_rate": 7.537146849378217e-06, + "loss": 0.2479, + "step": 225300 + }, + { + "epoch": 11.67, + "learning_rate": 7.5148144075401545e-06, + "loss": 0.2581, + "step": 225400 + }, + { + "epoch": 11.68, + "learning_rate": 7.49251036199505e-06, + "loss": 0.2538, + "step": 225500 + }, + { + "epoch": 11.68, + "learning_rate": 7.4702347409104066e-06, + "loss": 0.2444, + "step": 225600 + }, + { + "epoch": 11.69, + "learning_rate": 7.4482099031701775e-06, + "loss": 0.2185, + "step": 225700 + }, + { + "epoch": 11.69, + "learning_rate": 7.425990930419618e-06, + "loss": 0.2238, + "step": 225800 + }, + { + "epoch": 11.7, + "learning_rate": 7.403800466136186e-06, + "loss": 0.2908, + "step": 225900 + }, + { + "epoch": 11.7, + "learning_rate": 7.381638538343976e-06, + "loss": 0.2673, + "step": 226000 + }, + { + "epoch": 11.71, + "learning_rate": 7.359505175031036e-06, + "loss": 0.2697, + "step": 226100 + }, + { + "epoch": 11.71, + "learning_rate": 7.337400404149354e-06, + "loss": 0.2572, + "step": 226200 + }, + { + "epoch": 11.72, + "learning_rate": 7.315324253614796e-06, + "loss": 0.2814, + "step": 226300 + }, + { + "epoch": 11.72, + "learning_rate": 7.2932767513070945e-06, + "loss": 0.2294, + "step": 226400 + }, + { + "epoch": 11.73, + "learning_rate": 7.271257925069781e-06, + "loss": 0.2272, + "step": 226500 + }, + { + "epoch": 11.73, + "learning_rate": 7.2492678027102186e-06, + "loss": 0.2418, + "step": 226600 + }, + { + "epoch": 11.74, + "learning_rate": 7.227306411999467e-06, + "loss": 0.2533, + "step": 226700 + }, + { + "epoch": 11.74, + "learning_rate": 7.205373780672326e-06, + "loss": 0.2619, + "step": 226800 + }, + { + "epoch": 11.75, + "learning_rate": 7.183469936427271e-06, + "loss": 0.301, + "step": 226900 + }, + { + "epoch": 11.75, + "learning_rate": 7.161594906926452e-06, + "loss": 0.2468, + "step": 227000 + }, + { + "epoch": 11.76, + "learning_rate": 7.139748719795572e-06, + "loss": 0.2682, + "step": 227100 + }, + { + "epoch": 11.76, + "learning_rate": 7.1179314026239425e-06, + "loss": 0.2376, + "step": 227200 + }, + { + "epoch": 11.77, + "learning_rate": 7.09614298296443e-06, + "loss": 0.2621, + "step": 227300 + }, + { + "epoch": 11.77, + "learning_rate": 7.074383488333379e-06, + "loss": 0.2643, + "step": 227400 + }, + { + "epoch": 11.78, + "learning_rate": 7.052652946210626e-06, + "loss": 0.2305, + "step": 227500 + }, + { + "epoch": 11.78, + "learning_rate": 7.030951384039405e-06, + "loss": 0.2726, + "step": 227600 + }, + { + "epoch": 11.79, + "learning_rate": 7.009278829226409e-06, + "loss": 0.259, + "step": 227700 + }, + { + "epoch": 11.8, + "learning_rate": 6.987635309141658e-06, + "loss": 0.2264, + "step": 227800 + }, + { + "epoch": 11.8, + "learning_rate": 6.966020851118511e-06, + "loss": 0.2432, + "step": 227900 + }, + { + "epoch": 11.81, + "learning_rate": 6.944435482453636e-06, + "loss": 0.2488, + "step": 228000 + }, + { + "epoch": 11.81, + "learning_rate": 6.922879230406951e-06, + "loss": 0.255, + "step": 228100 + }, + { + "epoch": 11.82, + "learning_rate": 6.901352122201613e-06, + "loss": 0.2249, + "step": 228200 + }, + { + "epoch": 11.82, + "learning_rate": 6.879854185023969e-06, + "loss": 0.2315, + "step": 228300 + }, + { + "epoch": 11.83, + "learning_rate": 6.858385446023523e-06, + "loss": 0.3001, + "step": 228400 + }, + { + "epoch": 11.83, + "learning_rate": 6.8369459323129125e-06, + "loss": 0.2821, + "step": 228500 + }, + { + "epoch": 11.84, + "learning_rate": 6.815535670967862e-06, + "loss": 0.231, + "step": 228600 + }, + { + "epoch": 11.84, + "learning_rate": 6.794154689027155e-06, + "loss": 0.2846, + "step": 228700 + }, + { + "epoch": 11.85, + "learning_rate": 6.7728030134925975e-06, + "loss": 0.2684, + "step": 228800 + }, + { + "epoch": 11.85, + "learning_rate": 6.751480671328985e-06, + "loss": 0.246, + "step": 228900 + }, + { + "epoch": 11.86, + "learning_rate": 6.730187689464066e-06, + "loss": 0.2754, + "step": 229000 + }, + { + "epoch": 11.86, + "learning_rate": 6.708924094788515e-06, + "loss": 0.2236, + "step": 229100 + }, + { + "epoch": 11.87, + "learning_rate": 6.687689914155891e-06, + "loss": 0.2472, + "step": 229200 + }, + { + "epoch": 11.87, + "learning_rate": 6.6664851743826084e-06, + "loss": 0.2579, + "step": 229300 + }, + { + "epoch": 11.88, + "learning_rate": 6.645309902247888e-06, + "loss": 0.2475, + "step": 229400 + }, + { + "epoch": 11.88, + "learning_rate": 6.6241641244937625e-06, + "loss": 0.2223, + "step": 229500 + }, + { + "epoch": 11.89, + "learning_rate": 6.603047867825006e-06, + "loss": 0.3127, + "step": 229600 + }, + { + "epoch": 11.89, + "learning_rate": 6.581961158909081e-06, + "loss": 0.2251, + "step": 229700 + }, + { + "epoch": 11.9, + "learning_rate": 6.561114449240968e-06, + "loss": 0.2524, + "step": 229800 + }, + { + "epoch": 11.9, + "learning_rate": 6.540086619542641e-06, + "loss": 0.2494, + "step": 229900 + }, + { + "epoch": 11.91, + "learning_rate": 6.519088417110225e-06, + "loss": 0.2206, + "step": 230000 + }, + { + "epoch": 11.91, + "learning_rate": 6.498119868462117e-06, + "loss": 0.2039, + "step": 230100 + }, + { + "epoch": 11.92, + "learning_rate": 6.4771810000792705e-06, + "loss": 0.226, + "step": 230200 + }, + { + "epoch": 11.92, + "learning_rate": 6.456271838405151e-06, + "loss": 0.2812, + "step": 230300 + }, + { + "epoch": 11.93, + "learning_rate": 6.435392409845708e-06, + "loss": 0.2378, + "step": 230400 + }, + { + "epoch": 11.93, + "learning_rate": 6.41454274076933e-06, + "loss": 0.2552, + "step": 230500 + }, + { + "epoch": 11.94, + "learning_rate": 6.393722857506854e-06, + "loss": 0.2308, + "step": 230600 + }, + { + "epoch": 11.95, + "learning_rate": 6.372932786351478e-06, + "loss": 0.2666, + "step": 230700 + }, + { + "epoch": 11.95, + "learning_rate": 6.352172553558742e-06, + "loss": 0.2604, + "step": 230800 + }, + { + "epoch": 11.96, + "learning_rate": 6.331442185346508e-06, + "loss": 0.2636, + "step": 230900 + }, + { + "epoch": 11.96, + "learning_rate": 6.310741707894954e-06, + "loss": 0.2349, + "step": 231000 + }, + { + "epoch": 11.97, + "learning_rate": 6.290071147346478e-06, + "loss": 0.2423, + "step": 231100 + }, + { + "epoch": 11.97, + "learning_rate": 6.269430529805682e-06, + "loss": 0.3277, + "step": 231200 + }, + { + "epoch": 11.98, + "learning_rate": 6.248819881339398e-06, + "loss": 0.263, + "step": 231300 + }, + { + "epoch": 11.98, + "learning_rate": 6.228239227976579e-06, + "loss": 0.2689, + "step": 231400 + }, + { + "epoch": 11.99, + "learning_rate": 6.207688595708309e-06, + "loss": 0.2696, + "step": 231500 + }, + { + "epoch": 11.99, + "learning_rate": 6.187168010487737e-06, + "loss": 0.2349, + "step": 231600 + }, + { + "epoch": 12.0, + "learning_rate": 6.166677498230108e-06, + "loss": 0.2666, + "step": 231700 + }, + { + "epoch": 12.0, + "eval_accuracy": 0.6238972943849022, + "eval_cer": 0.10657801243229763, + "eval_loss": 0.5999477505683899, + "eval_runtime": 3879.8418, + "eval_samples_per_second": 4.425, + "eval_steps_per_second": 0.277, + "eval_wer": 0.24282101052879243, + "step": 231756 + }, + { + "epoch": 12.0, + "learning_rate": 6.146217084812649e-06, + "loss": 0.2271, + "step": 231800 + }, + { + "epoch": 12.01, + "learning_rate": 6.125786796074597e-06, + "loss": 0.2502, + "step": 231900 + }, + { + "epoch": 12.01, + "learning_rate": 6.105590509870199e-06, + "loss": 0.2483, + "step": 232000 + }, + { + "epoch": 12.02, + "learning_rate": 6.0852202459666e-06, + "loss": 0.1985, + "step": 232100 + }, + { + "epoch": 12.02, + "learning_rate": 6.064880183774647e-06, + "loss": 0.2446, + "step": 232200 + }, + { + "epoch": 12.03, + "learning_rate": 6.044570348981567e-06, + "loss": 0.2481, + "step": 232300 + }, + { + "epoch": 12.03, + "learning_rate": 6.024290767236425e-06, + "loss": 0.2124, + "step": 232400 + }, + { + "epoch": 12.04, + "learning_rate": 6.0040414641500986e-06, + "loss": 0.2878, + "step": 232500 + }, + { + "epoch": 12.04, + "learning_rate": 5.983822465295207e-06, + "loss": 0.2494, + "step": 232600 + }, + { + "epoch": 12.05, + "learning_rate": 5.963633796206077e-06, + "loss": 0.2455, + "step": 232700 + }, + { + "epoch": 12.05, + "learning_rate": 5.943475482378782e-06, + "loss": 0.2168, + "step": 232800 + }, + { + "epoch": 12.06, + "learning_rate": 5.9233475492710295e-06, + "loss": 0.23, + "step": 232900 + }, + { + "epoch": 12.06, + "learning_rate": 5.903250022302165e-06, + "loss": 0.1967, + "step": 233000 + }, + { + "epoch": 12.07, + "learning_rate": 5.883182926853114e-06, + "loss": 0.2243, + "step": 233100 + }, + { + "epoch": 12.07, + "learning_rate": 5.863146288266411e-06, + "loss": 0.2265, + "step": 233200 + }, + { + "epoch": 12.08, + "learning_rate": 5.843140131846103e-06, + "loss": 0.257, + "step": 233300 + }, + { + "epoch": 12.09, + "learning_rate": 5.823164482857742e-06, + "loss": 0.2727, + "step": 233400 + }, + { + "epoch": 12.09, + "learning_rate": 5.803219366528353e-06, + "loss": 0.2121, + "step": 233500 + }, + { + "epoch": 12.1, + "learning_rate": 5.783304808046405e-06, + "loss": 0.2697, + "step": 233600 + }, + { + "epoch": 12.1, + "learning_rate": 5.763420832561773e-06, + "loss": 0.2609, + "step": 233700 + }, + { + "epoch": 12.11, + "learning_rate": 5.743567465185715e-06, + "loss": 0.201, + "step": 233800 + }, + { + "epoch": 12.11, + "learning_rate": 5.723744730990822e-06, + "loss": 0.239, + "step": 233900 + }, + { + "epoch": 12.12, + "learning_rate": 5.703952655011012e-06, + "loss": 0.231, + "step": 234000 + }, + { + "epoch": 12.12, + "learning_rate": 5.6841912622414785e-06, + "loss": 0.2141, + "step": 234100 + }, + { + "epoch": 12.13, + "learning_rate": 5.6644605776386605e-06, + "loss": 0.1999, + "step": 234200 + }, + { + "epoch": 12.13, + "learning_rate": 5.64476062612024e-06, + "loss": 0.2442, + "step": 234300 + }, + { + "epoch": 12.14, + "learning_rate": 5.62509143256505e-06, + "loss": 0.2318, + "step": 234400 + }, + { + "epoch": 12.14, + "learning_rate": 5.605453021813105e-06, + "loss": 0.2162, + "step": 234500 + }, + { + "epoch": 12.15, + "learning_rate": 5.585845418665528e-06, + "loss": 0.2591, + "step": 234600 + }, + { + "epoch": 12.15, + "learning_rate": 5.5664642628909475e-06, + "loss": 0.2173, + "step": 234700 + }, + { + "epoch": 12.16, + "learning_rate": 5.54691804050672e-06, + "loss": 0.217, + "step": 234800 + }, + { + "epoch": 12.16, + "learning_rate": 5.527402699650054e-06, + "loss": 0.2407, + "step": 234900 + }, + { + "epoch": 12.17, + "learning_rate": 5.507918264966651e-06, + "loss": 0.2257, + "step": 235000 + }, + { + "epoch": 12.17, + "learning_rate": 5.488464761063197e-06, + "loss": 0.2153, + "step": 235100 + }, + { + "epoch": 12.18, + "learning_rate": 5.469042212507304e-06, + "loss": 0.2329, + "step": 235200 + }, + { + "epoch": 12.18, + "learning_rate": 5.449650643827495e-06, + "loss": 0.2641, + "step": 235300 + }, + { + "epoch": 12.19, + "learning_rate": 5.430483531604381e-06, + "loss": 0.2711, + "step": 235400 + }, + { + "epoch": 12.19, + "learning_rate": 5.411153685696722e-06, + "loss": 0.2406, + "step": 235500 + }, + { + "epoch": 12.2, + "learning_rate": 5.391854892771936e-06, + "loss": 0.2288, + "step": 235600 + }, + { + "epoch": 12.2, + "learning_rate": 5.372587177202232e-06, + "loss": 0.2598, + "step": 235700 + }, + { + "epoch": 12.21, + "learning_rate": 5.3533505633206195e-06, + "loss": 0.2185, + "step": 235800 + }, + { + "epoch": 12.21, + "learning_rate": 5.334145075420799e-06, + "loss": 0.2253, + "step": 235900 + }, + { + "epoch": 12.22, + "learning_rate": 5.314970737757169e-06, + "loss": 0.2276, + "step": 236000 + }, + { + "epoch": 12.22, + "learning_rate": 5.295827574544789e-06, + "loss": 0.244, + "step": 236100 + }, + { + "epoch": 12.23, + "learning_rate": 5.276715609959352e-06, + "loss": 0.2316, + "step": 236200 + }, + { + "epoch": 12.24, + "learning_rate": 5.257634868137139e-06, + "loss": 0.2538, + "step": 236300 + }, + { + "epoch": 12.24, + "learning_rate": 5.238585373175015e-06, + "loss": 0.2449, + "step": 236400 + }, + { + "epoch": 12.25, + "learning_rate": 5.219567149130378e-06, + "loss": 0.17, + "step": 236500 + }, + { + "epoch": 12.25, + "learning_rate": 5.20058022002113e-06, + "loss": 0.2299, + "step": 236600 + }, + { + "epoch": 12.26, + "learning_rate": 5.181624609825657e-06, + "loss": 0.1946, + "step": 236700 + }, + { + "epoch": 12.26, + "learning_rate": 5.1627003424827845e-06, + "loss": 0.1867, + "step": 236800 + }, + { + "epoch": 12.27, + "learning_rate": 5.143807441891768e-06, + "loss": 0.2366, + "step": 236900 + }, + { + "epoch": 12.27, + "learning_rate": 5.1249459319122415e-06, + "loss": 0.2874, + "step": 237000 + }, + { + "epoch": 12.28, + "learning_rate": 5.106115836364195e-06, + "loss": 0.1966, + "step": 237100 + }, + { + "epoch": 12.28, + "learning_rate": 5.087317179027945e-06, + "loss": 0.2441, + "step": 237200 + }, + { + "epoch": 12.29, + "learning_rate": 5.068549983644125e-06, + "loss": 0.2245, + "step": 237300 + }, + { + "epoch": 12.29, + "learning_rate": 5.049814273913603e-06, + "loss": 0.206, + "step": 237400 + }, + { + "epoch": 12.3, + "learning_rate": 5.031110073497506e-06, + "loss": 0.2095, + "step": 237500 + }, + { + "epoch": 12.3, + "learning_rate": 5.012437406017154e-06, + "loss": 0.2532, + "step": 237600 + }, + { + "epoch": 12.31, + "learning_rate": 4.993796295054078e-06, + "loss": 0.1885, + "step": 237700 + }, + { + "epoch": 12.31, + "learning_rate": 4.975186764149904e-06, + "loss": 0.1967, + "step": 237800 + }, + { + "epoch": 12.32, + "learning_rate": 4.9566088368064046e-06, + "loss": 0.2278, + "step": 237900 + }, + { + "epoch": 12.32, + "learning_rate": 4.938062536485459e-06, + "loss": 0.2271, + "step": 238000 + }, + { + "epoch": 12.33, + "learning_rate": 4.919732876361232e-06, + "loss": 0.2435, + "step": 238100 + }, + { + "epoch": 12.33, + "learning_rate": 4.901249583457285e-06, + "loss": 0.1926, + "step": 238200 + }, + { + "epoch": 12.34, + "learning_rate": 4.882797987488467e-06, + "loss": 0.1929, + "step": 238300 + }, + { + "epoch": 12.34, + "learning_rate": 4.864378111757099e-06, + "loss": 0.2217, + "step": 238400 + }, + { + "epoch": 12.35, + "learning_rate": 4.8459899795254425e-06, + "loss": 0.2276, + "step": 238500 + }, + { + "epoch": 12.35, + "learning_rate": 4.827633614015663e-06, + "loss": 0.2688, + "step": 238600 + }, + { + "epoch": 12.36, + "learning_rate": 4.809309038409806e-06, + "loss": 0.2357, + "step": 238700 + }, + { + "epoch": 12.36, + "learning_rate": 4.791016275849797e-06, + "loss": 0.246, + "step": 238800 + }, + { + "epoch": 12.37, + "learning_rate": 4.772755349437345e-06, + "loss": 0.2571, + "step": 238900 + }, + { + "epoch": 12.38, + "learning_rate": 4.754526282233975e-06, + "loss": 0.2434, + "step": 239000 + }, + { + "epoch": 12.38, + "learning_rate": 4.736329097260974e-06, + "loss": 0.201, + "step": 239100 + }, + { + "epoch": 12.39, + "learning_rate": 4.718163817499382e-06, + "loss": 0.2916, + "step": 239200 + }, + { + "epoch": 12.39, + "learning_rate": 4.700030465889913e-06, + "loss": 0.2519, + "step": 239300 + }, + { + "epoch": 12.4, + "learning_rate": 4.681929065332974e-06, + "loss": 0.2057, + "step": 239400 + }, + { + "epoch": 12.4, + "learning_rate": 4.663859638688643e-06, + "loss": 0.2554, + "step": 239500 + }, + { + "epoch": 12.41, + "learning_rate": 4.645822208776584e-06, + "loss": 0.2243, + "step": 239600 + }, + { + "epoch": 12.41, + "learning_rate": 4.6278167983760785e-06, + "loss": 0.2449, + "step": 239700 + }, + { + "epoch": 12.42, + "learning_rate": 4.6098434302259525e-06, + "loss": 0.3108, + "step": 239800 + }, + { + "epoch": 12.42, + "learning_rate": 4.59190212702458e-06, + "loss": 0.2199, + "step": 239900 + }, + { + "epoch": 12.43, + "learning_rate": 4.573992911429832e-06, + "loss": 0.2357, + "step": 240000 + }, + { + "epoch": 12.43, + "learning_rate": 4.556115806059057e-06, + "loss": 0.2459, + "step": 240100 + }, + { + "epoch": 12.44, + "learning_rate": 4.538270833489062e-06, + "loss": 0.1773, + "step": 240200 + }, + { + "epoch": 12.44, + "learning_rate": 4.5204580162560576e-06, + "loss": 0.2448, + "step": 240300 + }, + { + "epoch": 12.45, + "learning_rate": 4.502677376855661e-06, + "loss": 0.2214, + "step": 240400 + }, + { + "epoch": 12.45, + "learning_rate": 4.4849289377428406e-06, + "loss": 0.2503, + "step": 240500 + }, + { + "epoch": 12.46, + "learning_rate": 4.4672127213319065e-06, + "loss": 0.1976, + "step": 240600 + }, + { + "epoch": 12.46, + "learning_rate": 4.449528749996476e-06, + "loss": 0.2059, + "step": 240700 + }, + { + "epoch": 12.47, + "learning_rate": 4.4318770460694345e-06, + "loss": 0.2481, + "step": 240800 + }, + { + "epoch": 12.47, + "learning_rate": 4.414257631842933e-06, + "loss": 0.1832, + "step": 240900 + }, + { + "epoch": 12.48, + "learning_rate": 4.3966705295683285e-06, + "loss": 0.2247, + "step": 241000 + }, + { + "epoch": 12.48, + "learning_rate": 4.379115761456178e-06, + "loss": 0.227, + "step": 241100 + }, + { + "epoch": 12.49, + "learning_rate": 4.361593349676205e-06, + "loss": 0.2111, + "step": 241200 + }, + { + "epoch": 12.49, + "learning_rate": 4.344103316357284e-06, + "loss": 0.215, + "step": 241300 + }, + { + "epoch": 12.5, + "learning_rate": 4.3266456835873665e-06, + "loss": 0.2162, + "step": 241400 + }, + { + "epoch": 12.5, + "learning_rate": 4.309220473413511e-06, + "loss": 0.2069, + "step": 241500 + }, + { + "epoch": 12.51, + "learning_rate": 4.29182770784182e-06, + "loss": 0.1974, + "step": 241600 + }, + { + "epoch": 12.51, + "learning_rate": 4.274467408837433e-06, + "loss": 0.2117, + "step": 241700 + }, + { + "epoch": 12.52, + "learning_rate": 4.257139598324484e-06, + "loss": 0.2173, + "step": 241800 + }, + { + "epoch": 12.53, + "learning_rate": 4.2400170901893364e-06, + "loss": 0.246, + "step": 241900 + }, + { + "epoch": 12.53, + "learning_rate": 4.222753996837338e-06, + "loss": 0.2541, + "step": 242000 + }, + { + "epoch": 12.54, + "learning_rate": 4.205523457285068e-06, + "loss": 0.2312, + "step": 242100 + }, + { + "epoch": 12.54, + "learning_rate": 4.188325493292787e-06, + "loss": 0.2094, + "step": 242200 + }, + { + "epoch": 12.55, + "learning_rate": 4.17116012657961e-06, + "loss": 0.2289, + "step": 242300 + }, + { + "epoch": 12.55, + "learning_rate": 4.1540273788234875e-06, + "loss": 0.2394, + "step": 242400 + }, + { + "epoch": 12.56, + "learning_rate": 4.136927271661186e-06, + "loss": 0.1952, + "step": 242500 + }, + { + "epoch": 12.56, + "learning_rate": 4.1198598266882345e-06, + "loss": 0.1871, + "step": 242600 + }, + { + "epoch": 12.57, + "learning_rate": 4.102825065458919e-06, + "loss": 0.2595, + "step": 242700 + }, + { + "epoch": 12.57, + "learning_rate": 4.0858230094862645e-06, + "loss": 0.2175, + "step": 242800 + }, + { + "epoch": 12.58, + "learning_rate": 4.068853680241975e-06, + "loss": 0.1934, + "step": 242900 + }, + { + "epoch": 12.58, + "learning_rate": 4.051917099156424e-06, + "loss": 0.247, + "step": 243000 + }, + { + "epoch": 12.59, + "learning_rate": 4.0350132876186245e-06, + "loss": 0.1963, + "step": 243100 + }, + { + "epoch": 12.59, + "learning_rate": 4.018142266976234e-06, + "loss": 0.185, + "step": 243200 + }, + { + "epoch": 12.6, + "learning_rate": 4.001304058535476e-06, + "loss": 0.2135, + "step": 243300 + }, + { + "epoch": 12.6, + "learning_rate": 3.984498683561116e-06, + "loss": 0.2037, + "step": 243400 + }, + { + "epoch": 12.61, + "learning_rate": 3.9677261632765e-06, + "loss": 0.2335, + "step": 243500 + }, + { + "epoch": 12.61, + "learning_rate": 3.9509865188634505e-06, + "loss": 0.2378, + "step": 243600 + }, + { + "epoch": 12.62, + "learning_rate": 3.934446676026776e-06, + "loss": 0.221, + "step": 243700 + }, + { + "epoch": 12.62, + "learning_rate": 3.917772517450844e-06, + "loss": 0.2195, + "step": 243800 + }, + { + "epoch": 12.63, + "learning_rate": 3.90113129783238e-06, + "loss": 0.2212, + "step": 243900 + }, + { + "epoch": 12.63, + "learning_rate": 3.884523038187417e-06, + "loss": 0.2332, + "step": 244000 + }, + { + "epoch": 12.64, + "learning_rate": 3.867947759490325e-06, + "loss": 0.241, + "step": 244100 + }, + { + "epoch": 12.64, + "learning_rate": 3.8514054826738396e-06, + "loss": 0.2467, + "step": 244200 + }, + { + "epoch": 12.65, + "learning_rate": 3.834896228629031e-06, + "loss": 0.215, + "step": 244300 + }, + { + "epoch": 12.65, + "learning_rate": 3.818420018205256e-06, + "loss": 0.2497, + "step": 244400 + }, + { + "epoch": 12.66, + "learning_rate": 3.801976872210128e-06, + "loss": 0.2113, + "step": 244500 + }, + { + "epoch": 12.67, + "learning_rate": 3.7855668114095076e-06, + "loss": 0.2122, + "step": 244600 + }, + { + "epoch": 12.67, + "learning_rate": 3.7691898565275007e-06, + "loss": 0.2222, + "step": 244700 + }, + { + "epoch": 12.68, + "learning_rate": 3.7528460282463794e-06, + "loss": 0.2258, + "step": 244800 + }, + { + "epoch": 12.68, + "learning_rate": 3.7365353472065665e-06, + "loss": 0.2086, + "step": 244900 + }, + { + "epoch": 12.69, + "learning_rate": 3.720257834006655e-06, + "loss": 0.2292, + "step": 245000 + }, + { + "epoch": 12.69, + "learning_rate": 3.7040135092033377e-06, + "loss": 0.2091, + "step": 245100 + }, + { + "epoch": 12.7, + "learning_rate": 3.687802393311398e-06, + "loss": 0.2069, + "step": 245200 + }, + { + "epoch": 12.7, + "learning_rate": 3.6716245068036525e-06, + "loss": 0.2037, + "step": 245300 + }, + { + "epoch": 12.71, + "learning_rate": 3.655479870110998e-06, + "loss": 0.1932, + "step": 245400 + }, + { + "epoch": 12.71, + "learning_rate": 3.6393685036223088e-06, + "loss": 0.2463, + "step": 245500 + }, + { + "epoch": 12.72, + "learning_rate": 3.6232904276844558e-06, + "loss": 0.2355, + "step": 245600 + }, + { + "epoch": 12.72, + "learning_rate": 3.607245662602263e-06, + "loss": 0.257, + "step": 245700 + }, + { + "epoch": 12.73, + "learning_rate": 3.591234228638486e-06, + "loss": 0.2577, + "step": 245800 + }, + { + "epoch": 12.73, + "learning_rate": 3.575256146013789e-06, + "loss": 0.249, + "step": 245900 + }, + { + "epoch": 12.74, + "learning_rate": 3.5593114349067146e-06, + "loss": 0.2327, + "step": 246000 + }, + { + "epoch": 12.74, + "learning_rate": 3.5434001154536657e-06, + "loss": 0.25, + "step": 246100 + }, + { + "epoch": 12.75, + "learning_rate": 3.5275222077488676e-06, + "loss": 0.2247, + "step": 246200 + }, + { + "epoch": 12.75, + "learning_rate": 3.5116777318443584e-06, + "loss": 0.186, + "step": 246300 + }, + { + "epoch": 12.76, + "learning_rate": 3.495866707749947e-06, + "loss": 0.2277, + "step": 246400 + }, + { + "epoch": 12.76, + "learning_rate": 3.480089155433216e-06, + "loss": 0.2546, + "step": 246500 + }, + { + "epoch": 12.77, + "learning_rate": 3.464345094819449e-06, + "loss": 0.2027, + "step": 246600 + }, + { + "epoch": 12.77, + "learning_rate": 3.4486345457916414e-06, + "loss": 0.2076, + "step": 246700 + }, + { + "epoch": 12.78, + "learning_rate": 3.4329575281904855e-06, + "loss": 0.2062, + "step": 246800 + }, + { + "epoch": 12.78, + "learning_rate": 3.417314061814315e-06, + "loss": 0.2068, + "step": 246900 + }, + { + "epoch": 12.79, + "learning_rate": 3.4017041664190793e-06, + "loss": 0.236, + "step": 247000 + }, + { + "epoch": 12.79, + "learning_rate": 3.3861278617183435e-06, + "loss": 0.208, + "step": 247100 + }, + { + "epoch": 12.8, + "learning_rate": 3.370585167383261e-06, + "loss": 0.2023, + "step": 247200 + }, + { + "epoch": 12.8, + "learning_rate": 3.3550761030425313e-06, + "loss": 0.208, + "step": 247300 + }, + { + "epoch": 12.81, + "learning_rate": 3.3396006882823636e-06, + "loss": 0.2157, + "step": 247400 + }, + { + "epoch": 12.82, + "learning_rate": 3.3241589426465015e-06, + "loss": 0.2134, + "step": 247500 + }, + { + "epoch": 12.82, + "learning_rate": 3.308750885636155e-06, + "loss": 0.2138, + "step": 247600 + }, + { + "epoch": 12.83, + "learning_rate": 3.293376536709992e-06, + "loss": 0.2644, + "step": 247700 + }, + { + "epoch": 12.83, + "learning_rate": 3.278035915284092e-06, + "loss": 0.2456, + "step": 247800 + }, + { + "epoch": 12.84, + "learning_rate": 3.262729040731971e-06, + "loss": 0.23, + "step": 247900 + }, + { + "epoch": 12.84, + "learning_rate": 3.247455932384512e-06, + "loss": 0.2436, + "step": 248000 + }, + { + "epoch": 12.85, + "learning_rate": 3.232216609529953e-06, + "loss": 0.2003, + "step": 248100 + }, + { + "epoch": 12.85, + "learning_rate": 3.217011091413863e-06, + "loss": 0.2682, + "step": 248200 + }, + { + "epoch": 12.86, + "learning_rate": 3.201839397239127e-06, + "loss": 0.1738, + "step": 248300 + }, + { + "epoch": 12.86, + "learning_rate": 3.186701546165909e-06, + "loss": 0.22, + "step": 248400 + }, + { + "epoch": 12.87, + "learning_rate": 3.171597557311633e-06, + "loss": 0.2403, + "step": 248500 + }, + { + "epoch": 12.87, + "learning_rate": 3.1565274497509643e-06, + "loss": 0.2024, + "step": 248600 + }, + { + "epoch": 12.88, + "learning_rate": 3.141491242515773e-06, + "loss": 0.2273, + "step": 248700 + }, + { + "epoch": 12.88, + "learning_rate": 3.1264889545951148e-06, + "loss": 0.2268, + "step": 248800 + }, + { + "epoch": 12.89, + "learning_rate": 3.111520604935215e-06, + "loss": 0.2191, + "step": 248900 + }, + { + "epoch": 12.89, + "learning_rate": 3.0965862124394526e-06, + "loss": 0.1795, + "step": 249000 + }, + { + "epoch": 12.9, + "learning_rate": 3.0816857959682877e-06, + "loss": 0.1815, + "step": 249100 + }, + { + "epoch": 12.9, + "learning_rate": 3.0668193743393004e-06, + "loss": 0.2217, + "step": 249200 + }, + { + "epoch": 12.91, + "learning_rate": 3.0519869663271225e-06, + "loss": 0.2072, + "step": 249300 + }, + { + "epoch": 12.91, + "learning_rate": 3.037188590663458e-06, + "loss": 0.201, + "step": 249400 + }, + { + "epoch": 12.92, + "learning_rate": 3.0224242660369927e-06, + "loss": 0.2279, + "step": 249500 + }, + { + "epoch": 12.92, + "learning_rate": 3.0076940110934324e-06, + "loss": 0.2043, + "step": 249600 + }, + { + "epoch": 12.93, + "learning_rate": 2.9929978444354632e-06, + "loss": 0.2019, + "step": 249700 + }, + { + "epoch": 12.93, + "learning_rate": 2.9783357846227087e-06, + "loss": 0.1932, + "step": 249800 + }, + { + "epoch": 12.94, + "learning_rate": 2.9637078501717173e-06, + "loss": 0.2277, + "step": 249900 + }, + { + "epoch": 12.94, + "learning_rate": 2.949114059555945e-06, + "loss": 0.196, + "step": 250000 + }, + { + "epoch": 12.95, + "learning_rate": 2.934554431205736e-06, + "loss": 0.2446, + "step": 250100 + }, + { + "epoch": 12.96, + "learning_rate": 2.920028983508288e-06, + "loss": 0.2238, + "step": 250200 + }, + { + "epoch": 12.96, + "learning_rate": 2.905537734807612e-06, + "loss": 0.2225, + "step": 250300 + }, + { + "epoch": 12.97, + "learning_rate": 2.8910807034045604e-06, + "loss": 0.2603, + "step": 250400 + }, + { + "epoch": 12.97, + "learning_rate": 2.8766579075567533e-06, + "loss": 0.2387, + "step": 250500 + }, + { + "epoch": 12.98, + "learning_rate": 2.8622693654785904e-06, + "loss": 0.2337, + "step": 250600 + }, + { + "epoch": 12.98, + "learning_rate": 2.8479150953411824e-06, + "loss": 0.2107, + "step": 250700 + }, + { + "epoch": 12.99, + "learning_rate": 2.833595115272396e-06, + "loss": 0.2049, + "step": 250800 + }, + { + "epoch": 12.99, + "learning_rate": 2.819309443356771e-06, + "loss": 0.1853, + "step": 250900 + }, + { + "epoch": 13.0, + "learning_rate": 2.8050580976355233e-06, + "loss": 0.2546, + "step": 251000 + }, + { + "epoch": 13.0, + "eval_accuracy": 0.6238590691985089, + "eval_cer": 0.10245587287246308, + "eval_loss": 0.5943225622177124, + "eval_runtime": 3891.4893, + "eval_samples_per_second": 4.412, + "eval_steps_per_second": 0.276, + "eval_wer": 0.23677430739368271, + "step": 251069 + }, + { + "epoch": 13.0, + "learning_rate": 2.7908410961065254e-06, + "loss": 0.1901, + "step": 251100 + }, + { + "epoch": 13.01, + "learning_rate": 2.7766584567242658e-06, + "loss": 0.2272, + "step": 251200 + }, + { + "epoch": 13.01, + "learning_rate": 2.7625101973998434e-06, + "loss": 0.2346, + "step": 251300 + }, + { + "epoch": 13.02, + "learning_rate": 2.7483963360009458e-06, + "loss": 0.2241, + "step": 251400 + }, + { + "epoch": 13.02, + "learning_rate": 2.7343168903518044e-06, + "loss": 0.243, + "step": 251500 + }, + { + "epoch": 13.03, + "learning_rate": 2.7202718782332037e-06, + "loss": 0.2267, + "step": 251600 + }, + { + "epoch": 13.03, + "learning_rate": 2.706261317382428e-06, + "loss": 0.1972, + "step": 251700 + }, + { + "epoch": 13.04, + "learning_rate": 2.6922852254932575e-06, + "loss": 0.2277, + "step": 251800 + }, + { + "epoch": 13.04, + "learning_rate": 2.6783436202159596e-06, + "loss": 0.1726, + "step": 251900 + }, + { + "epoch": 13.05, + "learning_rate": 2.6644365191572206e-06, + "loss": 0.1883, + "step": 252000 + }, + { + "epoch": 13.05, + "learning_rate": 2.6505639398801683e-06, + "loss": 0.1965, + "step": 252100 + }, + { + "epoch": 13.06, + "learning_rate": 2.6367258999043255e-06, + "loss": 0.2154, + "step": 252200 + }, + { + "epoch": 13.06, + "learning_rate": 2.6230602804242765e-06, + "loss": 0.2194, + "step": 252300 + }, + { + "epoch": 13.07, + "learning_rate": 2.6092910256067095e-06, + "loss": 0.2131, + "step": 252400 + }, + { + "epoch": 13.07, + "learning_rate": 2.595556362213467e-06, + "loss": 0.2395, + "step": 252500 + }, + { + "epoch": 13.08, + "learning_rate": 2.581856307589898e-06, + "loss": 0.216, + "step": 252600 + }, + { + "epoch": 13.08, + "learning_rate": 2.5681908790376594e-06, + "loss": 0.2232, + "step": 252700 + }, + { + "epoch": 13.09, + "learning_rate": 2.5545600938146628e-06, + "loss": 0.2044, + "step": 252800 + }, + { + "epoch": 13.09, + "learning_rate": 2.5409639691350784e-06, + "loss": 0.2019, + "step": 252900 + }, + { + "epoch": 13.1, + "learning_rate": 2.5274025221693043e-06, + "loss": 0.1565, + "step": 253000 + }, + { + "epoch": 13.11, + "learning_rate": 2.514010865769604e-06, + "loss": 0.1796, + "step": 253100 + }, + { + "epoch": 13.11, + "learning_rate": 2.500518478363787e-06, + "loss": 0.227, + "step": 253200 + }, + { + "epoch": 13.12, + "learning_rate": 2.4870608197499458e-06, + "loss": 0.2244, + "step": 253300 + }, + { + "epoch": 13.12, + "learning_rate": 2.4736379069236047e-06, + "loss": 0.206, + "step": 253400 + }, + { + "epoch": 13.13, + "learning_rate": 2.4602497568364178e-06, + "loss": 0.2234, + "step": 253500 + }, + { + "epoch": 13.13, + "learning_rate": 2.4468963863961235e-06, + "loss": 0.2469, + "step": 253600 + }, + { + "epoch": 13.14, + "learning_rate": 2.433577812466552e-06, + "loss": 0.2079, + "step": 253700 + }, + { + "epoch": 13.14, + "learning_rate": 2.4202940518675854e-06, + "loss": 0.1648, + "step": 253800 + }, + { + "epoch": 13.15, + "learning_rate": 2.4070451213751345e-06, + "loss": 0.2031, + "step": 253900 + }, + { + "epoch": 13.15, + "learning_rate": 2.3938310377211246e-06, + "loss": 0.2399, + "step": 254000 + }, + { + "epoch": 13.16, + "learning_rate": 2.3806518175934846e-06, + "loss": 0.2116, + "step": 254100 + }, + { + "epoch": 13.16, + "learning_rate": 2.3675074776360994e-06, + "loss": 0.2334, + "step": 254200 + }, + { + "epoch": 13.17, + "learning_rate": 2.354398034448815e-06, + "loss": 0.1876, + "step": 254300 + }, + { + "epoch": 13.17, + "learning_rate": 2.341323504587397e-06, + "loss": 0.1919, + "step": 254400 + }, + { + "epoch": 13.18, + "learning_rate": 2.3282839045635385e-06, + "loss": 0.2057, + "step": 254500 + }, + { + "epoch": 13.18, + "learning_rate": 2.3152792508447896e-06, + "loss": 0.2304, + "step": 254600 + }, + { + "epoch": 13.19, + "learning_rate": 2.3023095598545927e-06, + "loss": 0.1968, + "step": 254700 + }, + { + "epoch": 13.19, + "learning_rate": 2.289374847972223e-06, + "loss": 0.1984, + "step": 254800 + }, + { + "epoch": 13.2, + "learning_rate": 2.276475131532797e-06, + "loss": 0.1979, + "step": 254900 + }, + { + "epoch": 13.2, + "learning_rate": 2.263610426827213e-06, + "loss": 0.1996, + "step": 255000 + }, + { + "epoch": 13.21, + "learning_rate": 2.2507807501021614e-06, + "loss": 0.1607, + "step": 255100 + }, + { + "epoch": 13.21, + "learning_rate": 2.2379861175601123e-06, + "loss": 0.194, + "step": 255200 + }, + { + "epoch": 13.22, + "learning_rate": 2.22522654535926e-06, + "loss": 0.2109, + "step": 255300 + }, + { + "epoch": 13.22, + "learning_rate": 2.212502049613532e-06, + "loss": 0.2232, + "step": 255400 + }, + { + "epoch": 13.23, + "learning_rate": 2.1998126463925392e-06, + "loss": 0.2082, + "step": 255500 + }, + { + "epoch": 13.23, + "learning_rate": 2.187158351721601e-06, + "loss": 0.2148, + "step": 255600 + }, + { + "epoch": 13.24, + "learning_rate": 2.174539181581686e-06, + "loss": 0.2345, + "step": 255700 + }, + { + "epoch": 13.24, + "learning_rate": 2.161955151909407e-06, + "loss": 0.2133, + "step": 255800 + }, + { + "epoch": 13.25, + "learning_rate": 2.1494062785969882e-06, + "loss": 0.2452, + "step": 255900 + }, + { + "epoch": 13.26, + "learning_rate": 2.1368925774922688e-06, + "loss": 0.2269, + "step": 256000 + }, + { + "epoch": 13.26, + "learning_rate": 2.1244140643986642e-06, + "loss": 0.245, + "step": 256100 + }, + { + "epoch": 13.27, + "learning_rate": 2.111970755075149e-06, + "loss": 0.1928, + "step": 256200 + }, + { + "epoch": 13.27, + "learning_rate": 2.0995626652362453e-06, + "loss": 0.2141, + "step": 256300 + }, + { + "epoch": 13.28, + "learning_rate": 2.087313364633465e-06, + "loss": 0.2157, + "step": 256400 + }, + { + "epoch": 13.28, + "learning_rate": 2.0749754081443994e-06, + "loss": 0.1806, + "step": 256500 + }, + { + "epoch": 13.29, + "learning_rate": 2.0626727178609495e-06, + "loss": 0.2415, + "step": 256600 + }, + { + "epoch": 13.29, + "learning_rate": 2.0505278087099387e-06, + "loss": 0.1997, + "step": 256700 + }, + { + "epoch": 13.3, + "learning_rate": 2.0382953443550877e-06, + "loss": 0.2335, + "step": 256800 + }, + { + "epoch": 13.3, + "learning_rate": 2.026098192528708e-06, + "loss": 0.2069, + "step": 256900 + }, + { + "epoch": 13.31, + "learning_rate": 2.0139363686344515e-06, + "loss": 0.2589, + "step": 257000 + }, + { + "epoch": 13.31, + "learning_rate": 2.0018098880313486e-06, + "loss": 0.1888, + "step": 257100 + }, + { + "epoch": 13.32, + "learning_rate": 1.989718766033799e-06, + "loss": 0.2144, + "step": 257200 + }, + { + "epoch": 13.32, + "learning_rate": 1.9776630179115452e-06, + "loss": 0.271, + "step": 257300 + }, + { + "epoch": 13.33, + "learning_rate": 1.9656426588896546e-06, + "loss": 0.2044, + "step": 257400 + }, + { + "epoch": 13.33, + "learning_rate": 1.953657704148515e-06, + "loss": 0.203, + "step": 257500 + }, + { + "epoch": 13.34, + "learning_rate": 1.941708168823798e-06, + "loss": 0.2069, + "step": 257600 + }, + { + "epoch": 13.34, + "learning_rate": 1.9297940680064262e-06, + "loss": 0.2128, + "step": 257700 + }, + { + "epoch": 13.35, + "learning_rate": 1.917915416742584e-06, + "loss": 0.2205, + "step": 257800 + }, + { + "epoch": 13.35, + "learning_rate": 1.9060722300337074e-06, + "loss": 0.1819, + "step": 257900 + }, + { + "epoch": 13.36, + "learning_rate": 1.8942645228364163e-06, + "loss": 0.1558, + "step": 258000 + }, + { + "epoch": 13.36, + "learning_rate": 1.8824923100625257e-06, + "loss": 0.1759, + "step": 258100 + }, + { + "epoch": 13.37, + "learning_rate": 1.8707556065790466e-06, + "loss": 0.1813, + "step": 258200 + }, + { + "epoch": 13.37, + "learning_rate": 1.8590544272081256e-06, + "loss": 0.1885, + "step": 258300 + }, + { + "epoch": 13.38, + "learning_rate": 1.8473887867270588e-06, + "loss": 0.2448, + "step": 258400 + }, + { + "epoch": 13.38, + "learning_rate": 1.8357586998682419e-06, + "loss": 0.1618, + "step": 258500 + }, + { + "epoch": 13.39, + "learning_rate": 1.8241641813191955e-06, + "loss": 0.2219, + "step": 258600 + }, + { + "epoch": 13.4, + "learning_rate": 1.812720658894893e-06, + "loss": 0.2087, + "step": 258700 + }, + { + "epoch": 13.4, + "learning_rate": 1.8011969648006043e-06, + "loss": 0.1823, + "step": 258800 + }, + { + "epoch": 13.41, + "learning_rate": 1.7897088826637088e-06, + "loss": 0.2372, + "step": 258900 + }, + { + "epoch": 13.41, + "learning_rate": 1.778256426992394e-06, + "loss": 0.213, + "step": 259000 + }, + { + "epoch": 13.42, + "learning_rate": 1.7668396122498344e-06, + "loss": 0.1751, + "step": 259100 + }, + { + "epoch": 13.42, + "learning_rate": 1.7554584528541927e-06, + "loss": 0.2055, + "step": 259200 + }, + { + "epoch": 13.43, + "learning_rate": 1.7441129631786124e-06, + "loss": 0.2269, + "step": 259300 + }, + { + "epoch": 13.43, + "learning_rate": 1.732803157551195e-06, + "loss": 0.193, + "step": 259400 + }, + { + "epoch": 13.44, + "learning_rate": 1.7215290502549653e-06, + "loss": 0.2059, + "step": 259500 + }, + { + "epoch": 13.44, + "learning_rate": 1.7102906555278608e-06, + "loss": 0.1976, + "step": 259600 + }, + { + "epoch": 13.45, + "learning_rate": 1.6990879875627351e-06, + "loss": 0.1935, + "step": 259700 + }, + { + "epoch": 13.45, + "learning_rate": 1.6879210605073115e-06, + "loss": 0.1569, + "step": 259800 + }, + { + "epoch": 13.46, + "learning_rate": 1.6767898884641852e-06, + "loss": 0.2007, + "step": 259900 + }, + { + "epoch": 13.46, + "learning_rate": 1.6656944854907785e-06, + "loss": 0.1785, + "step": 260000 + }, + { + "epoch": 13.47, + "learning_rate": 1.6546348655993592e-06, + "loss": 0.2157, + "step": 260100 + }, + { + "epoch": 13.47, + "learning_rate": 1.643611042757005e-06, + "loss": 0.1904, + "step": 260200 + }, + { + "epoch": 13.48, + "learning_rate": 1.6326230308855727e-06, + "loss": 0.1947, + "step": 260300 + }, + { + "epoch": 13.48, + "learning_rate": 1.6216708438617024e-06, + "loss": 0.1832, + "step": 260400 + }, + { + "epoch": 13.49, + "learning_rate": 1.610754495516793e-06, + "loss": 0.2235, + "step": 260500 + }, + { + "epoch": 13.49, + "learning_rate": 1.5998739996369804e-06, + "loss": 0.2028, + "step": 260600 + }, + { + "epoch": 13.5, + "learning_rate": 1.5890293699631197e-06, + "loss": 0.1836, + "step": 260700 + }, + { + "epoch": 13.5, + "learning_rate": 1.5782206201907756e-06, + "loss": 0.2324, + "step": 260800 + }, + { + "epoch": 13.51, + "learning_rate": 1.567447763970199e-06, + "loss": 0.2012, + "step": 260900 + }, + { + "epoch": 13.51, + "learning_rate": 1.5567108149063137e-06, + "loss": 0.2082, + "step": 261000 + }, + { + "epoch": 13.52, + "learning_rate": 1.5460097865586898e-06, + "loss": 0.2373, + "step": 261100 + }, + { + "epoch": 13.52, + "learning_rate": 1.5353446924415437e-06, + "loss": 0.198, + "step": 261200 + }, + { + "epoch": 13.53, + "learning_rate": 1.5247155460237017e-06, + "loss": 0.2033, + "step": 261300 + }, + { + "epoch": 13.53, + "learning_rate": 1.514122360728596e-06, + "loss": 0.2054, + "step": 261400 + }, + { + "epoch": 13.54, + "learning_rate": 1.5035651499342352e-06, + "loss": 0.2196, + "step": 261500 + }, + { + "epoch": 13.55, + "learning_rate": 1.4930439269732244e-06, + "loss": 0.2013, + "step": 261600 + }, + { + "epoch": 13.55, + "learning_rate": 1.4825587051326816e-06, + "loss": 0.1868, + "step": 261700 + }, + { + "epoch": 13.56, + "learning_rate": 1.4721094976542816e-06, + "loss": 0.1995, + "step": 261800 + }, + { + "epoch": 13.56, + "learning_rate": 1.4616963177342213e-06, + "loss": 0.1938, + "step": 261900 + }, + { + "epoch": 13.57, + "learning_rate": 1.4513191785231882e-06, + "loss": 0.2416, + "step": 262000 + }, + { + "epoch": 13.57, + "learning_rate": 1.4409780931263495e-06, + "loss": 0.1653, + "step": 262100 + }, + { + "epoch": 13.58, + "learning_rate": 1.430673074603348e-06, + "loss": 0.2609, + "step": 262200 + }, + { + "epoch": 13.58, + "learning_rate": 1.4204041359682906e-06, + "loss": 0.1971, + "step": 262300 + }, + { + "epoch": 13.59, + "learning_rate": 1.4101712901897001e-06, + "loss": 0.2155, + "step": 262400 + }, + { + "epoch": 13.59, + "learning_rate": 1.3999745501905159e-06, + "loss": 0.189, + "step": 262500 + }, + { + "epoch": 13.6, + "learning_rate": 1.3898139288481004e-06, + "loss": 0.1847, + "step": 262600 + }, + { + "epoch": 13.6, + "learning_rate": 1.3796894389941828e-06, + "loss": 0.1737, + "step": 262700 + }, + { + "epoch": 13.61, + "learning_rate": 1.369601093414875e-06, + "loss": 0.2339, + "step": 262800 + }, + { + "epoch": 13.61, + "learning_rate": 1.359548904850636e-06, + "loss": 0.2135, + "step": 262900 + }, + { + "epoch": 13.62, + "learning_rate": 1.3495328859962608e-06, + "loss": 0.1782, + "step": 263000 + }, + { + "epoch": 13.62, + "learning_rate": 1.3395530495008712e-06, + "loss": 0.1911, + "step": 263100 + }, + { + "epoch": 13.63, + "learning_rate": 1.3296094079678955e-06, + "loss": 0.2013, + "step": 263200 + }, + { + "epoch": 13.63, + "learning_rate": 1.3197019739550454e-06, + "loss": 0.183, + "step": 263300 + }, + { + "epoch": 13.64, + "learning_rate": 1.3099292927839835e-06, + "loss": 0.2456, + "step": 263400 + }, + { + "epoch": 13.64, + "learning_rate": 1.3000939489150742e-06, + "loss": 0.2004, + "step": 263500 + }, + { + "epoch": 13.65, + "learning_rate": 1.2902948498410305e-06, + "loss": 0.2296, + "step": 263600 + }, + { + "epoch": 13.65, + "learning_rate": 1.2805320079370397e-06, + "loss": 0.2282, + "step": 263700 + }, + { + "epoch": 13.66, + "learning_rate": 1.2708054355324793e-06, + "loss": 0.1687, + "step": 263800 + }, + { + "epoch": 13.66, + "learning_rate": 1.2611151449109403e-06, + "loss": 0.2553, + "step": 263900 + }, + { + "epoch": 13.67, + "learning_rate": 1.25146114831017e-06, + "loss": 0.2202, + "step": 264000 + }, + { + "epoch": 13.67, + "learning_rate": 1.2418434579221028e-06, + "loss": 0.1805, + "step": 264100 + }, + { + "epoch": 13.68, + "learning_rate": 1.2322620858928158e-06, + "loss": 0.2224, + "step": 264200 + }, + { + "epoch": 13.69, + "learning_rate": 1.2227170443225133e-06, + "loss": 0.208, + "step": 264300 + }, + { + "epoch": 13.69, + "learning_rate": 1.213208345265523e-06, + "loss": 0.2012, + "step": 264400 + }, + { + "epoch": 13.7, + "learning_rate": 1.203736000730279e-06, + "loss": 0.2031, + "step": 264500 + }, + { + "epoch": 13.7, + "learning_rate": 1.1943000226792988e-06, + "loss": 0.199, + "step": 264600 + }, + { + "epoch": 13.71, + "learning_rate": 1.1849004230291771e-06, + "loss": 0.2308, + "step": 264700 + }, + { + "epoch": 13.71, + "learning_rate": 1.1756306655736382e-06, + "loss": 0.1884, + "step": 264800 + }, + { + "epoch": 13.72, + "learning_rate": 1.16630349421188e-06, + "loss": 0.1962, + "step": 264900 + }, + { + "epoch": 13.72, + "learning_rate": 1.1570127366074911e-06, + "loss": 0.2593, + "step": 265000 + }, + { + "epoch": 13.73, + "learning_rate": 1.1477584044936528e-06, + "loss": 0.1999, + "step": 265100 + }, + { + "epoch": 13.73, + "learning_rate": 1.1385405095575729e-06, + "loss": 0.1882, + "step": 265200 + }, + { + "epoch": 13.74, + "learning_rate": 1.129359063440426e-06, + "loss": 0.2056, + "step": 265300 + }, + { + "epoch": 13.74, + "learning_rate": 1.1202140777373536e-06, + "loss": 0.2369, + "step": 265400 + }, + { + "epoch": 13.75, + "learning_rate": 1.1111055639974643e-06, + "loss": 0.2084, + "step": 265500 + }, + { + "epoch": 13.75, + "learning_rate": 1.102033533723793e-06, + "loss": 0.1779, + "step": 265600 + }, + { + "epoch": 13.76, + "learning_rate": 1.0929979983733119e-06, + "loss": 0.212, + "step": 265700 + }, + { + "epoch": 13.76, + "learning_rate": 1.0839989693568998e-06, + "loss": 0.2058, + "step": 265800 + }, + { + "epoch": 13.77, + "learning_rate": 1.0750364580393256e-06, + "loss": 0.2006, + "step": 265900 + }, + { + "epoch": 13.77, + "learning_rate": 1.0661104757392493e-06, + "loss": 0.1696, + "step": 266000 + }, + { + "epoch": 13.78, + "learning_rate": 1.0572210337291965e-06, + "loss": 0.206, + "step": 266100 + }, + { + "epoch": 13.78, + "learning_rate": 1.0483681432355407e-06, + "loss": 0.2058, + "step": 266200 + }, + { + "epoch": 13.79, + "learning_rate": 1.0395518154385087e-06, + "loss": 0.1829, + "step": 266300 + }, + { + "epoch": 13.79, + "learning_rate": 1.030772061472134e-06, + "loss": 0.1756, + "step": 266400 + }, + { + "epoch": 13.8, + "learning_rate": 1.022028892424277e-06, + "loss": 0.202, + "step": 266500 + }, + { + "epoch": 13.8, + "learning_rate": 1.0133223193365826e-06, + "loss": 0.2341, + "step": 266600 + }, + { + "epoch": 13.81, + "learning_rate": 1.0046523532044983e-06, + "loss": 0.1396, + "step": 266700 + }, + { + "epoch": 13.81, + "learning_rate": 9.96019004977219e-07, + "loss": 0.2712, + "step": 266800 + }, + { + "epoch": 13.82, + "learning_rate": 9.874222855577097e-07, + "loss": 0.2108, + "step": 266900 + }, + { + "epoch": 13.82, + "learning_rate": 9.788622058026631e-07, + "loss": 0.1792, + "step": 267000 + }, + { + "epoch": 13.83, + "learning_rate": 9.703387765225248e-07, + "loss": 0.1709, + "step": 267100 + }, + { + "epoch": 13.84, + "learning_rate": 9.618520084814275e-07, + "loss": 0.1931, + "step": 267200 + }, + { + "epoch": 13.84, + "learning_rate": 9.534019123972182e-07, + "loss": 0.2147, + "step": 267300 + }, + { + "epoch": 13.85, + "learning_rate": 9.44988498941437e-07, + "loss": 0.2211, + "step": 267400 + }, + { + "epoch": 13.85, + "learning_rate": 9.36611778739288e-07, + "loss": 0.1945, + "step": 267500 + }, + { + "epoch": 13.86, + "learning_rate": 9.282717623696391e-07, + "loss": 0.215, + "step": 267600 + }, + { + "epoch": 13.86, + "learning_rate": 9.199684603649983e-07, + "loss": 0.2223, + "step": 267700 + }, + { + "epoch": 13.87, + "learning_rate": 9.117843671607285e-07, + "loss": 0.2026, + "step": 267800 + }, + { + "epoch": 13.87, + "learning_rate": 9.035541578937468e-07, + "loss": 0.1997, + "step": 267900 + }, + { + "epoch": 13.88, + "learning_rate": 8.953606942073733e-07, + "loss": 0.2075, + "step": 268000 + }, + { + "epoch": 13.88, + "learning_rate": 8.872039864490311e-07, + "loss": 0.2017, + "step": 268100 + }, + { + "epoch": 13.89, + "learning_rate": 8.790840449197535e-07, + "loss": 0.1734, + "step": 268200 + }, + { + "epoch": 13.89, + "learning_rate": 8.710008798741076e-07, + "loss": 0.2188, + "step": 268300 + }, + { + "epoch": 13.9, + "learning_rate": 8.629545015202445e-07, + "loss": 0.2032, + "step": 268400 + }, + { + "epoch": 13.9, + "learning_rate": 8.54944920019839e-07, + "loss": 0.1782, + "step": 268500 + }, + { + "epoch": 13.91, + "learning_rate": 8.46972145488113e-07, + "loss": 0.1845, + "step": 268600 + }, + { + "epoch": 13.91, + "learning_rate": 8.390361879937891e-07, + "loss": 0.2174, + "step": 268700 + }, + { + "epoch": 13.92, + "learning_rate": 8.31137057559097e-07, + "loss": 0.1775, + "step": 268800 + }, + { + "epoch": 13.92, + "learning_rate": 8.232747641597704e-07, + "loss": 0.24, + "step": 268900 + }, + { + "epoch": 13.93, + "learning_rate": 8.154493177250067e-07, + "loss": 0.1645, + "step": 269000 + }, + { + "epoch": 13.93, + "learning_rate": 8.076607281374837e-07, + "loss": 0.1661, + "step": 269100 + }, + { + "epoch": 13.94, + "learning_rate": 7.999090052333103e-07, + "loss": 0.2008, + "step": 269200 + }, + { + "epoch": 13.94, + "learning_rate": 7.921941588020621e-07, + "loss": 0.2065, + "step": 269300 + }, + { + "epoch": 13.95, + "learning_rate": 7.845161985867356e-07, + "loss": 0.2162, + "step": 269400 + }, + { + "epoch": 13.95, + "learning_rate": 7.768751342837377e-07, + "loss": 0.1849, + "step": 269500 + }, + { + "epoch": 13.96, + "learning_rate": 7.692709755428861e-07, + "loss": 0.243, + "step": 269600 + }, + { + "epoch": 13.96, + "learning_rate": 7.617037319673859e-07, + "loss": 0.1959, + "step": 269700 + }, + { + "epoch": 13.97, + "learning_rate": 7.54173413113829e-07, + "loss": 0.2472, + "step": 269800 + }, + { + "epoch": 13.98, + "learning_rate": 7.466800284921715e-07, + "loss": 0.1853, + "step": 269900 + }, + { + "epoch": 13.98, + "learning_rate": 7.392235875657271e-07, + "loss": 0.1843, + "step": 270000 + }, + { + "epoch": 13.99, + "learning_rate": 7.3180409975115e-07, + "loss": 0.2055, + "step": 270100 + }, + { + "epoch": 13.99, + "learning_rate": 7.244215744184312e-07, + "loss": 0.2196, + "step": 270200 + }, + { + "epoch": 14.0, + "learning_rate": 7.1707602089088e-07, + "loss": 0.2078, + "step": 270300 + }, + { + "epoch": 14.0, + "eval_accuracy": 0.6238605253960857, + "eval_cer": 0.09958260984137292, + "eval_loss": 0.5843430161476135, + "eval_runtime": 3896.094, + "eval_samples_per_second": 4.406, + "eval_steps_per_second": 0.275, + "eval_wer": 0.2318393035703782, + "step": 270382 + }, + { + "epoch": 14.0, + "learning_rate": 7.097674484451155e-07, + "loss": 0.1998, + "step": 270400 + }, + { + "epoch": 14.01, + "learning_rate": 7.024958663110514e-07, + "loss": 0.1953, + "step": 270500 + }, + { + "epoch": 14.01, + "learning_rate": 6.952612836718919e-07, + "loss": 0.2291, + "step": 270600 + }, + { + "epoch": 14.02, + "learning_rate": 6.880637096641052e-07, + "loss": 0.2005, + "step": 270700 + }, + { + "epoch": 14.02, + "learning_rate": 6.809031533774401e-07, + "loss": 0.194, + "step": 270800 + }, + { + "epoch": 14.03, + "learning_rate": 6.737796238548732e-07, + "loss": 0.1717, + "step": 270900 + }, + { + "epoch": 14.03, + "learning_rate": 6.666931300926316e-07, + "loss": 0.2115, + "step": 271000 + }, + { + "epoch": 14.04, + "learning_rate": 6.596436810401796e-07, + "loss": 0.2235, + "step": 271100 + }, + { + "epoch": 14.04, + "learning_rate": 6.526312856001825e-07, + "loss": 0.2813, + "step": 271200 + }, + { + "epoch": 14.05, + "learning_rate": 6.456559526285133e-07, + "loss": 0.1728, + "step": 271300 + }, + { + "epoch": 14.05, + "learning_rate": 6.387176909342485e-07, + "loss": 0.1821, + "step": 271400 + }, + { + "epoch": 14.06, + "learning_rate": 6.318165092796424e-07, + "loss": 0.1847, + "step": 271500 + }, + { + "epoch": 14.06, + "learning_rate": 6.249524163801234e-07, + "loss": 0.1752, + "step": 271600 + }, + { + "epoch": 14.07, + "learning_rate": 6.181254209042674e-07, + "loss": 0.1396, + "step": 271700 + }, + { + "epoch": 14.07, + "learning_rate": 6.113355314738245e-07, + "loss": 0.1949, + "step": 271800 + }, + { + "epoch": 14.08, + "learning_rate": 6.045827566636619e-07, + "loss": 0.1896, + "step": 271900 + }, + { + "epoch": 14.08, + "learning_rate": 5.978671050017914e-07, + "loss": 0.1931, + "step": 272000 + }, + { + "epoch": 14.09, + "learning_rate": 5.911885849693322e-07, + "loss": 0.1753, + "step": 272100 + }, + { + "epoch": 14.09, + "learning_rate": 5.845472050005174e-07, + "loss": 0.1683, + "step": 272200 + }, + { + "epoch": 14.1, + "learning_rate": 5.779429734826647e-07, + "loss": 0.22, + "step": 272300 + }, + { + "epoch": 14.1, + "learning_rate": 5.713758987561923e-07, + "loss": 0.2127, + "step": 272400 + }, + { + "epoch": 14.11, + "learning_rate": 5.649111042167099e-07, + "loss": 0.2293, + "step": 272500 + }, + { + "epoch": 14.11, + "learning_rate": 5.584179961325353e-07, + "loss": 0.1585, + "step": 272600 + }, + { + "epoch": 14.12, + "learning_rate": 5.519620694976202e-07, + "loss": 0.1669, + "step": 272700 + }, + { + "epoch": 14.13, + "learning_rate": 5.455433324650727e-07, + "loss": 0.1638, + "step": 272800 + }, + { + "epoch": 14.13, + "learning_rate": 5.391617931410553e-07, + "loss": 0.2319, + "step": 272900 + }, + { + "epoch": 14.14, + "learning_rate": 5.328174595847413e-07, + "loss": 0.1694, + "step": 273000 + }, + { + "epoch": 14.14, + "learning_rate": 5.265103398083215e-07, + "loss": 0.2226, + "step": 273100 + }, + { + "epoch": 14.15, + "learning_rate": 5.202404417769813e-07, + "loss": 0.1842, + "step": 273200 + }, + { + "epoch": 14.15, + "learning_rate": 5.140077734089099e-07, + "loss": 0.1718, + "step": 273300 + }, + { + "epoch": 14.16, + "learning_rate": 5.078741125320907e-07, + "loss": 0.1985, + "step": 273400 + }, + { + "epoch": 14.16, + "learning_rate": 5.017155545648755e-07, + "loss": 0.2015, + "step": 273500 + }, + { + "epoch": 14.17, + "learning_rate": 4.955942496558019e-07, + "loss": 0.2013, + "step": 273600 + }, + { + "epoch": 14.17, + "learning_rate": 4.895102055354029e-07, + "loss": 0.1712, + "step": 273700 + }, + { + "epoch": 14.18, + "learning_rate": 4.83463429887152e-07, + "loss": 0.1952, + "step": 273800 + }, + { + "epoch": 14.18, + "learning_rate": 4.774539303474513e-07, + "loss": 0.2058, + "step": 273900 + }, + { + "epoch": 14.19, + "learning_rate": 4.714817145056294e-07, + "loss": 0.2194, + "step": 274000 + }, + { + "epoch": 14.19, + "learning_rate": 4.6554678990394004e-07, + "loss": 0.2556, + "step": 274100 + }, + { + "epoch": 14.2, + "learning_rate": 4.5964916403752774e-07, + "loss": 0.1886, + "step": 274200 + }, + { + "epoch": 14.2, + "learning_rate": 4.53788844354438e-07, + "loss": 0.2216, + "step": 274300 + }, + { + "epoch": 14.21, + "learning_rate": 4.4796583825561067e-07, + "loss": 0.1937, + "step": 274400 + }, + { + "epoch": 14.21, + "learning_rate": 4.4218015309484993e-07, + "loss": 0.2076, + "step": 274500 + }, + { + "epoch": 14.22, + "learning_rate": 4.3643179617883777e-07, + "loss": 0.1722, + "step": 274600 + }, + { + "epoch": 14.22, + "learning_rate": 4.3072077476710383e-07, + "loss": 0.21, + "step": 274700 + }, + { + "epoch": 14.23, + "learning_rate": 4.2504709607204207e-07, + "loss": 0.2138, + "step": 274800 + }, + { + "epoch": 14.23, + "learning_rate": 4.194107672588743e-07, + "loss": 0.2108, + "step": 274900 + }, + { + "epoch": 14.24, + "learning_rate": 4.138117954456633e-07, + "loss": 0.228, + "step": 275000 + }, + { + "epoch": 14.24, + "learning_rate": 4.082501877032796e-07, + "loss": 0.2217, + "step": 275100 + }, + { + "epoch": 14.25, + "learning_rate": 4.0272595105542484e-07, + "loss": 0.2087, + "step": 275200 + }, + { + "epoch": 14.25, + "learning_rate": 3.972390924785918e-07, + "loss": 0.2112, + "step": 275300 + }, + { + "epoch": 14.26, + "learning_rate": 3.917896189020775e-07, + "loss": 0.2122, + "step": 275400 + }, + { + "epoch": 14.27, + "learning_rate": 3.8637753720795697e-07, + "loss": 0.1684, + "step": 275500 + }, + { + "epoch": 14.27, + "learning_rate": 3.8100285423109284e-07, + "loss": 0.1985, + "step": 275600 + }, + { + "epoch": 14.28, + "learning_rate": 3.7566557675911217e-07, + "loss": 0.2142, + "step": 275700 + }, + { + "epoch": 14.28, + "learning_rate": 3.7036571153239997e-07, + "loss": 0.176, + "step": 275800 + }, + { + "epoch": 14.29, + "learning_rate": 3.651032652441022e-07, + "loss": 0.1658, + "step": 275900 + }, + { + "epoch": 14.29, + "learning_rate": 3.598782445401061e-07, + "loss": 0.2165, + "step": 276000 + }, + { + "epoch": 14.3, + "learning_rate": 3.546906560190233e-07, + "loss": 0.1821, + "step": 276100 + }, + { + "epoch": 14.3, + "learning_rate": 3.495405062322099e-07, + "loss": 0.2044, + "step": 276200 + }, + { + "epoch": 14.31, + "learning_rate": 3.444278016837366e-07, + "loss": 0.1928, + "step": 276300 + }, + { + "epoch": 14.31, + "learning_rate": 3.393525488303717e-07, + "loss": 0.1964, + "step": 276400 + }, + { + "epoch": 14.32, + "learning_rate": 3.343147540815983e-07, + "loss": 0.2014, + "step": 276500 + }, + { + "epoch": 14.32, + "learning_rate": 3.293144237996004e-07, + "loss": 0.1695, + "step": 276600 + }, + { + "epoch": 14.33, + "learning_rate": 3.243515642992334e-07, + "loss": 0.1918, + "step": 276700 + }, + { + "epoch": 14.33, + "learning_rate": 3.1942618184803373e-07, + "loss": 0.1939, + "step": 276800 + }, + { + "epoch": 14.34, + "learning_rate": 3.1453828266621907e-07, + "loss": 0.2032, + "step": 276900 + }, + { + "epoch": 14.34, + "learning_rate": 3.096878729266617e-07, + "loss": 0.1947, + "step": 277000 + }, + { + "epoch": 14.35, + "learning_rate": 3.048749587548949e-07, + "loss": 0.1716, + "step": 277100 + }, + { + "epoch": 14.35, + "learning_rate": 3.0009954622908344e-07, + "loss": 0.2202, + "step": 277200 + }, + { + "epoch": 14.36, + "learning_rate": 2.9536164138005637e-07, + "loss": 0.2217, + "step": 277300 + }, + { + "epoch": 14.36, + "learning_rate": 2.907080683909913e-07, + "loss": 0.1725, + "step": 277400 + }, + { + "epoch": 14.37, + "learning_rate": 2.8609126830038577e-07, + "loss": 0.2308, + "step": 277500 + }, + { + "epoch": 14.37, + "learning_rate": 2.8146517162576433e-07, + "loss": 0.2133, + "step": 277600 + }, + { + "epoch": 14.38, + "learning_rate": 2.7687660616106945e-07, + "loss": 0.2203, + "step": 277700 + }, + { + "epoch": 14.38, + "learning_rate": 2.7232557770114576e-07, + "loss": 0.2402, + "step": 277800 + }, + { + "epoch": 14.39, + "learning_rate": 2.67812091993439e-07, + "loss": 0.2206, + "step": 277900 + }, + { + "epoch": 14.39, + "learning_rate": 2.633361547379798e-07, + "loss": 0.2143, + "step": 278000 + }, + { + "epoch": 14.4, + "learning_rate": 2.5889777158738303e-07, + "loss": 0.2061, + "step": 278100 + }, + { + "epoch": 14.4, + "learning_rate": 2.545407704423808e-07, + "loss": 0.1924, + "step": 278200 + }, + { + "epoch": 14.41, + "learning_rate": 2.501771365895922e-07, + "loss": 0.1929, + "step": 278300 + }, + { + "epoch": 14.42, + "learning_rate": 2.458510734600428e-07, + "loss": 0.1861, + "step": 278400 + }, + { + "epoch": 14.42, + "learning_rate": 2.4156258651706566e-07, + "loss": 0.1819, + "step": 278500 + }, + { + "epoch": 14.43, + "learning_rate": 2.3731168117655188e-07, + "loss": 0.1687, + "step": 278600 + }, + { + "epoch": 14.43, + "learning_rate": 2.3309836280691387e-07, + "loss": 0.1915, + "step": 278700 + }, + { + "epoch": 14.44, + "learning_rate": 2.289226367291153e-07, + "loss": 0.1725, + "step": 278800 + }, + { + "epoch": 14.44, + "learning_rate": 2.2478450821662444e-07, + "loss": 0.2405, + "step": 278900 + }, + { + "epoch": 14.45, + "learning_rate": 2.2068398249544763e-07, + "loss": 0.2308, + "step": 279000 + }, + { + "epoch": 14.45, + "learning_rate": 2.1662106474408582e-07, + "loss": 0.1945, + "step": 279100 + }, + { + "epoch": 14.46, + "learning_rate": 2.1259576009355464e-07, + "loss": 0.2328, + "step": 279200 + }, + { + "epoch": 14.46, + "learning_rate": 2.08608073627371e-07, + "loss": 0.198, + "step": 279300 + }, + { + "epoch": 14.47, + "learning_rate": 2.0465801038153653e-07, + "loss": 0.1651, + "step": 279400 + }, + { + "epoch": 14.47, + "learning_rate": 2.0074557534454085e-07, + "loss": 0.2009, + "step": 279500 + }, + { + "epoch": 14.48, + "learning_rate": 1.968707734573616e-07, + "loss": 0.1968, + "step": 279600 + }, + { + "epoch": 14.48, + "learning_rate": 1.9303360961343774e-07, + "loss": 0.1836, + "step": 279700 + }, + { + "epoch": 14.49, + "learning_rate": 1.8923408865868296e-07, + "loss": 0.2042, + "step": 279800 + }, + { + "epoch": 14.49, + "learning_rate": 1.8547221539146898e-07, + "loss": 0.1982, + "step": 279900 + }, + { + "epoch": 14.5, + "learning_rate": 1.817479945626288e-07, + "loss": 0.2118, + "step": 280000 + }, + { + "epoch": 14.5, + "learning_rate": 1.7806143087543358e-07, + "loss": 0.2169, + "step": 280100 + }, + { + "epoch": 14.51, + "learning_rate": 1.744125289856058e-07, + "loss": 0.1846, + "step": 280200 + }, + { + "epoch": 14.51, + "learning_rate": 1.7080129350130591e-07, + "loss": 0.1802, + "step": 280300 + }, + { + "epoch": 14.52, + "learning_rate": 1.6722772898312254e-07, + "loss": 0.2135, + "step": 280400 + }, + { + "epoch": 14.52, + "learning_rate": 1.63691839944069e-07, + "loss": 0.1818, + "step": 280500 + }, + { + "epoch": 14.53, + "learning_rate": 1.6019363084957994e-07, + "loss": 0.255, + "step": 280600 + }, + { + "epoch": 14.53, + "learning_rate": 1.5673310611750813e-07, + "loss": 0.1475, + "step": 280700 + }, + { + "epoch": 14.54, + "learning_rate": 1.5331027011811106e-07, + "loss": 0.2059, + "step": 280800 + }, + { + "epoch": 14.54, + "learning_rate": 1.4992512717405426e-07, + "loss": 0.2332, + "step": 280900 + }, + { + "epoch": 14.55, + "learning_rate": 1.465776815603881e-07, + "loss": 0.1957, + "step": 281000 + }, + { + "epoch": 14.55, + "learning_rate": 1.432679375045709e-07, + "loss": 0.2232, + "step": 281100 + }, + { + "epoch": 14.56, + "learning_rate": 1.3999589918644252e-07, + "loss": 0.1849, + "step": 281200 + }, + { + "epoch": 14.57, + "learning_rate": 1.3676157073822415e-07, + "loss": 0.2131, + "step": 281300 + }, + { + "epoch": 14.57, + "learning_rate": 1.335649562445085e-07, + "loss": 0.2122, + "step": 281400 + }, + { + "epoch": 14.58, + "learning_rate": 1.304060597422696e-07, + "loss": 0.1763, + "step": 281500 + }, + { + "epoch": 14.58, + "learning_rate": 1.2728488522084303e-07, + "loss": 0.2014, + "step": 281600 + }, + { + "epoch": 14.59, + "learning_rate": 1.2420143662192574e-07, + "loss": 0.1878, + "step": 281700 + }, + { + "epoch": 14.59, + "learning_rate": 1.2115571783956615e-07, + "loss": 0.2029, + "step": 281800 + }, + { + "epoch": 14.6, + "learning_rate": 1.181477327201741e-07, + "loss": 0.1873, + "step": 281900 + }, + { + "epoch": 14.6, + "learning_rate": 1.1517748506250092e-07, + "loss": 0.1952, + "step": 282000 + }, + { + "epoch": 14.61, + "learning_rate": 1.1224497861763605e-07, + "loss": 0.2329, + "step": 282100 + }, + { + "epoch": 14.61, + "learning_rate": 1.0935021708901038e-07, + "loss": 0.1942, + "step": 282200 + }, + { + "epoch": 14.62, + "learning_rate": 1.0649320413238628e-07, + "loss": 0.2553, + "step": 282300 + }, + { + "epoch": 14.62, + "learning_rate": 1.0367394335585756e-07, + "loss": 0.1781, + "step": 282400 + }, + { + "epoch": 14.63, + "learning_rate": 1.0089243831983619e-07, + "loss": 0.2335, + "step": 282500 + }, + { + "epoch": 14.63, + "learning_rate": 9.814869253704894e-08, + "loss": 0.2154, + "step": 282600 + }, + { + "epoch": 14.64, + "learning_rate": 9.54427094725474e-08, + "loss": 0.2059, + "step": 282700 + }, + { + "epoch": 14.64, + "learning_rate": 9.277449254368797e-08, + "loss": 0.2259, + "step": 282800 + }, + { + "epoch": 14.65, + "learning_rate": 9.014404512012852e-08, + "loss": 0.1848, + "step": 282900 + }, + { + "epoch": 14.65, + "learning_rate": 8.755137052383844e-08, + "loss": 0.1772, + "step": 283000 + }, + { + "epoch": 14.66, + "learning_rate": 8.499647202906858e-08, + "loss": 0.1926, + "step": 283100 + }, + { + "epoch": 14.66, + "learning_rate": 8.247935286238129e-08, + "loss": 0.1812, + "step": 283200 + }, + { + "epoch": 14.67, + "learning_rate": 8.000001620261377e-08, + "loss": 0.2053, + "step": 283300 + }, + { + "epoch": 14.67, + "learning_rate": 7.755846518089472e-08, + "loss": 0.203, + "step": 283400 + }, + { + "epoch": 14.68, + "learning_rate": 7.515470288062764e-08, + "loss": 0.2046, + "step": 283500 + }, + { + "epoch": 14.68, + "learning_rate": 7.278873233750427e-08, + "loss": 0.196, + "step": 283600 + }, + { + "epoch": 14.69, + "learning_rate": 7.048365120377542e-08, + "loss": 0.1941, + "step": 283700 + }, + { + "epoch": 14.69, + "learning_rate": 6.819289509982562e-08, + "loss": 0.1811, + "step": 283800 + }, + { + "epoch": 14.7, + "learning_rate": 6.593993954500666e-08, + "loss": 0.2013, + "step": 283900 + }, + { + "epoch": 14.71, + "learning_rate": 6.372478738454923e-08, + "loss": 0.2085, + "step": 284000 + }, + { + "epoch": 14.71, + "learning_rate": 6.154744141594559e-08, + "loss": 0.2065, + "step": 284100 + }, + { + "epoch": 14.72, + "learning_rate": 5.940790438894617e-08, + "loss": 0.1885, + "step": 284200 + }, + { + "epoch": 14.72, + "learning_rate": 5.7306179005542915e-08, + "loss": 0.217, + "step": 284300 + }, + { + "epoch": 14.73, + "learning_rate": 5.5242267919982656e-08, + "loss": 0.1885, + "step": 284400 + }, + { + "epoch": 14.73, + "learning_rate": 5.321617373876042e-08, + "loss": 0.1921, + "step": 284500 + }, + { + "epoch": 14.74, + "learning_rate": 5.122789902060609e-08, + "loss": 0.1889, + "step": 284600 + }, + { + "epoch": 14.74, + "learning_rate": 4.927744627648445e-08, + "loss": 0.2025, + "step": 284700 + }, + { + "epoch": 14.75, + "learning_rate": 4.7364817969608454e-08, + "loss": 0.2209, + "step": 284800 + }, + { + "epoch": 14.75, + "learning_rate": 4.5490016515412624e-08, + "loss": 0.202, + "step": 284900 + }, + { + "epoch": 14.76, + "learning_rate": 4.3653044281559695e-08, + "loss": 0.1713, + "step": 285000 + }, + { + "epoch": 14.76, + "learning_rate": 4.185390358794727e-08, + "loss": 0.2358, + "step": 285100 + }, + { + "epoch": 14.77, + "learning_rate": 4.009259670668453e-08, + "loss": 0.2237, + "step": 285200 + }, + { + "epoch": 14.77, + "learning_rate": 3.8369125862112166e-08, + "loss": 0.1778, + "step": 285300 + }, + { + "epoch": 14.78, + "learning_rate": 3.66834932307758e-08, + "loss": 0.1806, + "step": 285400 + }, + { + "epoch": 14.78, + "learning_rate": 3.5035700941449255e-08, + "loss": 0.184, + "step": 285500 + }, + { + "epoch": 14.79, + "learning_rate": 3.342575107510792e-08, + "loss": 0.2171, + "step": 285600 + }, + { + "epoch": 14.79, + "learning_rate": 3.185364566494209e-08, + "loss": 0.2058, + "step": 285700 + }, + { + "epoch": 14.8, + "learning_rate": 3.0319386696340266e-08, + "loss": 0.1896, + "step": 285800 + }, + { + "epoch": 14.8, + "learning_rate": 2.8822976106909205e-08, + "loss": 0.2239, + "step": 285900 + }, + { + "epoch": 14.81, + "learning_rate": 2.7364415786440554e-08, + "loss": 0.2104, + "step": 286000 + }, + { + "epoch": 14.81, + "learning_rate": 2.5943707576944197e-08, + "loss": 0.161, + "step": 286100 + }, + { + "epoch": 14.82, + "learning_rate": 2.4560853272608263e-08, + "loss": 0.1693, + "step": 286200 + }, + { + "epoch": 14.82, + "learning_rate": 2.321585461982911e-08, + "loss": 0.2261, + "step": 286300 + }, + { + "epoch": 14.83, + "learning_rate": 2.1908713317188023e-08, + "loss": 0.1788, + "step": 286400 + }, + { + "epoch": 14.83, + "learning_rate": 2.0639431015457844e-08, + "loss": 0.1851, + "step": 286500 + }, + { + "epoch": 14.84, + "learning_rate": 1.9408009317606333e-08, + "loss": 0.2152, + "step": 286600 + }, + { + "epoch": 14.84, + "learning_rate": 1.821444977878284e-08, + "loss": 0.2341, + "step": 286700 + }, + { + "epoch": 14.85, + "learning_rate": 1.705875390631162e-08, + "loss": 0.2293, + "step": 286800 + }, + { + "epoch": 14.86, + "learning_rate": 1.5940923159718513e-08, + "loss": 0.249, + "step": 286900 + }, + { + "epoch": 14.86, + "learning_rate": 1.4860958950694282e-08, + "loss": 0.2155, + "step": 287000 + }, + { + "epoch": 14.87, + "learning_rate": 1.3818862643114604e-08, + "loss": 0.1737, + "step": 287100 + }, + { + "epoch": 14.87, + "learning_rate": 1.2814635553030085e-08, + "loss": 0.1897, + "step": 287200 + }, + { + "epoch": 14.88, + "learning_rate": 1.1848278948669578e-08, + "loss": 0.181, + "step": 287300 + }, + { + "epoch": 14.88, + "learning_rate": 1.091979405043686e-08, + "loss": 0.2013, + "step": 287400 + }, + { + "epoch": 14.89, + "learning_rate": 1.002918203090064e-08, + "loss": 0.1797, + "step": 287500 + }, + { + "epoch": 14.89, + "learning_rate": 9.176444014804553e-09, + "loss": 0.1855, + "step": 287600 + }, + { + "epoch": 14.9, + "learning_rate": 8.361581079067149e-09, + "loss": 0.2017, + "step": 287700 + }, + { + "epoch": 14.9, + "learning_rate": 7.584594252768584e-09, + "loss": 0.1972, + "step": 287800 + }, + { + "epoch": 14.91, + "learning_rate": 6.845484517153943e-09, + "loss": 0.2001, + "step": 287900 + }, + { + "epoch": 14.91, + "learning_rate": 6.144252805636574e-09, + "loss": 0.1866, + "step": 288000 + }, + { + "epoch": 14.92, + "learning_rate": 5.480900003798084e-09, + "loss": 0.1659, + "step": 288100 + }, + { + "epoch": 14.92, + "learning_rate": 4.85542694937835e-09, + "loss": 0.1714, + "step": 288200 + }, + { + "epoch": 14.93, + "learning_rate": 4.2678344322755195e-09, + "loss": 0.1893, + "step": 288300 + }, + { + "epoch": 14.93, + "learning_rate": 3.718123194559331e-09, + "loss": 0.2, + "step": 288400 + }, + { + "epoch": 14.94, + "learning_rate": 3.2062939304544626e-09, + "loss": 0.1652, + "step": 288500 + }, + { + "epoch": 14.94, + "learning_rate": 2.7323472863405307e-09, + "loss": 0.189, + "step": 288600 + }, + { + "epoch": 14.95, + "learning_rate": 2.296283860762083e-09, + "loss": 0.1614, + "step": 288700 + }, + { + "epoch": 14.95, + "learning_rate": 1.898104204415274e-09, + "loss": 0.1776, + "step": 288800 + }, + { + "epoch": 14.96, + "learning_rate": 1.5378088201611906e-09, + "loss": 0.1713, + "step": 288900 + }, + { + "epoch": 14.96, + "learning_rate": 1.2153981630125267e-09, + "loss": 0.1751, + "step": 289000 + }, + { + "epoch": 14.97, + "learning_rate": 9.30872640136915e-10, + "loss": 0.1546, + "step": 289100 + }, + { + "epoch": 14.97, + "learning_rate": 6.842326108569274e-10, + "loss": 0.2107, + "step": 289200 + }, + { + "epoch": 14.98, + "learning_rate": 4.754783866534051e-10, + "loss": 0.1943, + "step": 289300 + }, + { + "epoch": 14.98, + "learning_rate": 3.0461023115879725e-10, + "loss": 0.2321, + "step": 289400 + }, + { + "epoch": 14.99, + "learning_rate": 1.7162836016049177e-10, + "loss": 0.1605, + "step": 289500 + }, + { + "epoch": 15.0, + "learning_rate": 7.653294160414603e-11, + "loss": 0.1868, + "step": 289600 + }, + { + "epoch": 15.0, + "eval_accuracy": 0.6237545870223672, + "eval_cer": 0.10093501042298987, + "eval_loss": 0.5886313915252686, + "eval_runtime": 3881.629, + "eval_samples_per_second": 4.423, + "eval_steps_per_second": 0.276, + "eval_wer": 0.23375095582612787, + "step": 289695 + } + ], + "logging_steps": 100, + "max_steps": 289695, + "num_train_epochs": 15, + "save_steps": 500, + "total_flos": 3.113937730070863e+21, + "trial_name": null, + "trial_params": null +}