diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,36043 @@ +{ + "best_metric": 0.12089719269034979, + "best_model_checkpoint": "./wav2vec2-base-german-cv9/checkpoint-177850", + "epoch": 49.999859451862264, + "global_step": 177850, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.01, + "learning_rate": 1.6305875737981447e-07, + "loss": 12.2032, + "step": 30 + }, + { + "epoch": 0.02, + "learning_rate": 3.3174023053134664e-07, + "loss": 12.7588, + "step": 60 + }, + { + "epoch": 0.03, + "learning_rate": 5.004217036828789e-07, + "loss": 11.4436, + "step": 90 + }, + { + "epoch": 0.03, + "learning_rate": 6.691031768344111e-07, + "loss": 12.2914, + "step": 120 + }, + { + "epoch": 0.04, + "learning_rate": 8.377846499859433e-07, + "loss": 11.2155, + "step": 150 + }, + { + "epoch": 0.05, + "learning_rate": 1.0064661231374754e-06, + "loss": 10.696, + "step": 180 + }, + { + "epoch": 0.06, + "learning_rate": 1.1751475962890077e-06, + "loss": 10.2185, + "step": 210 + }, + { + "epoch": 0.07, + "learning_rate": 1.3438290694405398e-06, + "loss": 7.9571, + "step": 240 + }, + { + "epoch": 0.08, + "learning_rate": 1.512510542592072e-06, + "loss": 6.4243, + "step": 270 + }, + { + "epoch": 0.08, + "learning_rate": 1.6811920157436041e-06, + "loss": 4.8724, + "step": 300 + }, + { + "epoch": 0.09, + "learning_rate": 1.8498734888951364e-06, + "loss": 3.9775, + "step": 330 + }, + { + "epoch": 0.1, + "learning_rate": 2.0185549620466685e-06, + "loss": 3.7284, + "step": 360 + }, + { + "epoch": 0.11, + "learning_rate": 2.1872364351982008e-06, + "loss": 3.5572, + "step": 390 + }, + { + "epoch": 0.12, + "learning_rate": 2.355917908349733e-06, + "loss": 3.4845, + "step": 420 + }, + { + "epoch": 0.13, + "learning_rate": 2.5245993815012653e-06, + "loss": 3.5107, + "step": 450 + }, + { + "epoch": 0.13, + "learning_rate": 2.6932808546527976e-06, + "loss": 3.3341, + "step": 480 + }, + { + "epoch": 0.14, + "learning_rate": 2.8619623278043295e-06, + "loss": 3.3489, + "step": 510 + }, + { + "epoch": 0.15, + "learning_rate": 3.0306438009558618e-06, + "loss": 3.2479, + "step": 540 + }, + { + "epoch": 0.16, + "learning_rate": 3.199325274107394e-06, + "loss": 3.2032, + "step": 570 + }, + { + "epoch": 0.17, + "learning_rate": 3.3680067472589263e-06, + "loss": 3.1983, + "step": 600 + }, + { + "epoch": 0.18, + "learning_rate": 3.5366882204104586e-06, + "loss": 3.1298, + "step": 630 + }, + { + "epoch": 0.19, + "learning_rate": 3.7053696935619905e-06, + "loss": 3.1466, + "step": 660 + }, + { + "epoch": 0.19, + "learning_rate": 3.874051166713523e-06, + "loss": 3.1242, + "step": 690 + }, + { + "epoch": 0.2, + "learning_rate": 4.042732639865055e-06, + "loss": 3.11, + "step": 720 + }, + { + "epoch": 0.21, + "learning_rate": 4.211414113016587e-06, + "loss": 3.0988, + "step": 750 + }, + { + "epoch": 0.22, + "learning_rate": 4.38009558616812e-06, + "loss": 3.0706, + "step": 780 + }, + { + "epoch": 0.23, + "learning_rate": 4.548777059319652e-06, + "loss": 3.0548, + "step": 810 + }, + { + "epoch": 0.24, + "learning_rate": 4.717458532471184e-06, + "loss": 3.024, + "step": 840 + }, + { + "epoch": 0.24, + "learning_rate": 4.8861400056227165e-06, + "loss": 3.0499, + "step": 870 + }, + { + "epoch": 0.25, + "learning_rate": 5.054821478774248e-06, + "loss": 3.0314, + "step": 900 + }, + { + "epoch": 0.26, + "learning_rate": 5.22350295192578e-06, + "loss": 3.0053, + "step": 930 + }, + { + "epoch": 0.27, + "learning_rate": 5.3921844250773125e-06, + "loss": 3.0105, + "step": 960 + }, + { + "epoch": 0.28, + "learning_rate": 5.560865898228845e-06, + "loss": 2.9906, + "step": 990 + }, + { + "epoch": 0.29, + "learning_rate": 5.729547371380377e-06, + "loss": 2.9944, + "step": 1020 + }, + { + "epoch": 0.3, + "learning_rate": 5.898228844531909e-06, + "loss": 2.9826, + "step": 1050 + }, + { + "epoch": 0.3, + "learning_rate": 6.066910317683442e-06, + "loss": 2.9734, + "step": 1080 + }, + { + "epoch": 0.31, + "learning_rate": 6.235591790834974e-06, + "loss": 2.9778, + "step": 1110 + }, + { + "epoch": 0.32, + "learning_rate": 6.404273263986506e-06, + "loss": 2.9687, + "step": 1140 + }, + { + "epoch": 0.33, + "learning_rate": 6.572954737138038e-06, + "loss": 2.9713, + "step": 1170 + }, + { + "epoch": 0.34, + "learning_rate": 6.74163621028957e-06, + "loss": 2.974, + "step": 1200 + }, + { + "epoch": 0.35, + "learning_rate": 6.910317683441102e-06, + "loss": 2.9678, + "step": 1230 + }, + { + "epoch": 0.35, + "learning_rate": 7.0789991565926345e-06, + "loss": 2.9642, + "step": 1260 + }, + { + "epoch": 0.36, + "learning_rate": 7.247680629744166e-06, + "loss": 2.9497, + "step": 1290 + }, + { + "epoch": 0.37, + "learning_rate": 7.416362102895699e-06, + "loss": 2.9682, + "step": 1320 + }, + { + "epoch": 0.38, + "learning_rate": 7.5850435760472305e-06, + "loss": 2.9605, + "step": 1350 + }, + { + "epoch": 0.39, + "learning_rate": 7.753725049198764e-06, + "loss": 2.9447, + "step": 1380 + }, + { + "epoch": 0.4, + "learning_rate": 7.922406522350296e-06, + "loss": 2.9573, + "step": 1410 + }, + { + "epoch": 0.4, + "learning_rate": 8.091087995501828e-06, + "loss": 2.9415, + "step": 1440 + }, + { + "epoch": 0.41, + "learning_rate": 8.25976946865336e-06, + "loss": 2.9516, + "step": 1470 + }, + { + "epoch": 0.42, + "learning_rate": 8.428450941804893e-06, + "loss": 2.95, + "step": 1500 + }, + { + "epoch": 0.43, + "learning_rate": 8.597132414956425e-06, + "loss": 2.9408, + "step": 1530 + }, + { + "epoch": 0.44, + "learning_rate": 8.765813888107957e-06, + "loss": 2.9465, + "step": 1560 + }, + { + "epoch": 0.45, + "learning_rate": 8.934495361259488e-06, + "loss": 2.9343, + "step": 1590 + }, + { + "epoch": 0.46, + "learning_rate": 9.103176834411022e-06, + "loss": 2.9493, + "step": 1620 + }, + { + "epoch": 0.46, + "learning_rate": 9.271858307562552e-06, + "loss": 2.9469, + "step": 1650 + }, + { + "epoch": 0.47, + "learning_rate": 9.440539780714085e-06, + "loss": 2.9335, + "step": 1680 + }, + { + "epoch": 0.48, + "learning_rate": 9.609221253865617e-06, + "loss": 2.9465, + "step": 1710 + }, + { + "epoch": 0.49, + "learning_rate": 9.77790272701715e-06, + "loss": 2.9322, + "step": 1740 + }, + { + "epoch": 0.5, + "learning_rate": 9.946584200168682e-06, + "loss": 2.9458, + "step": 1770 + }, + { + "epoch": 0.51, + "learning_rate": 1.0115265673320214e-05, + "loss": 2.9356, + "step": 1800 + }, + { + "epoch": 0.51, + "learning_rate": 1.0283947146471746e-05, + "loss": 2.9323, + "step": 1830 + }, + { + "epoch": 0.52, + "learning_rate": 1.0452628619623278e-05, + "loss": 2.9469, + "step": 1860 + }, + { + "epoch": 0.53, + "learning_rate": 1.062131009277481e-05, + "loss": 2.9314, + "step": 1890 + }, + { + "epoch": 0.54, + "learning_rate": 1.0789991565926343e-05, + "loss": 2.938, + "step": 1920 + }, + { + "epoch": 0.55, + "learning_rate": 1.0958673039077875e-05, + "loss": 2.9337, + "step": 1950 + }, + { + "epoch": 0.56, + "learning_rate": 1.1127354512229408e-05, + "loss": 2.9256, + "step": 1980 + }, + { + "epoch": 0.57, + "learning_rate": 1.129603598538094e-05, + "loss": 2.932, + "step": 2010 + }, + { + "epoch": 0.57, + "learning_rate": 1.1464717458532472e-05, + "loss": 2.9211, + "step": 2040 + }, + { + "epoch": 0.58, + "learning_rate": 1.1633398931684004e-05, + "loss": 2.9309, + "step": 2070 + }, + { + "epoch": 0.59, + "learning_rate": 1.1802080404835537e-05, + "loss": 2.9275, + "step": 2100 + }, + { + "epoch": 0.6, + "learning_rate": 1.1970761877987069e-05, + "loss": 2.9213, + "step": 2130 + }, + { + "epoch": 0.61, + "learning_rate": 1.2139443351138601e-05, + "loss": 2.9525, + "step": 2160 + }, + { + "epoch": 0.62, + "learning_rate": 1.2308124824290134e-05, + "loss": 2.9197, + "step": 2190 + }, + { + "epoch": 0.62, + "learning_rate": 1.2476806297441664e-05, + "loss": 2.9257, + "step": 2220 + }, + { + "epoch": 0.63, + "learning_rate": 1.2645487770593198e-05, + "loss": 2.9156, + "step": 2250 + }, + { + "epoch": 0.64, + "learning_rate": 1.2814169243744729e-05, + "loss": 2.9045, + "step": 2280 + }, + { + "epoch": 0.65, + "learning_rate": 1.2982850716896261e-05, + "loss": 2.858, + "step": 2310 + }, + { + "epoch": 0.66, + "learning_rate": 1.3151532190047793e-05, + "loss": 2.7263, + "step": 2340 + }, + { + "epoch": 0.67, + "learning_rate": 1.3320213663199327e-05, + "loss": 2.6023, + "step": 2370 + }, + { + "epoch": 0.67, + "learning_rate": 1.3488895136350856e-05, + "loss": 2.412, + "step": 2400 + }, + { + "epoch": 0.68, + "learning_rate": 1.365757660950239e-05, + "loss": 2.2819, + "step": 2430 + }, + { + "epoch": 0.69, + "learning_rate": 1.3826258082653922e-05, + "loss": 2.1276, + "step": 2460 + }, + { + "epoch": 0.7, + "learning_rate": 1.3994939555805456e-05, + "loss": 1.9495, + "step": 2490 + }, + { + "epoch": 0.71, + "learning_rate": 1.4163621028956985e-05, + "loss": 1.7862, + "step": 2520 + }, + { + "epoch": 0.72, + "learning_rate": 1.433230250210852e-05, + "loss": 1.6618, + "step": 2550 + }, + { + "epoch": 0.73, + "learning_rate": 1.4500983975260052e-05, + "loss": 1.5095, + "step": 2580 + }, + { + "epoch": 0.73, + "learning_rate": 1.4669665448411586e-05, + "loss": 1.4625, + "step": 2610 + }, + { + "epoch": 0.74, + "learning_rate": 1.4838346921563114e-05, + "loss": 1.3446, + "step": 2640 + }, + { + "epoch": 0.75, + "learning_rate": 1.5007028394714648e-05, + "loss": 1.2631, + "step": 2670 + }, + { + "epoch": 0.76, + "learning_rate": 1.517570986786618e-05, + "loss": 1.2598, + "step": 2700 + }, + { + "epoch": 0.77, + "learning_rate": 1.534439134101771e-05, + "loss": 1.1956, + "step": 2730 + }, + { + "epoch": 0.78, + "learning_rate": 1.5513072814169244e-05, + "loss": 1.1249, + "step": 2760 + }, + { + "epoch": 0.78, + "learning_rate": 1.5681754287320776e-05, + "loss": 1.1259, + "step": 2790 + }, + { + "epoch": 0.79, + "learning_rate": 1.5850435760472308e-05, + "loss": 1.0686, + "step": 2820 + }, + { + "epoch": 0.8, + "learning_rate": 1.601911723362384e-05, + "loss": 1.0721, + "step": 2850 + }, + { + "epoch": 0.81, + "learning_rate": 1.6187798706775373e-05, + "loss": 1.0029, + "step": 2880 + }, + { + "epoch": 0.82, + "learning_rate": 1.6356480179926905e-05, + "loss": 1.0331, + "step": 2910 + }, + { + "epoch": 0.83, + "learning_rate": 1.6525161653078437e-05, + "loss": 0.9962, + "step": 2940 + }, + { + "epoch": 0.83, + "learning_rate": 1.669384312622997e-05, + "loss": 0.9536, + "step": 2970 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862524599381502e-05, + "loss": 0.9659, + "step": 3000 + }, + { + "epoch": 0.85, + "learning_rate": 1.7031206072533034e-05, + "loss": 0.8696, + "step": 3030 + }, + { + "epoch": 0.86, + "learning_rate": 1.7199887545684566e-05, + "loss": 0.9237, + "step": 3060 + }, + { + "epoch": 0.87, + "learning_rate": 1.73685690188361e-05, + "loss": 0.8709, + "step": 3090 + }, + { + "epoch": 0.88, + "learning_rate": 1.753725049198763e-05, + "loss": 0.8687, + "step": 3120 + }, + { + "epoch": 0.89, + "learning_rate": 1.7705931965139163e-05, + "loss": 0.8936, + "step": 3150 + }, + { + "epoch": 0.89, + "learning_rate": 1.7874613438290696e-05, + "loss": 0.8026, + "step": 3180 + }, + { + "epoch": 0.9, + "learning_rate": 1.8043294911442228e-05, + "loss": 0.8476, + "step": 3210 + }, + { + "epoch": 0.91, + "learning_rate": 1.821197638459376e-05, + "loss": 0.7849, + "step": 3240 + }, + { + "epoch": 0.92, + "learning_rate": 1.8380657857745292e-05, + "loss": 0.7881, + "step": 3270 + }, + { + "epoch": 0.93, + "learning_rate": 1.854933933089682e-05, + "loss": 0.8008, + "step": 3300 + }, + { + "epoch": 0.94, + "learning_rate": 1.8718020804048357e-05, + "loss": 0.7813, + "step": 3330 + }, + { + "epoch": 0.94, + "learning_rate": 1.888670227719989e-05, + "loss": 0.7709, + "step": 3360 + }, + { + "epoch": 0.95, + "learning_rate": 1.905538375035142e-05, + "loss": 0.7513, + "step": 3390 + }, + { + "epoch": 0.96, + "learning_rate": 1.922406522350295e-05, + "loss": 0.7527, + "step": 3420 + }, + { + "epoch": 0.97, + "learning_rate": 1.9392746696654486e-05, + "loss": 0.7578, + "step": 3450 + }, + { + "epoch": 0.98, + "learning_rate": 1.956142816980602e-05, + "loss": 0.692, + "step": 3480 + }, + { + "epoch": 0.99, + "learning_rate": 1.973010964295755e-05, + "loss": 0.7196, + "step": 3510 + }, + { + "epoch": 1.0, + "learning_rate": 1.989879111610908e-05, + "loss": 0.6827, + "step": 3540 + }, + { + "epoch": 1.0, + "eval_loss": 0.6694612503051758, + "eval_runtime": 479.6772, + "eval_samples_per_second": 33.425, + "eval_steps_per_second": 1.047, + "eval_wer": 0.6247048708255428, + "step": 3557 + }, + { + "epoch": 1.0, + "learning_rate": 2.0067472589260615e-05, + "loss": 0.7322, + "step": 3570 + }, + { + "epoch": 1.01, + "learning_rate": 2.0236154062412148e-05, + "loss": 0.6911, + "step": 3600 + }, + { + "epoch": 1.02, + "learning_rate": 2.040483553556368e-05, + "loss": 0.6838, + "step": 3630 + }, + { + "epoch": 1.03, + "learning_rate": 2.057351700871521e-05, + "loss": 0.7403, + "step": 3660 + }, + { + "epoch": 1.04, + "learning_rate": 2.074219848186674e-05, + "loss": 0.6329, + "step": 3690 + }, + { + "epoch": 1.05, + "learning_rate": 2.0910879955018277e-05, + "loss": 0.7176, + "step": 3720 + }, + { + "epoch": 1.05, + "learning_rate": 2.107956142816981e-05, + "loss": 0.6629, + "step": 3750 + }, + { + "epoch": 1.06, + "learning_rate": 2.1248242901321338e-05, + "loss": 0.6463, + "step": 3780 + }, + { + "epoch": 1.07, + "learning_rate": 2.141692437447287e-05, + "loss": 0.6654, + "step": 3810 + }, + { + "epoch": 1.08, + "learning_rate": 2.1585605847624406e-05, + "loss": 0.6117, + "step": 3840 + }, + { + "epoch": 1.09, + "learning_rate": 2.1754287320775935e-05, + "loss": 0.6467, + "step": 3870 + }, + { + "epoch": 1.1, + "learning_rate": 2.1922968793927467e-05, + "loss": 0.6177, + "step": 3900 + }, + { + "epoch": 1.1, + "learning_rate": 2.2091650267079e-05, + "loss": 0.6371, + "step": 3930 + }, + { + "epoch": 1.11, + "learning_rate": 2.2260331740230535e-05, + "loss": 0.6435, + "step": 3960 + }, + { + "epoch": 1.12, + "learning_rate": 2.2429013213382064e-05, + "loss": 0.5747, + "step": 3990 + }, + { + "epoch": 1.13, + "learning_rate": 2.2597694686533596e-05, + "loss": 0.6323, + "step": 4020 + }, + { + "epoch": 1.14, + "learning_rate": 2.276637615968513e-05, + "loss": 0.5872, + "step": 4050 + }, + { + "epoch": 1.15, + "learning_rate": 2.293505763283666e-05, + "loss": 0.6117, + "step": 4080 + }, + { + "epoch": 1.16, + "learning_rate": 2.3103739105988193e-05, + "loss": 0.6378, + "step": 4110 + }, + { + "epoch": 1.16, + "learning_rate": 2.3272420579139725e-05, + "loss": 0.5582, + "step": 4140 + }, + { + "epoch": 1.17, + "learning_rate": 2.3441102052291258e-05, + "loss": 0.5966, + "step": 4170 + }, + { + "epoch": 1.18, + "learning_rate": 2.360978352544279e-05, + "loss": 0.5798, + "step": 4200 + }, + { + "epoch": 1.19, + "learning_rate": 2.3778464998594322e-05, + "loss": 0.5712, + "step": 4230 + }, + { + "epoch": 1.2, + "learning_rate": 2.3947146471745854e-05, + "loss": 0.6294, + "step": 4260 + }, + { + "epoch": 1.21, + "learning_rate": 2.4115827944897387e-05, + "loss": 0.5199, + "step": 4290 + }, + { + "epoch": 1.21, + "learning_rate": 2.428450941804892e-05, + "loss": 0.5899, + "step": 4320 + }, + { + "epoch": 1.22, + "learning_rate": 2.445319089120045e-05, + "loss": 0.5548, + "step": 4350 + }, + { + "epoch": 1.23, + "learning_rate": 2.4621872364351984e-05, + "loss": 0.5549, + "step": 4380 + }, + { + "epoch": 1.24, + "learning_rate": 2.4790553837503516e-05, + "loss": 0.5868, + "step": 4410 + }, + { + "epoch": 1.25, + "learning_rate": 2.4959235310655048e-05, + "loss": 0.5235, + "step": 4440 + }, + { + "epoch": 1.26, + "learning_rate": 2.5127916783806584e-05, + "loss": 0.554, + "step": 4470 + }, + { + "epoch": 1.27, + "learning_rate": 2.529659825695811e-05, + "loss": 0.5417, + "step": 4500 + }, + { + "epoch": 1.27, + "learning_rate": 2.546527973010964e-05, + "loss": 0.5507, + "step": 4530 + }, + { + "epoch": 1.28, + "learning_rate": 2.5633961203261174e-05, + "loss": 0.553, + "step": 4560 + }, + { + "epoch": 1.29, + "learning_rate": 2.580264267641271e-05, + "loss": 0.5236, + "step": 4590 + }, + { + "epoch": 1.3, + "learning_rate": 2.5971324149564242e-05, + "loss": 0.539, + "step": 4620 + }, + { + "epoch": 1.31, + "learning_rate": 2.6140005622715774e-05, + "loss": 0.5365, + "step": 4650 + }, + { + "epoch": 1.32, + "learning_rate": 2.6308687095867306e-05, + "loss": 0.5051, + "step": 4680 + }, + { + "epoch": 1.32, + "learning_rate": 2.647736856901884e-05, + "loss": 0.5507, + "step": 4710 + }, + { + "epoch": 1.33, + "learning_rate": 2.6646050042170368e-05, + "loss": 0.4849, + "step": 4740 + }, + { + "epoch": 1.34, + "learning_rate": 2.68147315153219e-05, + "loss": 0.5283, + "step": 4770 + }, + { + "epoch": 1.35, + "learning_rate": 2.6983412988473432e-05, + "loss": 0.5033, + "step": 4800 + }, + { + "epoch": 1.36, + "learning_rate": 2.7152094461624968e-05, + "loss": 0.4936, + "step": 4830 + }, + { + "epoch": 1.37, + "learning_rate": 2.73207759347765e-05, + "loss": 0.5279, + "step": 4860 + }, + { + "epoch": 1.37, + "learning_rate": 2.7489457407928032e-05, + "loss": 0.4744, + "step": 4890 + }, + { + "epoch": 1.38, + "learning_rate": 2.7658138881079565e-05, + "loss": 0.5037, + "step": 4920 + }, + { + "epoch": 1.39, + "learning_rate": 2.7826820354231094e-05, + "loss": 0.4915, + "step": 4950 + }, + { + "epoch": 1.4, + "learning_rate": 2.7995501827382626e-05, + "loss": 0.4876, + "step": 4980 + }, + { + "epoch": 1.41, + "learning_rate": 2.8164183300534158e-05, + "loss": 0.5335, + "step": 5010 + }, + { + "epoch": 1.42, + "learning_rate": 2.833286477368569e-05, + "loss": 0.4636, + "step": 5040 + }, + { + "epoch": 1.43, + "learning_rate": 2.8501546246837223e-05, + "loss": 0.5002, + "step": 5070 + }, + { + "epoch": 1.43, + "learning_rate": 2.867022771998876e-05, + "loss": 0.4758, + "step": 5100 + }, + { + "epoch": 1.44, + "learning_rate": 2.883890919314029e-05, + "loss": 0.4738, + "step": 5130 + }, + { + "epoch": 1.45, + "learning_rate": 2.9007590666291823e-05, + "loss": 0.5203, + "step": 5160 + }, + { + "epoch": 1.46, + "learning_rate": 2.9176272139443352e-05, + "loss": 0.443, + "step": 5190 + }, + { + "epoch": 1.47, + "learning_rate": 2.9344953612594884e-05, + "loss": 0.4962, + "step": 5220 + }, + { + "epoch": 1.48, + "learning_rate": 2.9513635085746416e-05, + "loss": 0.4682, + "step": 5250 + }, + { + "epoch": 1.48, + "learning_rate": 2.968231655889795e-05, + "loss": 0.457, + "step": 5280 + }, + { + "epoch": 1.49, + "learning_rate": 2.985099803204948e-05, + "loss": 0.5142, + "step": 5310 + }, + { + "epoch": 1.5, + "learning_rate": 3.0019679505201017e-05, + "loss": 0.4314, + "step": 5340 + }, + { + "epoch": 1.51, + "learning_rate": 3.018836097835255e-05, + "loss": 0.4743, + "step": 5370 + }, + { + "epoch": 1.52, + "learning_rate": 3.0357042451504074e-05, + "loss": 0.4578, + "step": 5400 + }, + { + "epoch": 1.53, + "learning_rate": 3.052572392465561e-05, + "loss": 0.4509, + "step": 5430 + }, + { + "epoch": 1.53, + "learning_rate": 3.069440539780714e-05, + "loss": 0.4864, + "step": 5460 + }, + { + "epoch": 1.54, + "learning_rate": 3.0863086870958675e-05, + "loss": 0.4256, + "step": 5490 + }, + { + "epoch": 1.55, + "learning_rate": 3.103176834411021e-05, + "loss": 0.4903, + "step": 5520 + }, + { + "epoch": 1.56, + "learning_rate": 3.120044981726174e-05, + "loss": 0.4521, + "step": 5550 + }, + { + "epoch": 1.57, + "learning_rate": 3.136913129041327e-05, + "loss": 0.4468, + "step": 5580 + }, + { + "epoch": 1.58, + "learning_rate": 3.1537812763564804e-05, + "loss": 0.4822, + "step": 5610 + }, + { + "epoch": 1.59, + "learning_rate": 3.1706494236716336e-05, + "loss": 0.4293, + "step": 5640 + }, + { + "epoch": 1.59, + "learning_rate": 3.187517570986787e-05, + "loss": 0.4591, + "step": 5670 + }, + { + "epoch": 1.6, + "learning_rate": 3.20438571830194e-05, + "loss": 0.4288, + "step": 5700 + }, + { + "epoch": 1.61, + "learning_rate": 3.221253865617093e-05, + "loss": 0.4464, + "step": 5730 + }, + { + "epoch": 1.62, + "learning_rate": 3.2381220129322465e-05, + "loss": 0.4698, + "step": 5760 + }, + { + "epoch": 1.63, + "learning_rate": 3.2549901602474e-05, + "loss": 0.4046, + "step": 5790 + }, + { + "epoch": 1.64, + "learning_rate": 3.271858307562553e-05, + "loss": 0.4578, + "step": 5820 + }, + { + "epoch": 1.64, + "learning_rate": 3.288726454877706e-05, + "loss": 0.4225, + "step": 5850 + }, + { + "epoch": 1.65, + "learning_rate": 3.3055946021928594e-05, + "loss": 0.4364, + "step": 5880 + }, + { + "epoch": 1.66, + "learning_rate": 3.3224627495080127e-05, + "loss": 0.4601, + "step": 5910 + }, + { + "epoch": 1.67, + "learning_rate": 3.339330896823166e-05, + "loss": 0.4043, + "step": 5940 + }, + { + "epoch": 1.68, + "learning_rate": 3.356199044138319e-05, + "loss": 0.4533, + "step": 5970 + }, + { + "epoch": 1.69, + "learning_rate": 3.3730671914534723e-05, + "loss": 0.4269, + "step": 6000 + }, + { + "epoch": 1.7, + "learning_rate": 3.3899353387686256e-05, + "loss": 0.4232, + "step": 6030 + }, + { + "epoch": 1.7, + "learning_rate": 3.406803486083779e-05, + "loss": 0.4536, + "step": 6060 + }, + { + "epoch": 1.71, + "learning_rate": 3.4236716333989314e-05, + "loss": 0.3908, + "step": 6090 + }, + { + "epoch": 1.72, + "learning_rate": 3.4405397807140846e-05, + "loss": 0.4204, + "step": 6120 + }, + { + "epoch": 1.73, + "learning_rate": 3.4574079280292385e-05, + "loss": 0.4227, + "step": 6150 + }, + { + "epoch": 1.74, + "learning_rate": 3.474276075344392e-05, + "loss": 0.4017, + "step": 6180 + }, + { + "epoch": 1.75, + "learning_rate": 3.491144222659545e-05, + "loss": 0.4394, + "step": 6210 + }, + { + "epoch": 1.75, + "learning_rate": 3.508012369974698e-05, + "loss": 0.3858, + "step": 6240 + }, + { + "epoch": 1.76, + "learning_rate": 3.5248805172898514e-05, + "loss": 0.4235, + "step": 6270 + }, + { + "epoch": 1.77, + "learning_rate": 3.5417486646050046e-05, + "loss": 0.4025, + "step": 6300 + }, + { + "epoch": 1.78, + "learning_rate": 3.558616811920157e-05, + "loss": 0.4115, + "step": 6330 + }, + { + "epoch": 1.79, + "learning_rate": 3.5754849592353104e-05, + "loss": 0.4366, + "step": 6360 + }, + { + "epoch": 1.8, + "learning_rate": 3.592353106550464e-05, + "loss": 0.3796, + "step": 6390 + }, + { + "epoch": 1.8, + "learning_rate": 3.6092212538656175e-05, + "loss": 0.4116, + "step": 6420 + }, + { + "epoch": 1.81, + "learning_rate": 3.625527129603599e-05, + "loss": 0.3995, + "step": 6450 + }, + { + "epoch": 1.82, + "learning_rate": 3.642395276918752e-05, + "loss": 0.3909, + "step": 6480 + }, + { + "epoch": 1.83, + "learning_rate": 3.659263424233905e-05, + "loss": 0.4251, + "step": 6510 + }, + { + "epoch": 1.84, + "learning_rate": 3.6761315715490585e-05, + "loss": 0.378, + "step": 6540 + }, + { + "epoch": 1.85, + "learning_rate": 3.692999718864212e-05, + "loss": 0.4189, + "step": 6570 + }, + { + "epoch": 1.86, + "learning_rate": 3.709867866179364e-05, + "loss": 0.3978, + "step": 6600 + }, + { + "epoch": 1.86, + "learning_rate": 3.726736013494518e-05, + "loss": 0.3937, + "step": 6630 + }, + { + "epoch": 1.87, + "learning_rate": 3.7436041608096714e-05, + "loss": 0.4173, + "step": 6660 + }, + { + "epoch": 1.88, + "learning_rate": 3.7604723081248246e-05, + "loss": 0.3611, + "step": 6690 + }, + { + "epoch": 1.89, + "learning_rate": 3.777340455439978e-05, + "loss": 0.415, + "step": 6720 + }, + { + "epoch": 1.9, + "learning_rate": 3.794208602755131e-05, + "loss": 0.3909, + "step": 6750 + }, + { + "epoch": 1.91, + "learning_rate": 3.811076750070284e-05, + "loss": 0.398, + "step": 6780 + }, + { + "epoch": 1.91, + "learning_rate": 3.8279448973854375e-05, + "loss": 0.4173, + "step": 6810 + }, + { + "epoch": 1.92, + "learning_rate": 3.84481304470059e-05, + "loss": 0.3814, + "step": 6840 + }, + { + "epoch": 1.93, + "learning_rate": 3.861681192015743e-05, + "loss": 0.4008, + "step": 6870 + }, + { + "epoch": 1.94, + "learning_rate": 3.878549339330897e-05, + "loss": 0.3793, + "step": 6900 + }, + { + "epoch": 1.95, + "learning_rate": 3.8954174866460504e-05, + "loss": 0.3828, + "step": 6930 + }, + { + "epoch": 1.96, + "learning_rate": 3.912285633961204e-05, + "loss": 0.4004, + "step": 6960 + }, + { + "epoch": 1.97, + "learning_rate": 3.929153781276357e-05, + "loss": 0.3492, + "step": 6990 + }, + { + "epoch": 1.97, + "learning_rate": 3.94602192859151e-05, + "loss": 0.4091, + "step": 7020 + }, + { + "epoch": 1.98, + "learning_rate": 3.962890075906663e-05, + "loss": 0.3959, + "step": 7050 + }, + { + "epoch": 1.99, + "learning_rate": 3.979758223221816e-05, + "loss": 0.3989, + "step": 7080 + }, + { + "epoch": 2.0, + "learning_rate": 3.996626370536969e-05, + "loss": 0.3992, + "step": 7110 + }, + { + "epoch": 2.0, + "eval_loss": 0.3737587332725525, + "eval_runtime": 480.2975, + "eval_samples_per_second": 33.381, + "eval_steps_per_second": 1.045, + "eval_wer": 0.39358972609283094, + "step": 7114 + }, + { + "epoch": 2.01, + "learning_rate": 4.013494517852123e-05, + "loss": 0.3616, + "step": 7140 + }, + { + "epoch": 2.02, + "learning_rate": 4.030362665167276e-05, + "loss": 0.3869, + "step": 7170 + }, + { + "epoch": 2.02, + "learning_rate": 4.0472308124824295e-05, + "loss": 0.344, + "step": 7200 + }, + { + "epoch": 2.03, + "learning_rate": 4.064098959797583e-05, + "loss": 0.3751, + "step": 7230 + }, + { + "epoch": 2.04, + "learning_rate": 4.080967107112736e-05, + "loss": 0.3755, + "step": 7260 + }, + { + "epoch": 2.05, + "learning_rate": 4.0978352544278885e-05, + "loss": 0.3529, + "step": 7290 + }, + { + "epoch": 2.06, + "learning_rate": 4.114703401743042e-05, + "loss": 0.3805, + "step": 7320 + }, + { + "epoch": 2.07, + "learning_rate": 4.131571549058195e-05, + "loss": 0.3421, + "step": 7350 + }, + { + "epoch": 2.07, + "learning_rate": 4.148439696373348e-05, + "loss": 0.3584, + "step": 7380 + }, + { + "epoch": 2.08, + "learning_rate": 4.165307843688502e-05, + "loss": 0.3639, + "step": 7410 + }, + { + "epoch": 2.09, + "learning_rate": 4.182175991003655e-05, + "loss": 0.3447, + "step": 7440 + }, + { + "epoch": 2.1, + "learning_rate": 4.1990441383188086e-05, + "loss": 0.3812, + "step": 7470 + }, + { + "epoch": 2.11, + "learning_rate": 4.215912285633962e-05, + "loss": 0.342, + "step": 7500 + }, + { + "epoch": 2.12, + "learning_rate": 4.232780432949114e-05, + "loss": 0.3811, + "step": 7530 + }, + { + "epoch": 2.13, + "learning_rate": 4.2496485802642676e-05, + "loss": 0.3631, + "step": 7560 + }, + { + "epoch": 2.13, + "learning_rate": 4.266516727579421e-05, + "loss": 0.338, + "step": 7590 + }, + { + "epoch": 2.14, + "learning_rate": 4.283384874894574e-05, + "loss": 0.3733, + "step": 7620 + }, + { + "epoch": 2.15, + "learning_rate": 4.300253022209727e-05, + "loss": 0.3247, + "step": 7650 + }, + { + "epoch": 2.16, + "learning_rate": 4.317121169524881e-05, + "loss": 0.3573, + "step": 7680 + }, + { + "epoch": 2.17, + "learning_rate": 4.3339893168400344e-05, + "loss": 0.3536, + "step": 7710 + }, + { + "epoch": 2.18, + "learning_rate": 4.350857464155187e-05, + "loss": 0.336, + "step": 7740 + }, + { + "epoch": 2.18, + "learning_rate": 4.36772561147034e-05, + "loss": 0.3805, + "step": 7770 + }, + { + "epoch": 2.19, + "learning_rate": 4.3845937587854934e-05, + "loss": 0.3219, + "step": 7800 + }, + { + "epoch": 2.2, + "learning_rate": 4.4014619061006466e-05, + "loss": 0.3488, + "step": 7830 + }, + { + "epoch": 2.21, + "learning_rate": 4.4183300534158e-05, + "loss": 0.3505, + "step": 7860 + }, + { + "epoch": 2.22, + "learning_rate": 4.435198200730953e-05, + "loss": 0.3363, + "step": 7890 + }, + { + "epoch": 2.23, + "learning_rate": 4.452066348046107e-05, + "loss": 0.3674, + "step": 7920 + }, + { + "epoch": 2.23, + "learning_rate": 4.46893449536126e-05, + "loss": 0.3187, + "step": 7950 + }, + { + "epoch": 2.24, + "learning_rate": 4.485802642676413e-05, + "loss": 0.342, + "step": 7980 + }, + { + "epoch": 2.25, + "learning_rate": 4.502670789991566e-05, + "loss": 0.3452, + "step": 8010 + }, + { + "epoch": 2.26, + "learning_rate": 4.519538937306719e-05, + "loss": 0.3259, + "step": 8040 + }, + { + "epoch": 2.27, + "learning_rate": 4.5364070846218724e-05, + "loss": 0.365, + "step": 8070 + }, + { + "epoch": 2.28, + "learning_rate": 4.553275231937026e-05, + "loss": 0.3086, + "step": 8100 + }, + { + "epoch": 2.29, + "learning_rate": 4.570143379252179e-05, + "loss": 0.347, + "step": 8130 + }, + { + "epoch": 2.29, + "learning_rate": 4.587011526567332e-05, + "loss": 0.3502, + "step": 8160 + }, + { + "epoch": 2.3, + "learning_rate": 4.6038796738824854e-05, + "loss": 0.3292, + "step": 8190 + }, + { + "epoch": 2.31, + "learning_rate": 4.6207478211976386e-05, + "loss": 0.3591, + "step": 8220 + }, + { + "epoch": 2.32, + "learning_rate": 4.637615968512792e-05, + "loss": 0.3107, + "step": 8250 + }, + { + "epoch": 2.33, + "learning_rate": 4.654484115827945e-05, + "loss": 0.3472, + "step": 8280 + }, + { + "epoch": 2.34, + "learning_rate": 4.671352263143098e-05, + "loss": 0.3508, + "step": 8310 + }, + { + "epoch": 2.34, + "learning_rate": 4.6882204104582515e-05, + "loss": 0.3302, + "step": 8340 + }, + { + "epoch": 2.35, + "learning_rate": 4.705088557773405e-05, + "loss": 0.3546, + "step": 8370 + }, + { + "epoch": 2.36, + "learning_rate": 4.721956705088558e-05, + "loss": 0.3139, + "step": 8400 + }, + { + "epoch": 2.37, + "learning_rate": 4.738824852403711e-05, + "loss": 0.3369, + "step": 8430 + }, + { + "epoch": 2.38, + "learning_rate": 4.7556929997188644e-05, + "loss": 0.3388, + "step": 8460 + }, + { + "epoch": 2.39, + "learning_rate": 4.7725611470340176e-05, + "loss": 0.3249, + "step": 8490 + }, + { + "epoch": 2.4, + "learning_rate": 4.789429294349171e-05, + "loss": 0.3521, + "step": 8520 + }, + { + "epoch": 2.4, + "learning_rate": 4.806297441664324e-05, + "loss": 0.3098, + "step": 8550 + }, + { + "epoch": 2.41, + "learning_rate": 4.823165588979477e-05, + "loss": 0.3394, + "step": 8580 + }, + { + "epoch": 2.42, + "learning_rate": 4.8400337362946306e-05, + "loss": 0.3332, + "step": 8610 + }, + { + "epoch": 2.43, + "learning_rate": 4.856901883609784e-05, + "loss": 0.3176, + "step": 8640 + }, + { + "epoch": 2.44, + "learning_rate": 4.873770030924937e-05, + "loss": 0.3477, + "step": 8670 + }, + { + "epoch": 2.45, + "learning_rate": 4.89063817824009e-05, + "loss": 0.2996, + "step": 8700 + }, + { + "epoch": 2.45, + "learning_rate": 4.9075063255552435e-05, + "loss": 0.3392, + "step": 8730 + }, + { + "epoch": 2.46, + "learning_rate": 4.924374472870397e-05, + "loss": 0.3182, + "step": 8760 + }, + { + "epoch": 2.47, + "learning_rate": 4.94124262018555e-05, + "loss": 0.3102, + "step": 8790 + }, + { + "epoch": 2.48, + "learning_rate": 4.958110767500703e-05, + "loss": 0.3393, + "step": 8820 + }, + { + "epoch": 2.49, + "learning_rate": 4.9749789148158564e-05, + "loss": 0.3018, + "step": 8850 + }, + { + "epoch": 2.5, + "learning_rate": 4.9918470621310096e-05, + "loss": 0.3248, + "step": 8880 + }, + { + "epoch": 2.5, + "learning_rate": 5.008715209446163e-05, + "loss": 0.3333, + "step": 8910 + }, + { + "epoch": 2.51, + "learning_rate": 5.025021085184144e-05, + "loss": 0.3293, + "step": 8940 + }, + { + "epoch": 2.52, + "learning_rate": 5.041889232499297e-05, + "loss": 0.3295, + "step": 8970 + }, + { + "epoch": 2.53, + "learning_rate": 5.0587573798144506e-05, + "loss": 0.305, + "step": 9000 + }, + { + "epoch": 2.54, + "learning_rate": 5.075625527129604e-05, + "loss": 0.3299, + "step": 9030 + }, + { + "epoch": 2.55, + "learning_rate": 5.092493674444757e-05, + "loss": 0.3191, + "step": 9060 + }, + { + "epoch": 2.56, + "learning_rate": 5.10936182175991e-05, + "loss": 0.3088, + "step": 9090 + }, + { + "epoch": 2.56, + "learning_rate": 5.1262299690750635e-05, + "loss": 0.3358, + "step": 9120 + }, + { + "epoch": 2.57, + "learning_rate": 5.143098116390217e-05, + "loss": 0.2975, + "step": 9150 + }, + { + "epoch": 2.58, + "learning_rate": 5.1599662637053706e-05, + "loss": 0.3194, + "step": 9180 + }, + { + "epoch": 2.59, + "learning_rate": 5.176834411020524e-05, + "loss": 0.315, + "step": 9210 + }, + { + "epoch": 2.6, + "learning_rate": 5.193702558335677e-05, + "loss": 0.3019, + "step": 9240 + }, + { + "epoch": 2.61, + "learning_rate": 5.210570705650829e-05, + "loss": 0.341, + "step": 9270 + }, + { + "epoch": 2.61, + "learning_rate": 5.227438852965982e-05, + "loss": 0.2915, + "step": 9300 + }, + { + "epoch": 2.62, + "learning_rate": 5.2443070002811354e-05, + "loss": 0.3036, + "step": 9330 + }, + { + "epoch": 2.63, + "learning_rate": 5.2611751475962886e-05, + "loss": 0.3123, + "step": 9360 + }, + { + "epoch": 2.64, + "learning_rate": 5.2780432949114425e-05, + "loss": 0.2926, + "step": 9390 + }, + { + "epoch": 2.65, + "learning_rate": 5.294911442226596e-05, + "loss": 0.3263, + "step": 9420 + }, + { + "epoch": 2.66, + "learning_rate": 5.311779589541749e-05, + "loss": 0.2841, + "step": 9450 + }, + { + "epoch": 2.67, + "learning_rate": 5.328647736856902e-05, + "loss": 0.3243, + "step": 9480 + }, + { + "epoch": 2.67, + "learning_rate": 5.3455158841720554e-05, + "loss": 0.3091, + "step": 9510 + }, + { + "epoch": 2.68, + "learning_rate": 5.3623840314872087e-05, + "loss": 0.3011, + "step": 9540 + }, + { + "epoch": 2.69, + "learning_rate": 5.379252178802362e-05, + "loss": 0.3216, + "step": 9570 + }, + { + "epoch": 2.7, + "learning_rate": 5.396120326117515e-05, + "loss": 0.2834, + "step": 9600 + }, + { + "epoch": 2.71, + "learning_rate": 5.4129884734326683e-05, + "loss": 0.3174, + "step": 9630 + }, + { + "epoch": 2.72, + "learning_rate": 5.4298566207478216e-05, + "loss": 0.2969, + "step": 9660 + }, + { + "epoch": 2.72, + "learning_rate": 5.4467247680629755e-05, + "loss": 0.2896, + "step": 9690 + }, + { + "epoch": 2.73, + "learning_rate": 5.463592915378129e-05, + "loss": 0.3153, + "step": 9720 + }, + { + "epoch": 2.74, + "learning_rate": 5.4804610626932806e-05, + "loss": 0.2767, + "step": 9750 + }, + { + "epoch": 2.75, + "learning_rate": 5.497329210008434e-05, + "loss": 0.3188, + "step": 9780 + }, + { + "epoch": 2.76, + "learning_rate": 5.514197357323587e-05, + "loss": 0.3092, + "step": 9810 + }, + { + "epoch": 2.77, + "learning_rate": 5.53106550463874e-05, + "loss": 0.2959, + "step": 9840 + }, + { + "epoch": 2.77, + "learning_rate": 5.5479336519538935e-05, + "loss": 0.3283, + "step": 9870 + }, + { + "epoch": 2.78, + "learning_rate": 5.5648017992690474e-05, + "loss": 0.2868, + "step": 9900 + }, + { + "epoch": 2.79, + "learning_rate": 5.5816699465842006e-05, + "loss": 0.3149, + "step": 9930 + }, + { + "epoch": 2.8, + "learning_rate": 5.598538093899354e-05, + "loss": 0.304, + "step": 9960 + }, + { + "epoch": 2.81, + "learning_rate": 5.615406241214507e-05, + "loss": 0.2867, + "step": 9990 + }, + { + "epoch": 2.82, + "learning_rate": 5.63227438852966e-05, + "loss": 0.321, + "step": 10020 + }, + { + "epoch": 2.83, + "learning_rate": 5.6491425358448135e-05, + "loss": 0.2739, + "step": 10050 + }, + { + "epoch": 2.83, + "learning_rate": 5.666010683159967e-05, + "loss": 0.3268, + "step": 10080 + }, + { + "epoch": 2.84, + "learning_rate": 5.68287883047512e-05, + "loss": 0.3024, + "step": 10110 + }, + { + "epoch": 2.85, + "learning_rate": 5.699746977790273e-05, + "loss": 0.2842, + "step": 10140 + }, + { + "epoch": 2.86, + "learning_rate": 5.7166151251054265e-05, + "loss": 0.3249, + "step": 10170 + }, + { + "epoch": 2.87, + "learning_rate": 5.733483272420579e-05, + "loss": 0.2767, + "step": 10200 + }, + { + "epoch": 2.88, + "learning_rate": 5.750351419735732e-05, + "loss": 0.3021, + "step": 10230 + }, + { + "epoch": 2.88, + "learning_rate": 5.7672195670508855e-05, + "loss": 0.3049, + "step": 10260 + }, + { + "epoch": 2.89, + "learning_rate": 5.784087714366039e-05, + "loss": 0.2757, + "step": 10290 + }, + { + "epoch": 2.9, + "learning_rate": 5.800955861681192e-05, + "loss": 0.3065, + "step": 10320 + }, + { + "epoch": 2.91, + "learning_rate": 5.817824008996345e-05, + "loss": 0.2667, + "step": 10350 + }, + { + "epoch": 2.92, + "learning_rate": 5.8346921563114984e-05, + "loss": 0.3008, + "step": 10380 + }, + { + "epoch": 2.93, + "learning_rate": 5.851560303626652e-05, + "loss": 0.2879, + "step": 10410 + }, + { + "epoch": 2.93, + "learning_rate": 5.8684284509418055e-05, + "loss": 0.2768, + "step": 10440 + }, + { + "epoch": 2.94, + "learning_rate": 5.885296598256959e-05, + "loss": 0.3082, + "step": 10470 + }, + { + "epoch": 2.95, + "learning_rate": 5.902164745572112e-05, + "loss": 0.2627, + "step": 10500 + }, + { + "epoch": 2.96, + "learning_rate": 5.919032892887265e-05, + "loss": 0.3004, + "step": 10530 + }, + { + "epoch": 2.97, + "learning_rate": 5.9359010402024184e-05, + "loss": 0.2858, + "step": 10560 + }, + { + "epoch": 2.98, + "learning_rate": 5.9527691875175717e-05, + "loss": 0.2808, + "step": 10590 + }, + { + "epoch": 2.99, + "learning_rate": 5.969637334832725e-05, + "loss": 0.299, + "step": 10620 + }, + { + "epoch": 2.99, + "learning_rate": 5.9865054821478774e-05, + "loss": 0.2611, + "step": 10650 + }, + { + "epoch": 3.0, + "eval_loss": 0.30112308263778687, + "eval_runtime": 481.9568, + "eval_samples_per_second": 33.266, + "eval_steps_per_second": 1.042, + "eval_wer": 0.3177432342063243, + "step": 10671 + }, + { + "epoch": 3.0, + "learning_rate": 6.003373629463031e-05, + "loss": 0.3151, + "step": 10680 + }, + { + "epoch": 3.01, + "learning_rate": 6.020241776778184e-05, + "loss": 0.2666, + "step": 10710 + }, + { + "epoch": 3.02, + "learning_rate": 6.037109924093337e-05, + "loss": 0.278, + "step": 10740 + }, + { + "epoch": 3.03, + "learning_rate": 6.0539780714084903e-05, + "loss": 0.2873, + "step": 10770 + }, + { + "epoch": 3.04, + "learning_rate": 6.0708462187236436e-05, + "loss": 0.2838, + "step": 10800 + }, + { + "epoch": 3.04, + "learning_rate": 6.087714366038797e-05, + "loss": 0.2901, + "step": 10830 + }, + { + "epoch": 3.05, + "learning_rate": 6.104582513353951e-05, + "loss": 0.2606, + "step": 10860 + }, + { + "epoch": 3.06, + "learning_rate": 6.121450660669103e-05, + "loss": 0.2811, + "step": 10890 + }, + { + "epoch": 3.07, + "learning_rate": 6.138318807984257e-05, + "loss": 0.2904, + "step": 10920 + }, + { + "epoch": 3.08, + "learning_rate": 6.15518695529941e-05, + "loss": 0.2569, + "step": 10950 + }, + { + "epoch": 3.09, + "learning_rate": 6.172055102614564e-05, + "loss": 0.2859, + "step": 10980 + }, + { + "epoch": 3.1, + "learning_rate": 6.188923249929716e-05, + "loss": 0.2584, + "step": 11010 + }, + { + "epoch": 3.1, + "learning_rate": 6.20579139724487e-05, + "loss": 0.2834, + "step": 11040 + }, + { + "epoch": 3.11, + "learning_rate": 6.222659544560024e-05, + "loss": 0.2814, + "step": 11070 + }, + { + "epoch": 3.12, + "learning_rate": 6.239527691875175e-05, + "loss": 0.2533, + "step": 11100 + }, + { + "epoch": 3.13, + "learning_rate": 6.256395839190329e-05, + "loss": 0.2884, + "step": 11130 + }, + { + "epoch": 3.14, + "learning_rate": 6.273263986505482e-05, + "loss": 0.2633, + "step": 11160 + }, + { + "epoch": 3.15, + "learning_rate": 6.290132133820636e-05, + "loss": 0.2737, + "step": 11190 + }, + { + "epoch": 3.15, + "learning_rate": 6.307000281135788e-05, + "loss": 0.2805, + "step": 11220 + }, + { + "epoch": 3.16, + "learning_rate": 6.323868428450942e-05, + "loss": 0.2478, + "step": 11250 + }, + { + "epoch": 3.17, + "learning_rate": 6.340736575766096e-05, + "loss": 0.2918, + "step": 11280 + }, + { + "epoch": 3.18, + "learning_rate": 6.357604723081248e-05, + "loss": 0.2566, + "step": 11310 + }, + { + "epoch": 3.19, + "learning_rate": 6.374472870396402e-05, + "loss": 0.2685, + "step": 11340 + }, + { + "epoch": 3.2, + "learning_rate": 6.391341017711555e-05, + "loss": 0.2871, + "step": 11370 + }, + { + "epoch": 3.2, + "learning_rate": 6.408209165026709e-05, + "loss": 0.2461, + "step": 11400 + }, + { + "epoch": 3.21, + "learning_rate": 6.425077312341861e-05, + "loss": 0.2769, + "step": 11430 + }, + { + "epoch": 3.22, + "learning_rate": 6.441945459657015e-05, + "loss": 0.2561, + "step": 11460 + }, + { + "epoch": 3.23, + "learning_rate": 6.458813606972168e-05, + "loss": 0.2703, + "step": 11490 + }, + { + "epoch": 3.24, + "learning_rate": 6.475681754287322e-05, + "loss": 0.28, + "step": 11520 + }, + { + "epoch": 3.25, + "learning_rate": 6.492549901602474e-05, + "loss": 0.2409, + "step": 11550 + }, + { + "epoch": 3.26, + "learning_rate": 6.509418048917627e-05, + "loss": 0.2825, + "step": 11580 + }, + { + "epoch": 3.26, + "learning_rate": 6.526286196232781e-05, + "loss": 0.255, + "step": 11610 + }, + { + "epoch": 3.27, + "learning_rate": 6.543154343547933e-05, + "loss": 0.2633, + "step": 11640 + }, + { + "epoch": 3.28, + "learning_rate": 6.560022490863087e-05, + "loss": 0.2806, + "step": 11670 + }, + { + "epoch": 3.29, + "learning_rate": 6.57689063817824e-05, + "loss": 0.2471, + "step": 11700 + }, + { + "epoch": 3.3, + "learning_rate": 6.593758785493394e-05, + "loss": 0.2886, + "step": 11730 + }, + { + "epoch": 3.31, + "learning_rate": 6.610626932808546e-05, + "loss": 0.2501, + "step": 11760 + }, + { + "epoch": 3.31, + "learning_rate": 6.626932808546529e-05, + "loss": 0.2899, + "step": 11790 + }, + { + "epoch": 3.32, + "learning_rate": 6.643800955861683e-05, + "loss": 0.2852, + "step": 11820 + }, + { + "epoch": 3.33, + "learning_rate": 6.660669103176834e-05, + "loss": 0.2445, + "step": 11850 + }, + { + "epoch": 3.34, + "learning_rate": 6.677537250491988e-05, + "loss": 0.2772, + "step": 11880 + }, + { + "epoch": 3.35, + "learning_rate": 6.69440539780714e-05, + "loss": 0.2438, + "step": 11910 + }, + { + "epoch": 3.36, + "learning_rate": 6.711273545122294e-05, + "loss": 0.2682, + "step": 11940 + }, + { + "epoch": 3.37, + "learning_rate": 6.728141692437447e-05, + "loss": 0.2745, + "step": 11970 + }, + { + "epoch": 3.37, + "learning_rate": 6.745009839752601e-05, + "loss": 0.2412, + "step": 12000 + }, + { + "epoch": 3.38, + "learning_rate": 6.761877987067755e-05, + "loss": 0.2704, + "step": 12030 + }, + { + "epoch": 3.39, + "learning_rate": 6.778746134382907e-05, + "loss": 0.2515, + "step": 12060 + }, + { + "epoch": 3.4, + "learning_rate": 6.795614281698061e-05, + "loss": 0.2614, + "step": 12090 + }, + { + "epoch": 3.41, + "learning_rate": 6.812482429013214e-05, + "loss": 0.2673, + "step": 12120 + }, + { + "epoch": 3.42, + "learning_rate": 6.829350576328368e-05, + "loss": 0.2377, + "step": 12150 + }, + { + "epoch": 3.42, + "learning_rate": 6.84621872364352e-05, + "loss": 0.2801, + "step": 12180 + }, + { + "epoch": 3.43, + "learning_rate": 6.863086870958674e-05, + "loss": 0.2468, + "step": 12210 + }, + { + "epoch": 3.44, + "learning_rate": 6.879955018273827e-05, + "loss": 0.263, + "step": 12240 + }, + { + "epoch": 3.45, + "learning_rate": 6.89682316558898e-05, + "loss": 0.2722, + "step": 12270 + }, + { + "epoch": 3.46, + "learning_rate": 6.913691312904133e-05, + "loss": 0.2458, + "step": 12300 + }, + { + "epoch": 3.47, + "learning_rate": 6.930559460219286e-05, + "loss": 0.2719, + "step": 12330 + }, + { + "epoch": 3.47, + "learning_rate": 6.94742760753444e-05, + "loss": 0.2646, + "step": 12360 + }, + { + "epoch": 3.48, + "learning_rate": 6.964295754849592e-05, + "loss": 0.2577, + "step": 12390 + }, + { + "epoch": 3.49, + "learning_rate": 6.981163902164746e-05, + "loss": 0.2693, + "step": 12420 + }, + { + "epoch": 3.5, + "learning_rate": 6.998032049479898e-05, + "loss": 0.2399, + "step": 12450 + }, + { + "epoch": 3.51, + "learning_rate": 7.014900196795052e-05, + "loss": 0.2699, + "step": 12480 + }, + { + "epoch": 3.52, + "learning_rate": 7.031768344110205e-05, + "loss": 0.2454, + "step": 12510 + }, + { + "epoch": 3.53, + "learning_rate": 7.048636491425359e-05, + "loss": 0.2598, + "step": 12540 + }, + { + "epoch": 3.53, + "learning_rate": 7.065504638740513e-05, + "loss": 0.2643, + "step": 12570 + }, + { + "epoch": 3.54, + "learning_rate": 7.082372786055665e-05, + "loss": 0.2328, + "step": 12600 + }, + { + "epoch": 3.55, + "learning_rate": 7.099240933370819e-05, + "loss": 0.2691, + "step": 12630 + }, + { + "epoch": 3.56, + "learning_rate": 7.116109080685972e-05, + "loss": 0.233, + "step": 12660 + }, + { + "epoch": 3.57, + "learning_rate": 7.132977228001126e-05, + "loss": 0.2597, + "step": 12690 + }, + { + "epoch": 3.58, + "learning_rate": 7.149845375316278e-05, + "loss": 0.2666, + "step": 12720 + }, + { + "epoch": 3.58, + "learning_rate": 7.166713522631431e-05, + "loss": 0.2254, + "step": 12750 + }, + { + "epoch": 3.59, + "learning_rate": 7.183581669946585e-05, + "loss": 0.2699, + "step": 12780 + }, + { + "epoch": 3.6, + "learning_rate": 7.200449817261737e-05, + "loss": 0.2374, + "step": 12810 + }, + { + "epoch": 3.61, + "learning_rate": 7.217317964576891e-05, + "loss": 0.2505, + "step": 12840 + }, + { + "epoch": 3.62, + "learning_rate": 7.234186111892044e-05, + "loss": 0.2685, + "step": 12870 + }, + { + "epoch": 3.63, + "learning_rate": 7.251054259207198e-05, + "loss": 0.2371, + "step": 12900 + }, + { + "epoch": 3.63, + "learning_rate": 7.26792240652235e-05, + "loss": 0.2573, + "step": 12930 + }, + { + "epoch": 3.64, + "learning_rate": 7.284790553837504e-05, + "loss": 0.2376, + "step": 12960 + }, + { + "epoch": 3.65, + "learning_rate": 7.301658701152657e-05, + "loss": 0.2575, + "step": 12990 + }, + { + "epoch": 3.66, + "learning_rate": 7.31852684846781e-05, + "loss": 0.2615, + "step": 13020 + }, + { + "epoch": 3.67, + "learning_rate": 7.335394995782964e-05, + "loss": 0.2391, + "step": 13050 + }, + { + "epoch": 3.68, + "learning_rate": 7.352263143098117e-05, + "loss": 0.2535, + "step": 13080 + }, + { + "epoch": 3.69, + "learning_rate": 7.369131290413271e-05, + "loss": 0.237, + "step": 13110 + }, + { + "epoch": 3.69, + "learning_rate": 7.385999437728423e-05, + "loss": 0.2592, + "step": 13140 + }, + { + "epoch": 3.7, + "learning_rate": 7.402867585043577e-05, + "loss": 0.2529, + "step": 13170 + }, + { + "epoch": 3.71, + "learning_rate": 7.419735732358729e-05, + "loss": 0.2341, + "step": 13200 + }, + { + "epoch": 3.72, + "learning_rate": 7.436603879673882e-05, + "loss": 0.2643, + "step": 13230 + }, + { + "epoch": 3.73, + "learning_rate": 7.453472026989036e-05, + "loss": 0.2348, + "step": 13260 + }, + { + "epoch": 3.74, + "learning_rate": 7.470340174304189e-05, + "loss": 0.2549, + "step": 13290 + }, + { + "epoch": 3.74, + "learning_rate": 7.487208321619343e-05, + "loss": 0.2583, + "step": 13320 + }, + { + "epoch": 3.75, + "learning_rate": 7.504076468934495e-05, + "loss": 0.2319, + "step": 13350 + }, + { + "epoch": 3.76, + "learning_rate": 7.520944616249649e-05, + "loss": 0.2575, + "step": 13380 + }, + { + "epoch": 3.77, + "learning_rate": 7.537812763564802e-05, + "loss": 0.2378, + "step": 13410 + }, + { + "epoch": 3.78, + "learning_rate": 7.554680910879956e-05, + "loss": 0.2515, + "step": 13440 + }, + { + "epoch": 3.79, + "learning_rate": 7.571549058195108e-05, + "loss": 0.2695, + "step": 13470 + }, + { + "epoch": 3.8, + "learning_rate": 7.588417205510262e-05, + "loss": 0.2304, + "step": 13500 + }, + { + "epoch": 3.8, + "learning_rate": 7.605285352825415e-05, + "loss": 0.2562, + "step": 13530 + }, + { + "epoch": 3.81, + "learning_rate": 7.622153500140569e-05, + "loss": 0.2263, + "step": 13560 + }, + { + "epoch": 3.82, + "learning_rate": 7.639021647455723e-05, + "loss": 0.2499, + "step": 13590 + }, + { + "epoch": 3.83, + "learning_rate": 7.655889794770875e-05, + "loss": 0.2728, + "step": 13620 + }, + { + "epoch": 3.84, + "learning_rate": 7.672757942086028e-05, + "loss": 0.2294, + "step": 13650 + }, + { + "epoch": 3.85, + "learning_rate": 7.68962608940118e-05, + "loss": 0.2573, + "step": 13680 + }, + { + "epoch": 3.85, + "learning_rate": 7.706494236716334e-05, + "loss": 0.2317, + "step": 13710 + }, + { + "epoch": 3.86, + "learning_rate": 7.723362384031487e-05, + "loss": 0.251, + "step": 13740 + }, + { + "epoch": 3.87, + "learning_rate": 7.74023053134664e-05, + "loss": 0.2668, + "step": 13770 + }, + { + "epoch": 3.88, + "learning_rate": 7.757098678661794e-05, + "loss": 0.2297, + "step": 13800 + }, + { + "epoch": 3.89, + "learning_rate": 7.773966825976947e-05, + "loss": 0.2567, + "step": 13830 + }, + { + "epoch": 3.9, + "learning_rate": 7.790834973292101e-05, + "loss": 0.2354, + "step": 13860 + }, + { + "epoch": 3.9, + "learning_rate": 7.807703120607253e-05, + "loss": 0.2504, + "step": 13890 + }, + { + "epoch": 3.91, + "learning_rate": 7.824571267922407e-05, + "loss": 0.256, + "step": 13920 + }, + { + "epoch": 3.92, + "learning_rate": 7.84143941523756e-05, + "loss": 0.256, + "step": 13950 + }, + { + "epoch": 3.93, + "learning_rate": 7.858307562552714e-05, + "loss": 0.2575, + "step": 13980 + }, + { + "epoch": 3.94, + "learning_rate": 7.875175709867866e-05, + "loss": 0.2254, + "step": 14010 + }, + { + "epoch": 3.95, + "learning_rate": 7.89204385718302e-05, + "loss": 0.2451, + "step": 14040 + }, + { + "epoch": 3.96, + "learning_rate": 7.908912004498173e-05, + "loss": 0.258, + "step": 14070 + }, + { + "epoch": 3.96, + "learning_rate": 7.925780151813325e-05, + "loss": 0.2254, + "step": 14100 + }, + { + "epoch": 3.97, + "learning_rate": 7.942648299128479e-05, + "loss": 0.2545, + "step": 14130 + }, + { + "epoch": 3.98, + "learning_rate": 7.959516446443632e-05, + "loss": 0.2294, + "step": 14160 + }, + { + "epoch": 3.99, + "learning_rate": 7.976384593758786e-05, + "loss": 0.2423, + "step": 14190 + }, + { + "epoch": 4.0, + "learning_rate": 7.993252741073938e-05, + "loss": 0.2536, + "step": 14220 + }, + { + "epoch": 4.0, + "eval_loss": 0.2671508193016052, + "eval_runtime": 482.3902, + "eval_samples_per_second": 33.237, + "eval_steps_per_second": 1.041, + "eval_wer": 0.27493073847119676, + "step": 14228 + }, + { + "epoch": 4.01, + "learning_rate": 8.010120888389092e-05, + "loss": 0.2218, + "step": 14250 + }, + { + "epoch": 4.01, + "learning_rate": 8.026989035704246e-05, + "loss": 0.2506, + "step": 14280 + }, + { + "epoch": 4.02, + "learning_rate": 8.043857183019399e-05, + "loss": 0.2084, + "step": 14310 + }, + { + "epoch": 4.03, + "learning_rate": 8.060725330334553e-05, + "loss": 0.2442, + "step": 14340 + }, + { + "epoch": 4.04, + "learning_rate": 8.077593477649705e-05, + "loss": 0.2309, + "step": 14370 + }, + { + "epoch": 4.05, + "learning_rate": 8.094461624964859e-05, + "loss": 0.235, + "step": 14400 + }, + { + "epoch": 4.06, + "learning_rate": 8.111329772280012e-05, + "loss": 0.2574, + "step": 14430 + }, + { + "epoch": 4.07, + "learning_rate": 8.128197919595165e-05, + "loss": 0.2079, + "step": 14460 + }, + { + "epoch": 4.07, + "learning_rate": 8.145066066910318e-05, + "loss": 0.2396, + "step": 14490 + }, + { + "epoch": 4.08, + "learning_rate": 8.161934214225472e-05, + "loss": 0.2266, + "step": 14520 + }, + { + "epoch": 4.09, + "learning_rate": 8.178802361540624e-05, + "loss": 0.2359, + "step": 14550 + }, + { + "epoch": 4.1, + "learning_rate": 8.195670508855777e-05, + "loss": 0.2542, + "step": 14580 + }, + { + "epoch": 4.11, + "learning_rate": 8.212538656170931e-05, + "loss": 0.2034, + "step": 14610 + }, + { + "epoch": 4.12, + "learning_rate": 8.229406803486083e-05, + "loss": 0.2437, + "step": 14640 + }, + { + "epoch": 4.12, + "learning_rate": 8.246274950801237e-05, + "loss": 0.2173, + "step": 14670 + }, + { + "epoch": 4.13, + "learning_rate": 8.26314309811639e-05, + "loss": 0.2339, + "step": 14700 + }, + { + "epoch": 4.14, + "learning_rate": 8.280011245431544e-05, + "loss": 0.2409, + "step": 14730 + }, + { + "epoch": 4.15, + "learning_rate": 8.296879392746696e-05, + "loss": 0.2086, + "step": 14760 + }, + { + "epoch": 4.16, + "learning_rate": 8.31374754006185e-05, + "loss": 0.2382, + "step": 14790 + }, + { + "epoch": 4.17, + "learning_rate": 8.330615687377004e-05, + "loss": 0.2231, + "step": 14820 + }, + { + "epoch": 4.17, + "learning_rate": 8.347483834692157e-05, + "loss": 0.2237, + "step": 14850 + }, + { + "epoch": 4.18, + "learning_rate": 8.36435198200731e-05, + "loss": 0.2468, + "step": 14880 + }, + { + "epoch": 4.19, + "learning_rate": 8.381220129322463e-05, + "loss": 0.2035, + "step": 14910 + }, + { + "epoch": 4.2, + "learning_rate": 8.398088276637617e-05, + "loss": 0.2326, + "step": 14940 + }, + { + "epoch": 4.21, + "learning_rate": 8.41495642395277e-05, + "loss": 0.2307, + "step": 14970 + }, + { + "epoch": 4.22, + "learning_rate": 8.431824571267924e-05, + "loss": 0.2215, + "step": 15000 + }, + { + "epoch": 4.23, + "learning_rate": 8.448692718583076e-05, + "loss": 0.2467, + "step": 15030 + }, + { + "epoch": 4.23, + "learning_rate": 8.465560865898229e-05, + "loss": 0.2137, + "step": 15060 + }, + { + "epoch": 4.24, + "learning_rate": 8.482429013213383e-05, + "loss": 0.2265, + "step": 15090 + }, + { + "epoch": 4.25, + "learning_rate": 8.499297160528535e-05, + "loss": 0.2221, + "step": 15120 + }, + { + "epoch": 4.26, + "learning_rate": 8.516165307843689e-05, + "loss": 0.2279, + "step": 15150 + }, + { + "epoch": 4.27, + "learning_rate": 8.533033455158842e-05, + "loss": 0.2438, + "step": 15180 + }, + { + "epoch": 4.28, + "learning_rate": 8.549901602473995e-05, + "loss": 0.2015, + "step": 15210 + }, + { + "epoch": 4.28, + "learning_rate": 8.566769749789148e-05, + "loss": 0.2331, + "step": 15240 + }, + { + "epoch": 4.29, + "learning_rate": 8.583637897104302e-05, + "loss": 0.2249, + "step": 15270 + }, + { + "epoch": 4.3, + "learning_rate": 8.600506044419455e-05, + "loss": 0.2211, + "step": 15300 + }, + { + "epoch": 4.31, + "learning_rate": 8.617374191734608e-05, + "loss": 0.2383, + "step": 15330 + }, + { + "epoch": 4.32, + "learning_rate": 8.634242339049762e-05, + "loss": 0.2055, + "step": 15360 + }, + { + "epoch": 4.33, + "learning_rate": 8.651110486364915e-05, + "loss": 0.2317, + "step": 15390 + }, + { + "epoch": 4.34, + "learning_rate": 8.667978633680069e-05, + "loss": 0.2153, + "step": 15420 + }, + { + "epoch": 4.34, + "learning_rate": 8.684846780995221e-05, + "loss": 0.2264, + "step": 15450 + }, + { + "epoch": 4.35, + "learning_rate": 8.701714928310374e-05, + "loss": 0.2393, + "step": 15480 + }, + { + "epoch": 4.36, + "learning_rate": 8.718583075625528e-05, + "loss": 0.2047, + "step": 15510 + }, + { + "epoch": 4.37, + "learning_rate": 8.73545122294068e-05, + "loss": 0.2277, + "step": 15540 + }, + { + "epoch": 4.38, + "learning_rate": 8.752319370255834e-05, + "loss": 0.2107, + "step": 15570 + }, + { + "epoch": 4.39, + "learning_rate": 8.769187517570987e-05, + "loss": 0.2283, + "step": 15600 + }, + { + "epoch": 4.39, + "learning_rate": 8.786055664886141e-05, + "loss": 0.2457, + "step": 15630 + }, + { + "epoch": 4.4, + "learning_rate": 8.802923812201293e-05, + "loss": 0.1963, + "step": 15660 + }, + { + "epoch": 4.41, + "learning_rate": 8.819791959516447e-05, + "loss": 0.2371, + "step": 15690 + }, + { + "epoch": 4.42, + "learning_rate": 8.8366601068316e-05, + "loss": 0.2193, + "step": 15720 + }, + { + "epoch": 4.43, + "learning_rate": 8.853528254146754e-05, + "loss": 0.2212, + "step": 15750 + }, + { + "epoch": 4.44, + "learning_rate": 8.870396401461906e-05, + "loss": 0.2679, + "step": 15780 + }, + { + "epoch": 4.44, + "learning_rate": 8.88726454877706e-05, + "loss": 0.2074, + "step": 15810 + }, + { + "epoch": 4.45, + "learning_rate": 8.903570424515041e-05, + "loss": 0.2531, + "step": 15840 + }, + { + "epoch": 4.46, + "learning_rate": 8.920438571830194e-05, + "loss": 0.2107, + "step": 15870 + }, + { + "epoch": 4.47, + "learning_rate": 8.937306719145348e-05, + "loss": 0.2273, + "step": 15900 + }, + { + "epoch": 4.48, + "learning_rate": 8.9541748664605e-05, + "loss": 0.237, + "step": 15930 + }, + { + "epoch": 4.49, + "learning_rate": 8.971043013775654e-05, + "loss": 0.2008, + "step": 15960 + }, + { + "epoch": 4.5, + "learning_rate": 8.987911161090807e-05, + "loss": 0.2249, + "step": 15990 + }, + { + "epoch": 4.5, + "learning_rate": 9.004779308405961e-05, + "loss": 0.2184, + "step": 16020 + }, + { + "epoch": 4.51, + "learning_rate": 9.021647455721115e-05, + "loss": 0.2237, + "step": 16050 + }, + { + "epoch": 4.52, + "learning_rate": 9.038515603036267e-05, + "loss": 0.2461, + "step": 16080 + }, + { + "epoch": 4.53, + "learning_rate": 9.055383750351421e-05, + "loss": 0.2031, + "step": 16110 + }, + { + "epoch": 4.54, + "learning_rate": 9.072251897666574e-05, + "loss": 0.2328, + "step": 16140 + }, + { + "epoch": 4.55, + "learning_rate": 9.089120044981728e-05, + "loss": 0.2092, + "step": 16170 + }, + { + "epoch": 4.55, + "learning_rate": 9.10598819229688e-05, + "loss": 0.2176, + "step": 16200 + }, + { + "epoch": 4.56, + "learning_rate": 9.122856339612033e-05, + "loss": 0.2333, + "step": 16230 + }, + { + "epoch": 4.57, + "learning_rate": 9.139724486927187e-05, + "loss": 0.1933, + "step": 16260 + }, + { + "epoch": 4.58, + "learning_rate": 9.156592634242339e-05, + "loss": 0.2253, + "step": 16290 + }, + { + "epoch": 4.59, + "learning_rate": 9.173460781557493e-05, + "loss": 0.2157, + "step": 16320 + }, + { + "epoch": 4.6, + "learning_rate": 9.190328928872646e-05, + "loss": 0.2216, + "step": 16350 + }, + { + "epoch": 4.6, + "learning_rate": 9.2071970761878e-05, + "loss": 0.2463, + "step": 16380 + }, + { + "epoch": 4.61, + "learning_rate": 9.224065223502952e-05, + "loss": 0.1942, + "step": 16410 + }, + { + "epoch": 4.62, + "learning_rate": 9.240933370818106e-05, + "loss": 0.2332, + "step": 16440 + }, + { + "epoch": 4.63, + "learning_rate": 9.257801518133258e-05, + "loss": 0.2105, + "step": 16470 + }, + { + "epoch": 4.64, + "learning_rate": 9.274669665448412e-05, + "loss": 0.2198, + "step": 16500 + }, + { + "epoch": 4.65, + "learning_rate": 9.291537812763565e-05, + "loss": 0.2386, + "step": 16530 + }, + { + "epoch": 4.66, + "learning_rate": 9.308405960078719e-05, + "loss": 0.2008, + "step": 16560 + }, + { + "epoch": 4.66, + "learning_rate": 9.325274107393873e-05, + "loss": 0.2357, + "step": 16590 + }, + { + "epoch": 4.67, + "learning_rate": 9.342142254709025e-05, + "loss": 0.2182, + "step": 16620 + }, + { + "epoch": 4.68, + "learning_rate": 9.359010402024179e-05, + "loss": 0.2139, + "step": 16650 + }, + { + "epoch": 4.69, + "learning_rate": 9.375316277762159e-05, + "loss": 0.2395, + "step": 16680 + }, + { + "epoch": 4.7, + "learning_rate": 9.392184425077313e-05, + "loss": 0.1978, + "step": 16710 + }, + { + "epoch": 4.71, + "learning_rate": 9.408490300815294e-05, + "loss": 0.238, + "step": 16740 + }, + { + "epoch": 4.71, + "learning_rate": 9.425358448130448e-05, + "loss": 0.2058, + "step": 16770 + }, + { + "epoch": 4.72, + "learning_rate": 9.4422265954456e-05, + "loss": 0.2152, + "step": 16800 + }, + { + "epoch": 4.73, + "learning_rate": 9.459094742760753e-05, + "loss": 0.2404, + "step": 16830 + }, + { + "epoch": 4.74, + "learning_rate": 9.475962890075907e-05, + "loss": 0.1975, + "step": 16860 + }, + { + "epoch": 4.75, + "learning_rate": 9.49283103739106e-05, + "loss": 0.2275, + "step": 16890 + }, + { + "epoch": 4.76, + "learning_rate": 9.509699184706214e-05, + "loss": 0.2064, + "step": 16920 + }, + { + "epoch": 4.77, + "learning_rate": 9.526567332021366e-05, + "loss": 0.2191, + "step": 16950 + }, + { + "epoch": 4.77, + "learning_rate": 9.54343547933652e-05, + "loss": 0.2312, + "step": 16980 + }, + { + "epoch": 4.78, + "learning_rate": 9.560303626651673e-05, + "loss": 0.1969, + "step": 17010 + }, + { + "epoch": 4.79, + "learning_rate": 9.577171773966826e-05, + "loss": 0.2319, + "step": 17040 + }, + { + "epoch": 4.8, + "learning_rate": 9.59403992128198e-05, + "loss": 0.2196, + "step": 17070 + }, + { + "epoch": 4.81, + "learning_rate": 9.610908068597133e-05, + "loss": 0.2149, + "step": 17100 + }, + { + "epoch": 4.82, + "learning_rate": 9.627776215912287e-05, + "loss": 0.238, + "step": 17130 + }, + { + "epoch": 4.82, + "learning_rate": 9.64464436322744e-05, + "loss": 0.1979, + "step": 17160 + }, + { + "epoch": 4.83, + "learning_rate": 9.661512510542593e-05, + "loss": 0.2254, + "step": 17190 + }, + { + "epoch": 4.84, + "learning_rate": 9.678380657857746e-05, + "loss": 0.2059, + "step": 17220 + }, + { + "epoch": 4.85, + "learning_rate": 9.695248805172898e-05, + "loss": 0.2144, + "step": 17250 + }, + { + "epoch": 4.86, + "learning_rate": 9.712116952488052e-05, + "loss": 0.2367, + "step": 17280 + }, + { + "epoch": 4.87, + "learning_rate": 9.728985099803205e-05, + "loss": 0.1976, + "step": 17310 + }, + { + "epoch": 4.87, + "learning_rate": 9.745853247118359e-05, + "loss": 0.2329, + "step": 17340 + }, + { + "epoch": 4.88, + "learning_rate": 9.762721394433511e-05, + "loss": 0.2366, + "step": 17370 + }, + { + "epoch": 4.89, + "learning_rate": 9.779589541748665e-05, + "loss": 0.2181, + "step": 17400 + }, + { + "epoch": 4.9, + "learning_rate": 9.796457689063818e-05, + "loss": 0.2285, + "step": 17430 + }, + { + "epoch": 4.91, + "learning_rate": 9.813325836378972e-05, + "loss": 0.188, + "step": 17460 + }, + { + "epoch": 4.92, + "learning_rate": 9.830193983694124e-05, + "loss": 0.2252, + "step": 17490 + }, + { + "epoch": 4.93, + "learning_rate": 9.847062131009278e-05, + "loss": 0.2112, + "step": 17520 + }, + { + "epoch": 4.93, + "learning_rate": 9.863930278324432e-05, + "loss": 0.216, + "step": 17550 + }, + { + "epoch": 4.94, + "learning_rate": 9.880798425639585e-05, + "loss": 0.2321, + "step": 17580 + }, + { + "epoch": 4.95, + "learning_rate": 9.897666572954739e-05, + "loss": 0.1984, + "step": 17610 + }, + { + "epoch": 4.96, + "learning_rate": 9.914534720269891e-05, + "loss": 0.2293, + "step": 17640 + }, + { + "epoch": 4.97, + "learning_rate": 9.931402867585045e-05, + "loss": 0.2077, + "step": 17670 + }, + { + "epoch": 4.98, + "learning_rate": 9.948271014900196e-05, + "loss": 0.2105, + "step": 17700 + }, + { + "epoch": 4.98, + "learning_rate": 9.96513916221535e-05, + "loss": 0.2451, + "step": 17730 + }, + { + "epoch": 4.99, + "learning_rate": 9.982007309530504e-05, + "loss": 0.1943, + "step": 17760 + }, + { + "epoch": 5.0, + "eval_loss": 0.24867025017738342, + "eval_runtime": 481.4061, + "eval_samples_per_second": 33.305, + "eval_steps_per_second": 1.043, + "eval_wer": 0.24798356829937357, + "step": 17785 + }, + { + "epoch": 5.0, + "learning_rate": 9.998875456845657e-05, + "loss": 0.2282, + "step": 17790 + }, + { + "epoch": 5.01, + "learning_rate": 9.9982507106488e-05, + "loss": 0.1934, + "step": 17820 + }, + { + "epoch": 5.02, + "learning_rate": 9.996376472058226e-05, + "loss": 0.2085, + "step": 17850 + }, + { + "epoch": 5.03, + "learning_rate": 9.994502233467654e-05, + "loss": 0.1973, + "step": 17880 + }, + { + "epoch": 5.04, + "learning_rate": 9.992627994877082e-05, + "loss": 0.1986, + "step": 17910 + }, + { + "epoch": 5.04, + "learning_rate": 9.990753756286509e-05, + "loss": 0.2231, + "step": 17940 + }, + { + "epoch": 5.05, + "learning_rate": 9.988879517695936e-05, + "loss": 0.187, + "step": 17970 + }, + { + "epoch": 5.06, + "learning_rate": 9.987005279105364e-05, + "loss": 0.2081, + "step": 18000 + }, + { + "epoch": 5.07, + "learning_rate": 9.985131040514792e-05, + "loss": 0.2039, + "step": 18030 + }, + { + "epoch": 5.08, + "learning_rate": 9.983256801924219e-05, + "loss": 0.1983, + "step": 18060 + }, + { + "epoch": 5.09, + "learning_rate": 9.981382563333647e-05, + "loss": 0.2192, + "step": 18090 + }, + { + "epoch": 5.09, + "learning_rate": 9.979508324743073e-05, + "loss": 0.1883, + "step": 18120 + }, + { + "epoch": 5.1, + "learning_rate": 9.977634086152502e-05, + "loss": 0.2088, + "step": 18150 + }, + { + "epoch": 5.11, + "learning_rate": 9.975759847561928e-05, + "loss": 0.2058, + "step": 18180 + }, + { + "epoch": 5.12, + "learning_rate": 9.973885608971356e-05, + "loss": 0.1956, + "step": 18210 + }, + { + "epoch": 5.13, + "learning_rate": 9.972011370380784e-05, + "loss": 0.23, + "step": 18240 + }, + { + "epoch": 5.14, + "learning_rate": 9.97013713179021e-05, + "loss": 0.1872, + "step": 18270 + }, + { + "epoch": 5.14, + "learning_rate": 9.968262893199638e-05, + "loss": 0.2122, + "step": 18300 + }, + { + "epoch": 5.15, + "learning_rate": 9.966388654609066e-05, + "loss": 0.2017, + "step": 18330 + }, + { + "epoch": 5.16, + "learning_rate": 9.964514416018493e-05, + "loss": 0.1956, + "step": 18360 + }, + { + "epoch": 5.17, + "learning_rate": 9.96264017742792e-05, + "loss": 0.2146, + "step": 18390 + }, + { + "epoch": 5.18, + "learning_rate": 9.960765938837348e-05, + "loss": 0.1876, + "step": 18420 + }, + { + "epoch": 5.19, + "learning_rate": 9.958891700246776e-05, + "loss": 0.2131, + "step": 18450 + }, + { + "epoch": 5.2, + "learning_rate": 9.957017461656202e-05, + "loss": 0.1991, + "step": 18480 + }, + { + "epoch": 5.2, + "learning_rate": 9.95514322306563e-05, + "loss": 0.2035, + "step": 18510 + }, + { + "epoch": 5.21, + "learning_rate": 9.953268984475057e-05, + "loss": 0.2284, + "step": 18540 + }, + { + "epoch": 5.22, + "learning_rate": 9.951394745884485e-05, + "loss": 0.1843, + "step": 18570 + }, + { + "epoch": 5.23, + "learning_rate": 9.949520507293912e-05, + "loss": 0.206, + "step": 18600 + }, + { + "epoch": 5.24, + "learning_rate": 9.94764626870334e-05, + "loss": 0.1995, + "step": 18630 + }, + { + "epoch": 5.25, + "learning_rate": 9.945772030112768e-05, + "loss": 0.1975, + "step": 18660 + }, + { + "epoch": 5.25, + "learning_rate": 9.943897791522194e-05, + "loss": 0.2307, + "step": 18690 + }, + { + "epoch": 5.26, + "learning_rate": 9.942023552931622e-05, + "loss": 0.184, + "step": 18720 + }, + { + "epoch": 5.27, + "learning_rate": 9.94014931434105e-05, + "loss": 0.1995, + "step": 18750 + }, + { + "epoch": 5.28, + "learning_rate": 9.938275075750477e-05, + "loss": 0.1945, + "step": 18780 + }, + { + "epoch": 5.29, + "learning_rate": 9.936400837159903e-05, + "loss": 0.1972, + "step": 18810 + }, + { + "epoch": 5.3, + "learning_rate": 9.934526598569331e-05, + "loss": 0.2212, + "step": 18840 + }, + { + "epoch": 5.3, + "learning_rate": 9.93265235997876e-05, + "loss": 0.1812, + "step": 18870 + }, + { + "epoch": 5.31, + "learning_rate": 9.930778121388186e-05, + "loss": 0.2027, + "step": 18900 + }, + { + "epoch": 5.32, + "learning_rate": 9.928903882797614e-05, + "loss": 0.2014, + "step": 18930 + }, + { + "epoch": 5.33, + "learning_rate": 9.927029644207041e-05, + "loss": 0.2044, + "step": 18960 + }, + { + "epoch": 5.34, + "learning_rate": 9.925155405616469e-05, + "loss": 0.2154, + "step": 18990 + }, + { + "epoch": 5.35, + "learning_rate": 9.923281167025896e-05, + "loss": 0.1867, + "step": 19020 + }, + { + "epoch": 5.36, + "learning_rate": 9.921406928435324e-05, + "loss": 0.2095, + "step": 19050 + }, + { + "epoch": 5.36, + "learning_rate": 9.919532689844752e-05, + "loss": 0.2086, + "step": 19080 + }, + { + "epoch": 5.37, + "learning_rate": 9.917658451254178e-05, + "loss": 0.1861, + "step": 19110 + }, + { + "epoch": 5.38, + "learning_rate": 9.915784212663606e-05, + "loss": 0.2321, + "step": 19140 + }, + { + "epoch": 5.39, + "learning_rate": 9.913909974073034e-05, + "loss": 0.1855, + "step": 19170 + }, + { + "epoch": 5.4, + "learning_rate": 9.91203573548246e-05, + "loss": 0.208, + "step": 19200 + }, + { + "epoch": 5.41, + "learning_rate": 9.910161496891887e-05, + "loss": 0.1986, + "step": 19230 + }, + { + "epoch": 5.41, + "learning_rate": 9.908287258301315e-05, + "loss": 0.1984, + "step": 19260 + }, + { + "epoch": 5.42, + "learning_rate": 9.906413019710743e-05, + "loss": 0.2198, + "step": 19290 + }, + { + "epoch": 5.43, + "learning_rate": 9.90453878112017e-05, + "loss": 0.1778, + "step": 19320 + }, + { + "epoch": 5.44, + "learning_rate": 9.902664542529598e-05, + "loss": 0.2127, + "step": 19350 + }, + { + "epoch": 5.45, + "learning_rate": 9.900790303939025e-05, + "loss": 0.1995, + "step": 19380 + }, + { + "epoch": 5.46, + "learning_rate": 9.898916065348453e-05, + "loss": 0.194, + "step": 19410 + }, + { + "epoch": 5.47, + "learning_rate": 9.89704182675788e-05, + "loss": 0.2109, + "step": 19440 + }, + { + "epoch": 5.47, + "learning_rate": 9.895167588167308e-05, + "loss": 0.1722, + "step": 19470 + }, + { + "epoch": 5.48, + "learning_rate": 9.893293349576735e-05, + "loss": 0.2064, + "step": 19500 + }, + { + "epoch": 5.49, + "learning_rate": 9.891419110986161e-05, + "loss": 0.1981, + "step": 19530 + }, + { + "epoch": 5.5, + "learning_rate": 9.88954487239559e-05, + "loss": 0.19, + "step": 19560 + }, + { + "epoch": 5.51, + "learning_rate": 9.887670633805018e-05, + "loss": 0.219, + "step": 19590 + }, + { + "epoch": 5.52, + "learning_rate": 9.885796395214444e-05, + "loss": 0.176, + "step": 19620 + }, + { + "epoch": 5.52, + "learning_rate": 9.883922156623871e-05, + "loss": 0.2065, + "step": 19650 + }, + { + "epoch": 5.53, + "learning_rate": 9.882047918033299e-05, + "loss": 0.195, + "step": 19680 + }, + { + "epoch": 5.54, + "learning_rate": 9.880173679442727e-05, + "loss": 0.1915, + "step": 19710 + }, + { + "epoch": 5.55, + "learning_rate": 9.878299440852154e-05, + "loss": 0.2066, + "step": 19740 + }, + { + "epoch": 5.56, + "learning_rate": 9.876425202261582e-05, + "loss": 0.1802, + "step": 19770 + }, + { + "epoch": 5.57, + "learning_rate": 9.874550963671009e-05, + "loss": 0.2033, + "step": 19800 + }, + { + "epoch": 5.57, + "learning_rate": 9.872676725080437e-05, + "loss": 0.1952, + "step": 19830 + }, + { + "epoch": 5.58, + "learning_rate": 9.870802486489864e-05, + "loss": 0.195, + "step": 19860 + }, + { + "epoch": 5.59, + "learning_rate": 9.868928247899292e-05, + "loss": 0.2103, + "step": 19890 + }, + { + "epoch": 5.6, + "learning_rate": 9.867054009308719e-05, + "loss": 0.1803, + "step": 19920 + }, + { + "epoch": 5.61, + "learning_rate": 9.865179770718145e-05, + "loss": 0.2008, + "step": 19950 + }, + { + "epoch": 5.62, + "learning_rate": 9.863305532127573e-05, + "loss": 0.2135, + "step": 19980 + }, + { + "epoch": 5.63, + "learning_rate": 9.861431293537001e-05, + "loss": 0.1886, + "step": 20010 + }, + { + "epoch": 5.63, + "learning_rate": 9.859557054946428e-05, + "loss": 0.2032, + "step": 20040 + }, + { + "epoch": 5.64, + "learning_rate": 9.857682816355855e-05, + "loss": 0.182, + "step": 20070 + }, + { + "epoch": 5.65, + "learning_rate": 9.855808577765283e-05, + "loss": 0.2084, + "step": 20100 + }, + { + "epoch": 5.66, + "learning_rate": 9.853934339174711e-05, + "loss": 0.2042, + "step": 20130 + }, + { + "epoch": 5.67, + "learning_rate": 9.852060100584138e-05, + "loss": 0.1928, + "step": 20160 + }, + { + "epoch": 5.68, + "learning_rate": 9.850185861993566e-05, + "loss": 0.2089, + "step": 20190 + }, + { + "epoch": 5.68, + "learning_rate": 9.848311623402993e-05, + "loss": 0.1816, + "step": 20220 + }, + { + "epoch": 5.69, + "learning_rate": 9.846437384812421e-05, + "loss": 0.2145, + "step": 20250 + }, + { + "epoch": 5.7, + "learning_rate": 9.844563146221848e-05, + "loss": 0.1957, + "step": 20280 + }, + { + "epoch": 5.71, + "learning_rate": 9.842688907631276e-05, + "loss": 0.1906, + "step": 20310 + }, + { + "epoch": 5.72, + "learning_rate": 9.840814669040702e-05, + "loss": 0.2095, + "step": 20340 + }, + { + "epoch": 5.73, + "learning_rate": 9.838940430450129e-05, + "loss": 0.1812, + "step": 20370 + }, + { + "epoch": 5.74, + "learning_rate": 9.837066191859557e-05, + "loss": 0.2028, + "step": 20400 + }, + { + "epoch": 5.74, + "learning_rate": 9.835191953268985e-05, + "loss": 0.1893, + "step": 20430 + }, + { + "epoch": 5.75, + "learning_rate": 9.833317714678413e-05, + "loss": 0.1979, + "step": 20460 + }, + { + "epoch": 5.76, + "learning_rate": 9.831443476087839e-05, + "loss": 0.2088, + "step": 20490 + }, + { + "epoch": 5.77, + "learning_rate": 9.829569237497267e-05, + "loss": 0.1761, + "step": 20520 + }, + { + "epoch": 5.78, + "learning_rate": 9.827694998906695e-05, + "loss": 0.1947, + "step": 20550 + }, + { + "epoch": 5.79, + "learning_rate": 9.825820760316122e-05, + "loss": 0.2022, + "step": 20580 + }, + { + "epoch": 5.79, + "learning_rate": 9.82394652172555e-05, + "loss": 0.1878, + "step": 20610 + }, + { + "epoch": 5.8, + "learning_rate": 9.822072283134977e-05, + "loss": 0.209, + "step": 20640 + }, + { + "epoch": 5.81, + "learning_rate": 9.820198044544405e-05, + "loss": 0.1745, + "step": 20670 + }, + { + "epoch": 5.82, + "learning_rate": 9.818323805953831e-05, + "loss": 0.2038, + "step": 20700 + }, + { + "epoch": 5.83, + "learning_rate": 9.81644956736326e-05, + "loss": 0.1929, + "step": 20730 + }, + { + "epoch": 5.84, + "learning_rate": 9.814575328772686e-05, + "loss": 0.1853, + "step": 20760 + }, + { + "epoch": 5.84, + "learning_rate": 9.812701090182113e-05, + "loss": 0.209, + "step": 20790 + }, + { + "epoch": 5.85, + "learning_rate": 9.810826851591541e-05, + "loss": 0.1737, + "step": 20820 + }, + { + "epoch": 5.86, + "learning_rate": 9.808952613000969e-05, + "loss": 0.1993, + "step": 20850 + }, + { + "epoch": 5.87, + "learning_rate": 9.807078374410397e-05, + "loss": 0.1926, + "step": 20880 + }, + { + "epoch": 5.88, + "learning_rate": 9.805204135819823e-05, + "loss": 0.184, + "step": 20910 + }, + { + "epoch": 5.89, + "learning_rate": 9.803329897229251e-05, + "loss": 0.2172, + "step": 20940 + }, + { + "epoch": 5.9, + "learning_rate": 9.801455658638679e-05, + "loss": 0.1867, + "step": 20970 + }, + { + "epoch": 5.9, + "learning_rate": 9.799581420048106e-05, + "loss": 0.1985, + "step": 21000 + }, + { + "epoch": 5.91, + "learning_rate": 9.797707181457534e-05, + "loss": 0.1884, + "step": 21030 + }, + { + "epoch": 5.92, + "learning_rate": 9.79583294286696e-05, + "loss": 0.1902, + "step": 21060 + }, + { + "epoch": 5.93, + "learning_rate": 9.793958704276389e-05, + "loss": 0.2094, + "step": 21090 + }, + { + "epoch": 5.94, + "learning_rate": 9.792084465685815e-05, + "loss": 0.1748, + "step": 21120 + }, + { + "epoch": 5.95, + "learning_rate": 9.790210227095243e-05, + "loss": 0.2104, + "step": 21150 + }, + { + "epoch": 5.95, + "learning_rate": 9.78833598850467e-05, + "loss": 0.1953, + "step": 21180 + }, + { + "epoch": 5.96, + "learning_rate": 9.786461749914098e-05, + "loss": 0.1853, + "step": 21210 + }, + { + "epoch": 5.97, + "learning_rate": 9.784587511323525e-05, + "loss": 0.1937, + "step": 21240 + }, + { + "epoch": 5.98, + "learning_rate": 9.782713272732953e-05, + "loss": 0.1741, + "step": 21270 + }, + { + "epoch": 5.99, + "learning_rate": 9.780839034142381e-05, + "loss": 0.2014, + "step": 21300 + }, + { + "epoch": 6.0, + "learning_rate": 9.778964795551807e-05, + "loss": 0.2004, + "step": 21330 + }, + { + "epoch": 6.0, + "eval_loss": 0.22455841302871704, + "eval_runtime": 479.6485, + "eval_samples_per_second": 33.427, + "eval_steps_per_second": 1.047, + "eval_wer": 0.2267956819019284, + "step": 21342 + }, + { + "epoch": 6.01, + "learning_rate": 9.777090556961235e-05, + "loss": 0.189, + "step": 21360 + }, + { + "epoch": 6.01, + "learning_rate": 9.775216318370663e-05, + "loss": 0.1862, + "step": 21390 + }, + { + "epoch": 6.02, + "learning_rate": 9.77334207978009e-05, + "loss": 0.178, + "step": 21420 + }, + { + "epoch": 6.03, + "learning_rate": 9.771467841189518e-05, + "loss": 0.1925, + "step": 21450 + }, + { + "epoch": 6.04, + "learning_rate": 9.769593602598944e-05, + "loss": 0.171, + "step": 21480 + }, + { + "epoch": 6.05, + "learning_rate": 9.767719364008372e-05, + "loss": 0.1871, + "step": 21510 + }, + { + "epoch": 6.06, + "learning_rate": 9.765845125417799e-05, + "loss": 0.186, + "step": 21540 + }, + { + "epoch": 6.06, + "learning_rate": 9.763970886827227e-05, + "loss": 0.1691, + "step": 21570 + }, + { + "epoch": 6.07, + "learning_rate": 9.762096648236654e-05, + "loss": 0.1968, + "step": 21600 + }, + { + "epoch": 6.08, + "learning_rate": 9.760222409646082e-05, + "loss": 0.1729, + "step": 21630 + }, + { + "epoch": 6.09, + "learning_rate": 9.758348171055509e-05, + "loss": 0.1882, + "step": 21660 + }, + { + "epoch": 6.1, + "learning_rate": 9.756473932464937e-05, + "loss": 0.1836, + "step": 21690 + }, + { + "epoch": 6.11, + "learning_rate": 9.754599693874365e-05, + "loss": 0.1704, + "step": 21720 + }, + { + "epoch": 6.11, + "learning_rate": 9.75272545528379e-05, + "loss": 0.1932, + "step": 21750 + }, + { + "epoch": 6.12, + "learning_rate": 9.750851216693219e-05, + "loss": 0.1824, + "step": 21780 + }, + { + "epoch": 6.13, + "learning_rate": 9.748976978102647e-05, + "loss": 0.1855, + "step": 21810 + }, + { + "epoch": 6.14, + "learning_rate": 9.747102739512073e-05, + "loss": 0.1903, + "step": 21840 + }, + { + "epoch": 6.15, + "learning_rate": 9.745290975541187e-05, + "loss": 0.1735, + "step": 21870 + }, + { + "epoch": 6.16, + "learning_rate": 9.743416736950614e-05, + "loss": 0.1922, + "step": 21900 + }, + { + "epoch": 6.17, + "learning_rate": 9.741542498360041e-05, + "loss": 0.168, + "step": 21930 + }, + { + "epoch": 6.17, + "learning_rate": 9.739668259769469e-05, + "loss": 0.1856, + "step": 21960 + }, + { + "epoch": 6.18, + "learning_rate": 9.737794021178897e-05, + "loss": 0.1876, + "step": 21990 + }, + { + "epoch": 6.19, + "learning_rate": 9.735919782588324e-05, + "loss": 0.1738, + "step": 22020 + }, + { + "epoch": 6.2, + "learning_rate": 9.734045543997752e-05, + "loss": 0.196, + "step": 22050 + }, + { + "epoch": 6.21, + "learning_rate": 9.732171305407179e-05, + "loss": 0.1711, + "step": 22080 + }, + { + "epoch": 6.22, + "learning_rate": 9.730297066816605e-05, + "loss": 0.1895, + "step": 22110 + }, + { + "epoch": 6.22, + "learning_rate": 9.728422828226034e-05, + "loss": 0.1879, + "step": 22140 + }, + { + "epoch": 6.23, + "learning_rate": 9.726548589635462e-05, + "loss": 0.1935, + "step": 22170 + }, + { + "epoch": 6.24, + "learning_rate": 9.724674351044888e-05, + "loss": 0.1967, + "step": 22200 + }, + { + "epoch": 6.25, + "learning_rate": 9.722800112454315e-05, + "loss": 0.1687, + "step": 22230 + }, + { + "epoch": 6.26, + "learning_rate": 9.720925873863743e-05, + "loss": 0.1852, + "step": 22260 + }, + { + "epoch": 6.27, + "learning_rate": 9.719051635273171e-05, + "loss": 0.1916, + "step": 22290 + }, + { + "epoch": 6.27, + "learning_rate": 9.717177396682598e-05, + "loss": 0.1701, + "step": 22320 + }, + { + "epoch": 6.28, + "learning_rate": 9.715303158092025e-05, + "loss": 0.2169, + "step": 22350 + }, + { + "epoch": 6.29, + "learning_rate": 9.713428919501453e-05, + "loss": 0.1695, + "step": 22380 + }, + { + "epoch": 6.3, + "learning_rate": 9.711554680910881e-05, + "loss": 0.1891, + "step": 22410 + }, + { + "epoch": 6.31, + "learning_rate": 9.709680442320308e-05, + "loss": 0.1845, + "step": 22440 + }, + { + "epoch": 6.32, + "learning_rate": 9.707806203729736e-05, + "loss": 0.1811, + "step": 22470 + }, + { + "epoch": 6.33, + "learning_rate": 9.705931965139163e-05, + "loss": 0.1991, + "step": 22500 + }, + { + "epoch": 6.33, + "learning_rate": 9.70405772654859e-05, + "loss": 0.1663, + "step": 22530 + }, + { + "epoch": 6.34, + "learning_rate": 9.702183487958017e-05, + "loss": 0.1848, + "step": 22560 + }, + { + "epoch": 6.35, + "learning_rate": 9.700309249367446e-05, + "loss": 0.188, + "step": 22590 + }, + { + "epoch": 6.36, + "learning_rate": 9.698435010776872e-05, + "loss": 0.1712, + "step": 22620 + }, + { + "epoch": 6.37, + "learning_rate": 9.696560772186299e-05, + "loss": 0.1949, + "step": 22650 + }, + { + "epoch": 6.38, + "learning_rate": 9.694686533595727e-05, + "loss": 0.1711, + "step": 22680 + }, + { + "epoch": 6.38, + "learning_rate": 9.692812295005155e-05, + "loss": 0.1781, + "step": 22710 + }, + { + "epoch": 6.39, + "learning_rate": 9.690938056414582e-05, + "loss": 0.1853, + "step": 22740 + }, + { + "epoch": 6.4, + "learning_rate": 9.689063817824009e-05, + "loss": 0.1683, + "step": 22770 + }, + { + "epoch": 6.41, + "learning_rate": 9.687189579233437e-05, + "loss": 0.2022, + "step": 22800 + }, + { + "epoch": 6.42, + "learning_rate": 9.685315340642865e-05, + "loss": 0.1749, + "step": 22830 + }, + { + "epoch": 6.43, + "learning_rate": 9.683441102052292e-05, + "loss": 0.1827, + "step": 22860 + }, + { + "epoch": 6.44, + "learning_rate": 9.68156686346172e-05, + "loss": 0.196, + "step": 22890 + }, + { + "epoch": 6.44, + "learning_rate": 9.679692624871146e-05, + "loss": 0.1645, + "step": 22920 + }, + { + "epoch": 6.45, + "learning_rate": 9.677818386280573e-05, + "loss": 0.1914, + "step": 22950 + }, + { + "epoch": 6.46, + "learning_rate": 9.675944147690001e-05, + "loss": 0.1651, + "step": 22980 + }, + { + "epoch": 6.47, + "learning_rate": 9.67406990909943e-05, + "loss": 0.1829, + "step": 23010 + }, + { + "epoch": 6.48, + "learning_rate": 9.672195670508856e-05, + "loss": 0.1873, + "step": 23040 + }, + { + "epoch": 6.49, + "learning_rate": 9.670321431918283e-05, + "loss": 0.1705, + "step": 23070 + }, + { + "epoch": 6.49, + "learning_rate": 9.668447193327711e-05, + "loss": 0.1941, + "step": 23100 + }, + { + "epoch": 6.5, + "learning_rate": 9.666635429356824e-05, + "loss": 0.1662, + "step": 23130 + }, + { + "epoch": 6.51, + "learning_rate": 9.664761190766252e-05, + "loss": 0.1801, + "step": 23160 + }, + { + "epoch": 6.52, + "learning_rate": 9.66288695217568e-05, + "loss": 0.1801, + "step": 23190 + }, + { + "epoch": 6.53, + "learning_rate": 9.661012713585107e-05, + "loss": 0.1699, + "step": 23220 + }, + { + "epoch": 6.54, + "learning_rate": 9.659138474994533e-05, + "loss": 0.1854, + "step": 23250 + }, + { + "epoch": 6.54, + "learning_rate": 9.657264236403961e-05, + "loss": 0.1731, + "step": 23280 + }, + { + "epoch": 6.55, + "learning_rate": 9.655389997813388e-05, + "loss": 0.1813, + "step": 23310 + }, + { + "epoch": 6.56, + "learning_rate": 9.653515759222816e-05, + "loss": 0.1832, + "step": 23340 + }, + { + "epoch": 6.57, + "learning_rate": 9.651641520632244e-05, + "loss": 0.1711, + "step": 23370 + }, + { + "epoch": 6.58, + "learning_rate": 9.649767282041671e-05, + "loss": 0.1868, + "step": 23400 + }, + { + "epoch": 6.59, + "learning_rate": 9.647893043451098e-05, + "loss": 0.1687, + "step": 23430 + }, + { + "epoch": 6.6, + "learning_rate": 9.646018804860526e-05, + "loss": 0.1852, + "step": 23460 + }, + { + "epoch": 6.6, + "learning_rate": 9.644144566269954e-05, + "loss": 0.1929, + "step": 23490 + }, + { + "epoch": 6.61, + "learning_rate": 9.642270327679381e-05, + "loss": 0.1647, + "step": 23520 + }, + { + "epoch": 6.62, + "learning_rate": 9.640396089088808e-05, + "loss": 0.1908, + "step": 23550 + }, + { + "epoch": 6.63, + "learning_rate": 9.638521850498236e-05, + "loss": 0.1694, + "step": 23580 + }, + { + "epoch": 6.64, + "learning_rate": 9.636647611907664e-05, + "loss": 0.1826, + "step": 23610 + }, + { + "epoch": 6.65, + "learning_rate": 9.63477337331709e-05, + "loss": 0.1811, + "step": 23640 + }, + { + "epoch": 6.65, + "learning_rate": 9.632899134726517e-05, + "loss": 0.1694, + "step": 23670 + }, + { + "epoch": 6.66, + "learning_rate": 9.631024896135945e-05, + "loss": 0.1822, + "step": 23700 + }, + { + "epoch": 6.67, + "learning_rate": 9.629150657545372e-05, + "loss": 0.1716, + "step": 23730 + }, + { + "epoch": 6.68, + "learning_rate": 9.6272764189548e-05, + "loss": 0.1766, + "step": 23760 + }, + { + "epoch": 6.69, + "learning_rate": 9.625402180364228e-05, + "loss": 0.1839, + "step": 23790 + }, + { + "epoch": 6.7, + "learning_rate": 9.623527941773655e-05, + "loss": 0.1729, + "step": 23820 + }, + { + "epoch": 6.7, + "learning_rate": 9.621653703183082e-05, + "loss": 0.185, + "step": 23850 + }, + { + "epoch": 6.71, + "learning_rate": 9.61977946459251e-05, + "loss": 0.167, + "step": 23880 + }, + { + "epoch": 6.72, + "learning_rate": 9.617905226001938e-05, + "loss": 0.1695, + "step": 23910 + }, + { + "epoch": 6.73, + "learning_rate": 9.616030987411365e-05, + "loss": 0.1803, + "step": 23940 + }, + { + "epoch": 6.74, + "learning_rate": 9.614156748820791e-05, + "loss": 0.1726, + "step": 23970 + }, + { + "epoch": 6.75, + "learning_rate": 9.61228251023022e-05, + "loss": 0.1836, + "step": 24000 + }, + { + "epoch": 6.76, + "learning_rate": 9.610408271639648e-05, + "loss": 0.1595, + "step": 24030 + }, + { + "epoch": 6.76, + "learning_rate": 9.608534033049074e-05, + "loss": 0.1787, + "step": 24060 + }, + { + "epoch": 6.77, + "learning_rate": 9.606659794458501e-05, + "loss": 0.1775, + "step": 24090 + }, + { + "epoch": 6.78, + "learning_rate": 9.604785555867929e-05, + "loss": 0.1698, + "step": 24120 + }, + { + "epoch": 6.79, + "learning_rate": 9.602911317277356e-05, + "loss": 0.1858, + "step": 24150 + }, + { + "epoch": 6.8, + "learning_rate": 9.601037078686784e-05, + "loss": 0.1682, + "step": 24180 + }, + { + "epoch": 6.81, + "learning_rate": 9.599162840096212e-05, + "loss": 0.181, + "step": 24210 + }, + { + "epoch": 6.81, + "learning_rate": 9.597288601505639e-05, + "loss": 0.1774, + "step": 24240 + }, + { + "epoch": 6.82, + "learning_rate": 9.595414362915066e-05, + "loss": 0.1743, + "step": 24270 + }, + { + "epoch": 6.83, + "learning_rate": 9.593540124324494e-05, + "loss": 0.1867, + "step": 24300 + }, + { + "epoch": 6.84, + "learning_rate": 9.591665885733922e-05, + "loss": 0.1672, + "step": 24330 + }, + { + "epoch": 6.85, + "learning_rate": 9.589791647143349e-05, + "loss": 0.1817, + "step": 24360 + }, + { + "epoch": 6.86, + "learning_rate": 9.587917408552775e-05, + "loss": 0.1774, + "step": 24390 + }, + { + "epoch": 6.87, + "learning_rate": 9.586043169962203e-05, + "loss": 0.1679, + "step": 24420 + }, + { + "epoch": 6.87, + "learning_rate": 9.584168931371632e-05, + "loss": 0.1908, + "step": 24450 + }, + { + "epoch": 6.88, + "learning_rate": 9.582294692781058e-05, + "loss": 0.1584, + "step": 24480 + }, + { + "epoch": 6.89, + "learning_rate": 9.580420454190485e-05, + "loss": 0.1763, + "step": 24510 + }, + { + "epoch": 6.9, + "learning_rate": 9.578546215599913e-05, + "loss": 0.184, + "step": 24540 + }, + { + "epoch": 6.91, + "learning_rate": 9.57667197700934e-05, + "loss": 0.1639, + "step": 24570 + }, + { + "epoch": 6.92, + "learning_rate": 9.574797738418768e-05, + "loss": 0.1887, + "step": 24600 + }, + { + "epoch": 6.92, + "learning_rate": 9.572923499828196e-05, + "loss": 0.1645, + "step": 24630 + }, + { + "epoch": 6.93, + "learning_rate": 9.571049261237623e-05, + "loss": 0.1768, + "step": 24660 + }, + { + "epoch": 6.94, + "learning_rate": 9.56917502264705e-05, + "loss": 0.1916, + "step": 24690 + }, + { + "epoch": 6.95, + "learning_rate": 9.567300784056478e-05, + "loss": 0.1623, + "step": 24720 + }, + { + "epoch": 6.96, + "learning_rate": 9.565426545465906e-05, + "loss": 0.2004, + "step": 24750 + }, + { + "epoch": 6.97, + "learning_rate": 9.563552306875332e-05, + "loss": 0.1615, + "step": 24780 + }, + { + "epoch": 6.97, + "learning_rate": 9.561678068284759e-05, + "loss": 0.1826, + "step": 24810 + }, + { + "epoch": 6.98, + "learning_rate": 9.559803829694187e-05, + "loss": 0.1842, + "step": 24840 + }, + { + "epoch": 6.99, + "learning_rate": 9.557929591103615e-05, + "loss": 0.1605, + "step": 24870 + }, + { + "epoch": 7.0, + "eval_loss": 0.2175769805908203, + "eval_runtime": 478.6384, + "eval_samples_per_second": 33.497, + "eval_steps_per_second": 1.049, + "eval_wer": 0.21197439711762858, + "step": 24899 + }, + { + "epoch": 7.0, + "learning_rate": 9.556055352513042e-05, + "loss": 0.1973, + "step": 24900 + }, + { + "epoch": 7.01, + "learning_rate": 9.554181113922469e-05, + "loss": 0.1446, + "step": 24930 + }, + { + "epoch": 7.02, + "learning_rate": 9.552306875331897e-05, + "loss": 0.172, + "step": 24960 + }, + { + "epoch": 7.03, + "learning_rate": 9.550432636741324e-05, + "loss": 0.1592, + "step": 24990 + }, + { + "epoch": 7.03, + "learning_rate": 9.548558398150752e-05, + "loss": 0.1663, + "step": 25020 + }, + { + "epoch": 7.04, + "learning_rate": 9.546684159560179e-05, + "loss": 0.194, + "step": 25050 + }, + { + "epoch": 7.05, + "learning_rate": 9.544809920969607e-05, + "loss": 0.1514, + "step": 25080 + }, + { + "epoch": 7.06, + "learning_rate": 9.542935682379033e-05, + "loss": 0.1735, + "step": 25110 + }, + { + "epoch": 7.07, + "learning_rate": 9.541061443788461e-05, + "loss": 0.1586, + "step": 25140 + }, + { + "epoch": 7.08, + "learning_rate": 9.53918720519789e-05, + "loss": 0.1807, + "step": 25170 + }, + { + "epoch": 7.08, + "learning_rate": 9.537312966607316e-05, + "loss": 0.1757, + "step": 25200 + }, + { + "epoch": 7.09, + "learning_rate": 9.535438728016743e-05, + "loss": 0.145, + "step": 25230 + }, + { + "epoch": 7.1, + "learning_rate": 9.533564489426171e-05, + "loss": 0.1695, + "step": 25260 + }, + { + "epoch": 7.11, + "learning_rate": 9.531690250835599e-05, + "loss": 0.1631, + "step": 25290 + }, + { + "epoch": 7.12, + "learning_rate": 9.529816012245026e-05, + "loss": 0.1638, + "step": 25320 + }, + { + "epoch": 7.13, + "learning_rate": 9.527941773654453e-05, + "loss": 0.1766, + "step": 25350 + }, + { + "epoch": 7.14, + "learning_rate": 9.526067535063881e-05, + "loss": 0.1464, + "step": 25380 + }, + { + "epoch": 7.14, + "learning_rate": 9.524193296473309e-05, + "loss": 0.1746, + "step": 25410 + }, + { + "epoch": 7.15, + "learning_rate": 9.522319057882736e-05, + "loss": 0.1564, + "step": 25440 + }, + { + "epoch": 7.16, + "learning_rate": 9.520444819292162e-05, + "loss": 0.1598, + "step": 25470 + }, + { + "epoch": 7.17, + "learning_rate": 9.51857058070159e-05, + "loss": 0.1798, + "step": 25500 + }, + { + "epoch": 7.18, + "learning_rate": 9.516696342111017e-05, + "loss": 0.1506, + "step": 25530 + }, + { + "epoch": 7.19, + "learning_rate": 9.514822103520445e-05, + "loss": 0.1717, + "step": 25560 + }, + { + "epoch": 7.19, + "learning_rate": 9.512947864929873e-05, + "loss": 0.1586, + "step": 25590 + }, + { + "epoch": 7.2, + "learning_rate": 9.5110736263393e-05, + "loss": 0.1695, + "step": 25620 + }, + { + "epoch": 7.21, + "learning_rate": 9.509199387748727e-05, + "loss": 0.173, + "step": 25650 + }, + { + "epoch": 7.22, + "learning_rate": 9.507325149158155e-05, + "loss": 0.1468, + "step": 25680 + }, + { + "epoch": 7.23, + "learning_rate": 9.505450910567583e-05, + "loss": 0.1749, + "step": 25710 + }, + { + "epoch": 7.24, + "learning_rate": 9.50357667197701e-05, + "loss": 0.1609, + "step": 25740 + }, + { + "epoch": 7.24, + "learning_rate": 9.501702433386437e-05, + "loss": 0.1712, + "step": 25770 + }, + { + "epoch": 7.25, + "learning_rate": 9.499828194795865e-05, + "loss": 0.1844, + "step": 25800 + }, + { + "epoch": 7.26, + "learning_rate": 9.497953956205293e-05, + "loss": 0.1508, + "step": 25830 + }, + { + "epoch": 7.27, + "learning_rate": 9.49607971761472e-05, + "loss": 0.1767, + "step": 25860 + }, + { + "epoch": 7.28, + "learning_rate": 9.494205479024146e-05, + "loss": 0.1609, + "step": 25890 + }, + { + "epoch": 7.29, + "learning_rate": 9.492331240433574e-05, + "loss": 0.1644, + "step": 25920 + }, + { + "epoch": 7.3, + "learning_rate": 9.490457001843001e-05, + "loss": 0.1788, + "step": 25950 + }, + { + "epoch": 7.3, + "learning_rate": 9.488582763252429e-05, + "loss": 0.1519, + "step": 25980 + }, + { + "epoch": 7.31, + "learning_rate": 9.486708524661857e-05, + "loss": 0.1708, + "step": 26010 + }, + { + "epoch": 7.32, + "learning_rate": 9.484834286071284e-05, + "loss": 0.1571, + "step": 26040 + }, + { + "epoch": 7.33, + "learning_rate": 9.482960047480711e-05, + "loss": 0.1727, + "step": 26070 + }, + { + "epoch": 7.34, + "learning_rate": 9.481085808890139e-05, + "loss": 0.1843, + "step": 26100 + }, + { + "epoch": 7.35, + "learning_rate": 9.479211570299567e-05, + "loss": 0.1489, + "step": 26130 + }, + { + "epoch": 7.35, + "learning_rate": 9.477337331708994e-05, + "loss": 0.1675, + "step": 26160 + }, + { + "epoch": 7.36, + "learning_rate": 9.47546309311842e-05, + "loss": 0.1596, + "step": 26190 + }, + { + "epoch": 7.37, + "learning_rate": 9.473588854527849e-05, + "loss": 0.1626, + "step": 26220 + }, + { + "epoch": 7.38, + "learning_rate": 9.471714615937277e-05, + "loss": 0.1838, + "step": 26250 + }, + { + "epoch": 7.39, + "learning_rate": 9.469840377346703e-05, + "loss": 0.1511, + "step": 26280 + }, + { + "epoch": 7.4, + "learning_rate": 9.46796613875613e-05, + "loss": 0.183, + "step": 26310 + }, + { + "epoch": 7.41, + "learning_rate": 9.466091900165558e-05, + "loss": 0.1619, + "step": 26340 + }, + { + "epoch": 7.41, + "learning_rate": 9.464217661574985e-05, + "loss": 0.1685, + "step": 26370 + }, + { + "epoch": 7.42, + "learning_rate": 9.462343422984413e-05, + "loss": 0.1724, + "step": 26400 + }, + { + "epoch": 7.43, + "learning_rate": 9.460469184393841e-05, + "loss": 0.1478, + "step": 26430 + }, + { + "epoch": 7.44, + "learning_rate": 9.458594945803268e-05, + "loss": 0.1795, + "step": 26460 + }, + { + "epoch": 7.45, + "learning_rate": 9.456720707212695e-05, + "loss": 0.157, + "step": 26490 + }, + { + "epoch": 7.46, + "learning_rate": 9.454846468622123e-05, + "loss": 0.1705, + "step": 26520 + }, + { + "epoch": 7.46, + "learning_rate": 9.452972230031551e-05, + "loss": 0.1815, + "step": 26550 + }, + { + "epoch": 7.47, + "learning_rate": 9.451097991440978e-05, + "loss": 0.1459, + "step": 26580 + }, + { + "epoch": 7.48, + "learning_rate": 9.449223752850404e-05, + "loss": 0.1747, + "step": 26610 + }, + { + "epoch": 7.49, + "learning_rate": 9.447349514259832e-05, + "loss": 0.1625, + "step": 26640 + }, + { + "epoch": 7.5, + "learning_rate": 9.44547527566926e-05, + "loss": 0.1675, + "step": 26670 + }, + { + "epoch": 7.51, + "learning_rate": 9.443601037078687e-05, + "loss": 0.1816, + "step": 26700 + }, + { + "epoch": 7.51, + "learning_rate": 9.441726798488114e-05, + "loss": 0.1526, + "step": 26730 + }, + { + "epoch": 7.52, + "learning_rate": 9.439852559897542e-05, + "loss": 0.1826, + "step": 26760 + }, + { + "epoch": 7.53, + "learning_rate": 9.437978321306969e-05, + "loss": 0.1595, + "step": 26790 + }, + { + "epoch": 7.54, + "learning_rate": 9.436104082716397e-05, + "loss": 0.1705, + "step": 26820 + }, + { + "epoch": 7.55, + "learning_rate": 9.434229844125825e-05, + "loss": 0.1778, + "step": 26850 + }, + { + "epoch": 7.56, + "learning_rate": 9.432355605535252e-05, + "loss": 0.1514, + "step": 26880 + }, + { + "epoch": 7.57, + "learning_rate": 9.430481366944679e-05, + "loss": 0.1749, + "step": 26910 + }, + { + "epoch": 7.57, + "learning_rate": 9.428607128354107e-05, + "loss": 0.159, + "step": 26940 + }, + { + "epoch": 7.58, + "learning_rate": 9.426732889763535e-05, + "loss": 0.167, + "step": 26970 + }, + { + "epoch": 7.59, + "learning_rate": 9.424858651172961e-05, + "loss": 0.1819, + "step": 27000 + }, + { + "epoch": 7.6, + "learning_rate": 9.422984412582388e-05, + "loss": 0.1506, + "step": 27030 + }, + { + "epoch": 7.61, + "learning_rate": 9.421110173991816e-05, + "loss": 0.1736, + "step": 27060 + }, + { + "epoch": 7.62, + "learning_rate": 9.419235935401244e-05, + "loss": 0.1546, + "step": 27090 + }, + { + "epoch": 7.62, + "learning_rate": 9.417361696810671e-05, + "loss": 0.1667, + "step": 27120 + }, + { + "epoch": 7.63, + "learning_rate": 9.415487458220098e-05, + "loss": 0.1817, + "step": 27150 + }, + { + "epoch": 7.64, + "learning_rate": 9.413613219629526e-05, + "loss": 0.1571, + "step": 27180 + }, + { + "epoch": 7.65, + "learning_rate": 9.411738981038953e-05, + "loss": 0.1728, + "step": 27210 + }, + { + "epoch": 7.66, + "learning_rate": 9.409864742448381e-05, + "loss": 0.1586, + "step": 27240 + }, + { + "epoch": 7.67, + "learning_rate": 9.407990503857809e-05, + "loss": 0.1627, + "step": 27270 + }, + { + "epoch": 7.67, + "learning_rate": 9.406116265267236e-05, + "loss": 0.1711, + "step": 27300 + }, + { + "epoch": 7.68, + "learning_rate": 9.404242026676662e-05, + "loss": 0.149, + "step": 27330 + }, + { + "epoch": 7.69, + "learning_rate": 9.40236778808609e-05, + "loss": 0.1698, + "step": 27360 + }, + { + "epoch": 7.7, + "learning_rate": 9.400493549495519e-05, + "loss": 0.1562, + "step": 27390 + }, + { + "epoch": 7.71, + "learning_rate": 9.398619310904945e-05, + "loss": 0.1595, + "step": 27420 + }, + { + "epoch": 7.72, + "learning_rate": 9.396745072314372e-05, + "loss": 0.1754, + "step": 27450 + }, + { + "epoch": 7.73, + "learning_rate": 9.3948708337238e-05, + "loss": 0.1469, + "step": 27480 + }, + { + "epoch": 7.73, + "learning_rate": 9.392996595133228e-05, + "loss": 0.1762, + "step": 27510 + }, + { + "epoch": 7.74, + "learning_rate": 9.391122356542655e-05, + "loss": 0.1586, + "step": 27540 + }, + { + "epoch": 7.75, + "learning_rate": 9.389248117952082e-05, + "loss": 0.1669, + "step": 27570 + }, + { + "epoch": 7.76, + "learning_rate": 9.38737387936151e-05, + "loss": 0.1792, + "step": 27600 + }, + { + "epoch": 7.77, + "learning_rate": 9.385499640770937e-05, + "loss": 0.1467, + "step": 27630 + }, + { + "epoch": 7.78, + "learning_rate": 9.383625402180365e-05, + "loss": 0.1749, + "step": 27660 + }, + { + "epoch": 7.78, + "learning_rate": 9.381751163589793e-05, + "loss": 0.1577, + "step": 27690 + }, + { + "epoch": 7.79, + "learning_rate": 9.37987692499922e-05, + "loss": 0.1676, + "step": 27720 + }, + { + "epoch": 7.8, + "learning_rate": 9.378002686408646e-05, + "loss": 0.1791, + "step": 27750 + }, + { + "epoch": 7.81, + "learning_rate": 9.376128447818074e-05, + "loss": 0.1508, + "step": 27780 + }, + { + "epoch": 7.82, + "learning_rate": 9.374254209227502e-05, + "loss": 0.1746, + "step": 27810 + }, + { + "epoch": 7.83, + "learning_rate": 9.372379970636929e-05, + "loss": 0.1564, + "step": 27840 + }, + { + "epoch": 7.84, + "learning_rate": 9.370505732046356e-05, + "loss": 0.1633, + "step": 27870 + }, + { + "epoch": 7.84, + "learning_rate": 9.368631493455784e-05, + "loss": 0.1766, + "step": 27900 + }, + { + "epoch": 7.85, + "learning_rate": 9.366757254865212e-05, + "loss": 0.147, + "step": 27930 + }, + { + "epoch": 7.86, + "learning_rate": 9.364883016274639e-05, + "loss": 0.1762, + "step": 27960 + }, + { + "epoch": 7.87, + "learning_rate": 9.363008777684066e-05, + "loss": 0.1618, + "step": 27990 + }, + { + "epoch": 7.88, + "learning_rate": 9.361134539093494e-05, + "loss": 0.1721, + "step": 28020 + }, + { + "epoch": 7.89, + "learning_rate": 9.359260300502922e-05, + "loss": 0.1843, + "step": 28050 + }, + { + "epoch": 7.89, + "learning_rate": 9.357386061912349e-05, + "loss": 0.151, + "step": 28080 + }, + { + "epoch": 7.9, + "learning_rate": 9.355511823321777e-05, + "loss": 0.1718, + "step": 28110 + }, + { + "epoch": 7.91, + "learning_rate": 9.353637584731203e-05, + "loss": 0.1575, + "step": 28140 + }, + { + "epoch": 7.92, + "learning_rate": 9.35176334614063e-05, + "loss": 0.1578, + "step": 28170 + }, + { + "epoch": 7.93, + "learning_rate": 9.349889107550058e-05, + "loss": 0.1781, + "step": 28200 + }, + { + "epoch": 7.94, + "learning_rate": 9.348014868959486e-05, + "loss": 0.1412, + "step": 28230 + }, + { + "epoch": 7.94, + "learning_rate": 9.346140630368913e-05, + "loss": 0.1711, + "step": 28260 + }, + { + "epoch": 7.95, + "learning_rate": 9.34426639177834e-05, + "loss": 0.1557, + "step": 28290 + }, + { + "epoch": 7.96, + "learning_rate": 9.342392153187768e-05, + "loss": 0.1607, + "step": 28320 + }, + { + "epoch": 7.97, + "learning_rate": 9.340517914597196e-05, + "loss": 0.1763, + "step": 28350 + }, + { + "epoch": 7.98, + "learning_rate": 9.338643676006623e-05, + "loss": 0.1441, + "step": 28380 + }, + { + "epoch": 7.99, + "learning_rate": 9.33676943741605e-05, + "loss": 0.1739, + "step": 28410 + }, + { + "epoch": 8.0, + "learning_rate": 9.334895198825478e-05, + "loss": 0.1579, + "step": 28440 + }, + { + "epoch": 8.0, + "eval_loss": 0.20457884669303894, + "eval_runtime": 477.673, + "eval_samples_per_second": 33.565, + "eval_steps_per_second": 1.051, + "eval_wer": 0.20240743520805754, + "step": 28456 + }, + { + "epoch": 8.0, + "learning_rate": 9.333020960234906e-05, + "loss": 0.1691, + "step": 28470 + }, + { + "epoch": 8.01, + "learning_rate": 9.331146721644332e-05, + "loss": 0.1501, + "step": 28500 + }, + { + "epoch": 8.02, + "learning_rate": 9.32927248305376e-05, + "loss": 0.1653, + "step": 28530 + }, + { + "epoch": 8.03, + "learning_rate": 9.327398244463187e-05, + "loss": 0.1736, + "step": 28560 + }, + { + "epoch": 8.04, + "learning_rate": 9.325524005872614e-05, + "loss": 0.1407, + "step": 28590 + }, + { + "epoch": 8.05, + "learning_rate": 9.323649767282042e-05, + "loss": 0.1634, + "step": 28620 + }, + { + "epoch": 8.05, + "learning_rate": 9.32177552869147e-05, + "loss": 0.151, + "step": 28650 + }, + { + "epoch": 8.06, + "learning_rate": 9.319901290100897e-05, + "loss": 0.1583, + "step": 28680 + }, + { + "epoch": 8.07, + "learning_rate": 9.318027051510324e-05, + "loss": 0.1657, + "step": 28710 + }, + { + "epoch": 8.08, + "learning_rate": 9.316152812919752e-05, + "loss": 0.1443, + "step": 28740 + }, + { + "epoch": 8.09, + "learning_rate": 9.31427857432918e-05, + "loss": 0.1535, + "step": 28770 + }, + { + "epoch": 8.1, + "learning_rate": 9.312404335738607e-05, + "loss": 0.1491, + "step": 28800 + }, + { + "epoch": 8.11, + "learning_rate": 9.310530097148033e-05, + "loss": 0.1525, + "step": 28830 + }, + { + "epoch": 8.11, + "learning_rate": 9.308655858557461e-05, + "loss": 0.1651, + "step": 28860 + }, + { + "epoch": 8.12, + "learning_rate": 9.30678161996689e-05, + "loss": 0.1411, + "step": 28890 + }, + { + "epoch": 8.13, + "learning_rate": 9.304907381376316e-05, + "loss": 0.1585, + "step": 28920 + }, + { + "epoch": 8.14, + "learning_rate": 9.303033142785744e-05, + "loss": 0.1506, + "step": 28950 + }, + { + "epoch": 8.15, + "learning_rate": 9.301158904195171e-05, + "loss": 0.1455, + "step": 28980 + }, + { + "epoch": 8.16, + "learning_rate": 9.299284665604598e-05, + "loss": 0.1692, + "step": 29010 + }, + { + "epoch": 8.16, + "learning_rate": 9.297410427014026e-05, + "loss": 0.1419, + "step": 29040 + }, + { + "epoch": 8.17, + "learning_rate": 9.295536188423454e-05, + "loss": 0.16, + "step": 29070 + }, + { + "epoch": 8.18, + "learning_rate": 9.293661949832881e-05, + "loss": 0.1529, + "step": 29100 + }, + { + "epoch": 8.19, + "learning_rate": 9.291787711242308e-05, + "loss": 0.16, + "step": 29130 + }, + { + "epoch": 8.2, + "learning_rate": 9.289913472651736e-05, + "loss": 0.1715, + "step": 29160 + }, + { + "epoch": 8.21, + "learning_rate": 9.288039234061164e-05, + "loss": 0.1412, + "step": 29190 + }, + { + "epoch": 8.21, + "learning_rate": 9.28616499547059e-05, + "loss": 0.1558, + "step": 29220 + }, + { + "epoch": 8.22, + "learning_rate": 9.284290756880017e-05, + "loss": 0.1502, + "step": 29250 + }, + { + "epoch": 8.23, + "learning_rate": 9.282416518289445e-05, + "loss": 0.1461, + "step": 29280 + }, + { + "epoch": 8.24, + "learning_rate": 9.280542279698873e-05, + "loss": 0.1623, + "step": 29310 + }, + { + "epoch": 8.25, + "learning_rate": 9.2786680411083e-05, + "loss": 0.1414, + "step": 29340 + }, + { + "epoch": 8.26, + "learning_rate": 9.276793802517728e-05, + "loss": 0.1583, + "step": 29370 + }, + { + "epoch": 8.27, + "learning_rate": 9.274919563927155e-05, + "loss": 0.1536, + "step": 29400 + }, + { + "epoch": 8.27, + "learning_rate": 9.273045325336582e-05, + "loss": 0.1542, + "step": 29430 + }, + { + "epoch": 8.28, + "learning_rate": 9.27117108674601e-05, + "loss": 0.1768, + "step": 29460 + }, + { + "epoch": 8.29, + "learning_rate": 9.269296848155438e-05, + "loss": 0.138, + "step": 29490 + }, + { + "epoch": 8.3, + "learning_rate": 9.267422609564865e-05, + "loss": 0.1596, + "step": 29520 + }, + { + "epoch": 8.31, + "learning_rate": 9.265548370974291e-05, + "loss": 0.1612, + "step": 29550 + }, + { + "epoch": 8.32, + "learning_rate": 9.263736607003406e-05, + "loss": 0.1545, + "step": 29580 + }, + { + "epoch": 8.32, + "learning_rate": 9.261862368412832e-05, + "loss": 0.1678, + "step": 29610 + }, + { + "epoch": 8.33, + "learning_rate": 9.25998812982226e-05, + "loss": 0.1419, + "step": 29640 + }, + { + "epoch": 8.34, + "learning_rate": 9.258113891231688e-05, + "loss": 0.1613, + "step": 29670 + }, + { + "epoch": 8.35, + "learning_rate": 9.256239652641115e-05, + "loss": 0.1547, + "step": 29700 + }, + { + "epoch": 8.36, + "learning_rate": 9.254365414050542e-05, + "loss": 0.1518, + "step": 29730 + }, + { + "epoch": 8.37, + "learning_rate": 9.25249117545997e-05, + "loss": 0.1679, + "step": 29760 + }, + { + "epoch": 8.37, + "learning_rate": 9.250616936869397e-05, + "loss": 0.1399, + "step": 29790 + }, + { + "epoch": 8.38, + "learning_rate": 9.248742698278825e-05, + "loss": 0.1626, + "step": 29820 + }, + { + "epoch": 8.39, + "learning_rate": 9.246868459688252e-05, + "loss": 0.1491, + "step": 29850 + }, + { + "epoch": 8.4, + "learning_rate": 9.24499422109768e-05, + "loss": 0.1552, + "step": 29880 + }, + { + "epoch": 8.41, + "learning_rate": 9.243119982507106e-05, + "loss": 0.167, + "step": 29910 + }, + { + "epoch": 8.42, + "learning_rate": 9.241245743916535e-05, + "loss": 0.1427, + "step": 29940 + }, + { + "epoch": 8.43, + "learning_rate": 9.239371505325963e-05, + "loss": 0.1594, + "step": 29970 + }, + { + "epoch": 8.43, + "learning_rate": 9.23749726673539e-05, + "loss": 0.1584, + "step": 30000 + }, + { + "epoch": 8.44, + "learning_rate": 9.235623028144816e-05, + "loss": 0.163, + "step": 30030 + }, + { + "epoch": 8.45, + "learning_rate": 9.233748789554244e-05, + "loss": 0.1628, + "step": 30060 + }, + { + "epoch": 8.46, + "learning_rate": 9.231874550963672e-05, + "loss": 0.1366, + "step": 30090 + }, + { + "epoch": 8.47, + "learning_rate": 9.230000312373099e-05, + "loss": 0.1564, + "step": 30120 + }, + { + "epoch": 8.48, + "learning_rate": 9.228126073782526e-05, + "loss": 0.1532, + "step": 30150 + }, + { + "epoch": 8.48, + "learning_rate": 9.226251835191954e-05, + "loss": 0.1561, + "step": 30180 + }, + { + "epoch": 8.49, + "learning_rate": 9.22437759660138e-05, + "loss": 0.1672, + "step": 30210 + }, + { + "epoch": 8.5, + "learning_rate": 9.222503358010809e-05, + "loss": 0.1394, + "step": 30240 + }, + { + "epoch": 8.51, + "learning_rate": 9.220629119420235e-05, + "loss": 0.154, + "step": 30270 + }, + { + "epoch": 8.52, + "learning_rate": 9.218754880829664e-05, + "loss": 0.1488, + "step": 30300 + }, + { + "epoch": 8.53, + "learning_rate": 9.21688064223909e-05, + "loss": 0.1608, + "step": 30330 + }, + { + "epoch": 8.54, + "learning_rate": 9.215006403648518e-05, + "loss": 0.1753, + "step": 30360 + }, + { + "epoch": 8.54, + "learning_rate": 9.213132165057946e-05, + "loss": 0.1395, + "step": 30390 + }, + { + "epoch": 8.55, + "learning_rate": 9.211257926467373e-05, + "loss": 0.1618, + "step": 30420 + }, + { + "epoch": 8.56, + "learning_rate": 9.2093836878768e-05, + "loss": 0.1517, + "step": 30450 + }, + { + "epoch": 8.57, + "learning_rate": 9.207509449286228e-05, + "loss": 0.1575, + "step": 30480 + }, + { + "epoch": 8.58, + "learning_rate": 9.205635210695656e-05, + "loss": 0.1733, + "step": 30510 + }, + { + "epoch": 8.59, + "learning_rate": 9.203760972105083e-05, + "loss": 0.1354, + "step": 30540 + }, + { + "epoch": 8.59, + "learning_rate": 9.20188673351451e-05, + "loss": 0.1627, + "step": 30570 + }, + { + "epoch": 8.6, + "learning_rate": 9.200012494923938e-05, + "loss": 0.1507, + "step": 30600 + }, + { + "epoch": 8.61, + "learning_rate": 9.198138256333364e-05, + "loss": 0.1558, + "step": 30630 + }, + { + "epoch": 8.62, + "learning_rate": 9.196264017742793e-05, + "loss": 0.1705, + "step": 30660 + }, + { + "epoch": 8.63, + "learning_rate": 9.19438977915222e-05, + "loss": 0.145, + "step": 30690 + }, + { + "epoch": 8.64, + "learning_rate": 9.192515540561647e-05, + "loss": 0.1545, + "step": 30720 + }, + { + "epoch": 8.64, + "learning_rate": 9.190641301971074e-05, + "loss": 0.1529, + "step": 30750 + }, + { + "epoch": 8.65, + "learning_rate": 9.188767063380502e-05, + "loss": 0.1532, + "step": 30780 + }, + { + "epoch": 8.66, + "learning_rate": 9.18689282478993e-05, + "loss": 0.1758, + "step": 30810 + }, + { + "epoch": 8.67, + "learning_rate": 9.185018586199357e-05, + "loss": 0.1431, + "step": 30840 + }, + { + "epoch": 8.68, + "learning_rate": 9.183144347608784e-05, + "loss": 0.1601, + "step": 30870 + }, + { + "epoch": 8.69, + "learning_rate": 9.181270109018212e-05, + "loss": 0.1566, + "step": 30900 + }, + { + "epoch": 8.7, + "learning_rate": 9.17939587042764e-05, + "loss": 0.1508, + "step": 30930 + }, + { + "epoch": 8.7, + "learning_rate": 9.177521631837067e-05, + "loss": 0.1649, + "step": 30960 + }, + { + "epoch": 8.71, + "learning_rate": 9.175647393246494e-05, + "loss": 0.1384, + "step": 30990 + }, + { + "epoch": 8.72, + "learning_rate": 9.173773154655922e-05, + "loss": 0.1627, + "step": 31020 + }, + { + "epoch": 8.73, + "learning_rate": 9.171898916065348e-05, + "loss": 0.1521, + "step": 31050 + }, + { + "epoch": 8.74, + "learning_rate": 9.170024677474776e-05, + "loss": 0.1704, + "step": 31080 + }, + { + "epoch": 8.75, + "learning_rate": 9.168150438884203e-05, + "loss": 0.1703, + "step": 31110 + }, + { + "epoch": 8.75, + "learning_rate": 9.166276200293631e-05, + "loss": 0.1414, + "step": 31140 + }, + { + "epoch": 8.76, + "learning_rate": 9.164401961703058e-05, + "loss": 0.1608, + "step": 31170 + }, + { + "epoch": 8.77, + "learning_rate": 9.162527723112486e-05, + "loss": 0.1476, + "step": 31200 + }, + { + "epoch": 8.78, + "learning_rate": 9.160653484521914e-05, + "loss": 0.1512, + "step": 31230 + }, + { + "epoch": 8.79, + "learning_rate": 9.158779245931341e-05, + "loss": 0.163, + "step": 31260 + }, + { + "epoch": 8.8, + "learning_rate": 9.156905007340768e-05, + "loss": 0.138, + "step": 31290 + }, + { + "epoch": 8.81, + "learning_rate": 9.155030768750196e-05, + "loss": 0.1663, + "step": 31320 + }, + { + "epoch": 8.81, + "learning_rate": 9.153156530159624e-05, + "loss": 0.1562, + "step": 31350 + }, + { + "epoch": 8.82, + "learning_rate": 9.15128229156905e-05, + "loss": 0.1519, + "step": 31380 + }, + { + "epoch": 8.83, + "learning_rate": 9.149408052978477e-05, + "loss": 0.1659, + "step": 31410 + }, + { + "epoch": 8.84, + "learning_rate": 9.147533814387905e-05, + "loss": 0.1398, + "step": 31440 + }, + { + "epoch": 8.85, + "learning_rate": 9.145659575797332e-05, + "loss": 0.1624, + "step": 31470 + }, + { + "epoch": 8.86, + "learning_rate": 9.14378533720676e-05, + "loss": 0.1481, + "step": 31500 + }, + { + "epoch": 8.86, + "learning_rate": 9.141911098616187e-05, + "loss": 0.1516, + "step": 31530 + }, + { + "epoch": 8.87, + "learning_rate": 9.140036860025615e-05, + "loss": 0.1661, + "step": 31560 + }, + { + "epoch": 8.88, + "learning_rate": 9.138162621435042e-05, + "loss": 0.133, + "step": 31590 + }, + { + "epoch": 8.89, + "learning_rate": 9.13628838284447e-05, + "loss": 0.1653, + "step": 31620 + }, + { + "epoch": 8.9, + "learning_rate": 9.134414144253898e-05, + "loss": 0.1572, + "step": 31650 + }, + { + "epoch": 8.91, + "learning_rate": 9.132539905663325e-05, + "loss": 0.1493, + "step": 31680 + }, + { + "epoch": 8.91, + "learning_rate": 9.130665667072752e-05, + "loss": 0.1715, + "step": 31710 + }, + { + "epoch": 8.92, + "learning_rate": 9.12879142848218e-05, + "loss": 0.1434, + "step": 31740 + }, + { + "epoch": 8.93, + "learning_rate": 9.126917189891608e-05, + "loss": 0.165, + "step": 31770 + }, + { + "epoch": 8.94, + "learning_rate": 9.125042951301035e-05, + "loss": 0.1505, + "step": 31800 + }, + { + "epoch": 8.95, + "learning_rate": 9.123168712710461e-05, + "loss": 0.1466, + "step": 31830 + }, + { + "epoch": 8.96, + "learning_rate": 9.12129447411989e-05, + "loss": 0.1676, + "step": 31860 + }, + { + "epoch": 8.97, + "learning_rate": 9.119420235529317e-05, + "loss": 0.143, + "step": 31890 + }, + { + "epoch": 8.97, + "learning_rate": 9.117545996938744e-05, + "loss": 0.1589, + "step": 31920 + }, + { + "epoch": 8.98, + "learning_rate": 9.115671758348171e-05, + "loss": 0.1529, + "step": 31950 + }, + { + "epoch": 8.99, + "learning_rate": 9.113797519757599e-05, + "loss": 0.1491, + "step": 31980 + }, + { + "epoch": 9.0, + "learning_rate": 9.111923281167026e-05, + "loss": 0.1668, + "step": 32010 + }, + { + "epoch": 9.0, + "eval_loss": 0.20271660387516022, + "eval_runtime": 480.4264, + "eval_samples_per_second": 33.372, + "eval_steps_per_second": 1.045, + "eval_wer": 0.19443724154872874, + "step": 32013 + }, + { + "epoch": 9.01, + "learning_rate": 9.110049042576454e-05, + "loss": 0.1419, + "step": 32040 + }, + { + "epoch": 9.02, + "learning_rate": 9.108174803985882e-05, + "loss": 0.1552, + "step": 32070 + }, + { + "epoch": 9.02, + "learning_rate": 9.106300565395309e-05, + "loss": 0.1401, + "step": 32100 + }, + { + "epoch": 9.03, + "learning_rate": 9.104426326804735e-05, + "loss": 0.1473, + "step": 32130 + }, + { + "epoch": 9.04, + "learning_rate": 9.102552088214164e-05, + "loss": 0.1431, + "step": 32160 + }, + { + "epoch": 9.05, + "learning_rate": 9.100740324243276e-05, + "loss": 0.1363, + "step": 32190 + }, + { + "epoch": 9.06, + "learning_rate": 9.098866085652704e-05, + "loss": 0.1572, + "step": 32220 + }, + { + "epoch": 9.07, + "learning_rate": 9.096991847062132e-05, + "loss": 0.1328, + "step": 32250 + }, + { + "epoch": 9.08, + "learning_rate": 9.095117608471558e-05, + "loss": 0.1498, + "step": 32280 + }, + { + "epoch": 9.08, + "learning_rate": 9.093243369880986e-05, + "loss": 0.1395, + "step": 32310 + }, + { + "epoch": 9.09, + "learning_rate": 9.091369131290414e-05, + "loss": 0.1405, + "step": 32340 + }, + { + "epoch": 9.1, + "learning_rate": 9.089494892699841e-05, + "loss": 0.1531, + "step": 32370 + }, + { + "epoch": 9.11, + "learning_rate": 9.087620654109269e-05, + "loss": 0.143, + "step": 32400 + }, + { + "epoch": 9.12, + "learning_rate": 9.085746415518696e-05, + "loss": 0.1493, + "step": 32430 + }, + { + "epoch": 9.13, + "learning_rate": 9.083872176928124e-05, + "loss": 0.1452, + "step": 32460 + }, + { + "epoch": 9.13, + "learning_rate": 9.08199793833755e-05, + "loss": 0.1398, + "step": 32490 + }, + { + "epoch": 9.14, + "learning_rate": 9.080123699746979e-05, + "loss": 0.1479, + "step": 32520 + }, + { + "epoch": 9.15, + "learning_rate": 9.078249461156407e-05, + "loss": 0.1371, + "step": 32550 + }, + { + "epoch": 9.16, + "learning_rate": 9.076375222565832e-05, + "loss": 0.1589, + "step": 32580 + }, + { + "epoch": 9.17, + "learning_rate": 9.07450098397526e-05, + "loss": 0.1518, + "step": 32610 + }, + { + "epoch": 9.18, + "learning_rate": 9.072626745384688e-05, + "loss": 0.1395, + "step": 32640 + }, + { + "epoch": 9.18, + "learning_rate": 9.070752506794116e-05, + "loss": 0.1503, + "step": 32670 + }, + { + "epoch": 9.19, + "learning_rate": 9.068878268203542e-05, + "loss": 0.1312, + "step": 32700 + }, + { + "epoch": 9.2, + "learning_rate": 9.06700402961297e-05, + "loss": 0.1455, + "step": 32730 + }, + { + "epoch": 9.21, + "learning_rate": 9.065129791022398e-05, + "loss": 0.154, + "step": 32760 + }, + { + "epoch": 9.22, + "learning_rate": 9.063255552431825e-05, + "loss": 0.1488, + "step": 32790 + }, + { + "epoch": 9.23, + "learning_rate": 9.061381313841253e-05, + "loss": 0.1592, + "step": 32820 + }, + { + "epoch": 9.24, + "learning_rate": 9.05950707525068e-05, + "loss": 0.1328, + "step": 32850 + }, + { + "epoch": 9.24, + "learning_rate": 9.057632836660108e-05, + "loss": 0.1484, + "step": 32880 + }, + { + "epoch": 9.25, + "learning_rate": 9.055758598069534e-05, + "loss": 0.15, + "step": 32910 + }, + { + "epoch": 9.26, + "learning_rate": 9.053884359478962e-05, + "loss": 0.1398, + "step": 32940 + }, + { + "epoch": 9.27, + "learning_rate": 9.05201012088839e-05, + "loss": 0.1523, + "step": 32970 + }, + { + "epoch": 9.28, + "learning_rate": 9.050135882297817e-05, + "loss": 0.1337, + "step": 33000 + }, + { + "epoch": 9.29, + "learning_rate": 9.048261643707244e-05, + "loss": 0.1517, + "step": 33030 + }, + { + "epoch": 9.29, + "learning_rate": 9.046449879736357e-05, + "loss": 0.1507, + "step": 33060 + }, + { + "epoch": 9.3, + "learning_rate": 9.044575641145785e-05, + "loss": 0.1424, + "step": 33090 + }, + { + "epoch": 9.31, + "learning_rate": 9.042701402555213e-05, + "loss": 0.1612, + "step": 33120 + }, + { + "epoch": 9.32, + "learning_rate": 9.04082716396464e-05, + "loss": 0.1389, + "step": 33150 + }, + { + "epoch": 9.33, + "learning_rate": 9.038952925374066e-05, + "loss": 0.1519, + "step": 33180 + }, + { + "epoch": 9.34, + "learning_rate": 9.037078686783495e-05, + "loss": 0.1426, + "step": 33210 + }, + { + "epoch": 9.34, + "learning_rate": 9.035204448192923e-05, + "loss": 0.1386, + "step": 33240 + }, + { + "epoch": 9.35, + "learning_rate": 9.03333020960235e-05, + "loss": 0.1566, + "step": 33270 + }, + { + "epoch": 9.36, + "learning_rate": 9.031455971011777e-05, + "loss": 0.1354, + "step": 33300 + }, + { + "epoch": 9.37, + "learning_rate": 9.029581732421204e-05, + "loss": 0.1502, + "step": 33330 + }, + { + "epoch": 9.38, + "learning_rate": 9.027707493830632e-05, + "loss": 0.1536, + "step": 33360 + }, + { + "epoch": 9.39, + "learning_rate": 9.025833255240059e-05, + "loss": 0.1453, + "step": 33390 + }, + { + "epoch": 9.4, + "learning_rate": 9.023959016649487e-05, + "loss": 0.1602, + "step": 33420 + }, + { + "epoch": 9.4, + "learning_rate": 9.022084778058914e-05, + "loss": 0.1344, + "step": 33450 + }, + { + "epoch": 9.41, + "learning_rate": 9.02021053946834e-05, + "loss": 0.152, + "step": 33480 + }, + { + "epoch": 9.42, + "learning_rate": 9.018336300877769e-05, + "loss": 0.1545, + "step": 33510 + }, + { + "epoch": 9.43, + "learning_rate": 9.016462062287197e-05, + "loss": 0.1418, + "step": 33540 + }, + { + "epoch": 9.44, + "learning_rate": 9.014587823696624e-05, + "loss": 0.1589, + "step": 33570 + }, + { + "epoch": 9.45, + "learning_rate": 9.01271358510605e-05, + "loss": 0.1331, + "step": 33600 + }, + { + "epoch": 9.45, + "learning_rate": 9.010839346515478e-05, + "loss": 0.1476, + "step": 33630 + }, + { + "epoch": 9.46, + "learning_rate": 9.008965107924906e-05, + "loss": 0.1456, + "step": 33660 + }, + { + "epoch": 9.47, + "learning_rate": 9.007090869334333e-05, + "loss": 0.1427, + "step": 33690 + }, + { + "epoch": 9.48, + "learning_rate": 9.005216630743761e-05, + "loss": 0.1528, + "step": 33720 + }, + { + "epoch": 9.49, + "learning_rate": 9.003342392153188e-05, + "loss": 0.1328, + "step": 33750 + }, + { + "epoch": 9.5, + "learning_rate": 9.001468153562616e-05, + "loss": 0.147, + "step": 33780 + }, + { + "epoch": 9.51, + "learning_rate": 8.999593914972043e-05, + "loss": 0.1503, + "step": 33810 + }, + { + "epoch": 9.51, + "learning_rate": 8.997719676381471e-05, + "loss": 0.1416, + "step": 33840 + }, + { + "epoch": 9.52, + "learning_rate": 8.995845437790898e-05, + "loss": 0.1699, + "step": 33870 + }, + { + "epoch": 9.53, + "learning_rate": 8.993971199200324e-05, + "loss": 0.1438, + "step": 33900 + }, + { + "epoch": 9.54, + "learning_rate": 8.992096960609753e-05, + "loss": 0.1845, + "step": 33930 + }, + { + "epoch": 9.55, + "learning_rate": 8.990222722019181e-05, + "loss": 0.1453, + "step": 33960 + }, + { + "epoch": 9.56, + "learning_rate": 8.988348483428607e-05, + "loss": 0.1379, + "step": 33990 + }, + { + "epoch": 9.56, + "learning_rate": 8.986474244838034e-05, + "loss": 0.1605, + "step": 34020 + }, + { + "epoch": 9.57, + "learning_rate": 8.984600006247462e-05, + "loss": 0.1322, + "step": 34050 + }, + { + "epoch": 9.58, + "learning_rate": 8.98272576765689e-05, + "loss": 0.1483, + "step": 34080 + }, + { + "epoch": 9.59, + "learning_rate": 8.980851529066317e-05, + "loss": 0.1529, + "step": 34110 + }, + { + "epoch": 9.6, + "learning_rate": 8.978977290475745e-05, + "loss": 0.1424, + "step": 34140 + }, + { + "epoch": 9.61, + "learning_rate": 8.977103051885172e-05, + "loss": 0.1585, + "step": 34170 + }, + { + "epoch": 9.61, + "learning_rate": 8.9752288132946e-05, + "loss": 0.1332, + "step": 34200 + }, + { + "epoch": 9.62, + "learning_rate": 8.973354574704027e-05, + "loss": 0.1488, + "step": 34230 + }, + { + "epoch": 9.63, + "learning_rate": 8.971480336113455e-05, + "loss": 0.1484, + "step": 34260 + }, + { + "epoch": 9.64, + "learning_rate": 8.969606097522882e-05, + "loss": 0.1382, + "step": 34290 + }, + { + "epoch": 9.65, + "learning_rate": 8.967731858932308e-05, + "loss": 0.1565, + "step": 34320 + }, + { + "epoch": 9.66, + "learning_rate": 8.965857620341736e-05, + "loss": 0.1494, + "step": 34350 + }, + { + "epoch": 9.67, + "learning_rate": 8.963983381751165e-05, + "loss": 0.1682, + "step": 34380 + }, + { + "epoch": 9.67, + "learning_rate": 8.962109143160591e-05, + "loss": 0.1465, + "step": 34410 + }, + { + "epoch": 9.68, + "learning_rate": 8.960234904570018e-05, + "loss": 0.1334, + "step": 34440 + }, + { + "epoch": 9.69, + "learning_rate": 8.958360665979446e-05, + "loss": 0.154, + "step": 34470 + }, + { + "epoch": 9.7, + "learning_rate": 8.956486427388874e-05, + "loss": 0.1351, + "step": 34500 + }, + { + "epoch": 9.71, + "learning_rate": 8.954612188798301e-05, + "loss": 0.1512, + "step": 34530 + }, + { + "epoch": 9.72, + "learning_rate": 8.952737950207728e-05, + "loss": 0.1509, + "step": 34560 + }, + { + "epoch": 9.72, + "learning_rate": 8.950863711617156e-05, + "loss": 0.1423, + "step": 34590 + }, + { + "epoch": 9.73, + "learning_rate": 8.948989473026584e-05, + "loss": 0.1546, + "step": 34620 + }, + { + "epoch": 9.74, + "learning_rate": 8.94711523443601e-05, + "loss": 0.1358, + "step": 34650 + }, + { + "epoch": 9.75, + "learning_rate": 8.945240995845439e-05, + "loss": 0.1512, + "step": 34680 + }, + { + "epoch": 9.76, + "learning_rate": 8.943366757254865e-05, + "loss": 0.1478, + "step": 34710 + }, + { + "epoch": 9.77, + "learning_rate": 8.941492518664292e-05, + "loss": 0.1393, + "step": 34740 + }, + { + "epoch": 9.77, + "learning_rate": 8.93961828007372e-05, + "loss": 0.1501, + "step": 34770 + }, + { + "epoch": 9.78, + "learning_rate": 8.937744041483148e-05, + "loss": 0.1328, + "step": 34800 + }, + { + "epoch": 9.79, + "learning_rate": 8.935869802892575e-05, + "loss": 0.1516, + "step": 34830 + }, + { + "epoch": 9.8, + "learning_rate": 8.933995564302002e-05, + "loss": 0.148, + "step": 34860 + }, + { + "epoch": 9.81, + "learning_rate": 8.93212132571143e-05, + "loss": 0.1357, + "step": 34890 + }, + { + "epoch": 9.82, + "learning_rate": 8.930247087120858e-05, + "loss": 0.161, + "step": 34920 + }, + { + "epoch": 9.83, + "learning_rate": 8.928372848530285e-05, + "loss": 0.1379, + "step": 34950 + }, + { + "epoch": 9.83, + "learning_rate": 8.926498609939712e-05, + "loss": 0.1554, + "step": 34980 + }, + { + "epoch": 9.84, + "learning_rate": 8.92462437134914e-05, + "loss": 0.1519, + "step": 35010 + }, + { + "epoch": 9.85, + "learning_rate": 8.922750132758568e-05, + "loss": 0.1393, + "step": 35040 + }, + { + "epoch": 9.86, + "learning_rate": 8.920875894167995e-05, + "loss": 0.1578, + "step": 35070 + }, + { + "epoch": 9.87, + "learning_rate": 8.919001655577423e-05, + "loss": 0.1331, + "step": 35100 + }, + { + "epoch": 9.88, + "learning_rate": 8.91712741698685e-05, + "loss": 0.1481, + "step": 35130 + }, + { + "epoch": 9.88, + "learning_rate": 8.915253178396276e-05, + "loss": 0.1467, + "step": 35160 + }, + { + "epoch": 9.89, + "learning_rate": 8.913378939805704e-05, + "loss": 0.1447, + "step": 35190 + }, + { + "epoch": 9.9, + "learning_rate": 8.911504701215132e-05, + "loss": 0.1507, + "step": 35220 + }, + { + "epoch": 9.91, + "learning_rate": 8.909630462624559e-05, + "loss": 0.1358, + "step": 35250 + }, + { + "epoch": 9.92, + "learning_rate": 8.907756224033986e-05, + "loss": 0.1411, + "step": 35280 + }, + { + "epoch": 9.93, + "learning_rate": 8.905881985443414e-05, + "loss": 0.145, + "step": 35310 + }, + { + "epoch": 9.94, + "learning_rate": 8.904007746852842e-05, + "loss": 0.14, + "step": 35340 + }, + { + "epoch": 9.94, + "learning_rate": 8.902133508262269e-05, + "loss": 0.1562, + "step": 35370 + }, + { + "epoch": 9.95, + "learning_rate": 8.900259269671695e-05, + "loss": 0.1337, + "step": 35400 + }, + { + "epoch": 9.96, + "learning_rate": 8.898385031081124e-05, + "loss": 0.1455, + "step": 35430 + }, + { + "epoch": 9.97, + "learning_rate": 8.896510792490552e-05, + "loss": 0.1489, + "step": 35460 + }, + { + "epoch": 9.98, + "learning_rate": 8.894636553899978e-05, + "loss": 0.1385, + "step": 35490 + }, + { + "epoch": 9.99, + "learning_rate": 8.892762315309406e-05, + "loss": 0.1525, + "step": 35520 + }, + { + "epoch": 9.99, + "learning_rate": 8.890888076718833e-05, + "loss": 0.1338, + "step": 35550 + }, + { + "epoch": 10.0, + "eval_loss": 0.19677478075027466, + "eval_runtime": 480.2192, + "eval_samples_per_second": 33.387, + "eval_steps_per_second": 1.045, + "eval_wer": 0.18540253572257176, + "step": 35570 + }, + { + "epoch": 10.0, + "learning_rate": 8.88901383812826e-05, + "loss": 0.1577, + "step": 35580 + }, + { + "epoch": 10.01, + "learning_rate": 8.887139599537688e-05, + "loss": 0.126, + "step": 35610 + }, + { + "epoch": 10.02, + "learning_rate": 8.885265360947116e-05, + "loss": 0.1397, + "step": 35640 + }, + { + "epoch": 10.03, + "learning_rate": 8.883391122356544e-05, + "loss": 0.1469, + "step": 35670 + }, + { + "epoch": 10.04, + "learning_rate": 8.88151688376597e-05, + "loss": 0.1223, + "step": 35700 + }, + { + "epoch": 10.04, + "learning_rate": 8.879642645175398e-05, + "loss": 0.1476, + "step": 35730 + }, + { + "epoch": 10.05, + "learning_rate": 8.877768406584826e-05, + "loss": 0.1295, + "step": 35760 + }, + { + "epoch": 10.06, + "learning_rate": 8.875894167994253e-05, + "loss": 0.1416, + "step": 35790 + }, + { + "epoch": 10.07, + "learning_rate": 8.874019929403679e-05, + "loss": 0.1501, + "step": 35820 + }, + { + "epoch": 10.08, + "learning_rate": 8.872145690813107e-05, + "loss": 0.1268, + "step": 35850 + }, + { + "epoch": 10.09, + "learning_rate": 8.870271452222536e-05, + "loss": 0.1408, + "step": 35880 + }, + { + "epoch": 10.1, + "learning_rate": 8.868397213631962e-05, + "loss": 0.1251, + "step": 35910 + }, + { + "epoch": 10.1, + "learning_rate": 8.86652297504139e-05, + "loss": 0.1372, + "step": 35940 + }, + { + "epoch": 10.11, + "learning_rate": 8.864648736450817e-05, + "loss": 0.1599, + "step": 35970 + }, + { + "epoch": 10.12, + "learning_rate": 8.862774497860244e-05, + "loss": 0.1254, + "step": 36000 + }, + { + "epoch": 10.13, + "learning_rate": 8.860900259269672e-05, + "loss": 0.1437, + "step": 36030 + }, + { + "epoch": 10.14, + "learning_rate": 8.8590260206791e-05, + "loss": 0.1295, + "step": 36060 + }, + { + "epoch": 10.15, + "learning_rate": 8.857214256708213e-05, + "loss": 0.1405, + "step": 36090 + }, + { + "epoch": 10.15, + "learning_rate": 8.855340018117641e-05, + "loss": 0.1457, + "step": 36120 + }, + { + "epoch": 10.16, + "learning_rate": 8.853465779527068e-05, + "loss": 0.1312, + "step": 36150 + }, + { + "epoch": 10.17, + "learning_rate": 8.851591540936494e-05, + "loss": 0.1476, + "step": 36180 + }, + { + "epoch": 10.18, + "learning_rate": 8.849717302345922e-05, + "loss": 0.1384, + "step": 36210 + }, + { + "epoch": 10.19, + "learning_rate": 8.84784306375535e-05, + "loss": 0.1427, + "step": 36240 + }, + { + "epoch": 10.2, + "learning_rate": 8.845968825164777e-05, + "loss": 0.1544, + "step": 36270 + }, + { + "epoch": 10.21, + "learning_rate": 8.844094586574204e-05, + "loss": 0.1251, + "step": 36300 + }, + { + "epoch": 10.21, + "learning_rate": 8.842220347983632e-05, + "loss": 0.1529, + "step": 36330 + }, + { + "epoch": 10.22, + "learning_rate": 8.840346109393059e-05, + "loss": 0.1352, + "step": 36360 + }, + { + "epoch": 10.23, + "learning_rate": 8.838471870802487e-05, + "loss": 0.1373, + "step": 36390 + }, + { + "epoch": 10.24, + "learning_rate": 8.836597632211915e-05, + "loss": 0.1523, + "step": 36420 + }, + { + "epoch": 10.25, + "learning_rate": 8.834723393621342e-05, + "loss": 0.125, + "step": 36450 + }, + { + "epoch": 10.26, + "learning_rate": 8.832849155030769e-05, + "loss": 0.1466, + "step": 36480 + }, + { + "epoch": 10.26, + "learning_rate": 8.830974916440197e-05, + "loss": 0.1257, + "step": 36510 + }, + { + "epoch": 10.27, + "learning_rate": 8.829100677849625e-05, + "loss": 0.1424, + "step": 36540 + }, + { + "epoch": 10.28, + "learning_rate": 8.827226439259051e-05, + "loss": 0.1519, + "step": 36570 + }, + { + "epoch": 10.29, + "learning_rate": 8.825352200668478e-05, + "loss": 0.1251, + "step": 36600 + }, + { + "epoch": 10.3, + "learning_rate": 8.823477962077906e-05, + "loss": 0.1453, + "step": 36630 + }, + { + "epoch": 10.31, + "learning_rate": 8.821603723487334e-05, + "loss": 0.1313, + "step": 36660 + }, + { + "epoch": 10.31, + "learning_rate": 8.819729484896761e-05, + "loss": 0.1441, + "step": 36690 + }, + { + "epoch": 10.32, + "learning_rate": 8.817855246306188e-05, + "loss": 0.1528, + "step": 36720 + }, + { + "epoch": 10.33, + "learning_rate": 8.815981007715616e-05, + "loss": 0.1278, + "step": 36750 + }, + { + "epoch": 10.34, + "learning_rate": 8.814106769125044e-05, + "loss": 0.1456, + "step": 36780 + }, + { + "epoch": 10.35, + "learning_rate": 8.812232530534471e-05, + "loss": 0.1373, + "step": 36810 + }, + { + "epoch": 10.36, + "learning_rate": 8.810358291943899e-05, + "loss": 0.146, + "step": 36840 + }, + { + "epoch": 10.37, + "learning_rate": 8.808484053353326e-05, + "loss": 0.1453, + "step": 36870 + }, + { + "epoch": 10.37, + "learning_rate": 8.806609814762752e-05, + "loss": 0.1258, + "step": 36900 + }, + { + "epoch": 10.38, + "learning_rate": 8.80473557617218e-05, + "loss": 0.1607, + "step": 36930 + }, + { + "epoch": 10.39, + "learning_rate": 8.802861337581609e-05, + "loss": 0.1325, + "step": 36960 + }, + { + "epoch": 10.4, + "learning_rate": 8.800987098991035e-05, + "loss": 0.1382, + "step": 36990 + }, + { + "epoch": 10.41, + "learning_rate": 8.799112860400462e-05, + "loss": 0.1456, + "step": 37020 + }, + { + "epoch": 10.42, + "learning_rate": 8.79723862180989e-05, + "loss": 0.1236, + "step": 37050 + }, + { + "epoch": 10.42, + "learning_rate": 8.795364383219318e-05, + "loss": 0.1515, + "step": 37080 + }, + { + "epoch": 10.43, + "learning_rate": 8.793490144628745e-05, + "loss": 0.1295, + "step": 37110 + }, + { + "epoch": 10.44, + "learning_rate": 8.791615906038172e-05, + "loss": 0.1371, + "step": 37140 + }, + { + "epoch": 10.45, + "learning_rate": 8.7897416674476e-05, + "loss": 0.151, + "step": 37170 + }, + { + "epoch": 10.46, + "learning_rate": 8.787867428857028e-05, + "loss": 0.122, + "step": 37200 + }, + { + "epoch": 10.47, + "learning_rate": 8.785993190266455e-05, + "loss": 0.1449, + "step": 37230 + }, + { + "epoch": 10.48, + "learning_rate": 8.784118951675883e-05, + "loss": 0.1325, + "step": 37260 + }, + { + "epoch": 10.48, + "learning_rate": 8.78224471308531e-05, + "loss": 0.1402, + "step": 37290 + }, + { + "epoch": 10.49, + "learning_rate": 8.780370474494736e-05, + "loss": 0.1541, + "step": 37320 + }, + { + "epoch": 10.5, + "learning_rate": 8.778496235904164e-05, + "loss": 0.1226, + "step": 37350 + }, + { + "epoch": 10.51, + "learning_rate": 8.776621997313592e-05, + "loss": 0.1441, + "step": 37380 + }, + { + "epoch": 10.52, + "learning_rate": 8.774747758723019e-05, + "loss": 0.1264, + "step": 37410 + }, + { + "epoch": 10.53, + "learning_rate": 8.772873520132446e-05, + "loss": 0.1375, + "step": 37440 + }, + { + "epoch": 10.53, + "learning_rate": 8.770999281541874e-05, + "loss": 0.1486, + "step": 37470 + }, + { + "epoch": 10.54, + "learning_rate": 8.769125042951302e-05, + "loss": 0.1249, + "step": 37500 + }, + { + "epoch": 10.55, + "learning_rate": 8.767250804360729e-05, + "loss": 0.1508, + "step": 37530 + }, + { + "epoch": 10.56, + "learning_rate": 8.765376565770156e-05, + "loss": 0.1286, + "step": 37560 + }, + { + "epoch": 10.57, + "learning_rate": 8.763502327179584e-05, + "loss": 0.1402, + "step": 37590 + }, + { + "epoch": 10.58, + "learning_rate": 8.761628088589012e-05, + "loss": 0.1529, + "step": 37620 + }, + { + "epoch": 10.58, + "learning_rate": 8.759753849998439e-05, + "loss": 0.1225, + "step": 37650 + }, + { + "epoch": 10.59, + "learning_rate": 8.757879611407867e-05, + "loss": 0.1485, + "step": 37680 + }, + { + "epoch": 10.6, + "learning_rate": 8.756005372817293e-05, + "loss": 0.1306, + "step": 37710 + }, + { + "epoch": 10.61, + "learning_rate": 8.75413113422672e-05, + "loss": 0.1424, + "step": 37740 + }, + { + "epoch": 10.62, + "learning_rate": 8.752256895636148e-05, + "loss": 0.1507, + "step": 37770 + }, + { + "epoch": 10.63, + "learning_rate": 8.750382657045576e-05, + "loss": 0.1254, + "step": 37800 + }, + { + "epoch": 10.64, + "learning_rate": 8.748508418455003e-05, + "loss": 0.1455, + "step": 37830 + }, + { + "epoch": 10.64, + "learning_rate": 8.74663417986443e-05, + "loss": 0.134, + "step": 37860 + }, + { + "epoch": 10.65, + "learning_rate": 8.744759941273858e-05, + "loss": 0.1381, + "step": 37890 + }, + { + "epoch": 10.66, + "learning_rate": 8.742885702683286e-05, + "loss": 0.149, + "step": 37920 + }, + { + "epoch": 10.67, + "learning_rate": 8.741011464092713e-05, + "loss": 0.1205, + "step": 37950 + }, + { + "epoch": 10.68, + "learning_rate": 8.73913722550214e-05, + "loss": 0.1481, + "step": 37980 + }, + { + "epoch": 10.69, + "learning_rate": 8.737262986911568e-05, + "loss": 0.1385, + "step": 38010 + }, + { + "epoch": 10.69, + "learning_rate": 8.735388748320996e-05, + "loss": 0.1368, + "step": 38040 + }, + { + "epoch": 10.7, + "learning_rate": 8.733514509730422e-05, + "loss": 0.151, + "step": 38070 + }, + { + "epoch": 10.71, + "learning_rate": 8.73164027113985e-05, + "loss": 0.1279, + "step": 38100 + }, + { + "epoch": 10.72, + "learning_rate": 8.729766032549277e-05, + "loss": 0.1501, + "step": 38130 + }, + { + "epoch": 10.73, + "learning_rate": 8.727891793958704e-05, + "loss": 0.142, + "step": 38160 + }, + { + "epoch": 10.74, + "learning_rate": 8.726017555368132e-05, + "loss": 0.1391, + "step": 38190 + }, + { + "epoch": 10.74, + "learning_rate": 8.72414331677756e-05, + "loss": 0.1548, + "step": 38220 + }, + { + "epoch": 10.75, + "learning_rate": 8.722269078186987e-05, + "loss": 0.1266, + "step": 38250 + }, + { + "epoch": 10.76, + "learning_rate": 8.720394839596414e-05, + "loss": 0.1479, + "step": 38280 + }, + { + "epoch": 10.77, + "learning_rate": 8.718520601005842e-05, + "loss": 0.1385, + "step": 38310 + }, + { + "epoch": 10.78, + "learning_rate": 8.71664636241527e-05, + "loss": 0.1431, + "step": 38340 + }, + { + "epoch": 10.79, + "learning_rate": 8.714772123824697e-05, + "loss": 0.1527, + "step": 38370 + }, + { + "epoch": 10.8, + "learning_rate": 8.712897885234123e-05, + "loss": 0.1253, + "step": 38400 + }, + { + "epoch": 10.8, + "learning_rate": 8.711023646643551e-05, + "loss": 0.1533, + "step": 38430 + }, + { + "epoch": 10.81, + "learning_rate": 8.70914940805298e-05, + "loss": 0.1286, + "step": 38460 + }, + { + "epoch": 10.82, + "learning_rate": 8.707275169462406e-05, + "loss": 0.1318, + "step": 38490 + }, + { + "epoch": 10.83, + "learning_rate": 8.705463405491519e-05, + "loss": 0.1631, + "step": 38520 + }, + { + "epoch": 10.84, + "learning_rate": 8.703589166900947e-05, + "loss": 0.1207, + "step": 38550 + }, + { + "epoch": 10.85, + "learning_rate": 8.701714928310374e-05, + "loss": 0.1482, + "step": 38580 + }, + { + "epoch": 10.85, + "learning_rate": 8.699840689719802e-05, + "loss": 0.1333, + "step": 38610 + }, + { + "epoch": 10.86, + "learning_rate": 8.697966451129229e-05, + "loss": 0.144, + "step": 38640 + }, + { + "epoch": 10.87, + "learning_rate": 8.696092212538657e-05, + "loss": 0.1588, + "step": 38670 + }, + { + "epoch": 10.88, + "learning_rate": 8.694217973948085e-05, + "loss": 0.1212, + "step": 38700 + }, + { + "epoch": 10.89, + "learning_rate": 8.692343735357512e-05, + "loss": 0.1465, + "step": 38730 + }, + { + "epoch": 10.9, + "learning_rate": 8.690469496766938e-05, + "loss": 0.1286, + "step": 38760 + }, + { + "epoch": 10.91, + "learning_rate": 8.688595258176366e-05, + "loss": 0.146, + "step": 38790 + }, + { + "epoch": 10.91, + "learning_rate": 8.686721019585795e-05, + "loss": 0.1503, + "step": 38820 + }, + { + "epoch": 10.92, + "learning_rate": 8.684846780995221e-05, + "loss": 0.1341, + "step": 38850 + }, + { + "epoch": 10.93, + "learning_rate": 8.682972542404648e-05, + "loss": 0.1495, + "step": 38880 + }, + { + "epoch": 10.94, + "learning_rate": 8.681098303814076e-05, + "loss": 0.1285, + "step": 38910 + }, + { + "epoch": 10.95, + "learning_rate": 8.679224065223503e-05, + "loss": 0.1437, + "step": 38940 + }, + { + "epoch": 10.96, + "learning_rate": 8.677349826632931e-05, + "loss": 0.1519, + "step": 38970 + }, + { + "epoch": 10.96, + "learning_rate": 8.675475588042358e-05, + "loss": 0.1245, + "step": 39000 + }, + { + "epoch": 10.97, + "learning_rate": 8.673601349451786e-05, + "loss": 0.1472, + "step": 39030 + }, + { + "epoch": 10.98, + "learning_rate": 8.671727110861213e-05, + "loss": 0.1323, + "step": 39060 + }, + { + "epoch": 10.99, + "learning_rate": 8.66985287227064e-05, + "loss": 0.1388, + "step": 39090 + }, + { + "epoch": 11.0, + "learning_rate": 8.667978633680069e-05, + "loss": 0.1478, + "step": 39120 + }, + { + "epoch": 11.0, + "eval_loss": 0.1963042914867401, + "eval_runtime": 479.3311, + "eval_samples_per_second": 33.449, + "eval_steps_per_second": 1.047, + "eval_wer": 0.18230453236526414, + "step": 39127 + }, + { + "epoch": 11.01, + "learning_rate": 8.666104395089496e-05, + "loss": 0.1225, + "step": 39150 + }, + { + "epoch": 11.01, + "learning_rate": 8.664230156498922e-05, + "loss": 0.1408, + "step": 39180 + }, + { + "epoch": 11.02, + "learning_rate": 8.66235591790835e-05, + "loss": 0.1196, + "step": 39210 + }, + { + "epoch": 11.03, + "learning_rate": 8.660481679317778e-05, + "loss": 0.135, + "step": 39240 + }, + { + "epoch": 11.04, + "learning_rate": 8.658607440727205e-05, + "loss": 0.1295, + "step": 39270 + }, + { + "epoch": 11.05, + "learning_rate": 8.656733202136632e-05, + "loss": 0.1283, + "step": 39300 + }, + { + "epoch": 11.06, + "learning_rate": 8.65485896354606e-05, + "loss": 0.1426, + "step": 39330 + }, + { + "epoch": 11.07, + "learning_rate": 8.652984724955487e-05, + "loss": 0.1163, + "step": 39360 + }, + { + "epoch": 11.07, + "learning_rate": 8.651110486364915e-05, + "loss": 0.1324, + "step": 39390 + }, + { + "epoch": 11.08, + "learning_rate": 8.649236247774342e-05, + "loss": 0.1245, + "step": 39420 + }, + { + "epoch": 11.09, + "learning_rate": 8.64736200918377e-05, + "loss": 0.1335, + "step": 39450 + }, + { + "epoch": 11.1, + "learning_rate": 8.645487770593196e-05, + "loss": 0.1421, + "step": 39480 + }, + { + "epoch": 11.11, + "learning_rate": 8.643613532002625e-05, + "loss": 0.119, + "step": 39510 + }, + { + "epoch": 11.12, + "learning_rate": 8.641739293412053e-05, + "loss": 0.1411, + "step": 39540 + }, + { + "epoch": 11.12, + "learning_rate": 8.63986505482148e-05, + "loss": 0.1278, + "step": 39570 + }, + { + "epoch": 11.13, + "learning_rate": 8.637990816230906e-05, + "loss": 0.1336, + "step": 39600 + }, + { + "epoch": 11.14, + "learning_rate": 8.636116577640334e-05, + "loss": 0.143, + "step": 39630 + }, + { + "epoch": 11.15, + "learning_rate": 8.634242339049762e-05, + "loss": 0.1256, + "step": 39660 + }, + { + "epoch": 11.16, + "learning_rate": 8.632368100459189e-05, + "loss": 0.1332, + "step": 39690 + }, + { + "epoch": 11.17, + "learning_rate": 8.630493861868616e-05, + "loss": 0.1258, + "step": 39720 + }, + { + "epoch": 11.18, + "learning_rate": 8.628619623278044e-05, + "loss": 0.1286, + "step": 39750 + }, + { + "epoch": 11.18, + "learning_rate": 8.62674538468747e-05, + "loss": 0.1467, + "step": 39780 + }, + { + "epoch": 11.19, + "learning_rate": 8.624871146096899e-05, + "loss": 0.1143, + "step": 39810 + }, + { + "epoch": 11.2, + "learning_rate": 8.622996907506325e-05, + "loss": 0.1353, + "step": 39840 + }, + { + "epoch": 11.21, + "learning_rate": 8.621122668915754e-05, + "loss": 0.1315, + "step": 39870 + }, + { + "epoch": 11.22, + "learning_rate": 8.61924843032518e-05, + "loss": 0.1311, + "step": 39900 + }, + { + "epoch": 11.23, + "learning_rate": 8.617374191734608e-05, + "loss": 0.1403, + "step": 39930 + }, + { + "epoch": 11.23, + "learning_rate": 8.615499953144037e-05, + "loss": 0.1215, + "step": 39960 + }, + { + "epoch": 11.24, + "learning_rate": 8.613625714553463e-05, + "loss": 0.1423, + "step": 39990 + }, + { + "epoch": 11.25, + "learning_rate": 8.61175147596289e-05, + "loss": 0.1286, + "step": 40020 + }, + { + "epoch": 11.26, + "learning_rate": 8.609877237372318e-05, + "loss": 0.1436, + "step": 40050 + }, + { + "epoch": 11.27, + "learning_rate": 8.608002998781746e-05, + "loss": 0.1448, + "step": 40080 + }, + { + "epoch": 11.28, + "learning_rate": 8.606128760191172e-05, + "loss": 0.1137, + "step": 40110 + }, + { + "epoch": 11.28, + "learning_rate": 8.6042545216006e-05, + "loss": 0.1395, + "step": 40140 + }, + { + "epoch": 11.29, + "learning_rate": 8.602380283010028e-05, + "loss": 0.129, + "step": 40170 + }, + { + "epoch": 11.3, + "learning_rate": 8.600506044419455e-05, + "loss": 0.1381, + "step": 40200 + }, + { + "epoch": 11.31, + "learning_rate": 8.598631805828883e-05, + "loss": 0.1547, + "step": 40230 + }, + { + "epoch": 11.32, + "learning_rate": 8.59675756723831e-05, + "loss": 0.1182, + "step": 40260 + }, + { + "epoch": 11.33, + "learning_rate": 8.594883328647737e-05, + "loss": 0.1422, + "step": 40290 + }, + { + "epoch": 11.34, + "learning_rate": 8.593009090057164e-05, + "loss": 0.1323, + "step": 40320 + }, + { + "epoch": 11.34, + "learning_rate": 8.591134851466592e-05, + "loss": 0.1241, + "step": 40350 + }, + { + "epoch": 11.35, + "learning_rate": 8.58926061287602e-05, + "loss": 0.1451, + "step": 40380 + }, + { + "epoch": 11.36, + "learning_rate": 8.587386374285447e-05, + "loss": 0.1225, + "step": 40410 + }, + { + "epoch": 11.37, + "learning_rate": 8.585512135694874e-05, + "loss": 0.1381, + "step": 40440 + }, + { + "epoch": 11.38, + "learning_rate": 8.583637897104302e-05, + "loss": 0.1275, + "step": 40470 + }, + { + "epoch": 11.39, + "learning_rate": 8.58176365851373e-05, + "loss": 0.1301, + "step": 40500 + }, + { + "epoch": 11.39, + "learning_rate": 8.579889419923155e-05, + "loss": 0.1473, + "step": 40530 + }, + { + "epoch": 11.4, + "learning_rate": 8.578015181332584e-05, + "loss": 0.1212, + "step": 40560 + }, + { + "epoch": 11.41, + "learning_rate": 8.576140942742012e-05, + "loss": 0.1399, + "step": 40590 + }, + { + "epoch": 11.42, + "learning_rate": 8.57426670415144e-05, + "loss": 0.1206, + "step": 40620 + }, + { + "epoch": 11.43, + "learning_rate": 8.572392465560866e-05, + "loss": 0.1391, + "step": 40650 + }, + { + "epoch": 11.44, + "learning_rate": 8.570518226970293e-05, + "loss": 0.1464, + "step": 40680 + }, + { + "epoch": 11.44, + "learning_rate": 8.568643988379721e-05, + "loss": 0.1203, + "step": 40710 + }, + { + "epoch": 11.45, + "learning_rate": 8.566769749789148e-05, + "loss": 0.1393, + "step": 40740 + }, + { + "epoch": 11.46, + "learning_rate": 8.564895511198576e-05, + "loss": 0.1302, + "step": 40770 + }, + { + "epoch": 11.47, + "learning_rate": 8.563021272608004e-05, + "loss": 0.1356, + "step": 40800 + }, + { + "epoch": 11.48, + "learning_rate": 8.561147034017431e-05, + "loss": 0.1402, + "step": 40830 + }, + { + "epoch": 11.49, + "learning_rate": 8.559272795426858e-05, + "loss": 0.1223, + "step": 40860 + }, + { + "epoch": 11.5, + "learning_rate": 8.557398556836286e-05, + "loss": 0.1409, + "step": 40890 + }, + { + "epoch": 11.5, + "learning_rate": 8.555524318245714e-05, + "loss": 0.1258, + "step": 40920 + }, + { + "epoch": 11.51, + "learning_rate": 8.55365007965514e-05, + "loss": 0.1279, + "step": 40950 + }, + { + "epoch": 11.52, + "learning_rate": 8.551775841064567e-05, + "loss": 0.1434, + "step": 40980 + }, + { + "epoch": 11.53, + "learning_rate": 8.549901602473995e-05, + "loss": 0.1148, + "step": 41010 + }, + { + "epoch": 11.54, + "learning_rate": 8.548027363883424e-05, + "loss": 0.1429, + "step": 41040 + }, + { + "epoch": 11.55, + "learning_rate": 8.54615312529285e-05, + "loss": 0.1257, + "step": 41070 + }, + { + "epoch": 11.55, + "learning_rate": 8.544278886702277e-05, + "loss": 0.1344, + "step": 41100 + }, + { + "epoch": 11.56, + "learning_rate": 8.542404648111705e-05, + "loss": 0.1427, + "step": 41130 + }, + { + "epoch": 11.57, + "learning_rate": 8.540530409521132e-05, + "loss": 0.1237, + "step": 41160 + }, + { + "epoch": 11.58, + "learning_rate": 8.53865617093056e-05, + "loss": 0.1369, + "step": 41190 + }, + { + "epoch": 11.59, + "learning_rate": 8.536781932339988e-05, + "loss": 0.129, + "step": 41220 + }, + { + "epoch": 11.6, + "learning_rate": 8.534907693749415e-05, + "loss": 0.1385, + "step": 41250 + }, + { + "epoch": 11.61, + "learning_rate": 8.533033455158842e-05, + "loss": 0.1428, + "step": 41280 + }, + { + "epoch": 11.61, + "learning_rate": 8.53115921656827e-05, + "loss": 0.1188, + "step": 41310 + }, + { + "epoch": 11.62, + "learning_rate": 8.529284977977698e-05, + "loss": 0.1442, + "step": 41340 + }, + { + "epoch": 11.63, + "learning_rate": 8.527410739387125e-05, + "loss": 0.132, + "step": 41370 + }, + { + "epoch": 11.64, + "learning_rate": 8.525536500796551e-05, + "loss": 0.137, + "step": 41400 + }, + { + "epoch": 11.65, + "learning_rate": 8.52366226220598e-05, + "loss": 0.1439, + "step": 41430 + }, + { + "epoch": 11.66, + "learning_rate": 8.521788023615407e-05, + "loss": 0.1165, + "step": 41460 + }, + { + "epoch": 11.66, + "learning_rate": 8.519913785024834e-05, + "loss": 0.1331, + "step": 41490 + }, + { + "epoch": 11.67, + "learning_rate": 8.518039546434261e-05, + "loss": 0.1333, + "step": 41520 + }, + { + "epoch": 11.68, + "learning_rate": 8.516165307843689e-05, + "loss": 0.1305, + "step": 41550 + }, + { + "epoch": 11.69, + "learning_rate": 8.514291069253116e-05, + "loss": 0.1469, + "step": 41580 + }, + { + "epoch": 11.7, + "learning_rate": 8.512416830662544e-05, + "loss": 0.1196, + "step": 41610 + }, + { + "epoch": 11.71, + "learning_rate": 8.510542592071972e-05, + "loss": 0.1409, + "step": 41640 + }, + { + "epoch": 11.71, + "learning_rate": 8.508668353481399e-05, + "loss": 0.1287, + "step": 41670 + }, + { + "epoch": 11.72, + "learning_rate": 8.506794114890825e-05, + "loss": 0.1311, + "step": 41700 + }, + { + "epoch": 11.73, + "learning_rate": 8.504919876300254e-05, + "loss": 0.1521, + "step": 41730 + }, + { + "epoch": 11.74, + "learning_rate": 8.503045637709682e-05, + "loss": 0.1193, + "step": 41760 + }, + { + "epoch": 11.75, + "learning_rate": 8.501171399119108e-05, + "loss": 0.1292, + "step": 41790 + }, + { + "epoch": 11.76, + "learning_rate": 8.499297160528535e-05, + "loss": 0.1316, + "step": 41820 + }, + { + "epoch": 11.77, + "learning_rate": 8.497422921937963e-05, + "loss": 0.1282, + "step": 41850 + }, + { + "epoch": 11.77, + "learning_rate": 8.495548683347391e-05, + "loss": 0.1428, + "step": 41880 + }, + { + "epoch": 11.78, + "learning_rate": 8.493674444756818e-05, + "loss": 0.1231, + "step": 41910 + }, + { + "epoch": 11.79, + "learning_rate": 8.491800206166245e-05, + "loss": 0.1375, + "step": 41940 + }, + { + "epoch": 11.8, + "learning_rate": 8.489925967575673e-05, + "loss": 0.1259, + "step": 41970 + }, + { + "epoch": 11.81, + "learning_rate": 8.4880517289851e-05, + "loss": 0.1291, + "step": 42000 + }, + { + "epoch": 11.82, + "learning_rate": 8.486177490394528e-05, + "loss": 0.1446, + "step": 42030 + }, + { + "epoch": 11.82, + "learning_rate": 8.484303251803956e-05, + "loss": 0.12, + "step": 42060 + }, + { + "epoch": 11.83, + "learning_rate": 8.482429013213383e-05, + "loss": 0.1332, + "step": 42090 + }, + { + "epoch": 11.84, + "learning_rate": 8.480617249242495e-05, + "loss": 0.1232, + "step": 42120 + }, + { + "epoch": 11.85, + "learning_rate": 8.478743010651923e-05, + "loss": 0.1266, + "step": 42150 + }, + { + "epoch": 11.86, + "learning_rate": 8.47686877206135e-05, + "loss": 0.1501, + "step": 42180 + }, + { + "epoch": 11.87, + "learning_rate": 8.474994533470778e-05, + "loss": 0.1221, + "step": 42210 + }, + { + "epoch": 11.88, + "learning_rate": 8.473120294880206e-05, + "loss": 0.1365, + "step": 42240 + }, + { + "epoch": 11.88, + "learning_rate": 8.471246056289632e-05, + "loss": 0.1262, + "step": 42270 + }, + { + "epoch": 11.89, + "learning_rate": 8.46937181769906e-05, + "loss": 0.1313, + "step": 42300 + }, + { + "epoch": 11.9, + "learning_rate": 8.467497579108488e-05, + "loss": 0.1452, + "step": 42330 + }, + { + "epoch": 11.91, + "learning_rate": 8.465623340517915e-05, + "loss": 0.1246, + "step": 42360 + }, + { + "epoch": 11.92, + "learning_rate": 8.463749101927343e-05, + "loss": 0.1378, + "step": 42390 + }, + { + "epoch": 11.93, + "learning_rate": 8.46187486333677e-05, + "loss": 0.1265, + "step": 42420 + }, + { + "epoch": 11.93, + "learning_rate": 8.460000624746198e-05, + "loss": 0.1343, + "step": 42450 + }, + { + "epoch": 11.94, + "learning_rate": 8.458126386155624e-05, + "loss": 0.1391, + "step": 42480 + }, + { + "epoch": 11.95, + "learning_rate": 8.456252147565052e-05, + "loss": 0.1157, + "step": 42510 + }, + { + "epoch": 11.96, + "learning_rate": 8.454377908974479e-05, + "loss": 0.1359, + "step": 42540 + }, + { + "epoch": 11.97, + "learning_rate": 8.452503670383907e-05, + "loss": 0.1298, + "step": 42570 + }, + { + "epoch": 11.98, + "learning_rate": 8.450629431793334e-05, + "loss": 0.1291, + "step": 42600 + }, + { + "epoch": 11.98, + "learning_rate": 8.448755193202762e-05, + "loss": 0.1352, + "step": 42630 + }, + { + "epoch": 11.99, + "learning_rate": 8.44688095461219e-05, + "loss": 0.1177, + "step": 42660 + }, + { + "epoch": 12.0, + "eval_loss": 0.19564659893512726, + "eval_runtime": 478.632, + "eval_samples_per_second": 33.498, + "eval_steps_per_second": 1.049, + "eval_wer": 0.17997079415337164, + "step": 42684 + }, + { + "epoch": 12.0, + "learning_rate": 8.445006716021616e-05, + "loss": 0.1475, + "step": 42690 + }, + { + "epoch": 12.01, + "learning_rate": 8.443132477431044e-05, + "loss": 0.1208, + "step": 42720 + }, + { + "epoch": 12.02, + "learning_rate": 8.441258238840472e-05, + "loss": 0.1224, + "step": 42750 + }, + { + "epoch": 12.03, + "learning_rate": 8.439384000249899e-05, + "loss": 0.1231, + "step": 42780 + }, + { + "epoch": 12.04, + "learning_rate": 8.437509761659327e-05, + "loss": 0.1231, + "step": 42810 + }, + { + "epoch": 12.04, + "learning_rate": 8.435635523068753e-05, + "loss": 0.1325, + "step": 42840 + }, + { + "epoch": 12.05, + "learning_rate": 8.433761284478181e-05, + "loss": 0.1167, + "step": 42870 + }, + { + "epoch": 12.06, + "learning_rate": 8.431887045887608e-05, + "loss": 0.1336, + "step": 42900 + }, + { + "epoch": 12.07, + "learning_rate": 8.430012807297036e-05, + "loss": 0.1248, + "step": 42930 + }, + { + "epoch": 12.08, + "learning_rate": 8.428138568706463e-05, + "loss": 0.1246, + "step": 42960 + }, + { + "epoch": 12.09, + "learning_rate": 8.426264330115891e-05, + "loss": 0.1269, + "step": 42990 + }, + { + "epoch": 12.09, + "learning_rate": 8.424390091525318e-05, + "loss": 0.1137, + "step": 43020 + }, + { + "epoch": 12.1, + "learning_rate": 8.422515852934746e-05, + "loss": 0.1239, + "step": 43050 + }, + { + "epoch": 12.11, + "learning_rate": 8.420641614344174e-05, + "loss": 0.1295, + "step": 43080 + }, + { + "epoch": 12.12, + "learning_rate": 8.4187673757536e-05, + "loss": 0.1244, + "step": 43110 + }, + { + "epoch": 12.13, + "learning_rate": 8.416893137163028e-05, + "loss": 0.136, + "step": 43140 + }, + { + "epoch": 12.14, + "learning_rate": 8.415018898572456e-05, + "loss": 0.1142, + "step": 43170 + }, + { + "epoch": 12.15, + "learning_rate": 8.413144659981882e-05, + "loss": 0.1349, + "step": 43200 + }, + { + "epoch": 12.15, + "learning_rate": 8.41127042139131e-05, + "loss": 0.1246, + "step": 43230 + }, + { + "epoch": 12.16, + "learning_rate": 8.409396182800737e-05, + "loss": 0.1244, + "step": 43260 + }, + { + "epoch": 12.17, + "learning_rate": 8.407521944210165e-05, + "loss": 0.1357, + "step": 43290 + }, + { + "epoch": 12.18, + "learning_rate": 8.405647705619592e-05, + "loss": 0.1175, + "step": 43320 + }, + { + "epoch": 12.19, + "learning_rate": 8.40377346702902e-05, + "loss": 0.1322, + "step": 43350 + }, + { + "epoch": 12.2, + "learning_rate": 8.401899228438447e-05, + "loss": 0.1274, + "step": 43380 + }, + { + "epoch": 12.2, + "learning_rate": 8.400024989847875e-05, + "loss": 0.1226, + "step": 43410 + }, + { + "epoch": 12.21, + "learning_rate": 8.398150751257302e-05, + "loss": 0.1399, + "step": 43440 + }, + { + "epoch": 12.22, + "learning_rate": 8.39627651266673e-05, + "loss": 0.1195, + "step": 43470 + }, + { + "epoch": 12.23, + "learning_rate": 8.394402274076158e-05, + "loss": 0.13, + "step": 43500 + }, + { + "epoch": 12.24, + "learning_rate": 8.392528035485583e-05, + "loss": 0.1324, + "step": 43530 + }, + { + "epoch": 12.25, + "learning_rate": 8.390653796895011e-05, + "loss": 0.1257, + "step": 43560 + }, + { + "epoch": 12.25, + "learning_rate": 8.38877955830444e-05, + "loss": 0.1363, + "step": 43590 + }, + { + "epoch": 12.26, + "learning_rate": 8.386905319713866e-05, + "loss": 0.1137, + "step": 43620 + }, + { + "epoch": 12.27, + "learning_rate": 8.385031081123294e-05, + "loss": 0.1262, + "step": 43650 + }, + { + "epoch": 12.28, + "learning_rate": 8.383156842532721e-05, + "loss": 0.1309, + "step": 43680 + }, + { + "epoch": 12.29, + "learning_rate": 8.381282603942149e-05, + "loss": 0.1266, + "step": 43710 + }, + { + "epoch": 12.3, + "learning_rate": 8.379408365351576e-05, + "loss": 0.1372, + "step": 43740 + }, + { + "epoch": 12.31, + "learning_rate": 8.377534126761004e-05, + "loss": 0.1164, + "step": 43770 + }, + { + "epoch": 12.31, + "learning_rate": 8.375659888170431e-05, + "loss": 0.1326, + "step": 43800 + }, + { + "epoch": 12.32, + "learning_rate": 8.373785649579859e-05, + "loss": 0.1297, + "step": 43830 + }, + { + "epoch": 12.33, + "learning_rate": 8.371911410989286e-05, + "loss": 0.1234, + "step": 43860 + }, + { + "epoch": 12.34, + "learning_rate": 8.370037172398714e-05, + "loss": 0.1377, + "step": 43890 + }, + { + "epoch": 12.35, + "learning_rate": 8.368162933808142e-05, + "loss": 0.1154, + "step": 43920 + }, + { + "epoch": 12.36, + "learning_rate": 8.366288695217567e-05, + "loss": 0.1382, + "step": 43950 + }, + { + "epoch": 12.36, + "learning_rate": 8.364414456626995e-05, + "loss": 0.1308, + "step": 43980 + }, + { + "epoch": 12.37, + "learning_rate": 8.362540218036423e-05, + "loss": 0.1279, + "step": 44010 + }, + { + "epoch": 12.38, + "learning_rate": 8.360665979445851e-05, + "loss": 0.1345, + "step": 44040 + }, + { + "epoch": 12.39, + "learning_rate": 8.358791740855278e-05, + "loss": 0.1167, + "step": 44070 + }, + { + "epoch": 12.4, + "learning_rate": 8.356917502264705e-05, + "loss": 0.1296, + "step": 44100 + }, + { + "epoch": 12.41, + "learning_rate": 8.355043263674133e-05, + "loss": 0.1288, + "step": 44130 + }, + { + "epoch": 12.41, + "learning_rate": 8.35316902508356e-05, + "loss": 0.121, + "step": 44160 + }, + { + "epoch": 12.42, + "learning_rate": 8.351294786492988e-05, + "loss": 0.1304, + "step": 44190 + }, + { + "epoch": 12.43, + "learning_rate": 8.349420547902415e-05, + "loss": 0.1198, + "step": 44220 + }, + { + "epoch": 12.44, + "learning_rate": 8.347546309311843e-05, + "loss": 0.1348, + "step": 44250 + }, + { + "epoch": 12.45, + "learning_rate": 8.34567207072127e-05, + "loss": 0.1269, + "step": 44280 + }, + { + "epoch": 12.46, + "learning_rate": 8.343797832130698e-05, + "loss": 0.1216, + "step": 44310 + }, + { + "epoch": 12.47, + "learning_rate": 8.341923593540126e-05, + "loss": 0.1321, + "step": 44340 + }, + { + "epoch": 12.47, + "learning_rate": 8.340049354949551e-05, + "loss": 0.1204, + "step": 44370 + }, + { + "epoch": 12.48, + "learning_rate": 8.338175116358979e-05, + "loss": 0.1322, + "step": 44400 + }, + { + "epoch": 12.49, + "learning_rate": 8.336300877768407e-05, + "loss": 0.1259, + "step": 44430 + }, + { + "epoch": 12.5, + "learning_rate": 8.334426639177835e-05, + "loss": 0.1233, + "step": 44460 + }, + { + "epoch": 12.51, + "learning_rate": 8.332552400587261e-05, + "loss": 0.1342, + "step": 44490 + }, + { + "epoch": 12.52, + "learning_rate": 8.330678161996689e-05, + "loss": 0.1143, + "step": 44520 + }, + { + "epoch": 12.52, + "learning_rate": 8.328803923406117e-05, + "loss": 0.1335, + "step": 44550 + }, + { + "epoch": 12.53, + "learning_rate": 8.326929684815544e-05, + "loss": 0.1285, + "step": 44580 + }, + { + "epoch": 12.54, + "learning_rate": 8.325055446224972e-05, + "loss": 0.1218, + "step": 44610 + }, + { + "epoch": 12.55, + "learning_rate": 8.323181207634399e-05, + "loss": 0.1364, + "step": 44640 + }, + { + "epoch": 12.56, + "learning_rate": 8.321306969043827e-05, + "loss": 0.1171, + "step": 44670 + }, + { + "epoch": 12.57, + "learning_rate": 8.319432730453253e-05, + "loss": 0.1374, + "step": 44700 + }, + { + "epoch": 12.58, + "learning_rate": 8.317558491862681e-05, + "loss": 0.1288, + "step": 44730 + }, + { + "epoch": 12.58, + "learning_rate": 8.31568425327211e-05, + "loss": 0.126, + "step": 44760 + }, + { + "epoch": 12.59, + "learning_rate": 8.313810014681536e-05, + "loss": 0.1404, + "step": 44790 + }, + { + "epoch": 12.6, + "learning_rate": 8.311935776090963e-05, + "loss": 0.1171, + "step": 44820 + }, + { + "epoch": 12.61, + "learning_rate": 8.310061537500391e-05, + "loss": 0.1304, + "step": 44850 + }, + { + "epoch": 12.62, + "learning_rate": 8.308187298909819e-05, + "loss": 0.1322, + "step": 44880 + }, + { + "epoch": 12.63, + "learning_rate": 8.306313060319245e-05, + "loss": 0.1237, + "step": 44910 + }, + { + "epoch": 12.63, + "learning_rate": 8.304438821728673e-05, + "loss": 0.1353, + "step": 44940 + }, + { + "epoch": 12.64, + "learning_rate": 8.302564583138101e-05, + "loss": 0.1161, + "step": 44970 + }, + { + "epoch": 12.65, + "learning_rate": 8.300690344547528e-05, + "loss": 0.1297, + "step": 45000 + }, + { + "epoch": 12.66, + "learning_rate": 8.298816105956956e-05, + "loss": 0.1286, + "step": 45030 + }, + { + "epoch": 12.67, + "learning_rate": 8.296941867366382e-05, + "loss": 0.1245, + "step": 45060 + }, + { + "epoch": 12.68, + "learning_rate": 8.29506762877581e-05, + "loss": 0.1329, + "step": 45090 + }, + { + "epoch": 12.68, + "learning_rate": 8.293193390185237e-05, + "loss": 0.1151, + "step": 45120 + }, + { + "epoch": 12.69, + "learning_rate": 8.291319151594665e-05, + "loss": 0.1302, + "step": 45150 + }, + { + "epoch": 12.7, + "learning_rate": 8.289444913004093e-05, + "loss": 0.1284, + "step": 45180 + }, + { + "epoch": 12.71, + "learning_rate": 8.28757067441352e-05, + "loss": 0.1236, + "step": 45210 + }, + { + "epoch": 12.72, + "learning_rate": 8.285696435822947e-05, + "loss": 0.1403, + "step": 45240 + }, + { + "epoch": 12.73, + "learning_rate": 8.283822197232375e-05, + "loss": 0.112, + "step": 45270 + }, + { + "epoch": 12.74, + "learning_rate": 8.281947958641803e-05, + "loss": 0.1292, + "step": 45300 + }, + { + "epoch": 12.74, + "learning_rate": 8.280073720051228e-05, + "loss": 0.1273, + "step": 45330 + }, + { + "epoch": 12.75, + "learning_rate": 8.278199481460657e-05, + "loss": 0.1233, + "step": 45360 + }, + { + "epoch": 12.76, + "learning_rate": 8.276325242870085e-05, + "loss": 0.1404, + "step": 45390 + }, + { + "epoch": 12.77, + "learning_rate": 8.274451004279511e-05, + "loss": 0.1222, + "step": 45420 + }, + { + "epoch": 12.78, + "learning_rate": 8.27257676568894e-05, + "loss": 0.1301, + "step": 45450 + }, + { + "epoch": 12.79, + "learning_rate": 8.270702527098366e-05, + "loss": 0.1326, + "step": 45480 + }, + { + "epoch": 12.79, + "learning_rate": 8.268828288507794e-05, + "loss": 0.1243, + "step": 45510 + }, + { + "epoch": 12.8, + "learning_rate": 8.266954049917221e-05, + "loss": 0.1403, + "step": 45540 + }, + { + "epoch": 12.81, + "learning_rate": 8.265079811326649e-05, + "loss": 0.1198, + "step": 45570 + }, + { + "epoch": 12.82, + "learning_rate": 8.263205572736077e-05, + "loss": 0.1254, + "step": 45600 + }, + { + "epoch": 12.83, + "learning_rate": 8.261331334145504e-05, + "loss": 0.1306, + "step": 45630 + }, + { + "epoch": 12.84, + "learning_rate": 8.259457095554931e-05, + "loss": 0.1267, + "step": 45660 + }, + { + "epoch": 12.84, + "learning_rate": 8.257582856964359e-05, + "loss": 0.139, + "step": 45690 + }, + { + "epoch": 12.85, + "learning_rate": 8.255708618373787e-05, + "loss": 0.1106, + "step": 45720 + }, + { + "epoch": 12.86, + "learning_rate": 8.2538968544029e-05, + "loss": 0.1351, + "step": 45750 + }, + { + "epoch": 12.87, + "learning_rate": 8.252022615812326e-05, + "loss": 0.1265, + "step": 45780 + }, + { + "epoch": 12.88, + "learning_rate": 8.250148377221753e-05, + "loss": 0.1185, + "step": 45810 + }, + { + "epoch": 12.89, + "learning_rate": 8.248274138631181e-05, + "loss": 0.1317, + "step": 45840 + }, + { + "epoch": 12.9, + "learning_rate": 8.24639990004061e-05, + "loss": 0.1265, + "step": 45870 + }, + { + "epoch": 12.9, + "learning_rate": 8.244525661450036e-05, + "loss": 0.1248, + "step": 45900 + }, + { + "epoch": 12.91, + "learning_rate": 8.242651422859464e-05, + "loss": 0.1273, + "step": 45930 + }, + { + "epoch": 12.92, + "learning_rate": 8.240777184268891e-05, + "loss": 0.1254, + "step": 45960 + }, + { + "epoch": 12.93, + "learning_rate": 8.238902945678319e-05, + "loss": 0.1422, + "step": 45990 + }, + { + "epoch": 12.94, + "learning_rate": 8.237028707087746e-05, + "loss": 0.1225, + "step": 46020 + }, + { + "epoch": 12.95, + "learning_rate": 8.235154468497174e-05, + "loss": 0.1304, + "step": 46050 + }, + { + "epoch": 12.95, + "learning_rate": 8.2332802299066e-05, + "loss": 0.1287, + "step": 46080 + }, + { + "epoch": 12.96, + "learning_rate": 8.231405991316027e-05, + "loss": 0.1254, + "step": 46110 + }, + { + "epoch": 12.97, + "learning_rate": 8.229531752725455e-05, + "loss": 0.1448, + "step": 46140 + }, + { + "epoch": 12.98, + "learning_rate": 8.227657514134884e-05, + "loss": 0.117, + "step": 46170 + }, + { + "epoch": 12.99, + "learning_rate": 8.22578327554431e-05, + "loss": 0.1298, + "step": 46200 + }, + { + "epoch": 13.0, + "learning_rate": 8.223909036953737e-05, + "loss": 0.1245, + "step": 46230 + }, + { + "epoch": 13.0, + "eval_loss": 0.1889359951019287, + "eval_runtime": 478.3965, + "eval_samples_per_second": 33.514, + "eval_steps_per_second": 1.049, + "eval_wer": 0.17316746959998908, + "step": 46241 + }, + { + "epoch": 13.01, + "learning_rate": 8.222034798363165e-05, + "loss": 0.1197, + "step": 46260 + }, + { + "epoch": 13.01, + "learning_rate": 8.220160559772593e-05, + "loss": 0.1297, + "step": 46290 + }, + { + "epoch": 13.02, + "learning_rate": 8.21828632118202e-05, + "loss": 0.1108, + "step": 46320 + }, + { + "epoch": 13.03, + "learning_rate": 8.216412082591448e-05, + "loss": 0.1317, + "step": 46350 + }, + { + "epoch": 13.04, + "learning_rate": 8.214537844000875e-05, + "loss": 0.1133, + "step": 46380 + }, + { + "epoch": 13.05, + "learning_rate": 8.212663605410303e-05, + "loss": 0.1236, + "step": 46410 + }, + { + "epoch": 13.06, + "learning_rate": 8.21078936681973e-05, + "loss": 0.1254, + "step": 46440 + }, + { + "epoch": 13.06, + "learning_rate": 8.208915128229158e-05, + "loss": 0.1126, + "step": 46470 + }, + { + "epoch": 13.07, + "learning_rate": 8.207040889638585e-05, + "loss": 0.1321, + "step": 46500 + }, + { + "epoch": 13.08, + "learning_rate": 8.205166651048011e-05, + "loss": 0.1185, + "step": 46530 + }, + { + "epoch": 13.09, + "learning_rate": 8.20329241245744e-05, + "loss": 0.1262, + "step": 46560 + }, + { + "epoch": 13.1, + "learning_rate": 8.201418173866867e-05, + "loss": 0.1228, + "step": 46590 + }, + { + "epoch": 13.11, + "learning_rate": 8.199543935276294e-05, + "loss": 0.1105, + "step": 46620 + }, + { + "epoch": 13.11, + "learning_rate": 8.197669696685721e-05, + "loss": 0.1295, + "step": 46650 + }, + { + "epoch": 13.12, + "learning_rate": 8.195795458095149e-05, + "loss": 0.1089, + "step": 46680 + }, + { + "epoch": 13.13, + "learning_rate": 8.193921219504577e-05, + "loss": 0.1168, + "step": 46710 + }, + { + "epoch": 13.14, + "learning_rate": 8.192046980914004e-05, + "loss": 0.1319, + "step": 46740 + }, + { + "epoch": 13.15, + "learning_rate": 8.190172742323432e-05, + "loss": 0.1141, + "step": 46770 + }, + { + "epoch": 13.16, + "learning_rate": 8.188298503732859e-05, + "loss": 0.1327, + "step": 46800 + }, + { + "epoch": 13.17, + "learning_rate": 8.186424265142287e-05, + "loss": 0.1142, + "step": 46830 + }, + { + "epoch": 13.17, + "learning_rate": 8.184550026551714e-05, + "loss": 0.1268, + "step": 46860 + }, + { + "epoch": 13.18, + "learning_rate": 8.182675787961142e-05, + "loss": 0.1296, + "step": 46890 + }, + { + "epoch": 13.19, + "learning_rate": 8.180801549370568e-05, + "loss": 0.1103, + "step": 46920 + }, + { + "epoch": 13.2, + "learning_rate": 8.178927310779995e-05, + "loss": 0.1404, + "step": 46950 + }, + { + "epoch": 13.21, + "learning_rate": 8.177053072189423e-05, + "loss": 0.1145, + "step": 46980 + }, + { + "epoch": 13.22, + "learning_rate": 8.175178833598851e-05, + "loss": 0.1248, + "step": 47010 + }, + { + "epoch": 13.22, + "learning_rate": 8.173304595008278e-05, + "loss": 0.123, + "step": 47040 + }, + { + "epoch": 13.23, + "learning_rate": 8.171430356417705e-05, + "loss": 0.11, + "step": 47070 + }, + { + "epoch": 13.24, + "learning_rate": 8.169556117827133e-05, + "loss": 0.1269, + "step": 47100 + }, + { + "epoch": 13.25, + "learning_rate": 8.167681879236561e-05, + "loss": 0.118, + "step": 47130 + }, + { + "epoch": 13.26, + "learning_rate": 8.165807640645988e-05, + "loss": 0.1306, + "step": 47160 + }, + { + "epoch": 13.27, + "learning_rate": 8.163933402055416e-05, + "loss": 0.1242, + "step": 47190 + }, + { + "epoch": 13.28, + "learning_rate": 8.162059163464843e-05, + "loss": 0.1105, + "step": 47220 + }, + { + "epoch": 13.28, + "learning_rate": 8.16018492487427e-05, + "loss": 0.1311, + "step": 47250 + }, + { + "epoch": 13.29, + "learning_rate": 8.158310686283697e-05, + "loss": 0.1116, + "step": 47280 + }, + { + "epoch": 13.3, + "learning_rate": 8.156436447693125e-05, + "loss": 0.1219, + "step": 47310 + }, + { + "epoch": 13.31, + "learning_rate": 8.154562209102552e-05, + "loss": 0.1371, + "step": 47340 + }, + { + "epoch": 13.32, + "learning_rate": 8.152687970511979e-05, + "loss": 0.1145, + "step": 47370 + }, + { + "epoch": 13.33, + "learning_rate": 8.150813731921407e-05, + "loss": 0.1321, + "step": 47400 + }, + { + "epoch": 13.33, + "learning_rate": 8.148939493330835e-05, + "loss": 0.1164, + "step": 47430 + }, + { + "epoch": 13.34, + "learning_rate": 8.147065254740263e-05, + "loss": 0.1286, + "step": 47460 + }, + { + "epoch": 13.35, + "learning_rate": 8.145191016149689e-05, + "loss": 0.1307, + "step": 47490 + }, + { + "epoch": 13.36, + "learning_rate": 8.143316777559117e-05, + "loss": 0.1099, + "step": 47520 + }, + { + "epoch": 13.37, + "learning_rate": 8.141442538968545e-05, + "loss": 0.1275, + "step": 47550 + }, + { + "epoch": 13.38, + "learning_rate": 8.139568300377972e-05, + "loss": 0.1101, + "step": 47580 + }, + { + "epoch": 13.38, + "learning_rate": 8.1376940617874e-05, + "loss": 0.1284, + "step": 47610 + }, + { + "epoch": 13.39, + "learning_rate": 8.135819823196826e-05, + "loss": 0.1295, + "step": 47640 + }, + { + "epoch": 13.4, + "learning_rate": 8.133945584606255e-05, + "loss": 0.1114, + "step": 47670 + }, + { + "epoch": 13.41, + "learning_rate": 8.132071346015681e-05, + "loss": 0.1311, + "step": 47700 + }, + { + "epoch": 13.42, + "learning_rate": 8.13019710742511e-05, + "loss": 0.1133, + "step": 47730 + }, + { + "epoch": 13.43, + "learning_rate": 8.128322868834536e-05, + "loss": 0.1211, + "step": 47760 + }, + { + "epoch": 13.44, + "learning_rate": 8.126448630243963e-05, + "loss": 0.1273, + "step": 47790 + }, + { + "epoch": 13.44, + "learning_rate": 8.124574391653391e-05, + "loss": 0.1107, + "step": 47820 + }, + { + "epoch": 13.45, + "learning_rate": 8.122700153062819e-05, + "loss": 0.1235, + "step": 47850 + }, + { + "epoch": 13.46, + "learning_rate": 8.120825914472247e-05, + "loss": 0.1126, + "step": 47880 + }, + { + "epoch": 13.47, + "learning_rate": 8.118951675881673e-05, + "loss": 0.1345, + "step": 47910 + }, + { + "epoch": 13.48, + "learning_rate": 8.1170774372911e-05, + "loss": 0.1258, + "step": 47940 + }, + { + "epoch": 13.49, + "learning_rate": 8.115203198700529e-05, + "loss": 0.1151, + "step": 47970 + }, + { + "epoch": 13.49, + "learning_rate": 8.113328960109955e-05, + "loss": 0.1267, + "step": 48000 + }, + { + "epoch": 13.5, + "learning_rate": 8.111454721519384e-05, + "loss": 0.115, + "step": 48030 + }, + { + "epoch": 13.51, + "learning_rate": 8.10958048292881e-05, + "loss": 0.1229, + "step": 48060 + }, + { + "epoch": 13.52, + "learning_rate": 8.107706244338238e-05, + "loss": 0.1356, + "step": 48090 + }, + { + "epoch": 13.53, + "learning_rate": 8.105832005747665e-05, + "loss": 0.1159, + "step": 48120 + }, + { + "epoch": 13.54, + "learning_rate": 8.103957767157093e-05, + "loss": 0.1342, + "step": 48150 + }, + { + "epoch": 13.55, + "learning_rate": 8.10208352856652e-05, + "loss": 0.1118, + "step": 48180 + }, + { + "epoch": 13.55, + "learning_rate": 8.100209289975948e-05, + "loss": 0.1213, + "step": 48210 + }, + { + "epoch": 13.56, + "learning_rate": 8.098335051385375e-05, + "loss": 0.1283, + "step": 48240 + }, + { + "epoch": 13.57, + "learning_rate": 8.096460812794803e-05, + "loss": 0.1207, + "step": 48270 + }, + { + "epoch": 13.58, + "learning_rate": 8.094649048823916e-05, + "loss": 0.1269, + "step": 48300 + }, + { + "epoch": 13.59, + "learning_rate": 8.092774810233344e-05, + "loss": 0.1162, + "step": 48330 + }, + { + "epoch": 13.6, + "learning_rate": 8.09090057164277e-05, + "loss": 0.1253, + "step": 48360 + }, + { + "epoch": 13.6, + "learning_rate": 8.089026333052197e-05, + "loss": 0.1266, + "step": 48390 + }, + { + "epoch": 13.61, + "learning_rate": 8.087152094461625e-05, + "loss": 0.1125, + "step": 48420 + }, + { + "epoch": 13.62, + "learning_rate": 8.085277855871053e-05, + "loss": 0.125, + "step": 48450 + }, + { + "epoch": 13.63, + "learning_rate": 8.08340361728048e-05, + "loss": 0.1151, + "step": 48480 + }, + { + "epoch": 13.64, + "learning_rate": 8.081529378689907e-05, + "loss": 0.1226, + "step": 48510 + }, + { + "epoch": 13.65, + "learning_rate": 8.079655140099335e-05, + "loss": 0.1302, + "step": 48540 + }, + { + "epoch": 13.65, + "learning_rate": 8.077780901508763e-05, + "loss": 0.115, + "step": 48570 + }, + { + "epoch": 13.66, + "learning_rate": 8.07590666291819e-05, + "loss": 0.1313, + "step": 48600 + }, + { + "epoch": 13.67, + "learning_rate": 8.074032424327618e-05, + "loss": 0.1105, + "step": 48630 + }, + { + "epoch": 13.68, + "learning_rate": 8.072158185737045e-05, + "loss": 0.125, + "step": 48660 + }, + { + "epoch": 13.69, + "learning_rate": 8.070283947146471e-05, + "loss": 0.1268, + "step": 48690 + }, + { + "epoch": 13.7, + "learning_rate": 8.0684097085559e-05, + "loss": 0.1144, + "step": 48720 + }, + { + "epoch": 13.71, + "learning_rate": 8.066535469965328e-05, + "loss": 0.128, + "step": 48750 + }, + { + "epoch": 13.71, + "learning_rate": 8.064661231374754e-05, + "loss": 0.1158, + "step": 48780 + }, + { + "epoch": 13.72, + "learning_rate": 8.062786992784181e-05, + "loss": 0.1235, + "step": 48810 + }, + { + "epoch": 13.73, + "learning_rate": 8.060912754193609e-05, + "loss": 0.1263, + "step": 48840 + }, + { + "epoch": 13.74, + "learning_rate": 8.059038515603037e-05, + "loss": 0.1115, + "step": 48870 + }, + { + "epoch": 13.75, + "learning_rate": 8.057164277012464e-05, + "loss": 0.1304, + "step": 48900 + }, + { + "epoch": 13.76, + "learning_rate": 8.055290038421891e-05, + "loss": 0.1208, + "step": 48930 + }, + { + "epoch": 13.76, + "learning_rate": 8.053415799831319e-05, + "loss": 0.117, + "step": 48960 + }, + { + "epoch": 13.77, + "learning_rate": 8.051541561240747e-05, + "loss": 0.1305, + "step": 48990 + }, + { + "epoch": 13.78, + "learning_rate": 8.049667322650174e-05, + "loss": 0.1103, + "step": 49020 + }, + { + "epoch": 13.79, + "learning_rate": 8.047793084059602e-05, + "loss": 0.1299, + "step": 49050 + }, + { + "epoch": 13.8, + "learning_rate": 8.045918845469029e-05, + "loss": 0.1135, + "step": 49080 + }, + { + "epoch": 13.81, + "learning_rate": 8.044044606878455e-05, + "loss": 0.1247, + "step": 49110 + }, + { + "epoch": 13.81, + "learning_rate": 8.042170368287883e-05, + "loss": 0.1263, + "step": 49140 + }, + { + "epoch": 13.82, + "learning_rate": 8.040296129697311e-05, + "loss": 0.1101, + "step": 49170 + }, + { + "epoch": 13.83, + "learning_rate": 8.038421891106738e-05, + "loss": 0.1288, + "step": 49200 + }, + { + "epoch": 13.84, + "learning_rate": 8.036547652516165e-05, + "loss": 0.1181, + "step": 49230 + }, + { + "epoch": 13.85, + "learning_rate": 8.034673413925593e-05, + "loss": 0.1241, + "step": 49260 + }, + { + "epoch": 13.86, + "learning_rate": 8.032799175335021e-05, + "loss": 0.1287, + "step": 49290 + }, + { + "epoch": 13.87, + "learning_rate": 8.030924936744448e-05, + "loss": 0.1149, + "step": 49320 + }, + { + "epoch": 13.87, + "learning_rate": 8.029050698153875e-05, + "loss": 0.1251, + "step": 49350 + }, + { + "epoch": 13.88, + "learning_rate": 8.027176459563303e-05, + "loss": 0.1163, + "step": 49380 + }, + { + "epoch": 13.89, + "learning_rate": 8.025302220972731e-05, + "loss": 0.1359, + "step": 49410 + }, + { + "epoch": 13.9, + "learning_rate": 8.023427982382158e-05, + "loss": 0.1242, + "step": 49440 + }, + { + "epoch": 13.91, + "learning_rate": 8.021553743791586e-05, + "loss": 0.1106, + "step": 49470 + }, + { + "epoch": 13.92, + "learning_rate": 8.019679505201012e-05, + "loss": 0.1297, + "step": 49500 + }, + { + "epoch": 13.92, + "learning_rate": 8.017805266610439e-05, + "loss": 0.1153, + "step": 49530 + }, + { + "epoch": 13.93, + "learning_rate": 8.015931028019867e-05, + "loss": 0.1262, + "step": 49560 + }, + { + "epoch": 13.94, + "learning_rate": 8.014056789429295e-05, + "loss": 0.124, + "step": 49590 + }, + { + "epoch": 13.95, + "learning_rate": 8.012182550838722e-05, + "loss": 0.1129, + "step": 49620 + }, + { + "epoch": 13.96, + "learning_rate": 8.010308312248149e-05, + "loss": 0.1315, + "step": 49650 + }, + { + "epoch": 13.97, + "learning_rate": 8.008434073657577e-05, + "loss": 0.1142, + "step": 49680 + }, + { + "epoch": 13.98, + "learning_rate": 8.006559835067005e-05, + "loss": 0.1238, + "step": 49710 + }, + { + "epoch": 13.98, + "learning_rate": 8.004685596476432e-05, + "loss": 0.1246, + "step": 49740 + }, + { + "epoch": 13.99, + "learning_rate": 8.002811357885859e-05, + "loss": 0.1124, + "step": 49770 + }, + { + "epoch": 14.0, + "eval_loss": 0.18678802251815796, + "eval_runtime": 477.9923, + "eval_samples_per_second": 33.542, + "eval_steps_per_second": 1.05, + "eval_wer": 0.17144104922686393, + "step": 49798 + }, + { + "epoch": 14.0, + "learning_rate": 8.000937119295287e-05, + "loss": 0.1446, + "step": 49800 + }, + { + "epoch": 14.01, + "learning_rate": 7.999062880704715e-05, + "loss": 0.1044, + "step": 49830 + }, + { + "epoch": 14.02, + "learning_rate": 7.997188642114141e-05, + "loss": 0.1248, + "step": 49860 + }, + { + "epoch": 14.03, + "learning_rate": 7.99531440352357e-05, + "loss": 0.1121, + "step": 49890 + }, + { + "epoch": 14.03, + "learning_rate": 7.993440164932996e-05, + "loss": 0.1138, + "step": 49920 + }, + { + "epoch": 14.04, + "learning_rate": 7.991565926342423e-05, + "loss": 0.1254, + "step": 49950 + }, + { + "epoch": 14.05, + "learning_rate": 7.989691687751851e-05, + "loss": 0.1065, + "step": 49980 + }, + { + "epoch": 14.06, + "learning_rate": 7.987817449161279e-05, + "loss": 0.121, + "step": 50010 + }, + { + "epoch": 14.07, + "learning_rate": 7.985943210570706e-05, + "loss": 0.1147, + "step": 50040 + }, + { + "epoch": 14.08, + "learning_rate": 7.984068971980133e-05, + "loss": 0.1176, + "step": 50070 + }, + { + "epoch": 14.08, + "learning_rate": 7.982194733389561e-05, + "loss": 0.1235, + "step": 50100 + }, + { + "epoch": 14.09, + "learning_rate": 7.980320494798989e-05, + "loss": 0.1075, + "step": 50130 + }, + { + "epoch": 14.1, + "learning_rate": 7.978446256208416e-05, + "loss": 0.1209, + "step": 50160 + }, + { + "epoch": 14.11, + "learning_rate": 7.976572017617842e-05, + "loss": 0.1125, + "step": 50190 + }, + { + "epoch": 14.12, + "learning_rate": 7.97469777902727e-05, + "loss": 0.116, + "step": 50220 + }, + { + "epoch": 14.13, + "learning_rate": 7.972823540436699e-05, + "loss": 0.1269, + "step": 50250 + }, + { + "epoch": 14.14, + "learning_rate": 7.970949301846125e-05, + "loss": 0.1052, + "step": 50280 + }, + { + "epoch": 14.14, + "learning_rate": 7.969075063255553e-05, + "loss": 0.1191, + "step": 50310 + }, + { + "epoch": 14.15, + "learning_rate": 7.96720082466498e-05, + "loss": 0.1106, + "step": 50340 + }, + { + "epoch": 14.16, + "learning_rate": 7.965326586074407e-05, + "loss": 0.1185, + "step": 50370 + }, + { + "epoch": 14.17, + "learning_rate": 7.963452347483835e-05, + "loss": 0.1263, + "step": 50400 + }, + { + "epoch": 14.18, + "learning_rate": 7.961578108893263e-05, + "loss": 0.102, + "step": 50430 + }, + { + "epoch": 14.19, + "learning_rate": 7.95970387030269e-05, + "loss": 0.1217, + "step": 50460 + }, + { + "epoch": 14.19, + "learning_rate": 7.957829631712117e-05, + "loss": 0.1099, + "step": 50490 + }, + { + "epoch": 14.2, + "learning_rate": 7.955955393121545e-05, + "loss": 0.1166, + "step": 50520 + }, + { + "epoch": 14.21, + "learning_rate": 7.954081154530973e-05, + "loss": 0.1237, + "step": 50550 + }, + { + "epoch": 14.22, + "learning_rate": 7.9522069159404e-05, + "loss": 0.1172, + "step": 50580 + }, + { + "epoch": 14.23, + "learning_rate": 7.950332677349826e-05, + "loss": 0.134, + "step": 50610 + }, + { + "epoch": 14.24, + "learning_rate": 7.948458438759254e-05, + "loss": 0.1155, + "step": 50640 + }, + { + "epoch": 14.25, + "learning_rate": 7.946584200168682e-05, + "loss": 0.1188, + "step": 50670 + }, + { + "epoch": 14.25, + "learning_rate": 7.944709961578109e-05, + "loss": 0.1204, + "step": 50700 + }, + { + "epoch": 14.26, + "learning_rate": 7.942835722987537e-05, + "loss": 0.1074, + "step": 50730 + }, + { + "epoch": 14.27, + "learning_rate": 7.940961484396964e-05, + "loss": 0.1268, + "step": 50760 + }, + { + "epoch": 14.28, + "learning_rate": 7.939087245806391e-05, + "loss": 0.1134, + "step": 50790 + }, + { + "epoch": 14.29, + "learning_rate": 7.937213007215819e-05, + "loss": 0.1181, + "step": 50820 + }, + { + "epoch": 14.3, + "learning_rate": 7.935338768625247e-05, + "loss": 0.1254, + "step": 50850 + }, + { + "epoch": 14.3, + "learning_rate": 7.933464530034674e-05, + "loss": 0.1021, + "step": 50880 + }, + { + "epoch": 14.31, + "learning_rate": 7.9315902914441e-05, + "loss": 0.1252, + "step": 50910 + }, + { + "epoch": 14.32, + "learning_rate": 7.929716052853529e-05, + "loss": 0.1114, + "step": 50940 + }, + { + "epoch": 14.33, + "learning_rate": 7.927904288882641e-05, + "loss": 0.1214, + "step": 50970 + }, + { + "epoch": 14.34, + "learning_rate": 7.92603005029207e-05, + "loss": 0.1237, + "step": 51000 + }, + { + "epoch": 14.35, + "learning_rate": 7.924155811701497e-05, + "loss": 0.1001, + "step": 51030 + }, + { + "epoch": 14.35, + "learning_rate": 7.922281573110924e-05, + "loss": 0.1224, + "step": 51060 + }, + { + "epoch": 14.36, + "learning_rate": 7.920407334520351e-05, + "loss": 0.1115, + "step": 51090 + }, + { + "epoch": 14.37, + "learning_rate": 7.918533095929779e-05, + "loss": 0.1233, + "step": 51120 + }, + { + "epoch": 14.38, + "learning_rate": 7.916658857339206e-05, + "loss": 0.1283, + "step": 51150 + }, + { + "epoch": 14.39, + "learning_rate": 7.914784618748634e-05, + "loss": 0.1084, + "step": 51180 + }, + { + "epoch": 14.4, + "learning_rate": 7.91291038015806e-05, + "loss": 0.1236, + "step": 51210 + }, + { + "epoch": 14.41, + "learning_rate": 7.911036141567489e-05, + "loss": 0.1153, + "step": 51240 + }, + { + "epoch": 14.41, + "learning_rate": 7.909161902976915e-05, + "loss": 0.1201, + "step": 51270 + }, + { + "epoch": 14.42, + "learning_rate": 7.907287664386344e-05, + "loss": 0.1267, + "step": 51300 + }, + { + "epoch": 14.43, + "learning_rate": 7.905413425795772e-05, + "loss": 0.1054, + "step": 51330 + }, + { + "epoch": 14.44, + "learning_rate": 7.903539187205198e-05, + "loss": 0.1218, + "step": 51360 + }, + { + "epoch": 14.45, + "learning_rate": 7.901664948614625e-05, + "loss": 0.1168, + "step": 51390 + }, + { + "epoch": 14.46, + "learning_rate": 7.899790710024053e-05, + "loss": 0.1181, + "step": 51420 + }, + { + "epoch": 14.46, + "learning_rate": 7.897916471433481e-05, + "loss": 0.1348, + "step": 51450 + }, + { + "epoch": 14.47, + "learning_rate": 7.896042232842908e-05, + "loss": 0.108, + "step": 51480 + }, + { + "epoch": 14.48, + "learning_rate": 7.894167994252335e-05, + "loss": 0.128, + "step": 51510 + }, + { + "epoch": 14.49, + "learning_rate": 7.892293755661763e-05, + "loss": 0.1127, + "step": 51540 + }, + { + "epoch": 14.5, + "learning_rate": 7.89041951707119e-05, + "loss": 0.1173, + "step": 51570 + }, + { + "epoch": 14.51, + "learning_rate": 7.888545278480618e-05, + "loss": 0.1281, + "step": 51600 + }, + { + "epoch": 14.51, + "learning_rate": 7.886671039890044e-05, + "loss": 0.105, + "step": 51630 + }, + { + "epoch": 14.52, + "learning_rate": 7.884796801299473e-05, + "loss": 0.1245, + "step": 51660 + }, + { + "epoch": 14.53, + "learning_rate": 7.8829225627089e-05, + "loss": 0.1153, + "step": 51690 + }, + { + "epoch": 14.54, + "learning_rate": 7.881048324118327e-05, + "loss": 0.1195, + "step": 51720 + }, + { + "epoch": 14.55, + "learning_rate": 7.879174085527756e-05, + "loss": 0.1238, + "step": 51750 + }, + { + "epoch": 14.56, + "learning_rate": 7.877299846937182e-05, + "loss": 0.1054, + "step": 51780 + }, + { + "epoch": 14.57, + "learning_rate": 7.875425608346609e-05, + "loss": 0.1259, + "step": 51810 + }, + { + "epoch": 14.57, + "learning_rate": 7.873551369756037e-05, + "loss": 0.1233, + "step": 51840 + }, + { + "epoch": 14.58, + "learning_rate": 7.871677131165465e-05, + "loss": 0.1216, + "step": 51870 + }, + { + "epoch": 14.59, + "learning_rate": 7.869802892574892e-05, + "loss": 0.1265, + "step": 51900 + }, + { + "epoch": 14.6, + "learning_rate": 7.867928653984319e-05, + "loss": 0.1006, + "step": 51930 + }, + { + "epoch": 14.61, + "learning_rate": 7.866054415393747e-05, + "loss": 0.1201, + "step": 51960 + }, + { + "epoch": 14.62, + "learning_rate": 7.864180176803175e-05, + "loss": 0.11, + "step": 51990 + }, + { + "epoch": 14.62, + "learning_rate": 7.862305938212602e-05, + "loss": 0.1239, + "step": 52020 + }, + { + "epoch": 14.63, + "learning_rate": 7.860431699622028e-05, + "loss": 0.1289, + "step": 52050 + }, + { + "epoch": 14.64, + "learning_rate": 7.858557461031456e-05, + "loss": 0.1077, + "step": 52080 + }, + { + "epoch": 14.65, + "learning_rate": 7.856683222440883e-05, + "loss": 0.1233, + "step": 52110 + }, + { + "epoch": 14.66, + "learning_rate": 7.854808983850311e-05, + "loss": 0.1114, + "step": 52140 + }, + { + "epoch": 14.67, + "learning_rate": 7.85293474525974e-05, + "loss": 0.1144, + "step": 52170 + }, + { + "epoch": 14.68, + "learning_rate": 7.851060506669166e-05, + "loss": 0.1286, + "step": 52200 + }, + { + "epoch": 14.68, + "learning_rate": 7.849186268078593e-05, + "loss": 0.107, + "step": 52230 + }, + { + "epoch": 14.69, + "learning_rate": 7.847312029488021e-05, + "loss": 0.1249, + "step": 52260 + }, + { + "epoch": 14.7, + "learning_rate": 7.845437790897449e-05, + "loss": 0.1106, + "step": 52290 + }, + { + "epoch": 14.71, + "learning_rate": 7.843563552306876e-05, + "loss": 0.1197, + "step": 52320 + }, + { + "epoch": 14.72, + "learning_rate": 7.841689313716303e-05, + "loss": 0.1247, + "step": 52350 + }, + { + "epoch": 14.73, + "learning_rate": 7.83981507512573e-05, + "loss": 0.1042, + "step": 52380 + }, + { + "epoch": 14.73, + "learning_rate": 7.837940836535159e-05, + "loss": 0.1233, + "step": 52410 + }, + { + "epoch": 14.74, + "learning_rate": 7.836066597944585e-05, + "loss": 0.1105, + "step": 52440 + }, + { + "epoch": 14.75, + "learning_rate": 7.834192359354012e-05, + "loss": 0.1189, + "step": 52470 + }, + { + "epoch": 14.76, + "learning_rate": 7.83231812076344e-05, + "loss": 0.1251, + "step": 52500 + }, + { + "epoch": 14.77, + "learning_rate": 7.830443882172867e-05, + "loss": 0.1052, + "step": 52530 + }, + { + "epoch": 14.78, + "learning_rate": 7.828569643582295e-05, + "loss": 0.1214, + "step": 52560 + }, + { + "epoch": 14.78, + "learning_rate": 7.826695404991723e-05, + "loss": 0.1133, + "step": 52590 + }, + { + "epoch": 14.79, + "learning_rate": 7.82482116640115e-05, + "loss": 0.1126, + "step": 52620 + }, + { + "epoch": 14.8, + "learning_rate": 7.822946927810577e-05, + "loss": 0.1238, + "step": 52650 + }, + { + "epoch": 14.81, + "learning_rate": 7.821072689220005e-05, + "loss": 0.1031, + "step": 52680 + }, + { + "epoch": 14.82, + "learning_rate": 7.819198450629433e-05, + "loss": 0.1207, + "step": 52710 + }, + { + "epoch": 14.83, + "learning_rate": 7.81732421203886e-05, + "loss": 0.1115, + "step": 52740 + }, + { + "epoch": 14.84, + "learning_rate": 7.815449973448286e-05, + "loss": 0.1096, + "step": 52770 + }, + { + "epoch": 14.84, + "learning_rate": 7.813575734857715e-05, + "loss": 0.1262, + "step": 52800 + }, + { + "epoch": 14.85, + "learning_rate": 7.811701496267143e-05, + "loss": 0.1025, + "step": 52830 + }, + { + "epoch": 14.86, + "learning_rate": 7.80982725767657e-05, + "loss": 0.1263, + "step": 52860 + }, + { + "epoch": 14.87, + "learning_rate": 7.807953019085996e-05, + "loss": 0.1144, + "step": 52890 + }, + { + "epoch": 14.88, + "learning_rate": 7.806078780495424e-05, + "loss": 0.1192, + "step": 52920 + }, + { + "epoch": 14.89, + "learning_rate": 7.804204541904851e-05, + "loss": 0.1352, + "step": 52950 + }, + { + "epoch": 14.89, + "learning_rate": 7.802330303314279e-05, + "loss": 0.1102, + "step": 52980 + }, + { + "epoch": 14.9, + "learning_rate": 7.800456064723707e-05, + "loss": 0.1233, + "step": 53010 + }, + { + "epoch": 14.91, + "learning_rate": 7.798581826133134e-05, + "loss": 0.1162, + "step": 53040 + }, + { + "epoch": 14.92, + "learning_rate": 7.79670758754256e-05, + "loss": 0.1214, + "step": 53070 + }, + { + "epoch": 14.93, + "learning_rate": 7.794833348951989e-05, + "loss": 0.1302, + "step": 53100 + }, + { + "epoch": 14.94, + "learning_rate": 7.792959110361417e-05, + "loss": 0.1029, + "step": 53130 + }, + { + "epoch": 14.95, + "learning_rate": 7.791084871770844e-05, + "loss": 0.1164, + "step": 53160 + }, + { + "epoch": 14.95, + "learning_rate": 7.78921063318027e-05, + "loss": 0.1147, + "step": 53190 + }, + { + "epoch": 14.96, + "learning_rate": 7.787336394589698e-05, + "loss": 0.1186, + "step": 53220 + }, + { + "epoch": 14.97, + "learning_rate": 7.785462155999126e-05, + "loss": 0.1225, + "step": 53250 + }, + { + "epoch": 14.98, + "learning_rate": 7.783587917408553e-05, + "loss": 0.1043, + "step": 53280 + }, + { + "epoch": 14.99, + "learning_rate": 7.78171367881798e-05, + "loss": 0.1225, + "step": 53310 + }, + { + "epoch": 15.0, + "learning_rate": 7.779839440227408e-05, + "loss": 0.1112, + "step": 53340 + }, + { + "epoch": 15.0, + "eval_loss": 0.18052412569522858, + "eval_runtime": 480.525, + "eval_samples_per_second": 33.366, + "eval_steps_per_second": 1.045, + "eval_wer": 0.16497209067460047, + "step": 53355 + }, + { + "epoch": 15.0, + "learning_rate": 7.777965201636835e-05, + "loss": 0.1152, + "step": 53370 + }, + { + "epoch": 15.01, + "learning_rate": 7.776090963046263e-05, + "loss": 0.1118, + "step": 53400 + }, + { + "epoch": 15.02, + "learning_rate": 7.774216724455691e-05, + "loss": 0.1098, + "step": 53430 + }, + { + "epoch": 15.03, + "learning_rate": 7.772342485865118e-05, + "loss": 0.1218, + "step": 53460 + }, + { + "epoch": 15.04, + "learning_rate": 7.770468247274544e-05, + "loss": 0.1046, + "step": 53490 + }, + { + "epoch": 15.05, + "learning_rate": 7.768594008683973e-05, + "loss": 0.1181, + "step": 53520 + }, + { + "epoch": 15.05, + "learning_rate": 7.7667197700934e-05, + "loss": 0.11, + "step": 53550 + }, + { + "epoch": 15.06, + "learning_rate": 7.764845531502827e-05, + "loss": 0.1103, + "step": 53580 + }, + { + "epoch": 15.07, + "learning_rate": 7.762971292912254e-05, + "loss": 0.1236, + "step": 53610 + }, + { + "epoch": 15.08, + "learning_rate": 7.761097054321682e-05, + "loss": 0.1036, + "step": 53640 + }, + { + "epoch": 15.09, + "learning_rate": 7.75922281573111e-05, + "loss": 0.1174, + "step": 53670 + }, + { + "epoch": 15.1, + "learning_rate": 7.757348577140537e-05, + "loss": 0.1093, + "step": 53700 + }, + { + "epoch": 15.11, + "learning_rate": 7.755474338549964e-05, + "loss": 0.1113, + "step": 53730 + }, + { + "epoch": 15.11, + "learning_rate": 7.753600099959392e-05, + "loss": 0.1227, + "step": 53760 + }, + { + "epoch": 15.12, + "learning_rate": 7.751725861368819e-05, + "loss": 0.1027, + "step": 53790 + }, + { + "epoch": 15.13, + "learning_rate": 7.749851622778247e-05, + "loss": 0.1183, + "step": 53820 + }, + { + "epoch": 15.14, + "learning_rate": 7.747977384187675e-05, + "loss": 0.109, + "step": 53850 + }, + { + "epoch": 15.15, + "learning_rate": 7.746103145597102e-05, + "loss": 0.1085, + "step": 53880 + }, + { + "epoch": 15.16, + "learning_rate": 7.744228907006528e-05, + "loss": 0.1211, + "step": 53910 + }, + { + "epoch": 15.16, + "learning_rate": 7.742354668415956e-05, + "loss": 0.1044, + "step": 53940 + }, + { + "epoch": 15.17, + "learning_rate": 7.740480429825385e-05, + "loss": 0.1217, + "step": 53970 + }, + { + "epoch": 15.18, + "learning_rate": 7.738606191234811e-05, + "loss": 0.116, + "step": 54000 + }, + { + "epoch": 15.19, + "learning_rate": 7.736731952644238e-05, + "loss": 0.1133, + "step": 54030 + }, + { + "epoch": 15.2, + "learning_rate": 7.734857714053666e-05, + "loss": 0.1236, + "step": 54060 + }, + { + "epoch": 15.21, + "learning_rate": 7.732983475463094e-05, + "loss": 0.1054, + "step": 54090 + }, + { + "epoch": 15.22, + "learning_rate": 7.731109236872521e-05, + "loss": 0.1137, + "step": 54120 + }, + { + "epoch": 15.22, + "learning_rate": 7.729234998281948e-05, + "loss": 0.1101, + "step": 54150 + }, + { + "epoch": 15.23, + "learning_rate": 7.727360759691376e-05, + "loss": 0.1095, + "step": 54180 + }, + { + "epoch": 15.24, + "learning_rate": 7.725486521100803e-05, + "loss": 0.125, + "step": 54210 + }, + { + "epoch": 15.25, + "learning_rate": 7.72361228251023e-05, + "loss": 0.1027, + "step": 54240 + }, + { + "epoch": 15.26, + "learning_rate": 7.721738043919659e-05, + "loss": 0.1194, + "step": 54270 + }, + { + "epoch": 15.27, + "learning_rate": 7.719863805329085e-05, + "loss": 0.1073, + "step": 54300 + }, + { + "epoch": 15.27, + "learning_rate": 7.717989566738512e-05, + "loss": 0.1084, + "step": 54330 + }, + { + "epoch": 15.28, + "learning_rate": 7.71611532814794e-05, + "loss": 0.123, + "step": 54360 + }, + { + "epoch": 15.29, + "learning_rate": 7.714241089557368e-05, + "loss": 0.1038, + "step": 54390 + }, + { + "epoch": 15.3, + "learning_rate": 7.712366850966795e-05, + "loss": 0.1195, + "step": 54420 + }, + { + "epoch": 15.31, + "learning_rate": 7.710492612376222e-05, + "loss": 0.1125, + "step": 54450 + }, + { + "epoch": 15.32, + "learning_rate": 7.70861837378565e-05, + "loss": 0.1089, + "step": 54480 + }, + { + "epoch": 15.32, + "learning_rate": 7.706744135195078e-05, + "loss": 0.1225, + "step": 54510 + }, + { + "epoch": 15.33, + "learning_rate": 7.704869896604505e-05, + "loss": 0.1016, + "step": 54540 + }, + { + "epoch": 15.34, + "learning_rate": 7.702995658013932e-05, + "loss": 0.1209, + "step": 54570 + }, + { + "epoch": 15.35, + "learning_rate": 7.70112141942336e-05, + "loss": 0.1101, + "step": 54600 + }, + { + "epoch": 15.36, + "learning_rate": 7.699247180832786e-05, + "loss": 0.1126, + "step": 54630 + }, + { + "epoch": 15.37, + "learning_rate": 7.697372942242214e-05, + "loss": 0.1198, + "step": 54660 + }, + { + "epoch": 15.38, + "learning_rate": 7.695498703651643e-05, + "loss": 0.1039, + "step": 54690 + }, + { + "epoch": 15.38, + "learning_rate": 7.69362446506107e-05, + "loss": 0.1164, + "step": 54720 + }, + { + "epoch": 15.39, + "learning_rate": 7.691750226470496e-05, + "loss": 0.1102, + "step": 54750 + }, + { + "epoch": 15.4, + "learning_rate": 7.689875987879924e-05, + "loss": 0.1078, + "step": 54780 + }, + { + "epoch": 15.41, + "learning_rate": 7.688001749289352e-05, + "loss": 0.1205, + "step": 54810 + }, + { + "epoch": 15.42, + "learning_rate": 7.686127510698779e-05, + "loss": 0.1061, + "step": 54840 + }, + { + "epoch": 15.43, + "learning_rate": 7.684253272108206e-05, + "loss": 0.1205, + "step": 54870 + }, + { + "epoch": 15.43, + "learning_rate": 7.682379033517634e-05, + "loss": 0.1128, + "step": 54900 + }, + { + "epoch": 15.44, + "learning_rate": 7.680504794927062e-05, + "loss": 0.109, + "step": 54930 + }, + { + "epoch": 15.45, + "learning_rate": 7.678630556336489e-05, + "loss": 0.1243, + "step": 54960 + }, + { + "epoch": 15.46, + "learning_rate": 7.676756317745915e-05, + "loss": 0.1044, + "step": 54990 + }, + { + "epoch": 15.47, + "learning_rate": 7.674882079155344e-05, + "loss": 0.1143, + "step": 55020 + }, + { + "epoch": 15.48, + "learning_rate": 7.673007840564772e-05, + "loss": 0.1105, + "step": 55050 + }, + { + "epoch": 15.48, + "learning_rate": 7.671133601974198e-05, + "loss": 0.1089, + "step": 55080 + }, + { + "epoch": 15.49, + "learning_rate": 7.669259363383626e-05, + "loss": 0.1214, + "step": 55110 + }, + { + "epoch": 15.5, + "learning_rate": 7.667385124793053e-05, + "loss": 0.1021, + "step": 55140 + }, + { + "epoch": 15.51, + "learning_rate": 7.66551088620248e-05, + "loss": 0.124, + "step": 55170 + }, + { + "epoch": 15.52, + "learning_rate": 7.663636647611908e-05, + "loss": 0.1125, + "step": 55200 + }, + { + "epoch": 15.53, + "learning_rate": 7.661762409021336e-05, + "loss": 0.1154, + "step": 55230 + }, + { + "epoch": 15.54, + "learning_rate": 7.659888170430763e-05, + "loss": 0.125, + "step": 55260 + }, + { + "epoch": 15.54, + "learning_rate": 7.65801393184019e-05, + "loss": 0.1042, + "step": 55290 + }, + { + "epoch": 15.55, + "learning_rate": 7.656139693249618e-05, + "loss": 0.1173, + "step": 55320 + }, + { + "epoch": 15.56, + "learning_rate": 7.654265454659046e-05, + "loss": 0.1201, + "step": 55350 + }, + { + "epoch": 15.57, + "learning_rate": 7.652391216068473e-05, + "loss": 0.1115, + "step": 55380 + }, + { + "epoch": 15.58, + "learning_rate": 7.650516977477899e-05, + "loss": 0.1237, + "step": 55410 + }, + { + "epoch": 15.59, + "learning_rate": 7.648642738887327e-05, + "loss": 0.11, + "step": 55440 + }, + { + "epoch": 15.59, + "learning_rate": 7.64683097491644e-05, + "loss": 0.1174, + "step": 55470 + }, + { + "epoch": 15.6, + "learning_rate": 7.644956736325868e-05, + "loss": 0.1106, + "step": 55500 + }, + { + "epoch": 15.61, + "learning_rate": 7.643082497735295e-05, + "loss": 0.1088, + "step": 55530 + }, + { + "epoch": 15.62, + "learning_rate": 7.641208259144723e-05, + "loss": 0.1248, + "step": 55560 + }, + { + "epoch": 15.63, + "learning_rate": 7.63933402055415e-05, + "loss": 0.1051, + "step": 55590 + }, + { + "epoch": 15.64, + "learning_rate": 7.637459781963578e-05, + "loss": 0.121, + "step": 55620 + }, + { + "epoch": 15.65, + "learning_rate": 7.635585543373005e-05, + "loss": 0.1185, + "step": 55650 + }, + { + "epoch": 15.65, + "learning_rate": 7.633711304782433e-05, + "loss": 0.1174, + "step": 55680 + }, + { + "epoch": 15.66, + "learning_rate": 7.631837066191861e-05, + "loss": 0.1173, + "step": 55710 + }, + { + "epoch": 15.67, + "learning_rate": 7.629962827601286e-05, + "loss": 0.1022, + "step": 55740 + }, + { + "epoch": 15.68, + "learning_rate": 7.628088589010714e-05, + "loss": 0.1189, + "step": 55770 + }, + { + "epoch": 15.69, + "learning_rate": 7.626214350420142e-05, + "loss": 0.1106, + "step": 55800 + }, + { + "epoch": 15.7, + "learning_rate": 7.62434011182957e-05, + "loss": 0.1096, + "step": 55830 + }, + { + "epoch": 15.7, + "learning_rate": 7.622465873238997e-05, + "loss": 0.122, + "step": 55860 + }, + { + "epoch": 15.71, + "learning_rate": 7.620591634648424e-05, + "loss": 0.1078, + "step": 55890 + }, + { + "epoch": 15.72, + "learning_rate": 7.618717396057852e-05, + "loss": 0.1106, + "step": 55920 + }, + { + "epoch": 15.73, + "learning_rate": 7.616843157467279e-05, + "loss": 0.1087, + "step": 55950 + }, + { + "epoch": 15.74, + "learning_rate": 7.614968918876707e-05, + "loss": 0.115, + "step": 55980 + }, + { + "epoch": 15.75, + "learning_rate": 7.613094680286134e-05, + "loss": 0.1257, + "step": 56010 + }, + { + "epoch": 15.75, + "learning_rate": 7.611220441695562e-05, + "loss": 0.1011, + "step": 56040 + }, + { + "epoch": 15.76, + "learning_rate": 7.609346203104989e-05, + "loss": 0.1181, + "step": 56070 + }, + { + "epoch": 15.77, + "learning_rate": 7.607471964514417e-05, + "loss": 0.1134, + "step": 56100 + }, + { + "epoch": 15.78, + "learning_rate": 7.605597725923845e-05, + "loss": 0.1146, + "step": 56130 + }, + { + "epoch": 15.79, + "learning_rate": 7.603723487333271e-05, + "loss": 0.1225, + "step": 56160 + }, + { + "epoch": 15.8, + "learning_rate": 7.601849248742698e-05, + "loss": 0.1049, + "step": 56190 + }, + { + "epoch": 15.81, + "learning_rate": 7.599975010152126e-05, + "loss": 0.1238, + "step": 56220 + }, + { + "epoch": 15.81, + "learning_rate": 7.598100771561554e-05, + "loss": 0.1097, + "step": 56250 + }, + { + "epoch": 15.82, + "learning_rate": 7.596226532970981e-05, + "loss": 0.1109, + "step": 56280 + }, + { + "epoch": 15.83, + "learning_rate": 7.594352294380408e-05, + "loss": 0.1233, + "step": 56310 + }, + { + "epoch": 15.84, + "learning_rate": 7.592478055789836e-05, + "loss": 0.0993, + "step": 56340 + }, + { + "epoch": 15.85, + "learning_rate": 7.590603817199263e-05, + "loss": 0.1169, + "step": 56370 + }, + { + "epoch": 15.86, + "learning_rate": 7.588729578608691e-05, + "loss": 0.1185, + "step": 56400 + }, + { + "epoch": 15.86, + "learning_rate": 7.586855340018118e-05, + "loss": 0.1075, + "step": 56430 + }, + { + "epoch": 15.87, + "learning_rate": 7.584981101427546e-05, + "loss": 0.1231, + "step": 56460 + }, + { + "epoch": 15.88, + "learning_rate": 7.583106862836972e-05, + "loss": 0.1021, + "step": 56490 + }, + { + "epoch": 15.89, + "learning_rate": 7.5812326242464e-05, + "loss": 0.1184, + "step": 56520 + }, + { + "epoch": 15.9, + "learning_rate": 7.579358385655829e-05, + "loss": 0.1124, + "step": 56550 + }, + { + "epoch": 15.91, + "learning_rate": 7.577484147065255e-05, + "loss": 0.1109, + "step": 56580 + }, + { + "epoch": 15.91, + "learning_rate": 7.575609908474682e-05, + "loss": 0.1229, + "step": 56610 + }, + { + "epoch": 15.92, + "learning_rate": 7.57373566988411e-05, + "loss": 0.106, + "step": 56640 + }, + { + "epoch": 15.93, + "learning_rate": 7.571861431293538e-05, + "loss": 0.1108, + "step": 56670 + }, + { + "epoch": 15.94, + "learning_rate": 7.569987192702965e-05, + "loss": 0.1108, + "step": 56700 + }, + { + "epoch": 15.95, + "learning_rate": 7.568112954112392e-05, + "loss": 0.1114, + "step": 56730 + }, + { + "epoch": 15.96, + "learning_rate": 7.56623871552182e-05, + "loss": 0.1179, + "step": 56760 + }, + { + "epoch": 15.97, + "learning_rate": 7.564364476931247e-05, + "loss": 0.1047, + "step": 56790 + }, + { + "epoch": 15.97, + "learning_rate": 7.562490238340675e-05, + "loss": 0.1134, + "step": 56820 + }, + { + "epoch": 15.98, + "learning_rate": 7.560615999750101e-05, + "loss": 0.1205, + "step": 56850 + }, + { + "epoch": 15.99, + "learning_rate": 7.55874176115953e-05, + "loss": 0.1121, + "step": 56880 + }, + { + "epoch": 16.0, + "learning_rate": 7.556867522568956e-05, + "loss": 0.1209, + "step": 56910 + }, + { + "epoch": 16.0, + "eval_loss": 0.18599531054496765, + "eval_runtime": 482.85, + "eval_samples_per_second": 33.205, + "eval_steps_per_second": 1.04, + "eval_wer": 0.16138959780546722, + "step": 56912 + }, + { + "epoch": 16.01, + "learning_rate": 7.554993283978384e-05, + "loss": 0.1057, + "step": 56940 + }, + { + "epoch": 16.02, + "learning_rate": 7.553119045387812e-05, + "loss": 0.1149, + "step": 56970 + }, + { + "epoch": 16.02, + "learning_rate": 7.551244806797239e-05, + "loss": 0.104, + "step": 57000 + }, + { + "epoch": 16.03, + "learning_rate": 7.549370568206666e-05, + "loss": 0.1114, + "step": 57030 + }, + { + "epoch": 16.04, + "learning_rate": 7.547496329616094e-05, + "loss": 0.1081, + "step": 57060 + }, + { + "epoch": 16.05, + "learning_rate": 7.545622091025522e-05, + "loss": 0.1041, + "step": 57090 + }, + { + "epoch": 16.06, + "learning_rate": 7.543747852434949e-05, + "loss": 0.1169, + "step": 57120 + }, + { + "epoch": 16.07, + "learning_rate": 7.541873613844376e-05, + "loss": 0.0974, + "step": 57150 + }, + { + "epoch": 16.08, + "learning_rate": 7.539999375253804e-05, + "loss": 0.1164, + "step": 57180 + }, + { + "epoch": 16.08, + "learning_rate": 7.53812513666323e-05, + "loss": 0.1173, + "step": 57210 + }, + { + "epoch": 16.09, + "learning_rate": 7.536250898072659e-05, + "loss": 0.1016, + "step": 57240 + }, + { + "epoch": 16.1, + "learning_rate": 7.534376659482085e-05, + "loss": 0.1165, + "step": 57270 + }, + { + "epoch": 16.11, + "learning_rate": 7.532502420891513e-05, + "loss": 0.102, + "step": 57300 + }, + { + "epoch": 16.12, + "learning_rate": 7.53062818230094e-05, + "loss": 0.1141, + "step": 57330 + }, + { + "epoch": 16.13, + "learning_rate": 7.528753943710368e-05, + "loss": 0.1121, + "step": 57360 + }, + { + "epoch": 16.13, + "learning_rate": 7.526879705119796e-05, + "loss": 0.104, + "step": 57390 + }, + { + "epoch": 16.14, + "learning_rate": 7.525005466529223e-05, + "loss": 0.1166, + "step": 57420 + }, + { + "epoch": 16.15, + "learning_rate": 7.52313122793865e-05, + "loss": 0.104, + "step": 57450 + }, + { + "epoch": 16.16, + "learning_rate": 7.521256989348078e-05, + "loss": 0.113, + "step": 57480 + }, + { + "epoch": 16.17, + "learning_rate": 7.519382750757506e-05, + "loss": 0.1123, + "step": 57510 + }, + { + "epoch": 16.18, + "learning_rate": 7.517508512166933e-05, + "loss": 0.1082, + "step": 57540 + }, + { + "epoch": 16.18, + "learning_rate": 7.51563427357636e-05, + "loss": 0.1162, + "step": 57570 + }, + { + "epoch": 16.19, + "learning_rate": 7.513760034985788e-05, + "loss": 0.104, + "step": 57600 + }, + { + "epoch": 16.2, + "learning_rate": 7.511885796395214e-05, + "loss": 0.1072, + "step": 57630 + }, + { + "epoch": 16.21, + "learning_rate": 7.510011557804642e-05, + "loss": 0.1094, + "step": 57660 + }, + { + "epoch": 16.22, + "learning_rate": 7.508137319214069e-05, + "loss": 0.1076, + "step": 57690 + }, + { + "epoch": 16.23, + "learning_rate": 7.506263080623497e-05, + "loss": 0.113, + "step": 57720 + }, + { + "epoch": 16.24, + "learning_rate": 7.504388842032924e-05, + "loss": 0.0999, + "step": 57750 + }, + { + "epoch": 16.24, + "learning_rate": 7.502514603442352e-05, + "loss": 0.1131, + "step": 57780 + }, + { + "epoch": 16.25, + "learning_rate": 7.50064036485178e-05, + "loss": 0.1118, + "step": 57810 + }, + { + "epoch": 16.26, + "learning_rate": 7.498766126261207e-05, + "loss": 0.1039, + "step": 57840 + }, + { + "epoch": 16.27, + "learning_rate": 7.496891887670634e-05, + "loss": 0.1186, + "step": 57870 + }, + { + "epoch": 16.28, + "learning_rate": 7.495017649080062e-05, + "loss": 0.1026, + "step": 57900 + }, + { + "epoch": 16.29, + "learning_rate": 7.49314341048949e-05, + "loss": 0.1134, + "step": 57930 + }, + { + "epoch": 16.29, + "learning_rate": 7.491269171898917e-05, + "loss": 0.1138, + "step": 57960 + }, + { + "epoch": 16.3, + "learning_rate": 7.489394933308343e-05, + "loss": 0.1086, + "step": 57990 + }, + { + "epoch": 16.31, + "learning_rate": 7.487520694717771e-05, + "loss": 0.1149, + "step": 58020 + }, + { + "epoch": 16.32, + "learning_rate": 7.485646456127198e-05, + "loss": 0.1041, + "step": 58050 + }, + { + "epoch": 16.33, + "learning_rate": 7.483772217536626e-05, + "loss": 0.132, + "step": 58080 + }, + { + "epoch": 16.34, + "learning_rate": 7.481897978946053e-05, + "loss": 0.114, + "step": 58110 + }, + { + "epoch": 16.35, + "learning_rate": 7.480086214975167e-05, + "loss": 0.1066, + "step": 58140 + }, + { + "epoch": 16.35, + "learning_rate": 7.478211976384594e-05, + "loss": 0.1142, + "step": 58170 + }, + { + "epoch": 16.36, + "learning_rate": 7.476337737794022e-05, + "loss": 0.1037, + "step": 58200 + }, + { + "epoch": 16.37, + "learning_rate": 7.474463499203449e-05, + "loss": 0.1154, + "step": 58230 + }, + { + "epoch": 16.38, + "learning_rate": 7.472589260612877e-05, + "loss": 0.109, + "step": 58260 + }, + { + "epoch": 16.39, + "learning_rate": 7.470715022022305e-05, + "loss": 0.1069, + "step": 58290 + }, + { + "epoch": 16.4, + "learning_rate": 7.46884078343173e-05, + "loss": 0.118, + "step": 58320 + }, + { + "epoch": 16.4, + "learning_rate": 7.466966544841158e-05, + "loss": 0.1016, + "step": 58350 + }, + { + "epoch": 16.41, + "learning_rate": 7.465092306250586e-05, + "loss": 0.1086, + "step": 58380 + }, + { + "epoch": 16.42, + "learning_rate": 7.463218067660013e-05, + "loss": 0.1108, + "step": 58410 + }, + { + "epoch": 16.43, + "learning_rate": 7.46134382906944e-05, + "loss": 0.1, + "step": 58440 + }, + { + "epoch": 16.44, + "learning_rate": 7.459469590478868e-05, + "loss": 0.1183, + "step": 58470 + }, + { + "epoch": 16.45, + "learning_rate": 7.457595351888296e-05, + "loss": 0.1011, + "step": 58500 + }, + { + "epoch": 16.45, + "learning_rate": 7.455721113297723e-05, + "loss": 0.1147, + "step": 58530 + }, + { + "epoch": 16.46, + "learning_rate": 7.453846874707151e-05, + "loss": 0.1079, + "step": 58560 + }, + { + "epoch": 16.47, + "learning_rate": 7.451972636116578e-05, + "loss": 0.1054, + "step": 58590 + }, + { + "epoch": 16.48, + "learning_rate": 7.450098397526006e-05, + "loss": 0.1135, + "step": 58620 + }, + { + "epoch": 16.49, + "learning_rate": 7.448224158935433e-05, + "loss": 0.1066, + "step": 58650 + }, + { + "epoch": 16.5, + "learning_rate": 7.44634992034486e-05, + "loss": 0.1149, + "step": 58680 + }, + { + "epoch": 16.51, + "learning_rate": 7.444475681754289e-05, + "loss": 0.1198, + "step": 58710 + }, + { + "epoch": 16.51, + "learning_rate": 7.442601443163714e-05, + "loss": 0.1022, + "step": 58740 + }, + { + "epoch": 16.52, + "learning_rate": 7.440727204573142e-05, + "loss": 0.1136, + "step": 58770 + }, + { + "epoch": 16.53, + "learning_rate": 7.43885296598257e-05, + "loss": 0.1034, + "step": 58800 + }, + { + "epoch": 16.54, + "learning_rate": 7.436978727391997e-05, + "loss": 0.1126, + "step": 58830 + }, + { + "epoch": 16.55, + "learning_rate": 7.435104488801424e-05, + "loss": 0.1137, + "step": 58860 + }, + { + "epoch": 16.56, + "learning_rate": 7.433230250210852e-05, + "loss": 0.102, + "step": 58890 + }, + { + "epoch": 16.56, + "learning_rate": 7.43135601162028e-05, + "loss": 0.1154, + "step": 58920 + }, + { + "epoch": 16.57, + "learning_rate": 7.429481773029707e-05, + "loss": 0.098, + "step": 58950 + }, + { + "epoch": 16.58, + "learning_rate": 7.427607534439135e-05, + "loss": 0.1214, + "step": 58980 + }, + { + "epoch": 16.59, + "learning_rate": 7.425733295848562e-05, + "loss": 0.1157, + "step": 59010 + }, + { + "epoch": 16.6, + "learning_rate": 7.42385905725799e-05, + "loss": 0.1017, + "step": 59040 + }, + { + "epoch": 16.61, + "learning_rate": 7.421984818667416e-05, + "loss": 0.1129, + "step": 59070 + }, + { + "epoch": 16.62, + "learning_rate": 7.420110580076845e-05, + "loss": 0.1024, + "step": 59100 + }, + { + "epoch": 16.62, + "learning_rate": 7.418236341486273e-05, + "loss": 0.1134, + "step": 59130 + }, + { + "epoch": 16.63, + "learning_rate": 7.416362102895698e-05, + "loss": 0.1085, + "step": 59160 + }, + { + "epoch": 16.64, + "learning_rate": 7.414487864305126e-05, + "loss": 0.1083, + "step": 59190 + }, + { + "epoch": 16.65, + "learning_rate": 7.412613625714554e-05, + "loss": 0.1192, + "step": 59220 + }, + { + "epoch": 16.66, + "learning_rate": 7.410739387123982e-05, + "loss": 0.1021, + "step": 59250 + }, + { + "epoch": 16.67, + "learning_rate": 7.408865148533408e-05, + "loss": 0.1139, + "step": 59280 + }, + { + "epoch": 16.67, + "learning_rate": 7.406990909942836e-05, + "loss": 0.1098, + "step": 59310 + }, + { + "epoch": 16.68, + "learning_rate": 7.405116671352264e-05, + "loss": 0.1042, + "step": 59340 + }, + { + "epoch": 16.69, + "learning_rate": 7.40324243276169e-05, + "loss": 0.1161, + "step": 59370 + }, + { + "epoch": 16.7, + "learning_rate": 7.401368194171119e-05, + "loss": 0.104, + "step": 59400 + }, + { + "epoch": 16.71, + "learning_rate": 7.399493955580545e-05, + "loss": 0.1136, + "step": 59430 + }, + { + "epoch": 16.72, + "learning_rate": 7.397619716989974e-05, + "loss": 0.1141, + "step": 59460 + }, + { + "epoch": 16.72, + "learning_rate": 7.3957454783994e-05, + "loss": 0.1043, + "step": 59490 + }, + { + "epoch": 16.73, + "learning_rate": 7.393871239808828e-05, + "loss": 0.1129, + "step": 59520 + }, + { + "epoch": 16.74, + "learning_rate": 7.391997001218255e-05, + "loss": 0.1023, + "step": 59550 + }, + { + "epoch": 16.75, + "learning_rate": 7.390185237247369e-05, + "loss": 0.1085, + "step": 59580 + }, + { + "epoch": 16.76, + "learning_rate": 7.388310998656796e-05, + "loss": 0.1074, + "step": 59610 + }, + { + "epoch": 16.77, + "learning_rate": 7.386436760066223e-05, + "loss": 0.1013, + "step": 59640 + }, + { + "epoch": 16.78, + "learning_rate": 7.384562521475651e-05, + "loss": 0.1198, + "step": 59670 + }, + { + "epoch": 16.78, + "learning_rate": 7.382688282885079e-05, + "loss": 0.0998, + "step": 59700 + }, + { + "epoch": 16.79, + "learning_rate": 7.380814044294506e-05, + "loss": 0.1151, + "step": 59730 + }, + { + "epoch": 16.8, + "learning_rate": 7.378939805703932e-05, + "loss": 0.11, + "step": 59760 + }, + { + "epoch": 16.81, + "learning_rate": 7.37706556711336e-05, + "loss": 0.1066, + "step": 59790 + }, + { + "epoch": 16.82, + "learning_rate": 7.375191328522789e-05, + "loss": 0.1179, + "step": 59820 + }, + { + "epoch": 16.83, + "learning_rate": 7.373317089932215e-05, + "loss": 0.0971, + "step": 59850 + }, + { + "epoch": 16.83, + "learning_rate": 7.371442851341643e-05, + "loss": 0.1134, + "step": 59880 + }, + { + "epoch": 16.84, + "learning_rate": 7.36956861275107e-05, + "loss": 0.1158, + "step": 59910 + }, + { + "epoch": 16.85, + "learning_rate": 7.367694374160497e-05, + "loss": 0.1018, + "step": 59940 + }, + { + "epoch": 16.86, + "learning_rate": 7.365820135569925e-05, + "loss": 0.1129, + "step": 59970 + }, + { + "epoch": 16.87, + "learning_rate": 7.363945896979353e-05, + "loss": 0.1013, + "step": 60000 + }, + { + "epoch": 16.88, + "learning_rate": 7.36207165838878e-05, + "loss": 0.1144, + "step": 60030 + }, + { + "epoch": 16.88, + "learning_rate": 7.360197419798207e-05, + "loss": 0.1108, + "step": 60060 + }, + { + "epoch": 16.89, + "learning_rate": 7.358323181207635e-05, + "loss": 0.1038, + "step": 60090 + }, + { + "epoch": 16.9, + "learning_rate": 7.356448942617063e-05, + "loss": 0.1161, + "step": 60120 + }, + { + "epoch": 16.91, + "learning_rate": 7.35457470402649e-05, + "loss": 0.1002, + "step": 60150 + }, + { + "epoch": 16.92, + "learning_rate": 7.352700465435916e-05, + "loss": 0.1178, + "step": 60180 + }, + { + "epoch": 16.93, + "learning_rate": 7.350826226845344e-05, + "loss": 0.1102, + "step": 60210 + }, + { + "epoch": 16.94, + "learning_rate": 7.348951988254772e-05, + "loss": 0.1, + "step": 60240 + }, + { + "epoch": 16.94, + "learning_rate": 7.347077749664199e-05, + "loss": 0.1173, + "step": 60270 + }, + { + "epoch": 16.95, + "learning_rate": 7.345203511073626e-05, + "loss": 0.1006, + "step": 60300 + }, + { + "epoch": 16.96, + "learning_rate": 7.343329272483054e-05, + "loss": 0.107, + "step": 60330 + }, + { + "epoch": 16.97, + "learning_rate": 7.341455033892482e-05, + "loss": 0.1133, + "step": 60360 + }, + { + "epoch": 16.98, + "learning_rate": 7.339580795301909e-05, + "loss": 0.1079, + "step": 60390 + }, + { + "epoch": 16.99, + "learning_rate": 7.337706556711337e-05, + "loss": 0.1203, + "step": 60420 + }, + { + "epoch": 16.99, + "learning_rate": 7.335832318120764e-05, + "loss": 0.1002, + "step": 60450 + }, + { + "epoch": 17.0, + "eval_loss": 0.18275776505470276, + "eval_runtime": 488.8565, + "eval_samples_per_second": 32.797, + "eval_steps_per_second": 1.027, + "eval_wer": 0.16040697118993352, + "step": 60469 + }, + { + "epoch": 17.0, + "learning_rate": 7.33395807953019e-05, + "loss": 0.1185, + "step": 60480 + }, + { + "epoch": 17.01, + "learning_rate": 7.332083840939619e-05, + "loss": 0.1053, + "step": 60510 + }, + { + "epoch": 17.02, + "learning_rate": 7.330209602349047e-05, + "loss": 0.1076, + "step": 60540 + }, + { + "epoch": 17.03, + "learning_rate": 7.328335363758473e-05, + "loss": 0.1197, + "step": 60570 + }, + { + "epoch": 17.04, + "learning_rate": 7.3264611251679e-05, + "loss": 0.0961, + "step": 60600 + }, + { + "epoch": 17.05, + "learning_rate": 7.324586886577328e-05, + "loss": 0.1129, + "step": 60630 + }, + { + "epoch": 17.05, + "learning_rate": 7.322712647986756e-05, + "loss": 0.1, + "step": 60660 + }, + { + "epoch": 17.06, + "learning_rate": 7.320838409396183e-05, + "loss": 0.1019, + "step": 60690 + }, + { + "epoch": 17.07, + "learning_rate": 7.31896417080561e-05, + "loss": 0.1202, + "step": 60720 + }, + { + "epoch": 17.08, + "learning_rate": 7.317089932215038e-05, + "loss": 0.0919, + "step": 60750 + }, + { + "epoch": 17.09, + "learning_rate": 7.315215693624466e-05, + "loss": 0.1064, + "step": 60780 + }, + { + "epoch": 17.1, + "learning_rate": 7.313341455033893e-05, + "loss": 0.0991, + "step": 60810 + }, + { + "epoch": 17.1, + "learning_rate": 7.311467216443321e-05, + "loss": 0.1061, + "step": 60840 + }, + { + "epoch": 17.11, + "learning_rate": 7.309592977852748e-05, + "loss": 0.1117, + "step": 60870 + }, + { + "epoch": 17.12, + "learning_rate": 7.307718739262174e-05, + "loss": 0.0942, + "step": 60900 + }, + { + "epoch": 17.13, + "learning_rate": 7.305844500671602e-05, + "loss": 0.111, + "step": 60930 + }, + { + "epoch": 17.14, + "learning_rate": 7.30397026208103e-05, + "loss": 0.1044, + "step": 60960 + }, + { + "epoch": 17.15, + "learning_rate": 7.302096023490457e-05, + "loss": 0.1077, + "step": 60990 + }, + { + "epoch": 17.15, + "learning_rate": 7.300221784899884e-05, + "loss": 0.1103, + "step": 61020 + }, + { + "epoch": 17.16, + "learning_rate": 7.298347546309312e-05, + "loss": 0.094, + "step": 61050 + }, + { + "epoch": 17.17, + "learning_rate": 7.29647330771874e-05, + "loss": 0.1097, + "step": 61080 + }, + { + "epoch": 17.18, + "learning_rate": 7.294599069128167e-05, + "loss": 0.0986, + "step": 61110 + }, + { + "epoch": 17.19, + "learning_rate": 7.292724830537594e-05, + "loss": 0.1039, + "step": 61140 + }, + { + "epoch": 17.2, + "learning_rate": 7.290850591947022e-05, + "loss": 0.1066, + "step": 61170 + }, + { + "epoch": 17.21, + "learning_rate": 7.28897635335645e-05, + "loss": 0.0945, + "step": 61200 + }, + { + "epoch": 17.21, + "learning_rate": 7.287102114765877e-05, + "loss": 0.1213, + "step": 61230 + }, + { + "epoch": 17.22, + "learning_rate": 7.285227876175305e-05, + "loss": 0.1002, + "step": 61260 + }, + { + "epoch": 17.23, + "learning_rate": 7.283353637584731e-05, + "loss": 0.11, + "step": 61290 + }, + { + "epoch": 17.24, + "learning_rate": 7.281479398994158e-05, + "loss": 0.1133, + "step": 61320 + }, + { + "epoch": 17.25, + "learning_rate": 7.279605160403586e-05, + "loss": 0.0981, + "step": 61350 + }, + { + "epoch": 17.26, + "learning_rate": 7.277730921813014e-05, + "loss": 0.1163, + "step": 61380 + }, + { + "epoch": 17.26, + "learning_rate": 7.275856683222441e-05, + "loss": 0.0986, + "step": 61410 + }, + { + "epoch": 17.27, + "learning_rate": 7.273982444631868e-05, + "loss": 0.1054, + "step": 61440 + }, + { + "epoch": 17.28, + "learning_rate": 7.272108206041296e-05, + "loss": 0.1176, + "step": 61470 + }, + { + "epoch": 17.29, + "learning_rate": 7.270233967450724e-05, + "loss": 0.0973, + "step": 61500 + }, + { + "epoch": 17.3, + "learning_rate": 7.268359728860151e-05, + "loss": 0.1126, + "step": 61530 + }, + { + "epoch": 17.31, + "learning_rate": 7.266485490269578e-05, + "loss": 0.1053, + "step": 61560 + }, + { + "epoch": 17.32, + "learning_rate": 7.264611251679006e-05, + "loss": 0.1058, + "step": 61590 + }, + { + "epoch": 17.32, + "learning_rate": 7.262737013088434e-05, + "loss": 0.1189, + "step": 61620 + }, + { + "epoch": 17.33, + "learning_rate": 7.26086277449786e-05, + "loss": 0.0924, + "step": 61650 + }, + { + "epoch": 17.34, + "learning_rate": 7.258988535907289e-05, + "loss": 0.1132, + "step": 61680 + }, + { + "epoch": 17.35, + "learning_rate": 7.257114297316715e-05, + "loss": 0.1037, + "step": 61710 + }, + { + "epoch": 17.36, + "learning_rate": 7.255240058726142e-05, + "loss": 0.1031, + "step": 61740 + }, + { + "epoch": 17.37, + "learning_rate": 7.25336582013557e-05, + "loss": 0.1161, + "step": 61770 + }, + { + "epoch": 17.37, + "learning_rate": 7.251491581544998e-05, + "loss": 0.0959, + "step": 61800 + }, + { + "epoch": 17.38, + "learning_rate": 7.249617342954425e-05, + "loss": 0.111, + "step": 61830 + }, + { + "epoch": 17.39, + "learning_rate": 7.247743104363852e-05, + "loss": 0.1024, + "step": 61860 + }, + { + "epoch": 17.4, + "learning_rate": 7.24586886577328e-05, + "loss": 0.1058, + "step": 61890 + }, + { + "epoch": 17.41, + "learning_rate": 7.243994627182708e-05, + "loss": 0.1188, + "step": 61920 + }, + { + "epoch": 17.42, + "learning_rate": 7.242120388592135e-05, + "loss": 0.097, + "step": 61950 + }, + { + "epoch": 17.42, + "learning_rate": 7.240246150001561e-05, + "loss": 0.1079, + "step": 61980 + }, + { + "epoch": 17.43, + "learning_rate": 7.23837191141099e-05, + "loss": 0.0996, + "step": 62010 + }, + { + "epoch": 17.44, + "learning_rate": 7.236497672820418e-05, + "loss": 0.1152, + "step": 62040 + }, + { + "epoch": 17.45, + "learning_rate": 7.234623434229844e-05, + "loss": 0.1167, + "step": 62070 + }, + { + "epoch": 17.46, + "learning_rate": 7.232749195639272e-05, + "loss": 0.0957, + "step": 62100 + }, + { + "epoch": 17.47, + "learning_rate": 7.230874957048699e-05, + "loss": 0.1087, + "step": 62130 + }, + { + "epoch": 17.48, + "learning_rate": 7.229000718458126e-05, + "loss": 0.1013, + "step": 62160 + }, + { + "epoch": 17.48, + "learning_rate": 7.227126479867554e-05, + "loss": 0.1123, + "step": 62190 + }, + { + "epoch": 17.49, + "learning_rate": 7.225252241276982e-05, + "loss": 0.1183, + "step": 62220 + }, + { + "epoch": 17.5, + "learning_rate": 7.223378002686409e-05, + "loss": 0.0954, + "step": 62250 + }, + { + "epoch": 17.51, + "learning_rate": 7.221503764095836e-05, + "loss": 0.1181, + "step": 62280 + }, + { + "epoch": 17.52, + "learning_rate": 7.219629525505264e-05, + "loss": 0.1007, + "step": 62310 + }, + { + "epoch": 17.53, + "learning_rate": 7.217755286914692e-05, + "loss": 0.106, + "step": 62340 + }, + { + "epoch": 17.53, + "learning_rate": 7.215881048324119e-05, + "loss": 0.1131, + "step": 62370 + }, + { + "epoch": 17.54, + "learning_rate": 7.214006809733545e-05, + "loss": 0.0923, + "step": 62400 + }, + { + "epoch": 17.55, + "learning_rate": 7.21219504576266e-05, + "loss": 0.1169, + "step": 62430 + }, + { + "epoch": 17.56, + "learning_rate": 7.210320807172086e-05, + "loss": 0.1009, + "step": 62460 + }, + { + "epoch": 17.57, + "learning_rate": 7.208446568581514e-05, + "loss": 0.1042, + "step": 62490 + }, + { + "epoch": 17.58, + "learning_rate": 7.206572329990941e-05, + "loss": 0.1077, + "step": 62520 + }, + { + "epoch": 17.58, + "learning_rate": 7.204698091400369e-05, + "loss": 0.0955, + "step": 62550 + }, + { + "epoch": 17.59, + "learning_rate": 7.202823852809797e-05, + "loss": 0.1196, + "step": 62580 + }, + { + "epoch": 17.6, + "learning_rate": 7.200949614219224e-05, + "loss": 0.1006, + "step": 62610 + }, + { + "epoch": 17.61, + "learning_rate": 7.19907537562865e-05, + "loss": 0.1077, + "step": 62640 + }, + { + "epoch": 17.62, + "learning_rate": 7.197201137038079e-05, + "loss": 0.1178, + "step": 62670 + }, + { + "epoch": 17.63, + "learning_rate": 7.195326898447507e-05, + "loss": 0.0981, + "step": 62700 + }, + { + "epoch": 17.64, + "learning_rate": 7.193452659856934e-05, + "loss": 0.1185, + "step": 62730 + }, + { + "epoch": 17.64, + "learning_rate": 7.19157842126636e-05, + "loss": 0.1058, + "step": 62760 + }, + { + "epoch": 17.65, + "learning_rate": 7.189704182675788e-05, + "loss": 0.1062, + "step": 62790 + }, + { + "epoch": 17.66, + "learning_rate": 7.187829944085216e-05, + "loss": 0.1159, + "step": 62820 + }, + { + "epoch": 17.67, + "learning_rate": 7.185955705494643e-05, + "loss": 0.0978, + "step": 62850 + }, + { + "epoch": 17.68, + "learning_rate": 7.18408146690407e-05, + "loss": 0.1161, + "step": 62880 + }, + { + "epoch": 17.69, + "learning_rate": 7.182207228313498e-05, + "loss": 0.104, + "step": 62910 + }, + { + "epoch": 17.69, + "learning_rate": 7.180332989722925e-05, + "loss": 0.1077, + "step": 62940 + }, + { + "epoch": 17.7, + "learning_rate": 7.178458751132353e-05, + "loss": 0.1148, + "step": 62970 + }, + { + "epoch": 17.71, + "learning_rate": 7.176584512541781e-05, + "loss": 0.1019, + "step": 63000 + }, + { + "epoch": 17.72, + "learning_rate": 7.174710273951208e-05, + "loss": 0.1124, + "step": 63030 + }, + { + "epoch": 17.73, + "learning_rate": 7.172836035360634e-05, + "loss": 0.102, + "step": 63060 + }, + { + "epoch": 17.74, + "learning_rate": 7.170961796770063e-05, + "loss": 0.1031, + "step": 63090 + }, + { + "epoch": 17.75, + "learning_rate": 7.169087558179491e-05, + "loss": 0.1219, + "step": 63120 + }, + { + "epoch": 17.75, + "learning_rate": 7.167213319588917e-05, + "loss": 0.096, + "step": 63150 + }, + { + "epoch": 17.76, + "learning_rate": 7.165339080998344e-05, + "loss": 0.1223, + "step": 63180 + }, + { + "epoch": 17.77, + "learning_rate": 7.163464842407772e-05, + "loss": 0.1004, + "step": 63210 + }, + { + "epoch": 17.78, + "learning_rate": 7.1615906038172e-05, + "loss": 0.1006, + "step": 63240 + }, + { + "epoch": 17.79, + "learning_rate": 7.159716365226627e-05, + "loss": 0.1104, + "step": 63270 + }, + { + "epoch": 17.8, + "learning_rate": 7.157842126636054e-05, + "loss": 0.0967, + "step": 63300 + }, + { + "epoch": 17.8, + "learning_rate": 7.155967888045482e-05, + "loss": 0.1117, + "step": 63330 + }, + { + "epoch": 17.81, + "learning_rate": 7.154093649454909e-05, + "loss": 0.1049, + "step": 63360 + }, + { + "epoch": 17.82, + "learning_rate": 7.152219410864337e-05, + "loss": 0.1011, + "step": 63390 + }, + { + "epoch": 17.83, + "learning_rate": 7.150345172273765e-05, + "loss": 0.1216, + "step": 63420 + }, + { + "epoch": 17.84, + "learning_rate": 7.148470933683192e-05, + "loss": 0.0968, + "step": 63450 + }, + { + "epoch": 17.85, + "learning_rate": 7.146596695092618e-05, + "loss": 0.1151, + "step": 63480 + }, + { + "epoch": 17.85, + "learning_rate": 7.144722456502046e-05, + "loss": 0.1018, + "step": 63510 + }, + { + "epoch": 17.86, + "learning_rate": 7.142848217911475e-05, + "loss": 0.1079, + "step": 63540 + }, + { + "epoch": 17.87, + "learning_rate": 7.140973979320901e-05, + "loss": 0.1129, + "step": 63570 + }, + { + "epoch": 17.88, + "learning_rate": 7.139099740730328e-05, + "loss": 0.0953, + "step": 63600 + }, + { + "epoch": 17.89, + "learning_rate": 7.137225502139756e-05, + "loss": 0.1147, + "step": 63630 + }, + { + "epoch": 17.9, + "learning_rate": 7.135351263549184e-05, + "loss": 0.1023, + "step": 63660 + }, + { + "epoch": 17.91, + "learning_rate": 7.133477024958611e-05, + "loss": 0.106, + "step": 63690 + }, + { + "epoch": 17.91, + "learning_rate": 7.131602786368038e-05, + "loss": 0.1124, + "step": 63720 + }, + { + "epoch": 17.92, + "learning_rate": 7.129728547777466e-05, + "loss": 0.1036, + "step": 63750 + }, + { + "epoch": 17.93, + "learning_rate": 7.127854309186894e-05, + "loss": 0.1174, + "step": 63780 + }, + { + "epoch": 17.94, + "learning_rate": 7.12598007059632e-05, + "loss": 0.1006, + "step": 63810 + }, + { + "epoch": 17.95, + "learning_rate": 7.124105832005749e-05, + "loss": 0.1088, + "step": 63840 + }, + { + "epoch": 17.96, + "learning_rate": 7.122231593415175e-05, + "loss": 0.1132, + "step": 63870 + }, + { + "epoch": 17.96, + "learning_rate": 7.120357354824602e-05, + "loss": 0.0997, + "step": 63900 + }, + { + "epoch": 17.97, + "learning_rate": 7.11848311623403e-05, + "loss": 0.1125, + "step": 63930 + }, + { + "epoch": 17.98, + "learning_rate": 7.116608877643458e-05, + "loss": 0.0998, + "step": 63960 + }, + { + "epoch": 17.99, + "learning_rate": 7.114734639052885e-05, + "loss": 0.1046, + "step": 63990 + }, + { + "epoch": 18.0, + "learning_rate": 7.112860400462312e-05, + "loss": 0.118, + "step": 64020 + }, + { + "epoch": 18.0, + "eval_loss": 0.18319498002529144, + "eval_runtime": 490.7803, + "eval_samples_per_second": 32.668, + "eval_steps_per_second": 1.023, + "eval_wer": 0.15797769983486415, + "step": 64026 + }, + { + "epoch": 18.01, + "learning_rate": 7.11098616187174e-05, + "loss": 0.0957, + "step": 64050 + }, + { + "epoch": 18.02, + "learning_rate": 7.109111923281168e-05, + "loss": 0.1128, + "step": 64080 + }, + { + "epoch": 18.02, + "learning_rate": 7.107237684690595e-05, + "loss": 0.0958, + "step": 64110 + }, + { + "epoch": 18.03, + "learning_rate": 7.105363446100022e-05, + "loss": 0.1036, + "step": 64140 + }, + { + "epoch": 18.04, + "learning_rate": 7.10348920750945e-05, + "loss": 0.0984, + "step": 64170 + }, + { + "epoch": 18.05, + "learning_rate": 7.101614968918878e-05, + "loss": 0.0978, + "step": 64200 + }, + { + "epoch": 18.06, + "learning_rate": 7.099740730328305e-05, + "loss": 0.1047, + "step": 64230 + }, + { + "epoch": 18.07, + "learning_rate": 7.097866491737733e-05, + "loss": 0.0965, + "step": 64260 + }, + { + "epoch": 18.07, + "learning_rate": 7.09599225314716e-05, + "loss": 0.1093, + "step": 64290 + }, + { + "epoch": 18.08, + "learning_rate": 7.094118014556586e-05, + "loss": 0.0999, + "step": 64320 + }, + { + "epoch": 18.09, + "learning_rate": 7.092243775966014e-05, + "loss": 0.1039, + "step": 64350 + }, + { + "epoch": 18.1, + "learning_rate": 7.090369537375442e-05, + "loss": 0.113, + "step": 64380 + }, + { + "epoch": 18.11, + "learning_rate": 7.088495298784869e-05, + "loss": 0.0963, + "step": 64410 + }, + { + "epoch": 18.12, + "learning_rate": 7.086621060194296e-05, + "loss": 0.1074, + "step": 64440 + }, + { + "epoch": 18.12, + "learning_rate": 7.084746821603724e-05, + "loss": 0.1056, + "step": 64470 + }, + { + "epoch": 18.13, + "learning_rate": 7.082872583013152e-05, + "loss": 0.1032, + "step": 64500 + }, + { + "epoch": 18.14, + "learning_rate": 7.080998344422579e-05, + "loss": 0.113, + "step": 64530 + }, + { + "epoch": 18.15, + "learning_rate": 7.079124105832005e-05, + "loss": 0.092, + "step": 64560 + }, + { + "epoch": 18.16, + "learning_rate": 7.077249867241434e-05, + "loss": 0.1066, + "step": 64590 + }, + { + "epoch": 18.17, + "learning_rate": 7.075375628650862e-05, + "loss": 0.0995, + "step": 64620 + }, + { + "epoch": 18.18, + "learning_rate": 7.073501390060288e-05, + "loss": 0.106, + "step": 64650 + }, + { + "epoch": 18.18, + "learning_rate": 7.071627151469715e-05, + "loss": 0.1113, + "step": 64680 + }, + { + "epoch": 18.19, + "learning_rate": 7.069752912879143e-05, + "loss": 0.0944, + "step": 64710 + }, + { + "epoch": 18.2, + "learning_rate": 7.06787867428857e-05, + "loss": 0.1118, + "step": 64740 + }, + { + "epoch": 18.21, + "learning_rate": 7.066004435697998e-05, + "loss": 0.1007, + "step": 64770 + }, + { + "epoch": 18.22, + "learning_rate": 7.064130197107426e-05, + "loss": 0.0998, + "step": 64800 + }, + { + "epoch": 18.23, + "learning_rate": 7.062255958516853e-05, + "loss": 0.1093, + "step": 64830 + }, + { + "epoch": 18.23, + "learning_rate": 7.06038171992628e-05, + "loss": 0.095, + "step": 64860 + }, + { + "epoch": 18.24, + "learning_rate": 7.058507481335708e-05, + "loss": 0.1087, + "step": 64890 + }, + { + "epoch": 18.25, + "learning_rate": 7.056633242745136e-05, + "loss": 0.101, + "step": 64920 + }, + { + "epoch": 18.26, + "learning_rate": 7.054759004154563e-05, + "loss": 0.1046, + "step": 64950 + }, + { + "epoch": 18.27, + "learning_rate": 7.052884765563989e-05, + "loss": 0.1116, + "step": 64980 + }, + { + "epoch": 18.28, + "learning_rate": 7.051010526973417e-05, + "loss": 0.0912, + "step": 65010 + }, + { + "epoch": 18.29, + "learning_rate": 7.049136288382845e-05, + "loss": 0.1096, + "step": 65040 + }, + { + "epoch": 18.29, + "learning_rate": 7.047262049792272e-05, + "loss": 0.1093, + "step": 65070 + }, + { + "epoch": 18.3, + "learning_rate": 7.045387811201699e-05, + "loss": 0.0976, + "step": 65100 + }, + { + "epoch": 18.31, + "learning_rate": 7.043513572611127e-05, + "loss": 0.1079, + "step": 65130 + }, + { + "epoch": 18.32, + "learning_rate": 7.041639334020554e-05, + "loss": 0.0989, + "step": 65160 + }, + { + "epoch": 18.33, + "learning_rate": 7.039765095429982e-05, + "loss": 0.1051, + "step": 65190 + }, + { + "epoch": 18.34, + "learning_rate": 7.03789085683941e-05, + "loss": 0.1016, + "step": 65220 + }, + { + "epoch": 18.34, + "learning_rate": 7.036016618248837e-05, + "loss": 0.1046, + "step": 65250 + }, + { + "epoch": 18.35, + "learning_rate": 7.034142379658263e-05, + "loss": 0.11, + "step": 65280 + }, + { + "epoch": 18.36, + "learning_rate": 7.032268141067692e-05, + "loss": 0.0949, + "step": 65310 + }, + { + "epoch": 18.37, + "learning_rate": 7.03039390247712e-05, + "loss": 0.1015, + "step": 65340 + }, + { + "epoch": 18.38, + "learning_rate": 7.028519663886546e-05, + "loss": 0.0995, + "step": 65370 + }, + { + "epoch": 18.39, + "learning_rate": 7.026645425295973e-05, + "loss": 0.1011, + "step": 65400 + }, + { + "epoch": 18.39, + "learning_rate": 7.024771186705401e-05, + "loss": 0.1081, + "step": 65430 + }, + { + "epoch": 18.4, + "learning_rate": 7.02289694811483e-05, + "loss": 0.0955, + "step": 65460 + }, + { + "epoch": 18.41, + "learning_rate": 7.021022709524256e-05, + "loss": 0.1054, + "step": 65490 + }, + { + "epoch": 18.42, + "learning_rate": 7.019148470933683e-05, + "loss": 0.0987, + "step": 65520 + }, + { + "epoch": 18.43, + "learning_rate": 7.017274232343111e-05, + "loss": 0.1082, + "step": 65550 + }, + { + "epoch": 18.44, + "learning_rate": 7.015399993752538e-05, + "loss": 0.116, + "step": 65580 + }, + { + "epoch": 18.45, + "learning_rate": 7.013525755161966e-05, + "loss": 0.0965, + "step": 65610 + }, + { + "epoch": 18.45, + "learning_rate": 7.011651516571394e-05, + "loss": 0.1075, + "step": 65640 + }, + { + "epoch": 18.46, + "learning_rate": 7.00977727798082e-05, + "loss": 0.0992, + "step": 65670 + }, + { + "epoch": 18.47, + "learning_rate": 7.007903039390247e-05, + "loss": 0.1035, + "step": 65700 + }, + { + "epoch": 18.48, + "learning_rate": 7.006028800799675e-05, + "loss": 0.1175, + "step": 65730 + }, + { + "epoch": 18.49, + "learning_rate": 7.004154562209104e-05, + "loss": 0.1027, + "step": 65760 + }, + { + "epoch": 18.5, + "learning_rate": 7.00228032361853e-05, + "loss": 0.1049, + "step": 65790 + }, + { + "epoch": 18.5, + "learning_rate": 7.000406085027957e-05, + "loss": 0.096, + "step": 65820 + }, + { + "epoch": 18.51, + "learning_rate": 6.998531846437385e-05, + "loss": 0.0972, + "step": 65850 + }, + { + "epoch": 18.52, + "learning_rate": 6.996657607846813e-05, + "loss": 0.1071, + "step": 65880 + }, + { + "epoch": 18.53, + "learning_rate": 6.99478336925624e-05, + "loss": 0.0942, + "step": 65910 + }, + { + "epoch": 18.54, + "learning_rate": 6.992909130665667e-05, + "loss": 0.1089, + "step": 65940 + }, + { + "epoch": 18.55, + "learning_rate": 6.991034892075095e-05, + "loss": 0.0967, + "step": 65970 + }, + { + "epoch": 18.55, + "learning_rate": 6.989160653484522e-05, + "loss": 0.1021, + "step": 66000 + }, + { + "epoch": 18.56, + "learning_rate": 6.98728641489395e-05, + "loss": 0.1093, + "step": 66030 + }, + { + "epoch": 18.57, + "learning_rate": 6.985412176303378e-05, + "loss": 0.0913, + "step": 66060 + }, + { + "epoch": 18.58, + "learning_rate": 6.983537937712804e-05, + "loss": 0.1137, + "step": 66090 + }, + { + "epoch": 18.59, + "learning_rate": 6.981663699122231e-05, + "loss": 0.0984, + "step": 66120 + }, + { + "epoch": 18.6, + "learning_rate": 6.97978946053166e-05, + "loss": 0.1054, + "step": 66150 + }, + { + "epoch": 18.61, + "learning_rate": 6.977915221941087e-05, + "loss": 0.1143, + "step": 66180 + }, + { + "epoch": 18.61, + "learning_rate": 6.976040983350514e-05, + "loss": 0.09, + "step": 66210 + }, + { + "epoch": 18.62, + "learning_rate": 6.974166744759941e-05, + "loss": 0.1103, + "step": 66240 + }, + { + "epoch": 18.63, + "learning_rate": 6.972292506169369e-05, + "loss": 0.0995, + "step": 66270 + }, + { + "epoch": 18.64, + "learning_rate": 6.970418267578797e-05, + "loss": 0.1061, + "step": 66300 + }, + { + "epoch": 18.65, + "learning_rate": 6.968544028988224e-05, + "loss": 0.1125, + "step": 66330 + }, + { + "epoch": 18.66, + "learning_rate": 6.96666979039765e-05, + "loss": 0.0972, + "step": 66360 + }, + { + "epoch": 18.66, + "learning_rate": 6.964795551807079e-05, + "loss": 0.1121, + "step": 66390 + }, + { + "epoch": 18.67, + "learning_rate": 6.962921313216505e-05, + "loss": 0.1064, + "step": 66420 + }, + { + "epoch": 18.68, + "learning_rate": 6.961047074625934e-05, + "loss": 0.1025, + "step": 66450 + }, + { + "epoch": 18.69, + "learning_rate": 6.959172836035362e-05, + "loss": 0.1122, + "step": 66480 + }, + { + "epoch": 18.7, + "learning_rate": 6.957298597444788e-05, + "loss": 0.0927, + "step": 66510 + }, + { + "epoch": 18.71, + "learning_rate": 6.955424358854215e-05, + "loss": 0.1043, + "step": 66540 + }, + { + "epoch": 18.72, + "learning_rate": 6.953550120263643e-05, + "loss": 0.1014, + "step": 66570 + }, + { + "epoch": 18.72, + "learning_rate": 6.951675881673071e-05, + "loss": 0.1046, + "step": 66600 + }, + { + "epoch": 18.73, + "learning_rate": 6.949801643082498e-05, + "loss": 0.1095, + "step": 66630 + }, + { + "epoch": 18.74, + "learning_rate": 6.947927404491925e-05, + "loss": 0.0927, + "step": 66660 + }, + { + "epoch": 18.75, + "learning_rate": 6.946053165901353e-05, + "loss": 0.1151, + "step": 66690 + }, + { + "epoch": 18.76, + "learning_rate": 6.944178927310781e-05, + "loss": 0.0999, + "step": 66720 + }, + { + "epoch": 18.77, + "learning_rate": 6.942304688720208e-05, + "loss": 0.1028, + "step": 66750 + }, + { + "epoch": 18.77, + "learning_rate": 6.940430450129634e-05, + "loss": 0.1076, + "step": 66780 + }, + { + "epoch": 18.78, + "learning_rate": 6.938556211539063e-05, + "loss": 0.0961, + "step": 66810 + }, + { + "epoch": 18.79, + "learning_rate": 6.93668197294849e-05, + "loss": 0.1088, + "step": 66840 + }, + { + "epoch": 18.8, + "learning_rate": 6.934807734357917e-05, + "loss": 0.1009, + "step": 66870 + }, + { + "epoch": 18.81, + "learning_rate": 6.932933495767345e-05, + "loss": 0.0993, + "step": 66900 + }, + { + "epoch": 18.82, + "learning_rate": 6.931059257176772e-05, + "loss": 0.1104, + "step": 66930 + }, + { + "epoch": 18.82, + "learning_rate": 6.929185018586199e-05, + "loss": 0.093, + "step": 66960 + }, + { + "epoch": 18.83, + "learning_rate": 6.927310779995627e-05, + "loss": 0.1068, + "step": 66990 + }, + { + "epoch": 18.84, + "learning_rate": 6.925436541405055e-05, + "loss": 0.1026, + "step": 67020 + }, + { + "epoch": 18.85, + "learning_rate": 6.923562302814482e-05, + "loss": 0.1081, + "step": 67050 + }, + { + "epoch": 18.86, + "learning_rate": 6.921688064223909e-05, + "loss": 0.1129, + "step": 67080 + }, + { + "epoch": 18.87, + "learning_rate": 6.919813825633337e-05, + "loss": 0.0944, + "step": 67110 + }, + { + "epoch": 18.88, + "learning_rate": 6.917939587042765e-05, + "loss": 0.1052, + "step": 67140 + }, + { + "epoch": 18.88, + "learning_rate": 6.916065348452192e-05, + "loss": 0.1053, + "step": 67170 + }, + { + "epoch": 18.89, + "learning_rate": 6.914191109861618e-05, + "loss": 0.0995, + "step": 67200 + }, + { + "epoch": 18.9, + "learning_rate": 6.912316871271046e-05, + "loss": 0.1094, + "step": 67230 + }, + { + "epoch": 18.91, + "learning_rate": 6.910442632680475e-05, + "loss": 0.0939, + "step": 67260 + }, + { + "epoch": 18.92, + "learning_rate": 6.908568394089901e-05, + "loss": 0.1072, + "step": 67290 + }, + { + "epoch": 18.93, + "learning_rate": 6.90669415549933e-05, + "loss": 0.1008, + "step": 67320 + }, + { + "epoch": 18.93, + "learning_rate": 6.904819916908756e-05, + "loss": 0.0974, + "step": 67350 + }, + { + "epoch": 18.94, + "learning_rate": 6.902945678318183e-05, + "loss": 0.1133, + "step": 67380 + }, + { + "epoch": 18.95, + "learning_rate": 6.901071439727611e-05, + "loss": 0.0942, + "step": 67410 + }, + { + "epoch": 18.96, + "learning_rate": 6.899197201137039e-05, + "loss": 0.1098, + "step": 67440 + }, + { + "epoch": 18.97, + "learning_rate": 6.897322962546466e-05, + "loss": 0.1027, + "step": 67470 + }, + { + "epoch": 18.98, + "learning_rate": 6.895448723955893e-05, + "loss": 0.0993, + "step": 67500 + }, + { + "epoch": 18.98, + "learning_rate": 6.89357448536532e-05, + "loss": 0.1138, + "step": 67530 + }, + { + "epoch": 18.99, + "learning_rate": 6.891700246774749e-05, + "loss": 0.0974, + "step": 67560 + }, + { + "epoch": 19.0, + "eval_loss": 0.1771358996629715, + "eval_runtime": 488.1062, + "eval_samples_per_second": 32.847, + "eval_steps_per_second": 1.028, + "eval_wer": 0.15545289533661785, + "step": 67583 + }, + { + "epoch": 19.0, + "learning_rate": 6.889826008184175e-05, + "loss": 0.1123, + "step": 67590 + }, + { + "epoch": 19.01, + "learning_rate": 6.887951769593602e-05, + "loss": 0.0894, + "step": 67620 + }, + { + "epoch": 19.02, + "learning_rate": 6.886140005622716e-05, + "loss": 0.0998, + "step": 67650 + }, + { + "epoch": 19.03, + "learning_rate": 6.884265767032143e-05, + "loss": 0.0999, + "step": 67680 + }, + { + "epoch": 19.04, + "learning_rate": 6.882391528441571e-05, + "loss": 0.093, + "step": 67710 + }, + { + "epoch": 19.04, + "learning_rate": 6.880517289850998e-05, + "loss": 0.111, + "step": 67740 + }, + { + "epoch": 19.05, + "learning_rate": 6.878643051260426e-05, + "loss": 0.0922, + "step": 67770 + }, + { + "epoch": 19.06, + "learning_rate": 6.876768812669854e-05, + "loss": 0.1035, + "step": 67800 + }, + { + "epoch": 19.07, + "learning_rate": 6.874894574079281e-05, + "loss": 0.1017, + "step": 67830 + }, + { + "epoch": 19.08, + "learning_rate": 6.873020335488708e-05, + "loss": 0.0932, + "step": 67860 + }, + { + "epoch": 19.09, + "learning_rate": 6.871146096898136e-05, + "loss": 0.1098, + "step": 67890 + }, + { + "epoch": 19.09, + "learning_rate": 6.869271858307564e-05, + "loss": 0.0905, + "step": 67920 + }, + { + "epoch": 19.1, + "learning_rate": 6.867460094336676e-05, + "loss": 0.1092, + "step": 67950 + }, + { + "epoch": 19.11, + "learning_rate": 6.865585855746105e-05, + "loss": 0.108, + "step": 67980 + }, + { + "epoch": 19.12, + "learning_rate": 6.86371161715553e-05, + "loss": 0.0963, + "step": 68010 + }, + { + "epoch": 19.13, + "learning_rate": 6.861837378564958e-05, + "loss": 0.105, + "step": 68040 + }, + { + "epoch": 19.14, + "learning_rate": 6.859963139974386e-05, + "loss": 0.0944, + "step": 68070 + }, + { + "epoch": 19.15, + "learning_rate": 6.858088901383813e-05, + "loss": 0.099, + "step": 68100 + }, + { + "epoch": 19.15, + "learning_rate": 6.856214662793241e-05, + "loss": 0.1086, + "step": 68130 + }, + { + "epoch": 19.16, + "learning_rate": 6.854340424202668e-05, + "loss": 0.0993, + "step": 68160 + }, + { + "epoch": 19.17, + "learning_rate": 6.852466185612096e-05, + "loss": 0.1077, + "step": 68190 + }, + { + "epoch": 19.18, + "learning_rate": 6.850591947021523e-05, + "loss": 0.0953, + "step": 68220 + }, + { + "epoch": 19.19, + "learning_rate": 6.84871770843095e-05, + "loss": 0.1038, + "step": 68250 + }, + { + "epoch": 19.2, + "learning_rate": 6.846843469840377e-05, + "loss": 0.1011, + "step": 68280 + }, + { + "epoch": 19.2, + "learning_rate": 6.844969231249806e-05, + "loss": 0.0969, + "step": 68310 + }, + { + "epoch": 19.21, + "learning_rate": 6.843094992659232e-05, + "loss": 0.1042, + "step": 68340 + }, + { + "epoch": 19.22, + "learning_rate": 6.84122075406866e-05, + "loss": 0.0889, + "step": 68370 + }, + { + "epoch": 19.23, + "learning_rate": 6.839346515478088e-05, + "loss": 0.1036, + "step": 68400 + }, + { + "epoch": 19.24, + "learning_rate": 6.837472276887514e-05, + "loss": 0.101, + "step": 68430 + }, + { + "epoch": 19.25, + "learning_rate": 6.835598038296942e-05, + "loss": 0.0987, + "step": 68460 + }, + { + "epoch": 19.25, + "learning_rate": 6.83372379970637e-05, + "loss": 0.106, + "step": 68490 + }, + { + "epoch": 19.26, + "learning_rate": 6.831849561115797e-05, + "loss": 0.0906, + "step": 68520 + }, + { + "epoch": 19.27, + "learning_rate": 6.829975322525225e-05, + "loss": 0.099, + "step": 68550 + }, + { + "epoch": 19.28, + "learning_rate": 6.828101083934652e-05, + "loss": 0.1017, + "step": 68580 + }, + { + "epoch": 19.29, + "learning_rate": 6.82622684534408e-05, + "loss": 0.102, + "step": 68610 + }, + { + "epoch": 19.3, + "learning_rate": 6.824352606753506e-05, + "loss": 0.1098, + "step": 68640 + }, + { + "epoch": 19.31, + "learning_rate": 6.822478368162935e-05, + "loss": 0.1002, + "step": 68670 + }, + { + "epoch": 19.31, + "learning_rate": 6.820604129572361e-05, + "loss": 0.1032, + "step": 68700 + }, + { + "epoch": 19.32, + "learning_rate": 6.81872989098179e-05, + "loss": 0.1009, + "step": 68730 + }, + { + "epoch": 19.33, + "learning_rate": 6.816855652391216e-05, + "loss": 0.094, + "step": 68760 + }, + { + "epoch": 19.34, + "learning_rate": 6.814981413800644e-05, + "loss": 0.1047, + "step": 68790 + }, + { + "epoch": 19.35, + "learning_rate": 6.813107175210072e-05, + "loss": 0.0919, + "step": 68820 + }, + { + "epoch": 19.36, + "learning_rate": 6.811232936619498e-05, + "loss": 0.1049, + "step": 68850 + }, + { + "epoch": 19.36, + "learning_rate": 6.809358698028926e-05, + "loss": 0.0989, + "step": 68880 + }, + { + "epoch": 19.37, + "learning_rate": 6.807484459438354e-05, + "loss": 0.0982, + "step": 68910 + }, + { + "epoch": 19.38, + "learning_rate": 6.80561022084778e-05, + "loss": 0.1088, + "step": 68940 + }, + { + "epoch": 19.39, + "learning_rate": 6.803735982257209e-05, + "loss": 0.0919, + "step": 68970 + }, + { + "epoch": 19.4, + "learning_rate": 6.801861743666635e-05, + "loss": 0.1043, + "step": 69000 + }, + { + "epoch": 19.41, + "learning_rate": 6.799987505076064e-05, + "loss": 0.1, + "step": 69030 + }, + { + "epoch": 19.42, + "learning_rate": 6.79811326648549e-05, + "loss": 0.0997, + "step": 69060 + }, + { + "epoch": 19.42, + "learning_rate": 6.796239027894918e-05, + "loss": 0.1081, + "step": 69090 + }, + { + "epoch": 19.43, + "learning_rate": 6.794364789304345e-05, + "loss": 0.0879, + "step": 69120 + }, + { + "epoch": 19.44, + "learning_rate": 6.792490550713773e-05, + "loss": 0.1077, + "step": 69150 + }, + { + "epoch": 19.45, + "learning_rate": 6.7906163121232e-05, + "loss": 0.1, + "step": 69180 + }, + { + "epoch": 19.46, + "learning_rate": 6.788742073532628e-05, + "loss": 0.0995, + "step": 69210 + }, + { + "epoch": 19.47, + "learning_rate": 6.786867834942056e-05, + "loss": 0.1106, + "step": 69240 + }, + { + "epoch": 19.47, + "learning_rate": 6.784993596351482e-05, + "loss": 0.0973, + "step": 69270 + }, + { + "epoch": 19.48, + "learning_rate": 6.78311935776091e-05, + "loss": 0.102, + "step": 69300 + }, + { + "epoch": 19.49, + "learning_rate": 6.781245119170338e-05, + "loss": 0.1005, + "step": 69330 + }, + { + "epoch": 19.5, + "learning_rate": 6.779370880579764e-05, + "loss": 0.0957, + "step": 69360 + }, + { + "epoch": 19.51, + "learning_rate": 6.777496641989193e-05, + "loss": 0.1084, + "step": 69390 + }, + { + "epoch": 19.52, + "learning_rate": 6.77562240339862e-05, + "loss": 0.0951, + "step": 69420 + }, + { + "epoch": 19.52, + "learning_rate": 6.773748164808047e-05, + "loss": 0.1102, + "step": 69450 + }, + { + "epoch": 19.53, + "learning_rate": 6.771873926217474e-05, + "loss": 0.1024, + "step": 69480 + }, + { + "epoch": 19.54, + "learning_rate": 6.769999687626902e-05, + "loss": 0.0908, + "step": 69510 + }, + { + "epoch": 19.55, + "learning_rate": 6.768125449036329e-05, + "loss": 0.1097, + "step": 69540 + }, + { + "epoch": 19.56, + "learning_rate": 6.766251210445757e-05, + "loss": 0.0884, + "step": 69570 + }, + { + "epoch": 19.57, + "learning_rate": 6.764376971855184e-05, + "loss": 0.1043, + "step": 69600 + }, + { + "epoch": 19.58, + "learning_rate": 6.762502733264612e-05, + "loss": 0.1006, + "step": 69630 + }, + { + "epoch": 19.58, + "learning_rate": 6.76062849467404e-05, + "loss": 0.0977, + "step": 69660 + }, + { + "epoch": 19.59, + "learning_rate": 6.758754256083465e-05, + "loss": 0.1091, + "step": 69690 + }, + { + "epoch": 19.6, + "learning_rate": 6.756880017492894e-05, + "loss": 0.0919, + "step": 69720 + }, + { + "epoch": 19.61, + "learning_rate": 6.755005778902322e-05, + "loss": 0.1035, + "step": 69750 + }, + { + "epoch": 19.62, + "learning_rate": 6.753131540311748e-05, + "loss": 0.0988, + "step": 69780 + }, + { + "epoch": 19.63, + "learning_rate": 6.751257301721175e-05, + "loss": 0.0976, + "step": 69810 + }, + { + "epoch": 19.63, + "learning_rate": 6.749383063130603e-05, + "loss": 0.1107, + "step": 69840 + }, + { + "epoch": 19.64, + "learning_rate": 6.747508824540031e-05, + "loss": 0.0914, + "step": 69870 + }, + { + "epoch": 19.65, + "learning_rate": 6.745634585949458e-05, + "loss": 0.103, + "step": 69900 + }, + { + "epoch": 19.66, + "learning_rate": 6.743760347358886e-05, + "loss": 0.1086, + "step": 69930 + }, + { + "epoch": 19.67, + "learning_rate": 6.741886108768313e-05, + "loss": 0.0938, + "step": 69960 + }, + { + "epoch": 19.68, + "learning_rate": 6.740011870177741e-05, + "loss": 0.1071, + "step": 69990 + }, + { + "epoch": 19.69, + "learning_rate": 6.738137631587168e-05, + "loss": 0.093, + "step": 70020 + }, + { + "epoch": 19.69, + "learning_rate": 6.736263392996596e-05, + "loss": 0.1046, + "step": 70050 + }, + { + "epoch": 19.7, + "learning_rate": 6.734389154406024e-05, + "loss": 0.1021, + "step": 70080 + }, + { + "epoch": 19.71, + "learning_rate": 6.732514915815449e-05, + "loss": 0.0982, + "step": 70110 + }, + { + "epoch": 19.72, + "learning_rate": 6.730640677224877e-05, + "loss": 0.1069, + "step": 70140 + }, + { + "epoch": 19.73, + "learning_rate": 6.728766438634305e-05, + "loss": 0.0912, + "step": 70170 + }, + { + "epoch": 19.74, + "learning_rate": 6.726892200043732e-05, + "loss": 0.1036, + "step": 70200 + }, + { + "epoch": 19.74, + "learning_rate": 6.725017961453159e-05, + "loss": 0.1075, + "step": 70230 + }, + { + "epoch": 19.75, + "learning_rate": 6.723143722862587e-05, + "loss": 0.0996, + "step": 70260 + }, + { + "epoch": 19.76, + "learning_rate": 6.721269484272015e-05, + "loss": 0.1122, + "step": 70290 + }, + { + "epoch": 19.77, + "learning_rate": 6.719395245681442e-05, + "loss": 0.0951, + "step": 70320 + }, + { + "epoch": 19.78, + "learning_rate": 6.71752100709087e-05, + "loss": 0.1156, + "step": 70350 + }, + { + "epoch": 19.79, + "learning_rate": 6.715646768500297e-05, + "loss": 0.1007, + "step": 70380 + }, + { + "epoch": 19.79, + "learning_rate": 6.713772529909725e-05, + "loss": 0.0958, + "step": 70410 + }, + { + "epoch": 19.8, + "learning_rate": 6.711898291319152e-05, + "loss": 0.1101, + "step": 70440 + }, + { + "epoch": 19.81, + "learning_rate": 6.71002405272858e-05, + "loss": 0.0887, + "step": 70470 + }, + { + "epoch": 19.82, + "learning_rate": 6.708149814138008e-05, + "loss": 0.1066, + "step": 70500 + }, + { + "epoch": 19.83, + "learning_rate": 6.706275575547433e-05, + "loss": 0.0971, + "step": 70530 + }, + { + "epoch": 19.84, + "learning_rate": 6.704401336956861e-05, + "loss": 0.0976, + "step": 70560 + }, + { + "epoch": 19.85, + "learning_rate": 6.70252709836629e-05, + "loss": 0.1099, + "step": 70590 + }, + { + "epoch": 19.85, + "learning_rate": 6.700652859775717e-05, + "loss": 0.091, + "step": 70620 + }, + { + "epoch": 19.86, + "learning_rate": 6.698778621185143e-05, + "loss": 0.1028, + "step": 70650 + }, + { + "epoch": 19.87, + "learning_rate": 6.696904382594571e-05, + "loss": 0.0995, + "step": 70680 + }, + { + "epoch": 19.88, + "learning_rate": 6.695030144003999e-05, + "loss": 0.0949, + "step": 70710 + }, + { + "epoch": 19.89, + "learning_rate": 6.693155905413426e-05, + "loss": 0.1015, + "step": 70740 + }, + { + "epoch": 19.9, + "learning_rate": 6.691281666822854e-05, + "loss": 0.0958, + "step": 70770 + }, + { + "epoch": 19.9, + "learning_rate": 6.68940742823228e-05, + "loss": 0.107, + "step": 70800 + }, + { + "epoch": 19.91, + "learning_rate": 6.687533189641709e-05, + "loss": 0.1014, + "step": 70830 + }, + { + "epoch": 19.92, + "learning_rate": 6.685658951051135e-05, + "loss": 0.0955, + "step": 70860 + }, + { + "epoch": 19.93, + "learning_rate": 6.683784712460564e-05, + "loss": 0.1046, + "step": 70890 + }, + { + "epoch": 19.94, + "learning_rate": 6.681910473869992e-05, + "loss": 0.0939, + "step": 70920 + }, + { + "epoch": 19.95, + "learning_rate": 6.680036235279417e-05, + "loss": 0.1079, + "step": 70950 + }, + { + "epoch": 19.95, + "learning_rate": 6.678161996688845e-05, + "loss": 0.1017, + "step": 70980 + }, + { + "epoch": 19.96, + "learning_rate": 6.676287758098273e-05, + "loss": 0.0968, + "step": 71010 + }, + { + "epoch": 19.97, + "learning_rate": 6.674413519507701e-05, + "loss": 0.1056, + "step": 71040 + }, + { + "epoch": 19.98, + "learning_rate": 6.672539280917127e-05, + "loss": 0.094, + "step": 71070 + }, + { + "epoch": 19.99, + "learning_rate": 6.670665042326555e-05, + "loss": 0.1013, + "step": 71100 + }, + { + "epoch": 20.0, + "learning_rate": 6.668790803735983e-05, + "loss": 0.1007, + "step": 71130 + }, + { + "epoch": 20.0, + "eval_loss": 0.18122704327106476, + "eval_runtime": 490.4096, + "eval_samples_per_second": 32.693, + "eval_steps_per_second": 1.024, + "eval_wer": 0.1531873950841374, + "step": 71140 + }, + { + "epoch": 20.01, + "learning_rate": 6.66691656514541e-05, + "loss": 0.0832, + "step": 71160 + }, + { + "epoch": 20.01, + "learning_rate": 6.665042326554838e-05, + "loss": 0.1068, + "step": 71190 + }, + { + "epoch": 20.02, + "learning_rate": 6.663168087964264e-05, + "loss": 0.0816, + "step": 71220 + }, + { + "epoch": 20.03, + "learning_rate": 6.661293849373693e-05, + "loss": 0.1002, + "step": 71250 + }, + { + "epoch": 20.04, + "learning_rate": 6.659419610783119e-05, + "loss": 0.087, + "step": 71280 + }, + { + "epoch": 20.05, + "learning_rate": 6.657545372192547e-05, + "loss": 0.0935, + "step": 71310 + }, + { + "epoch": 20.06, + "learning_rate": 6.655671133601976e-05, + "loss": 0.1067, + "step": 71340 + }, + { + "epoch": 20.06, + "learning_rate": 6.653796895011402e-05, + "loss": 0.0843, + "step": 71370 + }, + { + "epoch": 20.07, + "learning_rate": 6.651922656420829e-05, + "loss": 0.0997, + "step": 71400 + }, + { + "epoch": 20.08, + "learning_rate": 6.650048417830257e-05, + "loss": 0.0902, + "step": 71430 + }, + { + "epoch": 20.09, + "learning_rate": 6.648174179239685e-05, + "loss": 0.0941, + "step": 71460 + }, + { + "epoch": 20.1, + "learning_rate": 6.64629994064911e-05, + "loss": 0.1033, + "step": 71490 + }, + { + "epoch": 20.11, + "learning_rate": 6.644425702058539e-05, + "loss": 0.0856, + "step": 71520 + }, + { + "epoch": 20.12, + "learning_rate": 6.642551463467967e-05, + "loss": 0.1067, + "step": 71550 + }, + { + "epoch": 20.12, + "learning_rate": 6.640677224877394e-05, + "loss": 0.0924, + "step": 71580 + }, + { + "epoch": 20.13, + "learning_rate": 6.638802986286822e-05, + "loss": 0.0941, + "step": 71610 + }, + { + "epoch": 20.14, + "learning_rate": 6.636928747696248e-05, + "loss": 0.1004, + "step": 71640 + }, + { + "epoch": 20.15, + "learning_rate": 6.635054509105676e-05, + "loss": 0.0873, + "step": 71670 + }, + { + "epoch": 20.16, + "learning_rate": 6.633180270515103e-05, + "loss": 0.1021, + "step": 71700 + }, + { + "epoch": 20.17, + "learning_rate": 6.631306031924531e-05, + "loss": 0.0882, + "step": 71730 + }, + { + "epoch": 20.17, + "learning_rate": 6.62943179333396e-05, + "loss": 0.0968, + "step": 71760 + }, + { + "epoch": 20.18, + "learning_rate": 6.627557554743386e-05, + "loss": 0.1072, + "step": 71790 + }, + { + "epoch": 20.19, + "learning_rate": 6.625683316152813e-05, + "loss": 0.0872, + "step": 71820 + }, + { + "epoch": 20.2, + "learning_rate": 6.623809077562241e-05, + "loss": 0.1014, + "step": 71850 + }, + { + "epoch": 20.21, + "learning_rate": 6.621934838971669e-05, + "loss": 0.0874, + "step": 71880 + }, + { + "epoch": 20.22, + "learning_rate": 6.620060600381094e-05, + "loss": 0.0957, + "step": 71910 + }, + { + "epoch": 20.22, + "learning_rate": 6.618186361790523e-05, + "loss": 0.1076, + "step": 71940 + }, + { + "epoch": 20.23, + "learning_rate": 6.61631212319995e-05, + "loss": 0.0835, + "step": 71970 + }, + { + "epoch": 20.24, + "learning_rate": 6.614437884609377e-05, + "loss": 0.0982, + "step": 72000 + }, + { + "epoch": 20.25, + "learning_rate": 6.612563646018805e-05, + "loss": 0.0887, + "step": 72030 + }, + { + "epoch": 20.26, + "learning_rate": 6.610689407428232e-05, + "loss": 0.095, + "step": 72060 + }, + { + "epoch": 20.27, + "learning_rate": 6.60881516883766e-05, + "loss": 0.1108, + "step": 72090 + }, + { + "epoch": 20.28, + "learning_rate": 6.606940930247087e-05, + "loss": 0.0951, + "step": 72120 + }, + { + "epoch": 20.28, + "learning_rate": 6.605066691656515e-05, + "loss": 0.1091, + "step": 72150 + }, + { + "epoch": 20.29, + "learning_rate": 6.603192453065943e-05, + "loss": 0.0897, + "step": 72180 + }, + { + "epoch": 20.3, + "learning_rate": 6.60131821447537e-05, + "loss": 0.0941, + "step": 72210 + }, + { + "epoch": 20.31, + "learning_rate": 6.599443975884797e-05, + "loss": 0.1009, + "step": 72240 + }, + { + "epoch": 20.32, + "learning_rate": 6.597569737294225e-05, + "loss": 0.0877, + "step": 72270 + }, + { + "epoch": 20.33, + "learning_rate": 6.595695498703653e-05, + "loss": 0.1032, + "step": 72300 + }, + { + "epoch": 20.33, + "learning_rate": 6.593821260113078e-05, + "loss": 0.0901, + "step": 72330 + }, + { + "epoch": 20.34, + "learning_rate": 6.591947021522506e-05, + "loss": 0.0985, + "step": 72360 + }, + { + "epoch": 20.35, + "learning_rate": 6.590072782931934e-05, + "loss": 0.1042, + "step": 72390 + }, + { + "epoch": 20.36, + "learning_rate": 6.588198544341361e-05, + "loss": 0.0863, + "step": 72420 + }, + { + "epoch": 20.37, + "learning_rate": 6.586386780370475e-05, + "loss": 0.0994, + "step": 72450 + }, + { + "epoch": 20.38, + "learning_rate": 6.584512541779902e-05, + "loss": 0.09, + "step": 72480 + }, + { + "epoch": 20.39, + "learning_rate": 6.58263830318933e-05, + "loss": 0.0919, + "step": 72510 + }, + { + "epoch": 20.39, + "learning_rate": 6.580764064598757e-05, + "loss": 0.1083, + "step": 72540 + }, + { + "epoch": 20.4, + "learning_rate": 6.578889826008185e-05, + "loss": 0.0856, + "step": 72570 + }, + { + "epoch": 20.41, + "learning_rate": 6.577015587417612e-05, + "loss": 0.1011, + "step": 72600 + }, + { + "epoch": 20.42, + "learning_rate": 6.57514134882704e-05, + "loss": 0.0931, + "step": 72630 + }, + { + "epoch": 20.43, + "learning_rate": 6.573267110236467e-05, + "loss": 0.1012, + "step": 72660 + }, + { + "epoch": 20.44, + "learning_rate": 6.571392871645893e-05, + "loss": 0.1066, + "step": 72690 + }, + { + "epoch": 20.44, + "learning_rate": 6.569518633055321e-05, + "loss": 0.0876, + "step": 72720 + }, + { + "epoch": 20.45, + "learning_rate": 6.56764439446475e-05, + "loss": 0.1006, + "step": 72750 + }, + { + "epoch": 20.46, + "learning_rate": 6.565770155874176e-05, + "loss": 0.0882, + "step": 72780 + }, + { + "epoch": 20.47, + "learning_rate": 6.563895917283603e-05, + "loss": 0.0945, + "step": 72810 + }, + { + "epoch": 20.48, + "learning_rate": 6.562021678693031e-05, + "loss": 0.1038, + "step": 72840 + }, + { + "epoch": 20.49, + "learning_rate": 6.560147440102459e-05, + "loss": 0.0908, + "step": 72870 + }, + { + "epoch": 20.49, + "learning_rate": 6.558273201511886e-05, + "loss": 0.0993, + "step": 72900 + }, + { + "epoch": 20.5, + "learning_rate": 6.556398962921314e-05, + "loss": 0.087, + "step": 72930 + }, + { + "epoch": 20.51, + "learning_rate": 6.554524724330741e-05, + "loss": 0.1007, + "step": 72960 + }, + { + "epoch": 20.52, + "learning_rate": 6.552650485740169e-05, + "loss": 0.1041, + "step": 72990 + }, + { + "epoch": 20.53, + "learning_rate": 6.550776247149596e-05, + "loss": 0.0845, + "step": 73020 + }, + { + "epoch": 20.54, + "learning_rate": 6.548902008559024e-05, + "loss": 0.0989, + "step": 73050 + }, + { + "epoch": 20.55, + "learning_rate": 6.54702776996845e-05, + "loss": 0.085, + "step": 73080 + }, + { + "epoch": 20.55, + "learning_rate": 6.545153531377877e-05, + "loss": 0.098, + "step": 73110 + }, + { + "epoch": 20.56, + "learning_rate": 6.543279292787305e-05, + "loss": 0.1048, + "step": 73140 + }, + { + "epoch": 20.57, + "learning_rate": 6.541405054196733e-05, + "loss": 0.0855, + "step": 73170 + }, + { + "epoch": 20.58, + "learning_rate": 6.53953081560616e-05, + "loss": 0.0995, + "step": 73200 + }, + { + "epoch": 20.59, + "learning_rate": 6.537656577015587e-05, + "loss": 0.0978, + "step": 73230 + }, + { + "epoch": 20.6, + "learning_rate": 6.535782338425015e-05, + "loss": 0.1018, + "step": 73260 + }, + { + "epoch": 20.6, + "learning_rate": 6.533908099834443e-05, + "loss": 0.1015, + "step": 73290 + }, + { + "epoch": 20.61, + "learning_rate": 6.53203386124387e-05, + "loss": 0.0896, + "step": 73320 + }, + { + "epoch": 20.62, + "learning_rate": 6.530159622653298e-05, + "loss": 0.1, + "step": 73350 + }, + { + "epoch": 20.63, + "learning_rate": 6.528285384062725e-05, + "loss": 0.0872, + "step": 73380 + }, + { + "epoch": 20.64, + "learning_rate": 6.526411145472153e-05, + "loss": 0.1023, + "step": 73410 + }, + { + "epoch": 20.65, + "learning_rate": 6.52453690688158e-05, + "loss": 0.106, + "step": 73440 + }, + { + "epoch": 20.65, + "learning_rate": 6.522662668291008e-05, + "loss": 0.0848, + "step": 73470 + }, + { + "epoch": 20.66, + "learning_rate": 6.520788429700434e-05, + "loss": 0.0971, + "step": 73500 + }, + { + "epoch": 20.67, + "learning_rate": 6.518914191109861e-05, + "loss": 0.0956, + "step": 73530 + }, + { + "epoch": 20.68, + "learning_rate": 6.517039952519289e-05, + "loss": 0.0994, + "step": 73560 + }, + { + "epoch": 20.69, + "learning_rate": 6.515165713928717e-05, + "loss": 0.1042, + "step": 73590 + }, + { + "epoch": 20.7, + "learning_rate": 6.513291475338144e-05, + "loss": 0.0823, + "step": 73620 + }, + { + "epoch": 20.71, + "learning_rate": 6.511417236747571e-05, + "loss": 0.0984, + "step": 73650 + }, + { + "epoch": 20.71, + "learning_rate": 6.509542998156999e-05, + "loss": 0.0931, + "step": 73680 + }, + { + "epoch": 20.72, + "learning_rate": 6.507668759566427e-05, + "loss": 0.1084, + "step": 73710 + }, + { + "epoch": 20.73, + "learning_rate": 6.505794520975854e-05, + "loss": 0.1032, + "step": 73740 + }, + { + "epoch": 20.74, + "learning_rate": 6.503920282385282e-05, + "loss": 0.0868, + "step": 73770 + }, + { + "epoch": 20.75, + "learning_rate": 6.502046043794709e-05, + "loss": 0.1069, + "step": 73800 + }, + { + "epoch": 20.76, + "learning_rate": 6.500171805204137e-05, + "loss": 0.0901, + "step": 73830 + }, + { + "epoch": 20.76, + "learning_rate": 6.498297566613563e-05, + "loss": 0.1024, + "step": 73860 + }, + { + "epoch": 20.77, + "learning_rate": 6.496423328022991e-05, + "loss": 0.1037, + "step": 73890 + }, + { + "epoch": 20.78, + "learning_rate": 6.494549089432418e-05, + "loss": 0.0885, + "step": 73920 + }, + { + "epoch": 20.79, + "learning_rate": 6.492674850841845e-05, + "loss": 0.1046, + "step": 73950 + }, + { + "epoch": 20.8, + "learning_rate": 6.490800612251273e-05, + "loss": 0.0902, + "step": 73980 + }, + { + "epoch": 20.81, + "learning_rate": 6.488926373660701e-05, + "loss": 0.0999, + "step": 74010 + }, + { + "epoch": 20.82, + "learning_rate": 6.487052135070128e-05, + "loss": 0.1074, + "step": 74040 + }, + { + "epoch": 20.82, + "learning_rate": 6.485177896479555e-05, + "loss": 0.0874, + "step": 74070 + }, + { + "epoch": 20.83, + "learning_rate": 6.483303657888983e-05, + "loss": 0.1052, + "step": 74100 + }, + { + "epoch": 20.84, + "learning_rate": 6.481429419298411e-05, + "loss": 0.093, + "step": 74130 + }, + { + "epoch": 20.85, + "learning_rate": 6.479555180707838e-05, + "loss": 0.0919, + "step": 74160 + }, + { + "epoch": 20.86, + "learning_rate": 6.477680942117264e-05, + "loss": 0.1047, + "step": 74190 + }, + { + "epoch": 20.87, + "learning_rate": 6.475806703526692e-05, + "loss": 0.0858, + "step": 74220 + }, + { + "epoch": 20.87, + "learning_rate": 6.47393246493612e-05, + "loss": 0.1063, + "step": 74250 + }, + { + "epoch": 20.88, + "learning_rate": 6.472058226345547e-05, + "loss": 0.0914, + "step": 74280 + }, + { + "epoch": 20.89, + "learning_rate": 6.470183987754975e-05, + "loss": 0.0996, + "step": 74310 + }, + { + "epoch": 20.9, + "learning_rate": 6.468309749164402e-05, + "loss": 0.1036, + "step": 74340 + }, + { + "epoch": 20.91, + "learning_rate": 6.466435510573829e-05, + "loss": 0.0895, + "step": 74370 + }, + { + "epoch": 20.92, + "learning_rate": 6.464561271983257e-05, + "loss": 0.1012, + "step": 74400 + }, + { + "epoch": 20.92, + "learning_rate": 6.462687033392685e-05, + "loss": 0.0939, + "step": 74430 + }, + { + "epoch": 20.93, + "learning_rate": 6.460812794802113e-05, + "loss": 0.0999, + "step": 74460 + }, + { + "epoch": 20.94, + "learning_rate": 6.458938556211538e-05, + "loss": 0.1043, + "step": 74490 + }, + { + "epoch": 20.95, + "learning_rate": 6.457064317620967e-05, + "loss": 0.0844, + "step": 74520 + }, + { + "epoch": 20.96, + "learning_rate": 6.455190079030395e-05, + "loss": 0.098, + "step": 74550 + }, + { + "epoch": 20.97, + "learning_rate": 6.453315840439821e-05, + "loss": 0.0859, + "step": 74580 + }, + { + "epoch": 20.98, + "learning_rate": 6.451441601849248e-05, + "loss": 0.0982, + "step": 74610 + }, + { + "epoch": 20.98, + "learning_rate": 6.449567363258676e-05, + "loss": 0.1069, + "step": 74640 + }, + { + "epoch": 20.99, + "learning_rate": 6.447693124668104e-05, + "loss": 0.0866, + "step": 74670 + }, + { + "epoch": 21.0, + "eval_loss": 0.17515245079994202, + "eval_runtime": 503.7384, + "eval_samples_per_second": 31.828, + "eval_steps_per_second": 0.997, + "eval_wer": 0.1504169339320077, + "step": 74697 + }, + { + "epoch": 21.0, + "learning_rate": 6.445818886077531e-05, + "loss": 0.11, + "step": 74700 + }, + { + "epoch": 21.01, + "learning_rate": 6.443944647486959e-05, + "loss": 0.0902, + "step": 74730 + }, + { + "epoch": 21.02, + "learning_rate": 6.442132883516072e-05, + "loss": 0.1021, + "step": 74760 + }, + { + "epoch": 21.03, + "learning_rate": 6.4402586449255e-05, + "loss": 0.0912, + "step": 74790 + }, + { + "epoch": 21.03, + "learning_rate": 6.438384406334927e-05, + "loss": 0.0911, + "step": 74820 + }, + { + "epoch": 21.04, + "learning_rate": 6.436510167744354e-05, + "loss": 0.0956, + "step": 74850 + }, + { + "epoch": 21.05, + "learning_rate": 6.434635929153782e-05, + "loss": 0.0848, + "step": 74880 + }, + { + "epoch": 21.06, + "learning_rate": 6.43276169056321e-05, + "loss": 0.0995, + "step": 74910 + }, + { + "epoch": 21.07, + "learning_rate": 6.430887451972636e-05, + "loss": 0.0897, + "step": 74940 + }, + { + "epoch": 21.08, + "learning_rate": 6.429013213382063e-05, + "loss": 0.0911, + "step": 74970 + }, + { + "epoch": 21.09, + "learning_rate": 6.427138974791491e-05, + "loss": 0.0971, + "step": 75000 + }, + { + "epoch": 21.09, + "learning_rate": 6.42526473620092e-05, + "loss": 0.084, + "step": 75030 + }, + { + "epoch": 21.1, + "learning_rate": 6.423390497610346e-05, + "loss": 0.098, + "step": 75060 + }, + { + "epoch": 21.11, + "learning_rate": 6.421516259019773e-05, + "loss": 0.0882, + "step": 75090 + }, + { + "epoch": 21.12, + "learning_rate": 6.419642020429201e-05, + "loss": 0.0931, + "step": 75120 + }, + { + "epoch": 21.13, + "learning_rate": 6.417767781838628e-05, + "loss": 0.0954, + "step": 75150 + }, + { + "epoch": 21.14, + "learning_rate": 6.415893543248056e-05, + "loss": 0.0813, + "step": 75180 + }, + { + "epoch": 21.14, + "learning_rate": 6.414019304657484e-05, + "loss": 0.0998, + "step": 75210 + }, + { + "epoch": 21.15, + "learning_rate": 6.41214506606691e-05, + "loss": 0.0874, + "step": 75240 + }, + { + "epoch": 21.16, + "learning_rate": 6.410270827476337e-05, + "loss": 0.0928, + "step": 75270 + }, + { + "epoch": 21.17, + "learning_rate": 6.408396588885765e-05, + "loss": 0.097, + "step": 75300 + }, + { + "epoch": 21.18, + "learning_rate": 6.406522350295194e-05, + "loss": 0.0841, + "step": 75330 + }, + { + "epoch": 21.19, + "learning_rate": 6.40464811170462e-05, + "loss": 0.0913, + "step": 75360 + }, + { + "epoch": 21.19, + "learning_rate": 6.402773873114047e-05, + "loss": 0.0924, + "step": 75390 + }, + { + "epoch": 21.2, + "learning_rate": 6.400899634523475e-05, + "loss": 0.0949, + "step": 75420 + }, + { + "epoch": 21.21, + "learning_rate": 6.399025395932903e-05, + "loss": 0.1002, + "step": 75450 + }, + { + "epoch": 21.22, + "learning_rate": 6.39715115734233e-05, + "loss": 0.0857, + "step": 75480 + }, + { + "epoch": 21.23, + "learning_rate": 6.395276918751757e-05, + "loss": 0.0921, + "step": 75510 + }, + { + "epoch": 21.24, + "learning_rate": 6.393402680161185e-05, + "loss": 0.1005, + "step": 75540 + }, + { + "epoch": 21.25, + "learning_rate": 6.391528441570613e-05, + "loss": 0.097, + "step": 75570 + }, + { + "epoch": 21.25, + "learning_rate": 6.38965420298004e-05, + "loss": 0.098, + "step": 75600 + }, + { + "epoch": 21.26, + "learning_rate": 6.387779964389468e-05, + "loss": 0.0828, + "step": 75630 + }, + { + "epoch": 21.27, + "learning_rate": 6.385905725798894e-05, + "loss": 0.0935, + "step": 75660 + }, + { + "epoch": 21.28, + "learning_rate": 6.384031487208321e-05, + "loss": 0.0942, + "step": 75690 + }, + { + "epoch": 21.29, + "learning_rate": 6.38215724861775e-05, + "loss": 0.0906, + "step": 75720 + }, + { + "epoch": 21.3, + "learning_rate": 6.380283010027177e-05, + "loss": 0.1015, + "step": 75750 + }, + { + "epoch": 21.3, + "learning_rate": 6.378408771436604e-05, + "loss": 0.0827, + "step": 75780 + }, + { + "epoch": 21.31, + "learning_rate": 6.376534532846031e-05, + "loss": 0.0985, + "step": 75810 + }, + { + "epoch": 21.32, + "learning_rate": 6.374660294255459e-05, + "loss": 0.0928, + "step": 75840 + }, + { + "epoch": 21.33, + "learning_rate": 6.372786055664887e-05, + "loss": 0.0897, + "step": 75870 + }, + { + "epoch": 21.34, + "learning_rate": 6.370911817074314e-05, + "loss": 0.0953, + "step": 75900 + }, + { + "epoch": 21.35, + "learning_rate": 6.36903757848374e-05, + "loss": 0.0837, + "step": 75930 + }, + { + "epoch": 21.36, + "learning_rate": 6.367163339893169e-05, + "loss": 0.0935, + "step": 75960 + }, + { + "epoch": 21.36, + "learning_rate": 6.365289101302597e-05, + "loss": 0.0962, + "step": 75990 + }, + { + "epoch": 21.37, + "learning_rate": 6.363414862712024e-05, + "loss": 0.0919, + "step": 76020 + }, + { + "epoch": 21.38, + "learning_rate": 6.361540624121452e-05, + "loss": 0.0988, + "step": 76050 + }, + { + "epoch": 21.39, + "learning_rate": 6.359666385530878e-05, + "loss": 0.0867, + "step": 76080 + }, + { + "epoch": 21.4, + "learning_rate": 6.357792146940305e-05, + "loss": 0.0975, + "step": 76110 + }, + { + "epoch": 21.41, + "learning_rate": 6.355917908349733e-05, + "loss": 0.0979, + "step": 76140 + }, + { + "epoch": 21.41, + "learning_rate": 6.354043669759161e-05, + "loss": 0.0924, + "step": 76170 + }, + { + "epoch": 21.42, + "learning_rate": 6.352169431168588e-05, + "loss": 0.1027, + "step": 76200 + }, + { + "epoch": 21.43, + "learning_rate": 6.350295192578015e-05, + "loss": 0.0862, + "step": 76230 + }, + { + "epoch": 21.44, + "learning_rate": 6.348420953987443e-05, + "loss": 0.1067, + "step": 76260 + }, + { + "epoch": 21.45, + "learning_rate": 6.346546715396871e-05, + "loss": 0.0912, + "step": 76290 + }, + { + "epoch": 21.46, + "learning_rate": 6.344672476806298e-05, + "loss": 0.0943, + "step": 76320 + }, + { + "epoch": 21.46, + "learning_rate": 6.342860712835412e-05, + "loss": 0.1022, + "step": 76350 + }, + { + "epoch": 21.47, + "learning_rate": 6.340986474244839e-05, + "loss": 0.0851, + "step": 76380 + }, + { + "epoch": 21.48, + "learning_rate": 6.339112235654265e-05, + "loss": 0.0982, + "step": 76410 + }, + { + "epoch": 21.49, + "learning_rate": 6.337237997063693e-05, + "loss": 0.09, + "step": 76440 + }, + { + "epoch": 21.5, + "learning_rate": 6.33536375847312e-05, + "loss": 0.0955, + "step": 76470 + }, + { + "epoch": 21.51, + "learning_rate": 6.333489519882548e-05, + "loss": 0.0966, + "step": 76500 + }, + { + "epoch": 21.52, + "learning_rate": 6.331615281291975e-05, + "loss": 0.083, + "step": 76530 + }, + { + "epoch": 21.52, + "learning_rate": 6.329741042701403e-05, + "loss": 0.093, + "step": 76560 + }, + { + "epoch": 21.53, + "learning_rate": 6.32786680411083e-05, + "loss": 0.0922, + "step": 76590 + }, + { + "epoch": 21.54, + "learning_rate": 6.325992565520258e-05, + "loss": 0.0881, + "step": 76620 + }, + { + "epoch": 21.55, + "learning_rate": 6.324118326929686e-05, + "loss": 0.1021, + "step": 76650 + }, + { + "epoch": 21.56, + "learning_rate": 6.322244088339113e-05, + "loss": 0.0838, + "step": 76680 + }, + { + "epoch": 21.57, + "learning_rate": 6.32036984974854e-05, + "loss": 0.1031, + "step": 76710 + }, + { + "epoch": 21.57, + "learning_rate": 6.318495611157968e-05, + "loss": 0.0905, + "step": 76740 + }, + { + "epoch": 21.58, + "learning_rate": 6.316621372567396e-05, + "loss": 0.0944, + "step": 76770 + }, + { + "epoch": 21.59, + "learning_rate": 6.314747133976822e-05, + "loss": 0.0957, + "step": 76800 + }, + { + "epoch": 21.6, + "learning_rate": 6.312872895386249e-05, + "loss": 0.0841, + "step": 76830 + }, + { + "epoch": 21.61, + "learning_rate": 6.310998656795677e-05, + "loss": 0.0977, + "step": 76860 + }, + { + "epoch": 21.62, + "learning_rate": 6.309124418205104e-05, + "loss": 0.0896, + "step": 76890 + }, + { + "epoch": 21.62, + "learning_rate": 6.307250179614532e-05, + "loss": 0.0899, + "step": 76920 + }, + { + "epoch": 21.63, + "learning_rate": 6.305375941023959e-05, + "loss": 0.1022, + "step": 76950 + }, + { + "epoch": 21.64, + "learning_rate": 6.303501702433387e-05, + "loss": 0.0867, + "step": 76980 + }, + { + "epoch": 21.65, + "learning_rate": 6.301627463842814e-05, + "loss": 0.0982, + "step": 77010 + }, + { + "epoch": 21.66, + "learning_rate": 6.299753225252242e-05, + "loss": 0.0916, + "step": 77040 + }, + { + "epoch": 21.67, + "learning_rate": 6.29787898666167e-05, + "loss": 0.094, + "step": 77070 + }, + { + "epoch": 21.68, + "learning_rate": 6.296004748071097e-05, + "loss": 0.1011, + "step": 77100 + }, + { + "epoch": 21.68, + "learning_rate": 6.294130509480523e-05, + "loss": 0.0869, + "step": 77130 + }, + { + "epoch": 21.69, + "learning_rate": 6.292256270889951e-05, + "loss": 0.0969, + "step": 77160 + }, + { + "epoch": 21.7, + "learning_rate": 6.29038203229938e-05, + "loss": 0.0958, + "step": 77190 + }, + { + "epoch": 21.71, + "learning_rate": 6.288507793708806e-05, + "loss": 0.091, + "step": 77220 + }, + { + "epoch": 21.72, + "learning_rate": 6.286633555118233e-05, + "loss": 0.0994, + "step": 77250 + }, + { + "epoch": 21.73, + "learning_rate": 6.284759316527661e-05, + "loss": 0.0838, + "step": 77280 + }, + { + "epoch": 21.73, + "learning_rate": 6.282885077937088e-05, + "loss": 0.1009, + "step": 77310 + }, + { + "epoch": 21.74, + "learning_rate": 6.281010839346516e-05, + "loss": 0.0908, + "step": 77340 + }, + { + "epoch": 21.75, + "learning_rate": 6.279136600755943e-05, + "loss": 0.0974, + "step": 77370 + }, + { + "epoch": 21.76, + "learning_rate": 6.277262362165371e-05, + "loss": 0.1025, + "step": 77400 + }, + { + "epoch": 21.77, + "learning_rate": 6.275388123574798e-05, + "loss": 0.0836, + "step": 77430 + }, + { + "epoch": 21.78, + "learning_rate": 6.273513884984226e-05, + "loss": 0.0997, + "step": 77460 + }, + { + "epoch": 21.79, + "learning_rate": 6.271639646393654e-05, + "loss": 0.0941, + "step": 77490 + }, + { + "epoch": 21.79, + "learning_rate": 6.26976540780308e-05, + "loss": 0.0985, + "step": 77520 + }, + { + "epoch": 21.8, + "learning_rate": 6.267891169212507e-05, + "loss": 0.1066, + "step": 77550 + }, + { + "epoch": 21.81, + "learning_rate": 6.266016930621935e-05, + "loss": 0.0851, + "step": 77580 + }, + { + "epoch": 21.82, + "learning_rate": 6.264142692031363e-05, + "loss": 0.1011, + "step": 77610 + }, + { + "epoch": 21.83, + "learning_rate": 6.26226845344079e-05, + "loss": 0.0937, + "step": 77640 + }, + { + "epoch": 21.84, + "learning_rate": 6.260394214850217e-05, + "loss": 0.0957, + "step": 77670 + }, + { + "epoch": 21.84, + "learning_rate": 6.258519976259645e-05, + "loss": 0.1, + "step": 77700 + }, + { + "epoch": 21.85, + "learning_rate": 6.256645737669072e-05, + "loss": 0.0842, + "step": 77730 + }, + { + "epoch": 21.86, + "learning_rate": 6.2547714990785e-05, + "loss": 0.1, + "step": 77760 + }, + { + "epoch": 21.87, + "learning_rate": 6.252897260487927e-05, + "loss": 0.0912, + "step": 77790 + }, + { + "epoch": 21.88, + "learning_rate": 6.251023021897355e-05, + "loss": 0.0992, + "step": 77820 + }, + { + "epoch": 21.89, + "learning_rate": 6.249148783306781e-05, + "loss": 0.1045, + "step": 77850 + }, + { + "epoch": 21.89, + "learning_rate": 6.24727454471621e-05, + "loss": 0.0867, + "step": 77880 + }, + { + "epoch": 21.9, + "learning_rate": 6.245400306125638e-05, + "loss": 0.1005, + "step": 77910 + }, + { + "epoch": 21.91, + "learning_rate": 6.243526067535064e-05, + "loss": 0.0901, + "step": 77940 + }, + { + "epoch": 21.92, + "learning_rate": 6.241651828944491e-05, + "loss": 0.0971, + "step": 77970 + }, + { + "epoch": 21.93, + "learning_rate": 6.239777590353919e-05, + "loss": 0.1068, + "step": 78000 + }, + { + "epoch": 21.94, + "learning_rate": 6.237903351763347e-05, + "loss": 0.0858, + "step": 78030 + }, + { + "epoch": 21.95, + "learning_rate": 6.236029113172774e-05, + "loss": 0.1032, + "step": 78060 + }, + { + "epoch": 21.95, + "learning_rate": 6.234154874582201e-05, + "loss": 0.0857, + "step": 78090 + }, + { + "epoch": 21.96, + "learning_rate": 6.232280635991629e-05, + "loss": 0.0954, + "step": 78120 + }, + { + "epoch": 21.97, + "learning_rate": 6.230406397401056e-05, + "loss": 0.0997, + "step": 78150 + }, + { + "epoch": 21.98, + "learning_rate": 6.228532158810484e-05, + "loss": 0.0838, + "step": 78180 + }, + { + "epoch": 21.99, + "learning_rate": 6.22665792021991e-05, + "loss": 0.0995, + "step": 78210 + }, + { + "epoch": 22.0, + "learning_rate": 6.224783681629339e-05, + "loss": 0.0901, + "step": 78240 + }, + { + "epoch": 22.0, + "eval_loss": 0.1689508855342865, + "eval_runtime": 503.8188, + "eval_samples_per_second": 31.823, + "eval_steps_per_second": 0.996, + "eval_wer": 0.1476532965758192, + "step": 78254 + }, + { + "epoch": 22.0, + "learning_rate": 6.222909443038765e-05, + "loss": 0.0977, + "step": 78270 + }, + { + "epoch": 22.01, + "learning_rate": 6.221035204448193e-05, + "loss": 0.0944, + "step": 78300 + }, + { + "epoch": 22.02, + "learning_rate": 6.219160965857621e-05, + "loss": 0.0864, + "step": 78330 + }, + { + "epoch": 22.03, + "learning_rate": 6.217286727267048e-05, + "loss": 0.094, + "step": 78360 + }, + { + "epoch": 22.04, + "learning_rate": 6.215412488676475e-05, + "loss": 0.0862, + "step": 78390 + }, + { + "epoch": 22.05, + "learning_rate": 6.213538250085903e-05, + "loss": 0.0935, + "step": 78420 + }, + { + "epoch": 22.06, + "learning_rate": 6.211664011495331e-05, + "loss": 0.0925, + "step": 78450 + }, + { + "epoch": 22.06, + "learning_rate": 6.209789772904758e-05, + "loss": 0.0886, + "step": 78480 + }, + { + "epoch": 22.07, + "learning_rate": 6.207915534314185e-05, + "loss": 0.1043, + "step": 78510 + }, + { + "epoch": 22.08, + "learning_rate": 6.206041295723613e-05, + "loss": 0.0778, + "step": 78540 + }, + { + "epoch": 22.09, + "learning_rate": 6.20416705713304e-05, + "loss": 0.0892, + "step": 78570 + }, + { + "epoch": 22.1, + "learning_rate": 6.202292818542468e-05, + "loss": 0.0946, + "step": 78600 + }, + { + "epoch": 22.11, + "learning_rate": 6.200418579951894e-05, + "loss": 0.0867, + "step": 78630 + }, + { + "epoch": 22.11, + "learning_rate": 6.198544341361322e-05, + "loss": 0.0987, + "step": 78660 + }, + { + "epoch": 22.12, + "learning_rate": 6.196670102770749e-05, + "loss": 0.0858, + "step": 78690 + }, + { + "epoch": 22.13, + "learning_rate": 6.194795864180177e-05, + "loss": 0.0934, + "step": 78720 + }, + { + "epoch": 22.14, + "learning_rate": 6.192921625589605e-05, + "loss": 0.0866, + "step": 78750 + }, + { + "epoch": 22.15, + "learning_rate": 6.191047386999032e-05, + "loss": 0.0881, + "step": 78780 + }, + { + "epoch": 22.16, + "learning_rate": 6.189173148408459e-05, + "loss": 0.0925, + "step": 78810 + }, + { + "epoch": 22.16, + "learning_rate": 6.187298909817887e-05, + "loss": 0.0813, + "step": 78840 + }, + { + "epoch": 22.17, + "learning_rate": 6.185424671227315e-05, + "loss": 0.0971, + "step": 78870 + }, + { + "epoch": 22.18, + "learning_rate": 6.183550432636742e-05, + "loss": 0.09, + "step": 78900 + }, + { + "epoch": 22.19, + "learning_rate": 6.181676194046169e-05, + "loss": 0.087, + "step": 78930 + }, + { + "epoch": 22.2, + "learning_rate": 6.179801955455597e-05, + "loss": 0.0986, + "step": 78960 + }, + { + "epoch": 22.21, + "learning_rate": 6.177927716865025e-05, + "loss": 0.0811, + "step": 78990 + }, + { + "epoch": 22.22, + "learning_rate": 6.176053478274451e-05, + "loss": 0.0936, + "step": 79020 + }, + { + "epoch": 22.22, + "learning_rate": 6.174179239683878e-05, + "loss": 0.0894, + "step": 79050 + }, + { + "epoch": 22.23, + "learning_rate": 6.172305001093306e-05, + "loss": 0.088, + "step": 79080 + }, + { + "epoch": 22.24, + "learning_rate": 6.170430762502733e-05, + "loss": 0.0985, + "step": 79110 + }, + { + "epoch": 22.25, + "learning_rate": 6.168556523912161e-05, + "loss": 0.0785, + "step": 79140 + }, + { + "epoch": 22.26, + "learning_rate": 6.166682285321589e-05, + "loss": 0.0915, + "step": 79170 + }, + { + "epoch": 22.27, + "learning_rate": 6.164808046731016e-05, + "loss": 0.0902, + "step": 79200 + }, + { + "epoch": 22.27, + "learning_rate": 6.162933808140443e-05, + "loss": 0.0908, + "step": 79230 + }, + { + "epoch": 22.28, + "learning_rate": 6.161059569549871e-05, + "loss": 0.0902, + "step": 79260 + }, + { + "epoch": 22.29, + "learning_rate": 6.159185330959299e-05, + "loss": 0.0831, + "step": 79290 + }, + { + "epoch": 22.3, + "learning_rate": 6.157311092368726e-05, + "loss": 0.094, + "step": 79320 + }, + { + "epoch": 22.31, + "learning_rate": 6.155436853778152e-05, + "loss": 0.0895, + "step": 79350 + }, + { + "epoch": 22.32, + "learning_rate": 6.15356261518758e-05, + "loss": 0.0919, + "step": 79380 + }, + { + "epoch": 22.32, + "learning_rate": 6.151688376597009e-05, + "loss": 0.1012, + "step": 79410 + }, + { + "epoch": 22.33, + "learning_rate": 6.149814138006435e-05, + "loss": 0.0853, + "step": 79440 + }, + { + "epoch": 22.34, + "learning_rate": 6.147939899415862e-05, + "loss": 0.0983, + "step": 79470 + }, + { + "epoch": 22.35, + "learning_rate": 6.14606566082529e-05, + "loss": 0.0947, + "step": 79500 + }, + { + "epoch": 22.36, + "learning_rate": 6.144191422234717e-05, + "loss": 0.0862, + "step": 79530 + }, + { + "epoch": 22.37, + "learning_rate": 6.142317183644145e-05, + "loss": 0.1026, + "step": 79560 + }, + { + "epoch": 22.38, + "learning_rate": 6.140442945053573e-05, + "loss": 0.0817, + "step": 79590 + }, + { + "epoch": 22.38, + "learning_rate": 6.138568706463e-05, + "loss": 0.0901, + "step": 79620 + }, + { + "epoch": 22.39, + "learning_rate": 6.136694467872427e-05, + "loss": 0.0937, + "step": 79650 + }, + { + "epoch": 22.4, + "learning_rate": 6.134820229281855e-05, + "loss": 0.088, + "step": 79680 + }, + { + "epoch": 22.41, + "learning_rate": 6.132945990691283e-05, + "loss": 0.0966, + "step": 79710 + }, + { + "epoch": 22.42, + "learning_rate": 6.13107175210071e-05, + "loss": 0.0798, + "step": 79740 + }, + { + "epoch": 22.43, + "learning_rate": 6.129197513510136e-05, + "loss": 0.0895, + "step": 79770 + }, + { + "epoch": 22.43, + "learning_rate": 6.127323274919564e-05, + "loss": 0.0903, + "step": 79800 + }, + { + "epoch": 22.44, + "learning_rate": 6.125449036328992e-05, + "loss": 0.0902, + "step": 79830 + }, + { + "epoch": 22.45, + "learning_rate": 6.123574797738419e-05, + "loss": 0.1, + "step": 79860 + }, + { + "epoch": 22.46, + "learning_rate": 6.121700559147846e-05, + "loss": 0.0843, + "step": 79890 + }, + { + "epoch": 22.47, + "learning_rate": 6.119826320557274e-05, + "loss": 0.0924, + "step": 79920 + }, + { + "epoch": 22.48, + "learning_rate": 6.117952081966701e-05, + "loss": 0.0926, + "step": 79950 + }, + { + "epoch": 22.49, + "learning_rate": 6.116077843376129e-05, + "loss": 0.0866, + "step": 79980 + }, + { + "epoch": 22.49, + "learning_rate": 6.114203604785557e-05, + "loss": 0.0958, + "step": 80010 + }, + { + "epoch": 22.5, + "learning_rate": 6.112329366194984e-05, + "loss": 0.083, + "step": 80040 + }, + { + "epoch": 22.51, + "learning_rate": 6.11045512760441e-05, + "loss": 0.0946, + "step": 80070 + }, + { + "epoch": 22.52, + "learning_rate": 6.108580889013839e-05, + "loss": 0.0865, + "step": 80100 + }, + { + "epoch": 22.53, + "learning_rate": 6.106706650423267e-05, + "loss": 0.086, + "step": 80130 + }, + { + "epoch": 22.54, + "learning_rate": 6.104832411832693e-05, + "loss": 0.0981, + "step": 80160 + }, + { + "epoch": 22.54, + "learning_rate": 6.10295817324212e-05, + "loss": 0.0821, + "step": 80190 + }, + { + "epoch": 22.55, + "learning_rate": 6.101083934651548e-05, + "loss": 0.099, + "step": 80220 + }, + { + "epoch": 22.56, + "learning_rate": 6.0992096960609756e-05, + "loss": 0.0893, + "step": 80250 + }, + { + "epoch": 22.57, + "learning_rate": 6.097335457470403e-05, + "loss": 0.0876, + "step": 80280 + }, + { + "epoch": 22.58, + "learning_rate": 6.09546121887983e-05, + "loss": 0.0959, + "step": 80310 + }, + { + "epoch": 22.59, + "learning_rate": 6.093586980289258e-05, + "loss": 0.0838, + "step": 80340 + }, + { + "epoch": 22.59, + "learning_rate": 6.091712741698685e-05, + "loss": 0.0925, + "step": 80370 + }, + { + "epoch": 22.6, + "learning_rate": 6.089838503108113e-05, + "loss": 0.0904, + "step": 80400 + }, + { + "epoch": 22.61, + "learning_rate": 6.087964264517541e-05, + "loss": 0.0896, + "step": 80430 + }, + { + "epoch": 22.62, + "learning_rate": 6.086090025926967e-05, + "loss": 0.1, + "step": 80460 + }, + { + "epoch": 22.63, + "learning_rate": 6.084215787336395e-05, + "loss": 0.0886, + "step": 80490 + }, + { + "epoch": 22.64, + "learning_rate": 6.082404023365508e-05, + "loss": 0.095, + "step": 80520 + }, + { + "epoch": 22.65, + "learning_rate": 6.080529784774935e-05, + "loss": 0.0905, + "step": 80550 + }, + { + "epoch": 22.65, + "learning_rate": 6.078655546184363e-05, + "loss": 0.0882, + "step": 80580 + }, + { + "epoch": 22.66, + "learning_rate": 6.0767813075937906e-05, + "loss": 0.0944, + "step": 80610 + }, + { + "epoch": 22.67, + "learning_rate": 6.0749070690032174e-05, + "loss": 0.0856, + "step": 80640 + }, + { + "epoch": 22.68, + "learning_rate": 6.073032830412645e-05, + "loss": 0.0946, + "step": 80670 + }, + { + "epoch": 22.69, + "learning_rate": 6.071158591822073e-05, + "loss": 0.0964, + "step": 80700 + }, + { + "epoch": 22.7, + "learning_rate": 6.0692843532315e-05, + "loss": 0.0852, + "step": 80730 + }, + { + "epoch": 22.7, + "learning_rate": 6.067410114640928e-05, + "loss": 0.0985, + "step": 80760 + }, + { + "epoch": 22.71, + "learning_rate": 6.0655358760503545e-05, + "loss": 0.0888, + "step": 80790 + }, + { + "epoch": 22.72, + "learning_rate": 6.063661637459782e-05, + "loss": 0.0967, + "step": 80820 + }, + { + "epoch": 22.73, + "learning_rate": 6.06178739886921e-05, + "loss": 0.0974, + "step": 80850 + }, + { + "epoch": 22.74, + "learning_rate": 6.0599131602786374e-05, + "loss": 0.0877, + "step": 80880 + }, + { + "epoch": 22.75, + "learning_rate": 6.058038921688064e-05, + "loss": 0.108, + "step": 80910 + }, + { + "epoch": 22.76, + "learning_rate": 6.0561646830974916e-05, + "loss": 0.0797, + "step": 80940 + }, + { + "epoch": 22.76, + "learning_rate": 6.054290444506919e-05, + "loss": 0.0985, + "step": 80970 + }, + { + "epoch": 22.77, + "learning_rate": 6.052416205916347e-05, + "loss": 0.0904, + "step": 81000 + }, + { + "epoch": 22.78, + "learning_rate": 6.0505419673257745e-05, + "loss": 0.0913, + "step": 81030 + }, + { + "epoch": 22.79, + "learning_rate": 6.048667728735201e-05, + "loss": 0.1001, + "step": 81060 + }, + { + "epoch": 22.8, + "learning_rate": 6.046793490144629e-05, + "loss": 0.0899, + "step": 81090 + }, + { + "epoch": 22.81, + "learning_rate": 6.044919251554057e-05, + "loss": 0.0933, + "step": 81120 + }, + { + "epoch": 22.81, + "learning_rate": 6.043045012963484e-05, + "loss": 0.0877, + "step": 81150 + }, + { + "epoch": 22.82, + "learning_rate": 6.0411707743729116e-05, + "loss": 0.0882, + "step": 81180 + }, + { + "epoch": 22.83, + "learning_rate": 6.0392965357823384e-05, + "loss": 0.0974, + "step": 81210 + }, + { + "epoch": 22.84, + "learning_rate": 6.037422297191766e-05, + "loss": 0.0882, + "step": 81240 + }, + { + "epoch": 22.85, + "learning_rate": 6.035548058601194e-05, + "loss": 0.0925, + "step": 81270 + }, + { + "epoch": 22.86, + "learning_rate": 6.033673820010621e-05, + "loss": 0.0925, + "step": 81300 + }, + { + "epoch": 22.86, + "learning_rate": 6.031799581420048e-05, + "loss": 0.084, + "step": 81330 + }, + { + "epoch": 22.87, + "learning_rate": 6.0299253428294754e-05, + "loss": 0.0994, + "step": 81360 + }, + { + "epoch": 22.88, + "learning_rate": 6.028051104238903e-05, + "loss": 0.0873, + "step": 81390 + }, + { + "epoch": 22.89, + "learning_rate": 6.026176865648331e-05, + "loss": 0.098, + "step": 81420 + }, + { + "epoch": 22.9, + "learning_rate": 6.0243026270577584e-05, + "loss": 0.0902, + "step": 81450 + }, + { + "epoch": 22.91, + "learning_rate": 6.022428388467185e-05, + "loss": 0.0894, + "step": 81480 + }, + { + "epoch": 22.92, + "learning_rate": 6.0205541498766125e-05, + "loss": 0.0956, + "step": 81510 + }, + { + "epoch": 22.92, + "learning_rate": 6.0186799112860406e-05, + "loss": 0.0848, + "step": 81540 + }, + { + "epoch": 22.93, + "learning_rate": 6.016805672695468e-05, + "loss": 0.0961, + "step": 81570 + }, + { + "epoch": 22.94, + "learning_rate": 6.0149314341048955e-05, + "loss": 0.0908, + "step": 81600 + }, + { + "epoch": 22.95, + "learning_rate": 6.013057195514322e-05, + "loss": 0.0901, + "step": 81630 + }, + { + "epoch": 22.96, + "learning_rate": 6.0111829569237496e-05, + "loss": 0.1035, + "step": 81660 + }, + { + "epoch": 22.97, + "learning_rate": 6.009308718333178e-05, + "loss": 0.0859, + "step": 81690 + }, + { + "epoch": 22.97, + "learning_rate": 6.007434479742605e-05, + "loss": 0.0979, + "step": 81720 + }, + { + "epoch": 22.98, + "learning_rate": 6.005560241152032e-05, + "loss": 0.0898, + "step": 81750 + }, + { + "epoch": 22.99, + "learning_rate": 6.003686002561459e-05, + "loss": 0.0918, + "step": 81780 + }, + { + "epoch": 23.0, + "learning_rate": 6.001811763970887e-05, + "loss": 0.0964, + "step": 81810 + }, + { + "epoch": 23.0, + "eval_loss": 0.17729832231998444, + "eval_runtime": 539.2851, + "eval_samples_per_second": 29.73, + "eval_steps_per_second": 0.931, + "eval_wer": 0.14893617021276595, + "step": 81811 + }, + { + "epoch": 23.01, + "learning_rate": 5.999937525380315e-05, + "loss": 0.0783, + "step": 81840 + }, + { + "epoch": 23.02, + "learning_rate": 5.998063286789742e-05, + "loss": 0.0958, + "step": 81870 + }, + { + "epoch": 23.03, + "learning_rate": 5.996189048199169e-05, + "loss": 0.0909, + "step": 81900 + }, + { + "epoch": 23.03, + "learning_rate": 5.9943148096085964e-05, + "loss": 0.0884, + "step": 81930 + }, + { + "epoch": 23.04, + "learning_rate": 5.9924405710180245e-05, + "loss": 0.0905, + "step": 81960 + }, + { + "epoch": 23.05, + "learning_rate": 5.990566332427452e-05, + "loss": 0.0843, + "step": 81990 + }, + { + "epoch": 23.06, + "learning_rate": 5.9886920938368793e-05, + "loss": 0.091, + "step": 82020 + }, + { + "epoch": 23.07, + "learning_rate": 5.986817855246306e-05, + "loss": 0.0833, + "step": 82050 + }, + { + "epoch": 23.08, + "learning_rate": 5.9849436166557335e-05, + "loss": 0.0912, + "step": 82080 + }, + { + "epoch": 23.08, + "learning_rate": 5.9830693780651616e-05, + "loss": 0.0961, + "step": 82110 + }, + { + "epoch": 23.09, + "learning_rate": 5.981195139474589e-05, + "loss": 0.0854, + "step": 82140 + }, + { + "epoch": 23.1, + "learning_rate": 5.979320900884016e-05, + "loss": 0.0906, + "step": 82170 + }, + { + "epoch": 23.11, + "learning_rate": 5.977446662293443e-05, + "loss": 0.0793, + "step": 82200 + }, + { + "epoch": 23.12, + "learning_rate": 5.975572423702871e-05, + "loss": 0.0893, + "step": 82230 + }, + { + "epoch": 23.13, + "learning_rate": 5.973698185112299e-05, + "loss": 0.0944, + "step": 82260 + }, + { + "epoch": 23.13, + "learning_rate": 5.971823946521726e-05, + "loss": 0.0794, + "step": 82290 + }, + { + "epoch": 23.14, + "learning_rate": 5.969949707931153e-05, + "loss": 0.0943, + "step": 82320 + }, + { + "epoch": 23.15, + "learning_rate": 5.96807546934058e-05, + "loss": 0.0816, + "step": 82350 + }, + { + "epoch": 23.16, + "learning_rate": 5.9662012307500084e-05, + "loss": 0.0886, + "step": 82380 + }, + { + "epoch": 23.17, + "learning_rate": 5.964326992159436e-05, + "loss": 0.0915, + "step": 82410 + }, + { + "epoch": 23.18, + "learning_rate": 5.962452753568863e-05, + "loss": 0.0844, + "step": 82440 + }, + { + "epoch": 23.19, + "learning_rate": 5.96057851497829e-05, + "loss": 0.0913, + "step": 82470 + }, + { + "epoch": 23.19, + "learning_rate": 5.9587042763877174e-05, + "loss": 0.0835, + "step": 82500 + }, + { + "epoch": 23.2, + "learning_rate": 5.9568300377971455e-05, + "loss": 0.0888, + "step": 82530 + }, + { + "epoch": 23.21, + "learning_rate": 5.954955799206573e-05, + "loss": 0.0953, + "step": 82560 + }, + { + "epoch": 23.22, + "learning_rate": 5.9530815606159996e-05, + "loss": 0.0812, + "step": 82590 + }, + { + "epoch": 23.23, + "learning_rate": 5.951207322025427e-05, + "loss": 0.0925, + "step": 82620 + }, + { + "epoch": 23.24, + "learning_rate": 5.949333083434855e-05, + "loss": 0.0802, + "step": 82650 + }, + { + "epoch": 23.24, + "learning_rate": 5.9474588448442826e-05, + "loss": 0.0954, + "step": 82680 + }, + { + "epoch": 23.25, + "learning_rate": 5.94558460625371e-05, + "loss": 0.0904, + "step": 82710 + }, + { + "epoch": 23.26, + "learning_rate": 5.943710367663137e-05, + "loss": 0.0817, + "step": 82740 + }, + { + "epoch": 23.27, + "learning_rate": 5.941836129072564e-05, + "loss": 0.0938, + "step": 82770 + }, + { + "epoch": 23.28, + "learning_rate": 5.939961890481992e-05, + "loss": 0.0842, + "step": 82800 + }, + { + "epoch": 23.29, + "learning_rate": 5.9380876518914197e-05, + "loss": 0.0955, + "step": 82830 + }, + { + "epoch": 23.29, + "learning_rate": 5.936213413300847e-05, + "loss": 0.0901, + "step": 82860 + }, + { + "epoch": 23.3, + "learning_rate": 5.934339174710274e-05, + "loss": 0.0798, + "step": 82890 + }, + { + "epoch": 23.31, + "learning_rate": 5.932464936119701e-05, + "loss": 0.0934, + "step": 82920 + }, + { + "epoch": 23.32, + "learning_rate": 5.930590697529129e-05, + "loss": 0.0869, + "step": 82950 + }, + { + "epoch": 23.33, + "learning_rate": 5.928716458938557e-05, + "loss": 0.0874, + "step": 82980 + }, + { + "epoch": 23.34, + "learning_rate": 5.9268422203479835e-05, + "loss": 0.0876, + "step": 83010 + }, + { + "epoch": 23.35, + "learning_rate": 5.924967981757411e-05, + "loss": 0.0826, + "step": 83040 + }, + { + "epoch": 23.35, + "learning_rate": 5.923093743166839e-05, + "loss": 0.0966, + "step": 83070 + }, + { + "epoch": 23.36, + "learning_rate": 5.9212195045762664e-05, + "loss": 0.0846, + "step": 83100 + }, + { + "epoch": 23.37, + "learning_rate": 5.919345265985694e-05, + "loss": 0.0957, + "step": 83130 + }, + { + "epoch": 23.38, + "learning_rate": 5.917533502014807e-05, + "loss": 0.0924, + "step": 83160 + }, + { + "epoch": 23.39, + "learning_rate": 5.915659263424235e-05, + "loss": 0.0834, + "step": 83190 + }, + { + "epoch": 23.4, + "learning_rate": 5.9137850248336614e-05, + "loss": 0.0944, + "step": 83220 + }, + { + "epoch": 23.4, + "learning_rate": 5.911973260862774e-05, + "loss": 0.0815, + "step": 83250 + }, + { + "epoch": 23.41, + "learning_rate": 5.9100990222722016e-05, + "loss": 0.0868, + "step": 83280 + }, + { + "epoch": 23.42, + "learning_rate": 5.90822478368163e-05, + "loss": 0.0916, + "step": 83310 + }, + { + "epoch": 23.43, + "learning_rate": 5.906350545091057e-05, + "loss": 0.0816, + "step": 83340 + }, + { + "epoch": 23.44, + "learning_rate": 5.904476306500485e-05, + "loss": 0.0977, + "step": 83370 + }, + { + "epoch": 23.45, + "learning_rate": 5.902602067909911e-05, + "loss": 0.0878, + "step": 83400 + }, + { + "epoch": 23.46, + "learning_rate": 5.9007278293193394e-05, + "loss": 0.0923, + "step": 83430 + }, + { + "epoch": 23.46, + "learning_rate": 5.898853590728767e-05, + "loss": 0.0945, + "step": 83460 + }, + { + "epoch": 23.47, + "learning_rate": 5.896979352138194e-05, + "loss": 0.0828, + "step": 83490 + }, + { + "epoch": 23.48, + "learning_rate": 5.895105113547622e-05, + "loss": 0.0895, + "step": 83520 + }, + { + "epoch": 23.49, + "learning_rate": 5.8932308749570484e-05, + "loss": 0.0831, + "step": 83550 + }, + { + "epoch": 23.5, + "learning_rate": 5.8913566363664765e-05, + "loss": 0.0948, + "step": 83580 + }, + { + "epoch": 23.51, + "learning_rate": 5.889482397775904e-05, + "loss": 0.093, + "step": 83610 + }, + { + "epoch": 23.51, + "learning_rate": 5.887608159185331e-05, + "loss": 0.0808, + "step": 83640 + }, + { + "epoch": 23.52, + "learning_rate": 5.885733920594758e-05, + "loss": 0.0978, + "step": 83670 + }, + { + "epoch": 23.53, + "learning_rate": 5.883859682004186e-05, + "loss": 0.0801, + "step": 83700 + }, + { + "epoch": 23.54, + "learning_rate": 5.8819854434136136e-05, + "loss": 0.0915, + "step": 83730 + }, + { + "epoch": 23.55, + "learning_rate": 5.880111204823041e-05, + "loss": 0.0922, + "step": 83760 + }, + { + "epoch": 23.56, + "learning_rate": 5.878236966232469e-05, + "loss": 0.0833, + "step": 83790 + }, + { + "epoch": 23.56, + "learning_rate": 5.876362727641895e-05, + "loss": 0.0937, + "step": 83820 + }, + { + "epoch": 23.57, + "learning_rate": 5.874488489051323e-05, + "loss": 0.0798, + "step": 83850 + }, + { + "epoch": 23.58, + "learning_rate": 5.8726142504607506e-05, + "loss": 0.0898, + "step": 83880 + }, + { + "epoch": 23.59, + "learning_rate": 5.870740011870178e-05, + "loss": 0.0969, + "step": 83910 + }, + { + "epoch": 23.6, + "learning_rate": 5.868865773279606e-05, + "loss": 0.0818, + "step": 83940 + }, + { + "epoch": 23.61, + "learning_rate": 5.866991534689032e-05, + "loss": 0.0928, + "step": 83970 + }, + { + "epoch": 23.62, + "learning_rate": 5.86511729609846e-05, + "loss": 0.0825, + "step": 84000 + }, + { + "epoch": 23.62, + "learning_rate": 5.863243057507888e-05, + "loss": 0.0906, + "step": 84030 + }, + { + "epoch": 23.63, + "learning_rate": 5.861368818917315e-05, + "loss": 0.0972, + "step": 84060 + }, + { + "epoch": 23.64, + "learning_rate": 5.859494580326742e-05, + "loss": 0.0819, + "step": 84090 + }, + { + "epoch": 23.65, + "learning_rate": 5.85762034173617e-05, + "loss": 0.0984, + "step": 84120 + }, + { + "epoch": 23.66, + "learning_rate": 5.8557461031455974e-05, + "loss": 0.0816, + "step": 84150 + }, + { + "epoch": 23.67, + "learning_rate": 5.853871864555025e-05, + "loss": 0.0893, + "step": 84180 + }, + { + "epoch": 23.67, + "learning_rate": 5.851997625964453e-05, + "loss": 0.0938, + "step": 84210 + }, + { + "epoch": 23.68, + "learning_rate": 5.850123387373879e-05, + "loss": 0.0804, + "step": 84240 + }, + { + "epoch": 23.69, + "learning_rate": 5.848249148783307e-05, + "loss": 0.0994, + "step": 84270 + }, + { + "epoch": 23.7, + "learning_rate": 5.8463749101927345e-05, + "loss": 0.0842, + "step": 84300 + }, + { + "epoch": 23.71, + "learning_rate": 5.844500671602162e-05, + "loss": 0.0933, + "step": 84330 + }, + { + "epoch": 23.72, + "learning_rate": 5.84262643301159e-05, + "loss": 0.0918, + "step": 84360 + }, + { + "epoch": 23.72, + "learning_rate": 5.840752194421016e-05, + "loss": 0.0801, + "step": 84390 + }, + { + "epoch": 23.73, + "learning_rate": 5.838877955830444e-05, + "loss": 0.0955, + "step": 84420 + }, + { + "epoch": 23.74, + "learning_rate": 5.8370037172398716e-05, + "loss": 0.0861, + "step": 84450 + }, + { + "epoch": 23.75, + "learning_rate": 5.8351294786493e-05, + "loss": 0.089, + "step": 84480 + }, + { + "epoch": 23.76, + "learning_rate": 5.833255240058726e-05, + "loss": 0.0879, + "step": 84510 + }, + { + "epoch": 23.77, + "learning_rate": 5.831381001468154e-05, + "loss": 0.0822, + "step": 84540 + }, + { + "epoch": 23.78, + "learning_rate": 5.829506762877581e-05, + "loss": 0.0994, + "step": 84570 + }, + { + "epoch": 23.78, + "learning_rate": 5.827632524287009e-05, + "loss": 0.0891, + "step": 84600 + }, + { + "epoch": 23.79, + "learning_rate": 5.825758285696437e-05, + "loss": 0.0924, + "step": 84630 + }, + { + "epoch": 23.8, + "learning_rate": 5.823884047105863e-05, + "loss": 0.0912, + "step": 84660 + }, + { + "epoch": 23.81, + "learning_rate": 5.822009808515291e-05, + "loss": 0.0844, + "step": 84690 + }, + { + "epoch": 23.82, + "learning_rate": 5.8201355699247184e-05, + "loss": 0.099, + "step": 84720 + }, + { + "epoch": 23.83, + "learning_rate": 5.818261331334146e-05, + "loss": 0.0802, + "step": 84750 + }, + { + "epoch": 23.83, + "learning_rate": 5.816387092743574e-05, + "loss": 0.0929, + "step": 84780 + }, + { + "epoch": 23.84, + "learning_rate": 5.814512854153e-05, + "loss": 0.095, + "step": 84810 + }, + { + "epoch": 23.85, + "learning_rate": 5.812638615562428e-05, + "loss": 0.083, + "step": 84840 + }, + { + "epoch": 23.86, + "learning_rate": 5.8107643769718555e-05, + "loss": 0.092, + "step": 84870 + }, + { + "epoch": 23.87, + "learning_rate": 5.8088901383812836e-05, + "loss": 0.0865, + "step": 84900 + }, + { + "epoch": 23.88, + "learning_rate": 5.8070158997907096e-05, + "loss": 0.0936, + "step": 84930 + }, + { + "epoch": 23.89, + "learning_rate": 5.805141661200138e-05, + "loss": 0.0945, + "step": 84960 + }, + { + "epoch": 23.89, + "learning_rate": 5.803267422609565e-05, + "loss": 0.0826, + "step": 84990 + }, + { + "epoch": 23.9, + "learning_rate": 5.8013931840189926e-05, + "loss": 0.0921, + "step": 85020 + }, + { + "epoch": 23.91, + "learning_rate": 5.799518945428421e-05, + "loss": 0.0818, + "step": 85050 + }, + { + "epoch": 23.92, + "learning_rate": 5.797644706837847e-05, + "loss": 0.0931, + "step": 85080 + }, + { + "epoch": 23.93, + "learning_rate": 5.795770468247275e-05, + "loss": 0.0912, + "step": 85110 + }, + { + "epoch": 23.94, + "learning_rate": 5.793896229656702e-05, + "loss": 0.0818, + "step": 85140 + }, + { + "epoch": 23.94, + "learning_rate": 5.79202199106613e-05, + "loss": 0.0919, + "step": 85170 + }, + { + "epoch": 23.95, + "learning_rate": 5.790147752475558e-05, + "loss": 0.0816, + "step": 85200 + }, + { + "epoch": 23.96, + "learning_rate": 5.7882735138849845e-05, + "loss": 0.0941, + "step": 85230 + }, + { + "epoch": 23.97, + "learning_rate": 5.786399275294412e-05, + "loss": 0.0885, + "step": 85260 + }, + { + "epoch": 23.98, + "learning_rate": 5.7845250367038393e-05, + "loss": 0.0825, + "step": 85290 + }, + { + "epoch": 23.99, + "learning_rate": 5.7826507981132674e-05, + "loss": 0.0936, + "step": 85320 + }, + { + "epoch": 23.99, + "learning_rate": 5.7807765595226935e-05, + "loss": 0.085, + "step": 85350 + }, + { + "epoch": 24.0, + "eval_loss": 0.17761550843715668, + "eval_runtime": 505.4452, + "eval_samples_per_second": 31.721, + "eval_steps_per_second": 0.993, + "eval_wer": 0.1455515674259277, + "step": 85368 + }, + { + "epoch": 24.0, + "learning_rate": 5.7789023209321216e-05, + "loss": 0.0938, + "step": 85380 + }, + { + "epoch": 24.01, + "learning_rate": 5.777028082341549e-05, + "loss": 0.0848, + "step": 85410 + }, + { + "epoch": 24.02, + "learning_rate": 5.7751538437509764e-05, + "loss": 0.079, + "step": 85440 + }, + { + "epoch": 24.03, + "learning_rate": 5.7732796051604045e-05, + "loss": 0.0943, + "step": 85470 + }, + { + "epoch": 24.04, + "learning_rate": 5.7714053665698306e-05, + "loss": 0.0719, + "step": 85500 + }, + { + "epoch": 24.05, + "learning_rate": 5.769531127979259e-05, + "loss": 0.0914, + "step": 85530 + }, + { + "epoch": 24.05, + "learning_rate": 5.767656889388686e-05, + "loss": 0.0834, + "step": 85560 + }, + { + "epoch": 24.06, + "learning_rate": 5.7657826507981135e-05, + "loss": 0.0936, + "step": 85590 + }, + { + "epoch": 24.07, + "learning_rate": 5.76390841220754e-05, + "loss": 0.0898, + "step": 85620 + }, + { + "epoch": 24.08, + "learning_rate": 5.7620341736169684e-05, + "loss": 0.0802, + "step": 85650 + }, + { + "epoch": 24.09, + "learning_rate": 5.760159935026396e-05, + "loss": 0.0914, + "step": 85680 + }, + { + "epoch": 24.1, + "learning_rate": 5.758285696435823e-05, + "loss": 0.0822, + "step": 85710 + }, + { + "epoch": 24.1, + "learning_rate": 5.756411457845251e-05, + "loss": 0.086, + "step": 85740 + }, + { + "epoch": 24.11, + "learning_rate": 5.7545372192546774e-05, + "loss": 0.0894, + "step": 85770 + }, + { + "epoch": 24.12, + "learning_rate": 5.7526629806641055e-05, + "loss": 0.0769, + "step": 85800 + }, + { + "epoch": 24.13, + "learning_rate": 5.750851216693218e-05, + "loss": 0.0922, + "step": 85830 + }, + { + "epoch": 24.14, + "learning_rate": 5.7489769781026456e-05, + "loss": 0.0828, + "step": 85860 + }, + { + "epoch": 24.15, + "learning_rate": 5.747102739512074e-05, + "loss": 0.0821, + "step": 85890 + }, + { + "epoch": 24.16, + "learning_rate": 5.745228500921501e-05, + "loss": 0.0929, + "step": 85920 + }, + { + "epoch": 24.16, + "learning_rate": 5.7433542623309286e-05, + "loss": 0.0779, + "step": 85950 + }, + { + "epoch": 24.17, + "learning_rate": 5.741480023740355e-05, + "loss": 0.0938, + "step": 85980 + }, + { + "epoch": 24.18, + "learning_rate": 5.7396057851497834e-05, + "loss": 0.0811, + "step": 86010 + }, + { + "epoch": 24.19, + "learning_rate": 5.737731546559211e-05, + "loss": 0.0861, + "step": 86040 + }, + { + "epoch": 24.2, + "learning_rate": 5.735857307968638e-05, + "loss": 0.0949, + "step": 86070 + }, + { + "epoch": 24.21, + "learning_rate": 5.733983069378065e-05, + "loss": 0.0736, + "step": 86100 + }, + { + "epoch": 24.21, + "learning_rate": 5.7321088307874924e-05, + "loss": 0.092, + "step": 86130 + }, + { + "epoch": 24.22, + "learning_rate": 5.7302345921969205e-05, + "loss": 0.083, + "step": 86160 + }, + { + "epoch": 24.23, + "learning_rate": 5.728360353606348e-05, + "loss": 0.0861, + "step": 86190 + }, + { + "epoch": 24.24, + "learning_rate": 5.726486115015775e-05, + "loss": 0.0967, + "step": 86220 + }, + { + "epoch": 24.25, + "learning_rate": 5.724611876425202e-05, + "loss": 0.0779, + "step": 86250 + }, + { + "epoch": 24.26, + "learning_rate": 5.7227376378346295e-05, + "loss": 0.0899, + "step": 86280 + }, + { + "epoch": 24.26, + "learning_rate": 5.7208633992440576e-05, + "loss": 0.0845, + "step": 86310 + }, + { + "epoch": 24.27, + "learning_rate": 5.718989160653485e-05, + "loss": 0.0825, + "step": 86340 + }, + { + "epoch": 24.28, + "learning_rate": 5.7171149220629124e-05, + "loss": 0.0979, + "step": 86370 + }, + { + "epoch": 24.29, + "learning_rate": 5.715240683472339e-05, + "loss": 0.0793, + "step": 86400 + }, + { + "epoch": 24.3, + "learning_rate": 5.713366444881767e-05, + "loss": 0.0925, + "step": 86430 + }, + { + "epoch": 24.31, + "learning_rate": 5.711492206291195e-05, + "loss": 0.0805, + "step": 86460 + }, + { + "epoch": 24.32, + "learning_rate": 5.709617967700622e-05, + "loss": 0.0881, + "step": 86490 + }, + { + "epoch": 24.32, + "learning_rate": 5.707743729110049e-05, + "loss": 0.1005, + "step": 86520 + }, + { + "epoch": 24.33, + "learning_rate": 5.705869490519476e-05, + "loss": 0.0788, + "step": 86550 + }, + { + "epoch": 24.34, + "learning_rate": 5.7039952519289044e-05, + "loss": 0.0922, + "step": 86580 + }, + { + "epoch": 24.35, + "learning_rate": 5.702121013338332e-05, + "loss": 0.0865, + "step": 86610 + }, + { + "epoch": 24.36, + "learning_rate": 5.700246774747759e-05, + "loss": 0.0883, + "step": 86640 + }, + { + "epoch": 24.37, + "learning_rate": 5.698372536157186e-05, + "loss": 0.0973, + "step": 86670 + }, + { + "epoch": 24.37, + "learning_rate": 5.6964982975666134e-05, + "loss": 0.0847, + "step": 86700 + }, + { + "epoch": 24.38, + "learning_rate": 5.6946240589760415e-05, + "loss": 0.0917, + "step": 86730 + }, + { + "epoch": 24.39, + "learning_rate": 5.692749820385469e-05, + "loss": 0.0784, + "step": 86760 + }, + { + "epoch": 24.4, + "learning_rate": 5.6908755817948956e-05, + "loss": 0.0854, + "step": 86790 + }, + { + "epoch": 24.41, + "learning_rate": 5.689001343204323e-05, + "loss": 0.0945, + "step": 86820 + }, + { + "epoch": 24.42, + "learning_rate": 5.687127104613751e-05, + "loss": 0.0747, + "step": 86850 + }, + { + "epoch": 24.43, + "learning_rate": 5.6852528660231786e-05, + "loss": 0.0845, + "step": 86880 + }, + { + "epoch": 24.43, + "learning_rate": 5.683378627432606e-05, + "loss": 0.0821, + "step": 86910 + }, + { + "epoch": 24.44, + "learning_rate": 5.681504388842033e-05, + "loss": 0.0873, + "step": 86940 + }, + { + "epoch": 24.45, + "learning_rate": 5.67963015025146e-05, + "loss": 0.0975, + "step": 86970 + }, + { + "epoch": 24.46, + "learning_rate": 5.677755911660888e-05, + "loss": 0.0812, + "step": 87000 + }, + { + "epoch": 24.47, + "learning_rate": 5.6758816730703157e-05, + "loss": 0.0905, + "step": 87030 + }, + { + "epoch": 24.48, + "learning_rate": 5.674007434479743e-05, + "loss": 0.0812, + "step": 87060 + }, + { + "epoch": 24.48, + "learning_rate": 5.67213319588917e-05, + "loss": 0.0782, + "step": 87090 + }, + { + "epoch": 24.49, + "learning_rate": 5.670258957298598e-05, + "loss": 0.0969, + "step": 87120 + }, + { + "epoch": 24.5, + "learning_rate": 5.668384718708025e-05, + "loss": 0.079, + "step": 87150 + }, + { + "epoch": 24.51, + "learning_rate": 5.666510480117453e-05, + "loss": 0.0904, + "step": 87180 + }, + { + "epoch": 24.52, + "learning_rate": 5.6646362415268795e-05, + "loss": 0.0841, + "step": 87210 + }, + { + "epoch": 24.53, + "learning_rate": 5.662762002936307e-05, + "loss": 0.0867, + "step": 87240 + }, + { + "epoch": 24.53, + "learning_rate": 5.660887764345735e-05, + "loss": 0.0931, + "step": 87270 + }, + { + "epoch": 24.54, + "learning_rate": 5.6590135257551624e-05, + "loss": 0.0781, + "step": 87300 + }, + { + "epoch": 24.55, + "learning_rate": 5.65713928716459e-05, + "loss": 0.0932, + "step": 87330 + }, + { + "epoch": 24.56, + "learning_rate": 5.6552650485740166e-05, + "loss": 0.0797, + "step": 87360 + }, + { + "epoch": 24.57, + "learning_rate": 5.653390809983444e-05, + "loss": 0.0857, + "step": 87390 + }, + { + "epoch": 24.58, + "learning_rate": 5.651516571392872e-05, + "loss": 0.095, + "step": 87420 + }, + { + "epoch": 24.59, + "learning_rate": 5.6496423328022995e-05, + "loss": 0.0788, + "step": 87450 + }, + { + "epoch": 24.59, + "learning_rate": 5.647768094211727e-05, + "loss": 0.0921, + "step": 87480 + }, + { + "epoch": 24.6, + "learning_rate": 5.645893855621154e-05, + "loss": 0.0822, + "step": 87510 + }, + { + "epoch": 24.61, + "learning_rate": 5.644019617030582e-05, + "loss": 0.0886, + "step": 87540 + }, + { + "epoch": 24.62, + "learning_rate": 5.642145378440009e-05, + "loss": 0.0961, + "step": 87570 + }, + { + "epoch": 24.63, + "learning_rate": 5.6402711398494366e-05, + "loss": 0.0757, + "step": 87600 + }, + { + "epoch": 24.64, + "learning_rate": 5.6383969012588634e-05, + "loss": 0.0877, + "step": 87630 + }, + { + "epoch": 24.64, + "learning_rate": 5.636522662668291e-05, + "loss": 0.0839, + "step": 87660 + }, + { + "epoch": 24.65, + "learning_rate": 5.634648424077719e-05, + "loss": 0.0847, + "step": 87690 + }, + { + "epoch": 24.66, + "learning_rate": 5.632774185487146e-05, + "loss": 0.0956, + "step": 87720 + }, + { + "epoch": 24.67, + "learning_rate": 5.630899946896574e-05, + "loss": 0.0766, + "step": 87750 + }, + { + "epoch": 24.68, + "learning_rate": 5.6290257083060005e-05, + "loss": 0.0869, + "step": 87780 + }, + { + "epoch": 24.69, + "learning_rate": 5.627151469715428e-05, + "loss": 0.0878, + "step": 87810 + }, + { + "epoch": 24.69, + "learning_rate": 5.625277231124856e-05, + "loss": 0.0876, + "step": 87840 + }, + { + "epoch": 24.7, + "learning_rate": 5.6234029925342834e-05, + "loss": 0.0916, + "step": 87870 + }, + { + "epoch": 24.71, + "learning_rate": 5.6215287539437115e-05, + "loss": 0.0781, + "step": 87900 + }, + { + "epoch": 24.72, + "learning_rate": 5.6196545153531375e-05, + "loss": 0.0873, + "step": 87930 + }, + { + "epoch": 24.73, + "learning_rate": 5.6177802767625656e-05, + "loss": 0.0825, + "step": 87960 + }, + { + "epoch": 24.74, + "learning_rate": 5.615906038171993e-05, + "loss": 0.0903, + "step": 87990 + }, + { + "epoch": 24.75, + "learning_rate": 5.6140317995814205e-05, + "loss": 0.0974, + "step": 88020 + }, + { + "epoch": 24.75, + "learning_rate": 5.612157560990847e-05, + "loss": 0.0757, + "step": 88050 + }, + { + "epoch": 24.76, + "learning_rate": 5.6102833224002746e-05, + "loss": 0.0975, + "step": 88080 + }, + { + "epoch": 24.77, + "learning_rate": 5.608409083809703e-05, + "loss": 0.0821, + "step": 88110 + }, + { + "epoch": 24.78, + "learning_rate": 5.60653484521913e-05, + "loss": 0.0868, + "step": 88140 + }, + { + "epoch": 24.79, + "learning_rate": 5.6046606066285576e-05, + "loss": 0.0895, + "step": 88170 + }, + { + "epoch": 24.8, + "learning_rate": 5.602786368037984e-05, + "loss": 0.079, + "step": 88200 + }, + { + "epoch": 24.8, + "learning_rate": 5.600912129447412e-05, + "loss": 0.0896, + "step": 88230 + }, + { + "epoch": 24.81, + "learning_rate": 5.59903789085684e-05, + "loss": 0.0845, + "step": 88260 + }, + { + "epoch": 24.82, + "learning_rate": 5.597163652266267e-05, + "loss": 0.0872, + "step": 88290 + }, + { + "epoch": 24.83, + "learning_rate": 5.5952894136756954e-05, + "loss": 0.0924, + "step": 88320 + }, + { + "epoch": 24.84, + "learning_rate": 5.5934151750851214e-05, + "loss": 0.0772, + "step": 88350 + }, + { + "epoch": 24.85, + "learning_rate": 5.5915409364945495e-05, + "loss": 0.096, + "step": 88380 + }, + { + "epoch": 24.86, + "learning_rate": 5.589666697903977e-05, + "loss": 0.0867, + "step": 88410 + }, + { + "epoch": 24.86, + "learning_rate": 5.5877924593134043e-05, + "loss": 0.0925, + "step": 88440 + }, + { + "epoch": 24.87, + "learning_rate": 5.585918220722831e-05, + "loss": 0.098, + "step": 88470 + }, + { + "epoch": 24.88, + "learning_rate": 5.5840439821322585e-05, + "loss": 0.0773, + "step": 88500 + }, + { + "epoch": 24.89, + "learning_rate": 5.5821697435416866e-05, + "loss": 0.0894, + "step": 88530 + }, + { + "epoch": 24.9, + "learning_rate": 5.580295504951114e-05, + "loss": 0.0833, + "step": 88560 + }, + { + "epoch": 24.91, + "learning_rate": 5.5784212663605414e-05, + "loss": 0.0885, + "step": 88590 + }, + { + "epoch": 24.91, + "learning_rate": 5.576547027769968e-05, + "loss": 0.0983, + "step": 88620 + }, + { + "epoch": 24.92, + "learning_rate": 5.574672789179396e-05, + "loss": 0.0771, + "step": 88650 + }, + { + "epoch": 24.93, + "learning_rate": 5.572798550588824e-05, + "loss": 0.091, + "step": 88680 + }, + { + "epoch": 24.94, + "learning_rate": 5.570924311998251e-05, + "loss": 0.0824, + "step": 88710 + }, + { + "epoch": 24.95, + "learning_rate": 5.569050073407679e-05, + "loss": 0.082, + "step": 88740 + }, + { + "epoch": 24.96, + "learning_rate": 5.567175834817105e-05, + "loss": 0.0929, + "step": 88770 + }, + { + "epoch": 24.96, + "learning_rate": 5.5653015962265334e-05, + "loss": 0.0785, + "step": 88800 + }, + { + "epoch": 24.97, + "learning_rate": 5.563427357635961e-05, + "loss": 0.0907, + "step": 88830 + }, + { + "epoch": 24.98, + "learning_rate": 5.561553119045388e-05, + "loss": 0.0865, + "step": 88860 + }, + { + "epoch": 24.99, + "learning_rate": 5.559678880454815e-05, + "loss": 0.0906, + "step": 88890 + }, + { + "epoch": 25.0, + "learning_rate": 5.5578046418642424e-05, + "loss": 0.0945, + "step": 88920 + }, + { + "epoch": 25.0, + "eval_loss": 0.17860166728496552, + "eval_runtime": 503.6267, + "eval_samples_per_second": 31.835, + "eval_steps_per_second": 0.997, + "eval_wer": 0.142815225253504, + "step": 88925 + }, + { + "epoch": 25.01, + "learning_rate": 5.5559304032736705e-05, + "loss": 0.0802, + "step": 88950 + }, + { + "epoch": 25.02, + "learning_rate": 5.554056164683098e-05, + "loss": 0.0906, + "step": 88980 + }, + { + "epoch": 25.02, + "learning_rate": 5.552181926092525e-05, + "loss": 0.076, + "step": 89010 + }, + { + "epoch": 25.03, + "learning_rate": 5.550307687501952e-05, + "loss": 0.0857, + "step": 89040 + }, + { + "epoch": 25.04, + "learning_rate": 5.54843344891138e-05, + "loss": 0.0802, + "step": 89070 + }, + { + "epoch": 25.05, + "learning_rate": 5.5465592103208076e-05, + "loss": 0.0799, + "step": 89100 + }, + { + "epoch": 25.06, + "learning_rate": 5.544684971730235e-05, + "loss": 0.0861, + "step": 89130 + }, + { + "epoch": 25.07, + "learning_rate": 5.542810733139663e-05, + "loss": 0.0751, + "step": 89160 + }, + { + "epoch": 25.07, + "learning_rate": 5.540936494549089e-05, + "loss": 0.0899, + "step": 89190 + }, + { + "epoch": 25.08, + "learning_rate": 5.539062255958517e-05, + "loss": 0.0826, + "step": 89220 + }, + { + "epoch": 25.09, + "learning_rate": 5.537188017367945e-05, + "loss": 0.0856, + "step": 89250 + }, + { + "epoch": 25.1, + "learning_rate": 5.535313778777372e-05, + "loss": 0.0859, + "step": 89280 + }, + { + "epoch": 25.11, + "learning_rate": 5.533439540186799e-05, + "loss": 0.0768, + "step": 89310 + }, + { + "epoch": 25.12, + "learning_rate": 5.531565301596226e-05, + "loss": 0.088, + "step": 89340 + }, + { + "epoch": 25.13, + "learning_rate": 5.5296910630056543e-05, + "loss": 0.0799, + "step": 89370 + }, + { + "epoch": 25.13, + "learning_rate": 5.527816824415082e-05, + "loss": 0.0803, + "step": 89400 + }, + { + "epoch": 25.14, + "learning_rate": 5.52594258582451e-05, + "loss": 0.0905, + "step": 89430 + }, + { + "epoch": 25.15, + "learning_rate": 5.524068347233936e-05, + "loss": 0.0751, + "step": 89460 + }, + { + "epoch": 25.16, + "learning_rate": 5.522194108643364e-05, + "loss": 0.0891, + "step": 89490 + }, + { + "epoch": 25.17, + "learning_rate": 5.5203198700527914e-05, + "loss": 0.0835, + "step": 89520 + }, + { + "epoch": 25.18, + "learning_rate": 5.518445631462219e-05, + "loss": 0.0835, + "step": 89550 + }, + { + "epoch": 25.18, + "learning_rate": 5.516571392871647e-05, + "loss": 0.0896, + "step": 89580 + }, + { + "epoch": 25.19, + "learning_rate": 5.514697154281073e-05, + "loss": 0.0741, + "step": 89610 + }, + { + "epoch": 25.2, + "learning_rate": 5.512822915690501e-05, + "loss": 0.0939, + "step": 89640 + }, + { + "epoch": 25.21, + "learning_rate": 5.5109486770999285e-05, + "loss": 0.0849, + "step": 89670 + }, + { + "epoch": 25.22, + "learning_rate": 5.509074438509356e-05, + "loss": 0.0864, + "step": 89700 + }, + { + "epoch": 25.23, + "learning_rate": 5.507200199918783e-05, + "loss": 0.089, + "step": 89730 + }, + { + "epoch": 25.23, + "learning_rate": 5.50532596132821e-05, + "loss": 0.0745, + "step": 89760 + }, + { + "epoch": 25.24, + "learning_rate": 5.503451722737638e-05, + "loss": 0.091, + "step": 89790 + }, + { + "epoch": 25.25, + "learning_rate": 5.5015774841470656e-05, + "loss": 0.0839, + "step": 89820 + }, + { + "epoch": 25.26, + "learning_rate": 5.499703245556494e-05, + "loss": 0.0847, + "step": 89850 + }, + { + "epoch": 25.27, + "learning_rate": 5.49782900696592e-05, + "loss": 0.0913, + "step": 89880 + }, + { + "epoch": 25.28, + "learning_rate": 5.495954768375348e-05, + "loss": 0.0784, + "step": 89910 + }, + { + "epoch": 25.29, + "learning_rate": 5.494080529784775e-05, + "loss": 0.0875, + "step": 89940 + }, + { + "epoch": 25.29, + "learning_rate": 5.492206291194203e-05, + "loss": 0.0846, + "step": 89970 + }, + { + "epoch": 25.3, + "learning_rate": 5.4903320526036295e-05, + "loss": 0.0829, + "step": 90000 + }, + { + "epoch": 25.31, + "learning_rate": 5.488457814013057e-05, + "loss": 0.0905, + "step": 90030 + }, + { + "epoch": 25.32, + "learning_rate": 5.486583575422485e-05, + "loss": 0.0742, + "step": 90060 + }, + { + "epoch": 25.33, + "learning_rate": 5.4847093368319124e-05, + "loss": 0.0862, + "step": 90090 + }, + { + "epoch": 25.34, + "learning_rate": 5.48283509824134e-05, + "loss": 0.0776, + "step": 90120 + }, + { + "epoch": 25.34, + "learning_rate": 5.4809608596507666e-05, + "loss": 0.0821, + "step": 90150 + }, + { + "epoch": 25.35, + "learning_rate": 5.4790866210601947e-05, + "loss": 0.0918, + "step": 90180 + }, + { + "epoch": 25.36, + "learning_rate": 5.477212382469622e-05, + "loss": 0.0777, + "step": 90210 + }, + { + "epoch": 25.37, + "learning_rate": 5.4753381438790495e-05, + "loss": 0.0873, + "step": 90240 + }, + { + "epoch": 25.38, + "learning_rate": 5.4734639052884776e-05, + "loss": 0.0833, + "step": 90270 + }, + { + "epoch": 25.39, + "learning_rate": 5.4715896666979037e-05, + "loss": 0.0772, + "step": 90300 + }, + { + "epoch": 25.39, + "learning_rate": 5.469715428107332e-05, + "loss": 0.0882, + "step": 90330 + }, + { + "epoch": 25.4, + "learning_rate": 5.467841189516759e-05, + "loss": 0.0788, + "step": 90360 + }, + { + "epoch": 25.41, + "learning_rate": 5.4659669509261866e-05, + "loss": 0.0884, + "step": 90390 + }, + { + "epoch": 25.42, + "learning_rate": 5.464092712335613e-05, + "loss": 0.085, + "step": 90420 + }, + { + "epoch": 25.43, + "learning_rate": 5.462218473745041e-05, + "loss": 0.0803, + "step": 90450 + }, + { + "epoch": 25.44, + "learning_rate": 5.460344235154469e-05, + "loss": 0.091, + "step": 90480 + }, + { + "epoch": 25.45, + "learning_rate": 5.458469996563896e-05, + "loss": 0.0763, + "step": 90510 + }, + { + "epoch": 25.45, + "learning_rate": 5.456595757973324e-05, + "loss": 0.0876, + "step": 90540 + }, + { + "epoch": 25.46, + "learning_rate": 5.4547215193827504e-05, + "loss": 0.0865, + "step": 90570 + }, + { + "epoch": 25.47, + "learning_rate": 5.4528472807921785e-05, + "loss": 0.0815, + "step": 90600 + }, + { + "epoch": 25.48, + "learning_rate": 5.450973042201606e-05, + "loss": 0.0901, + "step": 90630 + }, + { + "epoch": 25.49, + "learning_rate": 5.4490988036110334e-05, + "loss": 0.0757, + "step": 90660 + }, + { + "epoch": 25.5, + "learning_rate": 5.4472245650204615e-05, + "loss": 0.0904, + "step": 90690 + }, + { + "epoch": 25.5, + "learning_rate": 5.4453503264298875e-05, + "loss": 0.0849, + "step": 90720 + }, + { + "epoch": 25.51, + "learning_rate": 5.4434760878393156e-05, + "loss": 0.0843, + "step": 90750 + }, + { + "epoch": 25.52, + "learning_rate": 5.4416643238684284e-05, + "loss": 0.0941, + "step": 90780 + }, + { + "epoch": 25.53, + "learning_rate": 5.439790085277856e-05, + "loss": 0.0802, + "step": 90810 + }, + { + "epoch": 25.54, + "learning_rate": 5.437915846687284e-05, + "loss": 0.0852, + "step": 90840 + }, + { + "epoch": 25.55, + "learning_rate": 5.436041608096711e-05, + "loss": 0.0793, + "step": 90870 + }, + { + "epoch": 25.56, + "learning_rate": 5.434167369506138e-05, + "loss": 0.086, + "step": 90900 + }, + { + "epoch": 25.56, + "learning_rate": 5.4322931309155655e-05, + "loss": 0.0929, + "step": 90930 + }, + { + "epoch": 25.57, + "learning_rate": 5.4304188923249936e-05, + "loss": 0.0805, + "step": 90960 + }, + { + "epoch": 25.58, + "learning_rate": 5.428544653734421e-05, + "loss": 0.087, + "step": 90990 + }, + { + "epoch": 25.59, + "learning_rate": 5.4266704151438484e-05, + "loss": 0.0838, + "step": 91020 + }, + { + "epoch": 25.6, + "learning_rate": 5.424796176553275e-05, + "loss": 0.0808, + "step": 91050 + }, + { + "epoch": 25.61, + "learning_rate": 5.4229219379627026e-05, + "loss": 0.0901, + "step": 91080 + }, + { + "epoch": 25.61, + "learning_rate": 5.4210476993721306e-05, + "loss": 0.0757, + "step": 91110 + }, + { + "epoch": 25.62, + "learning_rate": 5.419173460781558e-05, + "loss": 0.0876, + "step": 91140 + }, + { + "epoch": 25.63, + "learning_rate": 5.417299222190985e-05, + "loss": 0.0828, + "step": 91170 + }, + { + "epoch": 25.64, + "learning_rate": 5.415424983600412e-05, + "loss": 0.0881, + "step": 91200 + }, + { + "epoch": 25.65, + "learning_rate": 5.4135507450098396e-05, + "loss": 0.0927, + "step": 91230 + }, + { + "epoch": 25.66, + "learning_rate": 5.411676506419268e-05, + "loss": 0.0833, + "step": 91260 + }, + { + "epoch": 25.66, + "learning_rate": 5.409802267828695e-05, + "loss": 0.0837, + "step": 91290 + }, + { + "epoch": 25.67, + "learning_rate": 5.407928029238122e-05, + "loss": 0.0846, + "step": 91320 + }, + { + "epoch": 25.68, + "learning_rate": 5.406053790647549e-05, + "loss": 0.0863, + "step": 91350 + }, + { + "epoch": 25.69, + "learning_rate": 5.4041795520569774e-05, + "loss": 0.0921, + "step": 91380 + }, + { + "epoch": 25.7, + "learning_rate": 5.402305313466405e-05, + "loss": 0.0763, + "step": 91410 + }, + { + "epoch": 25.71, + "learning_rate": 5.400431074875832e-05, + "loss": 0.0872, + "step": 91440 + }, + { + "epoch": 25.72, + "learning_rate": 5.398556836285259e-05, + "loss": 0.0823, + "step": 91470 + }, + { + "epoch": 25.72, + "learning_rate": 5.3966825976946864e-05, + "loss": 0.0841, + "step": 91500 + }, + { + "epoch": 25.73, + "learning_rate": 5.3948083591041145e-05, + "loss": 0.09, + "step": 91530 + }, + { + "epoch": 25.74, + "learning_rate": 5.392934120513542e-05, + "loss": 0.0763, + "step": 91560 + }, + { + "epoch": 25.75, + "learning_rate": 5.391059881922969e-05, + "loss": 0.094, + "step": 91590 + }, + { + "epoch": 25.76, + "learning_rate": 5.389185643332396e-05, + "loss": 0.0783, + "step": 91620 + }, + { + "epoch": 25.77, + "learning_rate": 5.3873114047418235e-05, + "loss": 0.0808, + "step": 91650 + }, + { + "epoch": 25.77, + "learning_rate": 5.3854371661512516e-05, + "loss": 0.0896, + "step": 91680 + }, + { + "epoch": 25.78, + "learning_rate": 5.383562927560679e-05, + "loss": 0.0768, + "step": 91710 + }, + { + "epoch": 25.79, + "learning_rate": 5.381688688970106e-05, + "loss": 0.0888, + "step": 91740 + }, + { + "epoch": 25.8, + "learning_rate": 5.379814450379533e-05, + "loss": 0.0829, + "step": 91770 + }, + { + "epoch": 25.81, + "learning_rate": 5.377940211788961e-05, + "loss": 0.0793, + "step": 91800 + }, + { + "epoch": 25.82, + "learning_rate": 5.376065973198389e-05, + "loss": 0.1, + "step": 91830 + }, + { + "epoch": 25.83, + "learning_rate": 5.374191734607816e-05, + "loss": 0.0743, + "step": 91860 + }, + { + "epoch": 25.83, + "learning_rate": 5.372317496017243e-05, + "loss": 0.0834, + "step": 91890 + }, + { + "epoch": 25.84, + "learning_rate": 5.37044325742667e-05, + "loss": 0.0844, + "step": 91920 + }, + { + "epoch": 25.85, + "learning_rate": 5.3685690188360984e-05, + "loss": 0.0853, + "step": 91950 + }, + { + "epoch": 25.86, + "learning_rate": 5.366694780245526e-05, + "loss": 0.0876, + "step": 91980 + }, + { + "epoch": 25.87, + "learning_rate": 5.3648205416549525e-05, + "loss": 0.0716, + "step": 92010 + }, + { + "epoch": 25.88, + "learning_rate": 5.36294630306438e-05, + "loss": 0.0894, + "step": 92040 + }, + { + "epoch": 25.88, + "learning_rate": 5.361072064473808e-05, + "loss": 0.0869, + "step": 92070 + }, + { + "epoch": 25.89, + "learning_rate": 5.3591978258832355e-05, + "loss": 0.0816, + "step": 92100 + }, + { + "epoch": 25.9, + "learning_rate": 5.357323587292663e-05, + "loss": 0.0904, + "step": 92130 + }, + { + "epoch": 25.91, + "learning_rate": 5.3554493487020896e-05, + "loss": 0.0765, + "step": 92160 + }, + { + "epoch": 25.92, + "learning_rate": 5.353575110111517e-05, + "loss": 0.086, + "step": 92190 + }, + { + "epoch": 25.93, + "learning_rate": 5.351700871520945e-05, + "loss": 0.0827, + "step": 92220 + }, + { + "epoch": 25.93, + "learning_rate": 5.3498266329303726e-05, + "loss": 0.0785, + "step": 92250 + }, + { + "epoch": 25.94, + "learning_rate": 5.3479523943398e-05, + "loss": 0.0921, + "step": 92280 + }, + { + "epoch": 25.95, + "learning_rate": 5.346078155749227e-05, + "loss": 0.0794, + "step": 92310 + }, + { + "epoch": 25.96, + "learning_rate": 5.344203917158654e-05, + "loss": 0.0864, + "step": 92340 + }, + { + "epoch": 25.97, + "learning_rate": 5.342329678568082e-05, + "loss": 0.083, + "step": 92370 + }, + { + "epoch": 25.98, + "learning_rate": 5.34045543997751e-05, + "loss": 0.0854, + "step": 92400 + }, + { + "epoch": 25.99, + "learning_rate": 5.3385812013869364e-05, + "loss": 0.0924, + "step": 92430 + }, + { + "epoch": 25.99, + "learning_rate": 5.336706962796364e-05, + "loss": 0.0804, + "step": 92460 + }, + { + "epoch": 26.0, + "eval_loss": 0.17371097207069397, + "eval_runtime": 507.5317, + "eval_samples_per_second": 31.59, + "eval_steps_per_second": 0.989, + "eval_wer": 0.14286981562103368, + "step": 92482 + }, + { + "epoch": 26.0, + "learning_rate": 5.334832724205792e-05, + "loss": 0.0943, + "step": 92490 + }, + { + "epoch": 26.01, + "learning_rate": 5.3329584856152193e-05, + "loss": 0.0759, + "step": 92520 + }, + { + "epoch": 26.02, + "learning_rate": 5.331084247024647e-05, + "loss": 0.0836, + "step": 92550 + }, + { + "epoch": 26.03, + "learning_rate": 5.3292100084340735e-05, + "loss": 0.0859, + "step": 92580 + }, + { + "epoch": 26.04, + "learning_rate": 5.327335769843501e-05, + "loss": 0.0722, + "step": 92610 + }, + { + "epoch": 26.04, + "learning_rate": 5.325461531252929e-05, + "loss": 0.0867, + "step": 92640 + }, + { + "epoch": 26.05, + "learning_rate": 5.3235872926623564e-05, + "loss": 0.0756, + "step": 92670 + }, + { + "epoch": 26.06, + "learning_rate": 5.321713054071784e-05, + "loss": 0.0839, + "step": 92700 + }, + { + "epoch": 26.07, + "learning_rate": 5.3198388154812106e-05, + "loss": 0.0798, + "step": 92730 + }, + { + "epoch": 26.08, + "learning_rate": 5.317964576890638e-05, + "loss": 0.0787, + "step": 92760 + }, + { + "epoch": 26.09, + "learning_rate": 5.316090338300066e-05, + "loss": 0.0854, + "step": 92790 + }, + { + "epoch": 26.1, + "learning_rate": 5.3142160997094935e-05, + "loss": 0.0816, + "step": 92820 + }, + { + "epoch": 26.1, + "learning_rate": 5.31234186111892e-05, + "loss": 0.0817, + "step": 92850 + }, + { + "epoch": 26.11, + "learning_rate": 5.310467622528348e-05, + "loss": 0.0864, + "step": 92880 + }, + { + "epoch": 26.12, + "learning_rate": 5.308593383937776e-05, + "loss": 0.0767, + "step": 92910 + }, + { + "epoch": 26.13, + "learning_rate": 5.306719145347203e-05, + "loss": 0.0918, + "step": 92940 + }, + { + "epoch": 26.14, + "learning_rate": 5.3048449067566306e-05, + "loss": 0.0748, + "step": 92970 + }, + { + "epoch": 26.15, + "learning_rate": 5.3029706681660574e-05, + "loss": 0.0878, + "step": 93000 + }, + { + "epoch": 26.15, + "learning_rate": 5.301096429575485e-05, + "loss": 0.0877, + "step": 93030 + }, + { + "epoch": 26.16, + "learning_rate": 5.299222190984913e-05, + "loss": 0.0787, + "step": 93060 + }, + { + "epoch": 26.17, + "learning_rate": 5.29734795239434e-05, + "loss": 0.0941, + "step": 93090 + }, + { + "epoch": 26.18, + "learning_rate": 5.295473713803768e-05, + "loss": 0.078, + "step": 93120 + }, + { + "epoch": 26.19, + "learning_rate": 5.2935994752131945e-05, + "loss": 0.0847, + "step": 93150 + }, + { + "epoch": 26.2, + "learning_rate": 5.291725236622622e-05, + "loss": 0.0847, + "step": 93180 + }, + { + "epoch": 26.2, + "learning_rate": 5.28985099803205e-05, + "loss": 0.0773, + "step": 93210 + }, + { + "epoch": 26.21, + "learning_rate": 5.2879767594414774e-05, + "loss": 0.0865, + "step": 93240 + }, + { + "epoch": 26.22, + "learning_rate": 5.286102520850904e-05, + "loss": 0.0835, + "step": 93270 + }, + { + "epoch": 26.23, + "learning_rate": 5.2842282822603316e-05, + "loss": 0.082, + "step": 93300 + }, + { + "epoch": 26.24, + "learning_rate": 5.2823540436697597e-05, + "loss": 0.0851, + "step": 93330 + }, + { + "epoch": 26.25, + "learning_rate": 5.280479805079187e-05, + "loss": 0.0791, + "step": 93360 + }, + { + "epoch": 26.26, + "learning_rate": 5.2786055664886145e-05, + "loss": 0.0868, + "step": 93390 + }, + { + "epoch": 26.26, + "learning_rate": 5.276731327898041e-05, + "loss": 0.0789, + "step": 93420 + }, + { + "epoch": 26.27, + "learning_rate": 5.2748570893074687e-05, + "loss": 0.0805, + "step": 93450 + }, + { + "epoch": 26.28, + "learning_rate": 5.272982850716897e-05, + "loss": 0.0849, + "step": 93480 + }, + { + "epoch": 26.29, + "learning_rate": 5.271108612126324e-05, + "loss": 0.0753, + "step": 93510 + }, + { + "epoch": 26.3, + "learning_rate": 5.269296848155437e-05, + "loss": 0.086, + "step": 93540 + }, + { + "epoch": 26.31, + "learning_rate": 5.267422609564865e-05, + "loss": 0.0782, + "step": 93570 + }, + { + "epoch": 26.31, + "learning_rate": 5.265548370974292e-05, + "loss": 0.0837, + "step": 93600 + }, + { + "epoch": 26.32, + "learning_rate": 5.263674132383719e-05, + "loss": 0.0847, + "step": 93630 + }, + { + "epoch": 26.33, + "learning_rate": 5.2617998937931466e-05, + "loss": 0.0776, + "step": 93660 + }, + { + "epoch": 26.34, + "learning_rate": 5.259925655202575e-05, + "loss": 0.0878, + "step": 93690 + }, + { + "epoch": 26.35, + "learning_rate": 5.258051416612002e-05, + "loss": 0.0804, + "step": 93720 + }, + { + "epoch": 26.36, + "learning_rate": 5.256177178021429e-05, + "loss": 0.0843, + "step": 93750 + }, + { + "epoch": 26.36, + "learning_rate": 5.254302939430856e-05, + "loss": 0.0802, + "step": 93780 + }, + { + "epoch": 26.37, + "learning_rate": 5.252428700840284e-05, + "loss": 0.0787, + "step": 93810 + }, + { + "epoch": 26.38, + "learning_rate": 5.250554462249712e-05, + "loss": 0.0851, + "step": 93840 + }, + { + "epoch": 26.39, + "learning_rate": 5.248680223659139e-05, + "loss": 0.0785, + "step": 93870 + }, + { + "epoch": 26.4, + "learning_rate": 5.246805985068566e-05, + "loss": 0.0848, + "step": 93900 + }, + { + "epoch": 26.41, + "learning_rate": 5.2449317464779934e-05, + "loss": 0.0807, + "step": 93930 + }, + { + "epoch": 26.42, + "learning_rate": 5.243057507887421e-05, + "loss": 0.079, + "step": 93960 + }, + { + "epoch": 26.42, + "learning_rate": 5.241183269296849e-05, + "loss": 0.088, + "step": 93990 + }, + { + "epoch": 26.43, + "learning_rate": 5.2393090307062756e-05, + "loss": 0.0778, + "step": 94020 + }, + { + "epoch": 26.44, + "learning_rate": 5.237434792115703e-05, + "loss": 0.0871, + "step": 94050 + }, + { + "epoch": 26.45, + "learning_rate": 5.2355605535251305e-05, + "loss": 0.0805, + "step": 94080 + }, + { + "epoch": 26.46, + "learning_rate": 5.2336863149345586e-05, + "loss": 0.0832, + "step": 94110 + }, + { + "epoch": 26.47, + "learning_rate": 5.231812076343986e-05, + "loss": 0.0872, + "step": 94140 + }, + { + "epoch": 26.47, + "learning_rate": 5.229937837753413e-05, + "loss": 0.0773, + "step": 94170 + }, + { + "epoch": 26.48, + "learning_rate": 5.22806359916284e-05, + "loss": 0.0886, + "step": 94200 + }, + { + "epoch": 26.49, + "learning_rate": 5.2261893605722676e-05, + "loss": 0.0831, + "step": 94230 + }, + { + "epoch": 26.5, + "learning_rate": 5.2243151219816957e-05, + "loss": 0.0801, + "step": 94260 + }, + { + "epoch": 26.51, + "learning_rate": 5.222440883391123e-05, + "loss": 0.0872, + "step": 94290 + }, + { + "epoch": 26.52, + "learning_rate": 5.22056664480055e-05, + "loss": 0.0794, + "step": 94320 + }, + { + "epoch": 26.53, + "learning_rate": 5.218692406209977e-05, + "loss": 0.083, + "step": 94350 + }, + { + "epoch": 26.53, + "learning_rate": 5.216818167619405e-05, + "loss": 0.0816, + "step": 94380 + }, + { + "epoch": 26.54, + "learning_rate": 5.214943929028833e-05, + "loss": 0.0771, + "step": 94410 + }, + { + "epoch": 26.55, + "learning_rate": 5.2130696904382595e-05, + "loss": 0.0885, + "step": 94440 + }, + { + "epoch": 26.56, + "learning_rate": 5.211195451847687e-05, + "loss": 0.0748, + "step": 94470 + }, + { + "epoch": 26.57, + "learning_rate": 5.209321213257114e-05, + "loss": 0.0867, + "step": 94500 + }, + { + "epoch": 26.58, + "learning_rate": 5.2074469746665424e-05, + "loss": 0.0869, + "step": 94530 + }, + { + "epoch": 26.58, + "learning_rate": 5.20557273607597e-05, + "loss": 0.0754, + "step": 94560 + }, + { + "epoch": 26.59, + "learning_rate": 5.2036984974853966e-05, + "loss": 0.0903, + "step": 94590 + }, + { + "epoch": 26.6, + "learning_rate": 5.201824258894824e-05, + "loss": 0.0746, + "step": 94620 + }, + { + "epoch": 26.61, + "learning_rate": 5.1999500203042514e-05, + "loss": 0.0859, + "step": 94650 + }, + { + "epoch": 26.62, + "learning_rate": 5.1980757817136795e-05, + "loss": 0.0879, + "step": 94680 + }, + { + "epoch": 26.63, + "learning_rate": 5.196201543123107e-05, + "loss": 0.0744, + "step": 94710 + }, + { + "epoch": 26.63, + "learning_rate": 5.194327304532534e-05, + "loss": 0.0881, + "step": 94740 + }, + { + "epoch": 26.64, + "learning_rate": 5.192453065941961e-05, + "loss": 0.0761, + "step": 94770 + }, + { + "epoch": 26.65, + "learning_rate": 5.190578827351389e-05, + "loss": 0.0849, + "step": 94800 + }, + { + "epoch": 26.66, + "learning_rate": 5.1887045887608166e-05, + "loss": 0.0855, + "step": 94830 + }, + { + "epoch": 26.67, + "learning_rate": 5.1868303501702434e-05, + "loss": 0.076, + "step": 94860 + }, + { + "epoch": 26.68, + "learning_rate": 5.184956111579671e-05, + "loss": 0.0815, + "step": 94890 + }, + { + "epoch": 26.69, + "learning_rate": 5.183081872989098e-05, + "loss": 0.0818, + "step": 94920 + }, + { + "epoch": 26.69, + "learning_rate": 5.181207634398526e-05, + "loss": 0.0862, + "step": 94950 + }, + { + "epoch": 26.7, + "learning_rate": 5.179333395807954e-05, + "loss": 0.0882, + "step": 94980 + }, + { + "epoch": 26.71, + "learning_rate": 5.1774591572173804e-05, + "loss": 0.0773, + "step": 95010 + }, + { + "epoch": 26.72, + "learning_rate": 5.175584918626808e-05, + "loss": 0.0928, + "step": 95040 + }, + { + "epoch": 26.73, + "learning_rate": 5.173710680036235e-05, + "loss": 0.0805, + "step": 95070 + }, + { + "epoch": 26.74, + "learning_rate": 5.1718364414456634e-05, + "loss": 0.0857, + "step": 95100 + }, + { + "epoch": 26.74, + "learning_rate": 5.169962202855091e-05, + "loss": 0.0881, + "step": 95130 + }, + { + "epoch": 26.75, + "learning_rate": 5.1680879642645175e-05, + "loss": 0.0795, + "step": 95160 + }, + { + "epoch": 26.76, + "learning_rate": 5.166213725673945e-05, + "loss": 0.083, + "step": 95190 + }, + { + "epoch": 26.77, + "learning_rate": 5.164339487083373e-05, + "loss": 0.075, + "step": 95220 + }, + { + "epoch": 26.78, + "learning_rate": 5.1624652484928005e-05, + "loss": 0.082, + "step": 95250 + }, + { + "epoch": 26.79, + "learning_rate": 5.160591009902227e-05, + "loss": 0.0811, + "step": 95280 + }, + { + "epoch": 26.79, + "learning_rate": 5.1587167713116546e-05, + "loss": 0.0798, + "step": 95310 + }, + { + "epoch": 26.8, + "learning_rate": 5.156842532721082e-05, + "loss": 0.0893, + "step": 95340 + }, + { + "epoch": 26.81, + "learning_rate": 5.15496829413051e-05, + "loss": 0.0768, + "step": 95370 + }, + { + "epoch": 26.82, + "learning_rate": 5.1530940555399376e-05, + "loss": 0.0892, + "step": 95400 + }, + { + "epoch": 26.83, + "learning_rate": 5.151219816949364e-05, + "loss": 0.084, + "step": 95430 + }, + { + "epoch": 26.84, + "learning_rate": 5.149345578358792e-05, + "loss": 0.079, + "step": 95460 + }, + { + "epoch": 26.85, + "learning_rate": 5.147471339768219e-05, + "loss": 0.0995, + "step": 95490 + }, + { + "epoch": 26.85, + "learning_rate": 5.145597101177647e-05, + "loss": 0.0821, + "step": 95520 + }, + { + "epoch": 26.86, + "learning_rate": 5.143722862587074e-05, + "loss": 0.0874, + "step": 95550 + }, + { + "epoch": 26.87, + "learning_rate": 5.1418486239965014e-05, + "loss": 0.0838, + "step": 95580 + }, + { + "epoch": 26.88, + "learning_rate": 5.139974385405929e-05, + "loss": 0.0803, + "step": 95610 + }, + { + "epoch": 26.89, + "learning_rate": 5.138100146815357e-05, + "loss": 0.089, + "step": 95640 + }, + { + "epoch": 26.9, + "learning_rate": 5.1362259082247843e-05, + "loss": 0.0766, + "step": 95670 + }, + { + "epoch": 26.9, + "learning_rate": 5.134351669634211e-05, + "loss": 0.0893, + "step": 95700 + }, + { + "epoch": 26.91, + "learning_rate": 5.1324774310436385e-05, + "loss": 0.0878, + "step": 95730 + }, + { + "epoch": 26.92, + "learning_rate": 5.130603192453066e-05, + "loss": 0.0833, + "step": 95760 + }, + { + "epoch": 26.93, + "learning_rate": 5.128728953862494e-05, + "loss": 0.0942, + "step": 95790 + }, + { + "epoch": 26.94, + "learning_rate": 5.1268547152719214e-05, + "loss": 0.0756, + "step": 95820 + }, + { + "epoch": 26.95, + "learning_rate": 5.124980476681348e-05, + "loss": 0.0826, + "step": 95850 + }, + { + "epoch": 26.96, + "learning_rate": 5.1231062380907756e-05, + "loss": 0.0812, + "step": 95880 + }, + { + "epoch": 26.96, + "learning_rate": 5.121231999500204e-05, + "loss": 0.0837, + "step": 95910 + }, + { + "epoch": 26.97, + "learning_rate": 5.1194202355293164e-05, + "loss": 0.0896, + "step": 95940 + }, + { + "epoch": 26.98, + "learning_rate": 5.117545996938744e-05, + "loss": 0.0797, + "step": 95970 + }, + { + "epoch": 26.99, + "learning_rate": 5.115671758348172e-05, + "loss": 0.0854, + "step": 96000 + }, + { + "epoch": 27.0, + "learning_rate": 5.113797519757598e-05, + "loss": 0.0832, + "step": 96030 + }, + { + "epoch": 27.0, + "eval_loss": 0.17894543707370758, + "eval_runtime": 507.5418, + "eval_samples_per_second": 31.59, + "eval_steps_per_second": 0.989, + "eval_wer": 0.13943062246666577, + "step": 96039 + }, + { + "epoch": 27.01, + "learning_rate": 5.111923281167026e-05, + "loss": 0.081, + "step": 96060 + }, + { + "epoch": 27.01, + "learning_rate": 5.1100490425764535e-05, + "loss": 0.0886, + "step": 96090 + }, + { + "epoch": 27.02, + "learning_rate": 5.108174803985881e-05, + "loss": 0.0685, + "step": 96120 + }, + { + "epoch": 27.03, + "learning_rate": 5.106300565395309e-05, + "loss": 0.0845, + "step": 96150 + }, + { + "epoch": 27.04, + "learning_rate": 5.104488801424422e-05, + "loss": 0.0777, + "step": 96180 + }, + { + "epoch": 27.05, + "learning_rate": 5.102614562833849e-05, + "loss": 0.0776, + "step": 96210 + }, + { + "epoch": 27.06, + "learning_rate": 5.100740324243276e-05, + "loss": 0.086, + "step": 96240 + }, + { + "epoch": 27.06, + "learning_rate": 5.098866085652704e-05, + "loss": 0.0698, + "step": 96270 + }, + { + "epoch": 27.07, + "learning_rate": 5.0969918470621315e-05, + "loss": 0.082, + "step": 96300 + }, + { + "epoch": 27.08, + "learning_rate": 5.095117608471559e-05, + "loss": 0.0777, + "step": 96330 + }, + { + "epoch": 27.09, + "learning_rate": 5.0932433698809856e-05, + "loss": 0.0844, + "step": 96360 + }, + { + "epoch": 27.1, + "learning_rate": 5.091369131290413e-05, + "loss": 0.0874, + "step": 96390 + }, + { + "epoch": 27.11, + "learning_rate": 5.089494892699841e-05, + "loss": 0.0745, + "step": 96420 + }, + { + "epoch": 27.12, + "learning_rate": 5.0876206541092686e-05, + "loss": 0.0863, + "step": 96450 + }, + { + "epoch": 27.12, + "learning_rate": 5.085746415518696e-05, + "loss": 0.0814, + "step": 96480 + }, + { + "epoch": 27.13, + "learning_rate": 5.083872176928123e-05, + "loss": 0.0806, + "step": 96510 + }, + { + "epoch": 27.14, + "learning_rate": 5.08199793833755e-05, + "loss": 0.0872, + "step": 96540 + }, + { + "epoch": 27.15, + "learning_rate": 5.080123699746978e-05, + "loss": 0.0735, + "step": 96570 + }, + { + "epoch": 27.16, + "learning_rate": 5.078249461156406e-05, + "loss": 0.0811, + "step": 96600 + }, + { + "epoch": 27.17, + "learning_rate": 5.076375222565834e-05, + "loss": 0.0789, + "step": 96630 + }, + { + "epoch": 27.17, + "learning_rate": 5.07450098397526e-05, + "loss": 0.0836, + "step": 96660 + }, + { + "epoch": 27.18, + "learning_rate": 5.072626745384688e-05, + "loss": 0.0919, + "step": 96690 + }, + { + "epoch": 27.19, + "learning_rate": 5.0707525067941153e-05, + "loss": 0.0715, + "step": 96720 + }, + { + "epoch": 27.2, + "learning_rate": 5.068878268203543e-05, + "loss": 0.0844, + "step": 96750 + }, + { + "epoch": 27.21, + "learning_rate": 5.0670040296129695e-05, + "loss": 0.0794, + "step": 96780 + }, + { + "epoch": 27.22, + "learning_rate": 5.065129791022397e-05, + "loss": 0.0876, + "step": 96810 + }, + { + "epoch": 27.23, + "learning_rate": 5.063255552431825e-05, + "loss": 0.0904, + "step": 96840 + }, + { + "epoch": 27.23, + "learning_rate": 5.0613813138412524e-05, + "loss": 0.0739, + "step": 96870 + }, + { + "epoch": 27.24, + "learning_rate": 5.05950707525068e-05, + "loss": 0.0841, + "step": 96900 + }, + { + "epoch": 27.25, + "learning_rate": 5.0576328366601066e-05, + "loss": 0.0775, + "step": 96930 + }, + { + "epoch": 27.26, + "learning_rate": 5.055758598069534e-05, + "loss": 0.0806, + "step": 96960 + }, + { + "epoch": 27.27, + "learning_rate": 5.053884359478962e-05, + "loss": 0.0901, + "step": 96990 + }, + { + "epoch": 27.28, + "learning_rate": 5.0520101208883895e-05, + "loss": 0.0717, + "step": 97020 + }, + { + "epoch": 27.28, + "learning_rate": 5.050135882297816e-05, + "loss": 0.0798, + "step": 97050 + }, + { + "epoch": 27.29, + "learning_rate": 5.048261643707244e-05, + "loss": 0.0796, + "step": 97080 + }, + { + "epoch": 27.3, + "learning_rate": 5.046387405116672e-05, + "loss": 0.0857, + "step": 97110 + }, + { + "epoch": 27.31, + "learning_rate": 5.044513166526099e-05, + "loss": 0.0905, + "step": 97140 + }, + { + "epoch": 27.32, + "learning_rate": 5.0426389279355266e-05, + "loss": 0.0728, + "step": 97170 + }, + { + "epoch": 27.33, + "learning_rate": 5.0407646893449534e-05, + "loss": 0.0853, + "step": 97200 + }, + { + "epoch": 27.33, + "learning_rate": 5.038890450754381e-05, + "loss": 0.0789, + "step": 97230 + }, + { + "epoch": 27.34, + "learning_rate": 5.037016212163809e-05, + "loss": 0.0774, + "step": 97260 + }, + { + "epoch": 27.35, + "learning_rate": 5.035141973573236e-05, + "loss": 0.0922, + "step": 97290 + }, + { + "epoch": 27.36, + "learning_rate": 5.033267734982664e-05, + "loss": 0.072, + "step": 97320 + }, + { + "epoch": 27.37, + "learning_rate": 5.0313934963920905e-05, + "loss": 0.0839, + "step": 97350 + }, + { + "epoch": 27.38, + "learning_rate": 5.0295192578015186e-05, + "loss": 0.0781, + "step": 97380 + }, + { + "epoch": 27.39, + "learning_rate": 5.027645019210946e-05, + "loss": 0.082, + "step": 97410 + }, + { + "epoch": 27.39, + "learning_rate": 5.0257707806203734e-05, + "loss": 0.0847, + "step": 97440 + }, + { + "epoch": 27.4, + "learning_rate": 5.0238965420298e-05, + "loss": 0.0744, + "step": 97470 + }, + { + "epoch": 27.41, + "learning_rate": 5.0220223034392276e-05, + "loss": 0.0853, + "step": 97500 + }, + { + "epoch": 27.42, + "learning_rate": 5.0201480648486557e-05, + "loss": 0.073, + "step": 97530 + }, + { + "epoch": 27.43, + "learning_rate": 5.018273826258083e-05, + "loss": 0.0738, + "step": 97560 + }, + { + "epoch": 27.44, + "learning_rate": 5.0163995876675105e-05, + "loss": 0.0832, + "step": 97590 + }, + { + "epoch": 27.44, + "learning_rate": 5.014525349076937e-05, + "loss": 0.0737, + "step": 97620 + }, + { + "epoch": 27.45, + "learning_rate": 5.0126511104863647e-05, + "loss": 0.0899, + "step": 97650 + }, + { + "epoch": 27.46, + "learning_rate": 5.010776871895793e-05, + "loss": 0.0724, + "step": 97680 + }, + { + "epoch": 27.47, + "learning_rate": 5.00890263330522e-05, + "loss": 0.0775, + "step": 97710 + }, + { + "epoch": 27.48, + "learning_rate": 5.0070283947146476e-05, + "loss": 0.0845, + "step": 97740 + }, + { + "epoch": 27.49, + "learning_rate": 5.005154156124074e-05, + "loss": 0.0731, + "step": 97770 + }, + { + "epoch": 27.5, + "learning_rate": 5.0032799175335024e-05, + "loss": 0.0887, + "step": 97800 + }, + { + "epoch": 27.5, + "learning_rate": 5.00140567894293e-05, + "loss": 0.0752, + "step": 97830 + }, + { + "epoch": 27.51, + "learning_rate": 4.9995314403523566e-05, + "loss": 0.0789, + "step": 97860 + }, + { + "epoch": 27.52, + "learning_rate": 4.997657201761785e-05, + "loss": 0.088, + "step": 97890 + }, + { + "epoch": 27.53, + "learning_rate": 4.995782963171212e-05, + "loss": 0.0717, + "step": 97920 + }, + { + "epoch": 27.54, + "learning_rate": 4.9939711992003255e-05, + "loss": 0.0812, + "step": 97950 + }, + { + "epoch": 27.55, + "learning_rate": 4.992096960609752e-05, + "loss": 0.0775, + "step": 97980 + }, + { + "epoch": 27.55, + "learning_rate": 4.99022272201918e-05, + "loss": 0.0838, + "step": 98010 + }, + { + "epoch": 27.56, + "learning_rate": 4.988348483428608e-05, + "loss": 0.0828, + "step": 98040 + }, + { + "epoch": 27.57, + "learning_rate": 4.9864742448380345e-05, + "loss": 0.0754, + "step": 98070 + }, + { + "epoch": 27.58, + "learning_rate": 4.9846000062474626e-05, + "loss": 0.0857, + "step": 98100 + }, + { + "epoch": 27.59, + "learning_rate": 4.9827257676568894e-05, + "loss": 0.0792, + "step": 98130 + }, + { + "epoch": 27.6, + "learning_rate": 4.9808515290663175e-05, + "loss": 0.081, + "step": 98160 + }, + { + "epoch": 27.6, + "learning_rate": 4.978977290475744e-05, + "loss": 0.0903, + "step": 98190 + }, + { + "epoch": 27.61, + "learning_rate": 4.9771030518851716e-05, + "loss": 0.0697, + "step": 98220 + }, + { + "epoch": 27.62, + "learning_rate": 4.9752288132946e-05, + "loss": 0.0831, + "step": 98250 + }, + { + "epoch": 27.63, + "learning_rate": 4.9733545747040265e-05, + "loss": 0.0775, + "step": 98280 + }, + { + "epoch": 27.64, + "learning_rate": 4.9714803361134546e-05, + "loss": 0.0806, + "step": 98310 + }, + { + "epoch": 27.65, + "learning_rate": 4.969606097522881e-05, + "loss": 0.0896, + "step": 98340 + }, + { + "epoch": 27.66, + "learning_rate": 4.9677318589323094e-05, + "loss": 0.0721, + "step": 98370 + }, + { + "epoch": 27.66, + "learning_rate": 4.965857620341736e-05, + "loss": 0.0842, + "step": 98400 + }, + { + "epoch": 27.67, + "learning_rate": 4.9639833817511635e-05, + "loss": 0.0806, + "step": 98430 + }, + { + "epoch": 27.68, + "learning_rate": 4.9621091431605916e-05, + "loss": 0.0837, + "step": 98460 + }, + { + "epoch": 27.69, + "learning_rate": 4.9602349045700184e-05, + "loss": 0.0857, + "step": 98490 + }, + { + "epoch": 27.7, + "learning_rate": 4.9583606659794465e-05, + "loss": 0.072, + "step": 98520 + }, + { + "epoch": 27.71, + "learning_rate": 4.956486427388873e-05, + "loss": 0.0852, + "step": 98550 + }, + { + "epoch": 27.71, + "learning_rate": 4.954612188798301e-05, + "loss": 0.0756, + "step": 98580 + }, + { + "epoch": 27.72, + "learning_rate": 4.952737950207728e-05, + "loss": 0.0751, + "step": 98610 + }, + { + "epoch": 27.73, + "learning_rate": 4.9508637116171555e-05, + "loss": 0.0875, + "step": 98640 + }, + { + "epoch": 27.74, + "learning_rate": 4.9489894730265836e-05, + "loss": 0.0756, + "step": 98670 + }, + { + "epoch": 27.75, + "learning_rate": 4.94711523443601e-05, + "loss": 0.0835, + "step": 98700 + }, + { + "epoch": 27.76, + "learning_rate": 4.9452409958454384e-05, + "loss": 0.0758, + "step": 98730 + }, + { + "epoch": 27.76, + "learning_rate": 4.943366757254865e-05, + "loss": 0.0805, + "step": 98760 + }, + { + "epoch": 27.77, + "learning_rate": 4.941492518664293e-05, + "loss": 0.0908, + "step": 98790 + }, + { + "epoch": 27.78, + "learning_rate": 4.93961828007372e-05, + "loss": 0.0686, + "step": 98820 + }, + { + "epoch": 27.79, + "learning_rate": 4.9377440414831474e-05, + "loss": 0.0823, + "step": 98850 + }, + { + "epoch": 27.8, + "learning_rate": 4.9358698028925755e-05, + "loss": 0.0782, + "step": 98880 + }, + { + "epoch": 27.81, + "learning_rate": 4.933995564302002e-05, + "loss": 0.0835, + "step": 98910 + }, + { + "epoch": 27.82, + "learning_rate": 4.9321213257114304e-05, + "loss": 0.0905, + "step": 98940 + }, + { + "epoch": 27.82, + "learning_rate": 4.930247087120857e-05, + "loss": 0.0749, + "step": 98970 + }, + { + "epoch": 27.83, + "learning_rate": 4.928372848530285e-05, + "loss": 0.0906, + "step": 99000 + }, + { + "epoch": 27.84, + "learning_rate": 4.926498609939712e-05, + "loss": 0.0759, + "step": 99030 + }, + { + "epoch": 27.85, + "learning_rate": 4.9246243713491394e-05, + "loss": 0.0774, + "step": 99060 + }, + { + "epoch": 27.86, + "learning_rate": 4.9227501327585674e-05, + "loss": 0.0854, + "step": 99090 + }, + { + "epoch": 27.87, + "learning_rate": 4.920875894167994e-05, + "loss": 0.0737, + "step": 99120 + }, + { + "epoch": 27.87, + "learning_rate": 4.919001655577422e-05, + "loss": 0.0804, + "step": 99150 + }, + { + "epoch": 27.88, + "learning_rate": 4.917127416986849e-05, + "loss": 0.0797, + "step": 99180 + }, + { + "epoch": 27.89, + "learning_rate": 4.915253178396277e-05, + "loss": 0.0857, + "step": 99210 + }, + { + "epoch": 27.9, + "learning_rate": 4.913378939805704e-05, + "loss": 0.0884, + "step": 99240 + }, + { + "epoch": 27.91, + "learning_rate": 4.911504701215131e-05, + "loss": 0.071, + "step": 99270 + }, + { + "epoch": 27.92, + "learning_rate": 4.9096304626245594e-05, + "loss": 0.0831, + "step": 99300 + }, + { + "epoch": 27.93, + "learning_rate": 4.907756224033986e-05, + "loss": 0.077, + "step": 99330 + }, + { + "epoch": 27.93, + "learning_rate": 4.905881985443414e-05, + "loss": 0.0806, + "step": 99360 + }, + { + "epoch": 27.94, + "learning_rate": 4.904007746852841e-05, + "loss": 0.0897, + "step": 99390 + }, + { + "epoch": 27.95, + "learning_rate": 4.902133508262269e-05, + "loss": 0.0747, + "step": 99420 + }, + { + "epoch": 27.96, + "learning_rate": 4.900259269671696e-05, + "loss": 0.0819, + "step": 99450 + }, + { + "epoch": 27.97, + "learning_rate": 4.898385031081124e-05, + "loss": 0.0781, + "step": 99480 + }, + { + "epoch": 27.98, + "learning_rate": 4.896510792490551e-05, + "loss": 0.0808, + "step": 99510 + }, + { + "epoch": 27.98, + "learning_rate": 4.894636553899978e-05, + "loss": 0.0893, + "step": 99540 + }, + { + "epoch": 27.99, + "learning_rate": 4.892762315309406e-05, + "loss": 0.0683, + "step": 99570 + }, + { + "epoch": 28.0, + "eval_loss": 0.17405028641223907, + "eval_runtime": 504.0127, + "eval_samples_per_second": 31.811, + "eval_steps_per_second": 0.996, + "eval_wer": 0.1390484898939582, + "step": 99596 + }, + { + "epoch": 28.0, + "learning_rate": 4.890888076718833e-05, + "loss": 0.0901, + "step": 99600 + }, + { + "epoch": 28.01, + "learning_rate": 4.889013838128261e-05, + "loss": 0.0696, + "step": 99630 + }, + { + "epoch": 28.02, + "learning_rate": 4.887139599537688e-05, + "loss": 0.0792, + "step": 99660 + }, + { + "epoch": 28.03, + "learning_rate": 4.885265360947116e-05, + "loss": 0.0727, + "step": 99690 + }, + { + "epoch": 28.03, + "learning_rate": 4.8833911223565426e-05, + "loss": 0.0806, + "step": 99720 + }, + { + "epoch": 28.04, + "learning_rate": 4.88151688376597e-05, + "loss": 0.0846, + "step": 99750 + }, + { + "epoch": 28.05, + "learning_rate": 4.879642645175398e-05, + "loss": 0.0689, + "step": 99780 + }, + { + "epoch": 28.06, + "learning_rate": 4.877768406584825e-05, + "loss": 0.0813, + "step": 99810 + }, + { + "epoch": 28.07, + "learning_rate": 4.875894167994253e-05, + "loss": 0.0765, + "step": 99840 + }, + { + "epoch": 28.08, + "learning_rate": 4.87401992940368e-05, + "loss": 0.0702, + "step": 99870 + }, + { + "epoch": 28.09, + "learning_rate": 4.872145690813108e-05, + "loss": 0.084, + "step": 99900 + }, + { + "epoch": 28.09, + "learning_rate": 4.8702714522225345e-05, + "loss": 0.0721, + "step": 99930 + }, + { + "epoch": 28.1, + "learning_rate": 4.868397213631962e-05, + "loss": 0.0775, + "step": 99960 + }, + { + "epoch": 28.11, + "learning_rate": 4.86652297504139e-05, + "loss": 0.0758, + "step": 99990 + }, + { + "epoch": 28.12, + "learning_rate": 4.864648736450817e-05, + "loss": 0.0764, + "step": 100020 + }, + { + "epoch": 28.13, + "learning_rate": 4.862774497860245e-05, + "loss": 0.0849, + "step": 100050 + }, + { + "epoch": 28.14, + "learning_rate": 4.8609002592696716e-05, + "loss": 0.0691, + "step": 100080 + }, + { + "epoch": 28.14, + "learning_rate": 4.8590260206791e-05, + "loss": 0.079, + "step": 100110 + }, + { + "epoch": 28.15, + "learning_rate": 4.8571517820885264e-05, + "loss": 0.0777, + "step": 100140 + }, + { + "epoch": 28.16, + "learning_rate": 4.855277543497954e-05, + "loss": 0.0761, + "step": 100170 + }, + { + "epoch": 28.17, + "learning_rate": 4.853403304907382e-05, + "loss": 0.0843, + "step": 100200 + }, + { + "epoch": 28.18, + "learning_rate": 4.851529066316809e-05, + "loss": 0.071, + "step": 100230 + }, + { + "epoch": 28.19, + "learning_rate": 4.849654827726237e-05, + "loss": 0.0842, + "step": 100260 + }, + { + "epoch": 28.2, + "learning_rate": 4.8477805891356635e-05, + "loss": 0.0778, + "step": 100290 + }, + { + "epoch": 28.2, + "learning_rate": 4.8459063505450916e-05, + "loss": 0.0767, + "step": 100320 + }, + { + "epoch": 28.21, + "learning_rate": 4.8440321119545184e-05, + "loss": 0.0876, + "step": 100350 + }, + { + "epoch": 28.22, + "learning_rate": 4.842157873363946e-05, + "loss": 0.0721, + "step": 100380 + }, + { + "epoch": 28.23, + "learning_rate": 4.840283634773374e-05, + "loss": 0.0829, + "step": 100410 + }, + { + "epoch": 28.24, + "learning_rate": 4.8384093961828006e-05, + "loss": 0.0797, + "step": 100440 + }, + { + "epoch": 28.25, + "learning_rate": 4.836535157592229e-05, + "loss": 0.0775, + "step": 100470 + }, + { + "epoch": 28.25, + "learning_rate": 4.8346609190016555e-05, + "loss": 0.081, + "step": 100500 + }, + { + "epoch": 28.26, + "learning_rate": 4.8327866804110836e-05, + "loss": 0.0684, + "step": 100530 + }, + { + "epoch": 28.27, + "learning_rate": 4.83091244182051e-05, + "loss": 0.0847, + "step": 100560 + }, + { + "epoch": 28.28, + "learning_rate": 4.829038203229938e-05, + "loss": 0.0765, + "step": 100590 + }, + { + "epoch": 28.29, + "learning_rate": 4.827163964639366e-05, + "loss": 0.0819, + "step": 100620 + }, + { + "epoch": 28.3, + "learning_rate": 4.8252897260487926e-05, + "loss": 0.0865, + "step": 100650 + }, + { + "epoch": 28.3, + "learning_rate": 4.8234154874582207e-05, + "loss": 0.0685, + "step": 100680 + }, + { + "epoch": 28.31, + "learning_rate": 4.8215412488676474e-05, + "loss": 0.0824, + "step": 100710 + }, + { + "epoch": 28.32, + "learning_rate": 4.8196670102770755e-05, + "loss": 0.0759, + "step": 100740 + }, + { + "epoch": 28.33, + "learning_rate": 4.817792771686502e-05, + "loss": 0.076, + "step": 100770 + }, + { + "epoch": 28.34, + "learning_rate": 4.81591853309593e-05, + "loss": 0.0874, + "step": 100800 + }, + { + "epoch": 28.35, + "learning_rate": 4.814044294505358e-05, + "loss": 0.0693, + "step": 100830 + }, + { + "epoch": 28.36, + "learning_rate": 4.8121700559147845e-05, + "loss": 0.079, + "step": 100860 + }, + { + "epoch": 28.36, + "learning_rate": 4.8102958173242126e-05, + "loss": 0.0758, + "step": 100890 + }, + { + "epoch": 28.37, + "learning_rate": 4.808421578733639e-05, + "loss": 0.0777, + "step": 100920 + }, + { + "epoch": 28.38, + "learning_rate": 4.8065473401430674e-05, + "loss": 0.0839, + "step": 100950 + }, + { + "epoch": 28.39, + "learning_rate": 4.804673101552494e-05, + "loss": 0.0735, + "step": 100980 + }, + { + "epoch": 28.4, + "learning_rate": 4.802798862961922e-05, + "loss": 0.0807, + "step": 101010 + }, + { + "epoch": 28.41, + "learning_rate": 4.80092462437135e-05, + "loss": 0.0827, + "step": 101040 + }, + { + "epoch": 28.41, + "learning_rate": 4.7990503857807764e-05, + "loss": 0.0817, + "step": 101070 + }, + { + "epoch": 28.42, + "learning_rate": 4.7971761471902045e-05, + "loss": 0.083, + "step": 101100 + }, + { + "epoch": 28.43, + "learning_rate": 4.795301908599631e-05, + "loss": 0.0715, + "step": 101130 + }, + { + "epoch": 28.44, + "learning_rate": 4.7934276700090594e-05, + "loss": 0.0833, + "step": 101160 + }, + { + "epoch": 28.45, + "learning_rate": 4.791553431418486e-05, + "loss": 0.0769, + "step": 101190 + }, + { + "epoch": 28.46, + "learning_rate": 4.789679192827914e-05, + "loss": 0.0804, + "step": 101220 + }, + { + "epoch": 28.46, + "learning_rate": 4.7878049542373416e-05, + "loss": 0.0848, + "step": 101250 + }, + { + "epoch": 28.47, + "learning_rate": 4.7859307156467684e-05, + "loss": 0.066, + "step": 101280 + }, + { + "epoch": 28.48, + "learning_rate": 4.7840564770561965e-05, + "loss": 0.0854, + "step": 101310 + }, + { + "epoch": 28.49, + "learning_rate": 4.782182238465623e-05, + "loss": 0.0778, + "step": 101340 + }, + { + "epoch": 28.5, + "learning_rate": 4.780307999875051e-05, + "loss": 0.0797, + "step": 101370 + }, + { + "epoch": 28.51, + "learning_rate": 4.778433761284478e-05, + "loss": 0.0888, + "step": 101400 + }, + { + "epoch": 28.52, + "learning_rate": 4.776559522693906e-05, + "loss": 0.0721, + "step": 101430 + }, + { + "epoch": 28.52, + "learning_rate": 4.7746852841033336e-05, + "loss": 0.0865, + "step": 101460 + }, + { + "epoch": 28.53, + "learning_rate": 4.77281104551276e-05, + "loss": 0.0771, + "step": 101490 + }, + { + "epoch": 28.54, + "learning_rate": 4.7709368069221884e-05, + "loss": 0.0756, + "step": 101520 + }, + { + "epoch": 28.55, + "learning_rate": 4.769062568331615e-05, + "loss": 0.0855, + "step": 101550 + }, + { + "epoch": 28.56, + "learning_rate": 4.767188329741043e-05, + "loss": 0.0727, + "step": 101580 + }, + { + "epoch": 28.57, + "learning_rate": 4.76531409115047e-05, + "loss": 0.0831, + "step": 101610 + }, + { + "epoch": 28.57, + "learning_rate": 4.763439852559898e-05, + "loss": 0.08, + "step": 101640 + }, + { + "epoch": 28.58, + "learning_rate": 4.7615656139693255e-05, + "loss": 0.076, + "step": 101670 + }, + { + "epoch": 28.59, + "learning_rate": 4.759691375378752e-05, + "loss": 0.0856, + "step": 101700 + }, + { + "epoch": 28.6, + "learning_rate": 4.75781713678818e-05, + "loss": 0.0746, + "step": 101730 + }, + { + "epoch": 28.61, + "learning_rate": 4.755942898197607e-05, + "loss": 0.0843, + "step": 101760 + }, + { + "epoch": 28.62, + "learning_rate": 4.754068659607035e-05, + "loss": 0.0768, + "step": 101790 + }, + { + "epoch": 28.63, + "learning_rate": 4.752194421016462e-05, + "loss": 0.0799, + "step": 101820 + }, + { + "epoch": 28.63, + "learning_rate": 4.75032018242589e-05, + "loss": 0.0891, + "step": 101850 + }, + { + "epoch": 28.64, + "learning_rate": 4.7484459438353174e-05, + "loss": 0.0719, + "step": 101880 + }, + { + "epoch": 28.65, + "learning_rate": 4.746571705244744e-05, + "loss": 0.0836, + "step": 101910 + }, + { + "epoch": 28.66, + "learning_rate": 4.744697466654172e-05, + "loss": 0.0736, + "step": 101940 + }, + { + "epoch": 28.67, + "learning_rate": 4.742823228063599e-05, + "loss": 0.0755, + "step": 101970 + }, + { + "epoch": 28.68, + "learning_rate": 4.740948989473027e-05, + "loss": 0.0851, + "step": 102000 + }, + { + "epoch": 28.68, + "learning_rate": 4.739074750882454e-05, + "loss": 0.0715, + "step": 102030 + }, + { + "epoch": 28.69, + "learning_rate": 4.737200512291882e-05, + "loss": 0.0837, + "step": 102060 + }, + { + "epoch": 28.7, + "learning_rate": 4.7353262737013094e-05, + "loss": 0.079, + "step": 102090 + }, + { + "epoch": 28.71, + "learning_rate": 4.733452035110736e-05, + "loss": 0.0755, + "step": 102120 + }, + { + "epoch": 28.72, + "learning_rate": 4.731577796520164e-05, + "loss": 0.0904, + "step": 102150 + }, + { + "epoch": 28.73, + "learning_rate": 4.729703557929591e-05, + "loss": 0.0769, + "step": 102180 + }, + { + "epoch": 28.73, + "learning_rate": 4.727829319339019e-05, + "loss": 0.0791, + "step": 102210 + }, + { + "epoch": 28.74, + "learning_rate": 4.725955080748446e-05, + "loss": 0.0824, + "step": 102240 + }, + { + "epoch": 28.75, + "learning_rate": 4.724080842157874e-05, + "loss": 0.0743, + "step": 102270 + }, + { + "epoch": 28.76, + "learning_rate": 4.722206603567301e-05, + "loss": 0.0833, + "step": 102300 + }, + { + "epoch": 28.77, + "learning_rate": 4.720332364976729e-05, + "loss": 0.0729, + "step": 102330 + }, + { + "epoch": 28.78, + "learning_rate": 4.718458126386156e-05, + "loss": 0.0796, + "step": 102360 + }, + { + "epoch": 28.79, + "learning_rate": 4.716583887795583e-05, + "loss": 0.0812, + "step": 102390 + }, + { + "epoch": 28.79, + "learning_rate": 4.714709649205011e-05, + "loss": 0.0808, + "step": 102420 + }, + { + "epoch": 28.8, + "learning_rate": 4.712835410614438e-05, + "loss": 0.0863, + "step": 102450 + }, + { + "epoch": 28.81, + "learning_rate": 4.710961172023866e-05, + "loss": 0.072, + "step": 102480 + }, + { + "epoch": 28.82, + "learning_rate": 4.709086933433293e-05, + "loss": 0.0865, + "step": 102510 + }, + { + "epoch": 28.83, + "learning_rate": 4.7072126948427206e-05, + "loss": 0.077, + "step": 102540 + }, + { + "epoch": 28.84, + "learning_rate": 4.705338456252148e-05, + "loss": 0.0726, + "step": 102570 + }, + { + "epoch": 28.84, + "learning_rate": 4.703464217661575e-05, + "loss": 0.0873, + "step": 102600 + }, + { + "epoch": 28.85, + "learning_rate": 4.701589979071003e-05, + "loss": 0.0751, + "step": 102630 + }, + { + "epoch": 28.86, + "learning_rate": 4.6997157404804296e-05, + "loss": 0.0856, + "step": 102660 + }, + { + "epoch": 28.87, + "learning_rate": 4.697841501889858e-05, + "loss": 0.0805, + "step": 102690 + }, + { + "epoch": 28.88, + "learning_rate": 4.695967263299285e-05, + "loss": 0.0808, + "step": 102720 + }, + { + "epoch": 28.89, + "learning_rate": 4.6940930247087126e-05, + "loss": 0.0881, + "step": 102750 + }, + { + "epoch": 28.9, + "learning_rate": 4.69221878611814e-05, + "loss": 0.0678, + "step": 102780 + }, + { + "epoch": 28.9, + "learning_rate": 4.690344547527567e-05, + "loss": 0.0798, + "step": 102810 + }, + { + "epoch": 28.91, + "learning_rate": 4.688470308936995e-05, + "loss": 0.0816, + "step": 102840 + }, + { + "epoch": 28.92, + "learning_rate": 4.6865960703464216e-05, + "loss": 0.0761, + "step": 102870 + }, + { + "epoch": 28.93, + "learning_rate": 4.68472183175585e-05, + "loss": 0.081, + "step": 102900 + }, + { + "epoch": 28.94, + "learning_rate": 4.682847593165277e-05, + "loss": 0.0742, + "step": 102930 + }, + { + "epoch": 28.95, + "learning_rate": 4.6809733545747045e-05, + "loss": 0.0839, + "step": 102960 + }, + { + "epoch": 28.95, + "learning_rate": 4.679099115984132e-05, + "loss": 0.0795, + "step": 102990 + }, + { + "epoch": 28.96, + "learning_rate": 4.677287352013245e-05, + "loss": 0.0747, + "step": 103020 + }, + { + "epoch": 28.97, + "learning_rate": 4.675413113422673e-05, + "loss": 0.0859, + "step": 103050 + }, + { + "epoch": 28.98, + "learning_rate": 4.6735388748320995e-05, + "loss": 0.0709, + "step": 103080 + }, + { + "epoch": 28.99, + "learning_rate": 4.6716646362415276e-05, + "loss": 0.0851, + "step": 103110 + }, + { + "epoch": 29.0, + "learning_rate": 4.6697903976509543e-05, + "loss": 0.0761, + "step": 103140 + }, + { + "epoch": 29.0, + "eval_loss": 0.16884161531925201, + "eval_runtime": 504.2221, + "eval_samples_per_second": 31.797, + "eval_steps_per_second": 0.996, + "eval_wer": 0.1379225635636592, + "step": 103153 + }, + { + "epoch": 29.0, + "learning_rate": 4.667916159060382e-05, + "loss": 0.0795, + "step": 103170 + }, + { + "epoch": 29.01, + "learning_rate": 4.666041920469809e-05, + "loss": 0.0801, + "step": 103200 + }, + { + "epoch": 29.02, + "learning_rate": 4.6641676818792366e-05, + "loss": 0.078, + "step": 103230 + }, + { + "epoch": 29.03, + "learning_rate": 4.662293443288665e-05, + "loss": 0.0773, + "step": 103260 + }, + { + "epoch": 29.04, + "learning_rate": 4.6604192046980914e-05, + "loss": 0.073, + "step": 103290 + }, + { + "epoch": 29.05, + "learning_rate": 4.6585449661075195e-05, + "loss": 0.0767, + "step": 103320 + }, + { + "epoch": 29.06, + "learning_rate": 4.656670727516946e-05, + "loss": 0.0747, + "step": 103350 + }, + { + "epoch": 29.06, + "learning_rate": 4.654796488926374e-05, + "loss": 0.0705, + "step": 103380 + }, + { + "epoch": 29.07, + "learning_rate": 4.652922250335801e-05, + "loss": 0.0811, + "step": 103410 + }, + { + "epoch": 29.08, + "learning_rate": 4.6510480117452285e-05, + "loss": 0.0723, + "step": 103440 + }, + { + "epoch": 29.09, + "learning_rate": 4.6491737731546566e-05, + "loss": 0.0787, + "step": 103470 + }, + { + "epoch": 29.1, + "learning_rate": 4.6472995345640834e-05, + "loss": 0.0768, + "step": 103500 + }, + { + "epoch": 29.11, + "learning_rate": 4.6454252959735115e-05, + "loss": 0.0724, + "step": 103530 + }, + { + "epoch": 29.11, + "learning_rate": 4.643551057382938e-05, + "loss": 0.0837, + "step": 103560 + }, + { + "epoch": 29.12, + "learning_rate": 4.6416768187923656e-05, + "loss": 0.0678, + "step": 103590 + }, + { + "epoch": 29.13, + "learning_rate": 4.639802580201793e-05, + "loss": 0.0787, + "step": 103620 + }, + { + "epoch": 29.14, + "learning_rate": 4.6379283416112205e-05, + "loss": 0.0766, + "step": 103650 + }, + { + "epoch": 29.15, + "learning_rate": 4.6360541030206486e-05, + "loss": 0.0735, + "step": 103680 + }, + { + "epoch": 29.16, + "learning_rate": 4.634179864430075e-05, + "loss": 0.0764, + "step": 103710 + }, + { + "epoch": 29.17, + "learning_rate": 4.6323056258395034e-05, + "loss": 0.0708, + "step": 103740 + }, + { + "epoch": 29.17, + "learning_rate": 4.63043138724893e-05, + "loss": 0.0829, + "step": 103770 + }, + { + "epoch": 29.18, + "learning_rate": 4.6285571486583576e-05, + "loss": 0.079, + "step": 103800 + }, + { + "epoch": 29.19, + "learning_rate": 4.626682910067785e-05, + "loss": 0.0735, + "step": 103830 + }, + { + "epoch": 29.2, + "learning_rate": 4.6248086714772124e-05, + "loss": 0.0796, + "step": 103860 + }, + { + "epoch": 29.21, + "learning_rate": 4.6229344328866405e-05, + "loss": 0.0697, + "step": 103890 + }, + { + "epoch": 29.22, + "learning_rate": 4.621060194296067e-05, + "loss": 0.0766, + "step": 103920 + }, + { + "epoch": 29.22, + "learning_rate": 4.619185955705495e-05, + "loss": 0.0761, + "step": 103950 + }, + { + "epoch": 29.23, + "learning_rate": 4.617311717114922e-05, + "loss": 0.0731, + "step": 103980 + }, + { + "epoch": 29.24, + "learning_rate": 4.6154374785243495e-05, + "loss": 0.0812, + "step": 104010 + }, + { + "epoch": 29.25, + "learning_rate": 4.613563239933777e-05, + "loss": 0.0717, + "step": 104040 + }, + { + "epoch": 29.26, + "learning_rate": 4.611689001343204e-05, + "loss": 0.0798, + "step": 104070 + }, + { + "epoch": 29.27, + "learning_rate": 4.609814762752632e-05, + "loss": 0.0769, + "step": 104100 + }, + { + "epoch": 29.27, + "learning_rate": 4.607940524162059e-05, + "loss": 0.0744, + "step": 104130 + }, + { + "epoch": 29.28, + "learning_rate": 4.606066285571487e-05, + "loss": 0.0809, + "step": 104160 + }, + { + "epoch": 29.29, + "learning_rate": 4.604192046980914e-05, + "loss": 0.0728, + "step": 104190 + }, + { + "epoch": 29.3, + "learning_rate": 4.6023178083903414e-05, + "loss": 0.0783, + "step": 104220 + }, + { + "epoch": 29.31, + "learning_rate": 4.600443569799769e-05, + "loss": 0.0741, + "step": 104250 + }, + { + "epoch": 29.32, + "learning_rate": 4.598569331209196e-05, + "loss": 0.0725, + "step": 104280 + }, + { + "epoch": 29.33, + "learning_rate": 4.596695092618624e-05, + "loss": 0.0855, + "step": 104310 + }, + { + "epoch": 29.33, + "learning_rate": 4.594820854028051e-05, + "loss": 0.0706, + "step": 104340 + }, + { + "epoch": 29.34, + "learning_rate": 4.592946615437479e-05, + "loss": 0.0829, + "step": 104370 + }, + { + "epoch": 29.35, + "learning_rate": 4.591072376846906e-05, + "loss": 0.0805, + "step": 104400 + }, + { + "epoch": 29.36, + "learning_rate": 4.589198138256334e-05, + "loss": 0.0733, + "step": 104430 + }, + { + "epoch": 29.37, + "learning_rate": 4.587323899665761e-05, + "loss": 0.0785, + "step": 104460 + }, + { + "epoch": 29.38, + "learning_rate": 4.585449661075188e-05, + "loss": 0.067, + "step": 104490 + }, + { + "epoch": 29.38, + "learning_rate": 4.5835754224846156e-05, + "loss": 0.0796, + "step": 104520 + }, + { + "epoch": 29.39, + "learning_rate": 4.581701183894043e-05, + "loss": 0.079, + "step": 104550 + }, + { + "epoch": 29.4, + "learning_rate": 4.579826945303471e-05, + "loss": 0.0743, + "step": 104580 + }, + { + "epoch": 29.41, + "learning_rate": 4.577952706712898e-05, + "loss": 0.0806, + "step": 104610 + }, + { + "epoch": 29.42, + "learning_rate": 4.576078468122326e-05, + "loss": 0.0676, + "step": 104640 + }, + { + "epoch": 29.43, + "learning_rate": 4.574204229531753e-05, + "loss": 0.0739, + "step": 104670 + }, + { + "epoch": 29.43, + "learning_rate": 4.57232999094118e-05, + "loss": 0.0772, + "step": 104700 + }, + { + "epoch": 29.44, + "learning_rate": 4.5704557523506076e-05, + "loss": 0.0772, + "step": 104730 + }, + { + "epoch": 29.45, + "learning_rate": 4.568581513760035e-05, + "loss": 0.0837, + "step": 104760 + }, + { + "epoch": 29.46, + "learning_rate": 4.566707275169463e-05, + "loss": 0.0748, + "step": 104790 + }, + { + "epoch": 29.47, + "learning_rate": 4.56483303657889e-05, + "loss": 0.0779, + "step": 104820 + }, + { + "epoch": 29.48, + "learning_rate": 4.562958797988318e-05, + "loss": 0.0797, + "step": 104850 + }, + { + "epoch": 29.49, + "learning_rate": 4.5610845593977447e-05, + "loss": 0.079, + "step": 104880 + }, + { + "epoch": 29.49, + "learning_rate": 4.559210320807172e-05, + "loss": 0.0863, + "step": 104910 + }, + { + "epoch": 29.5, + "learning_rate": 4.5573360822165995e-05, + "loss": 0.0685, + "step": 104940 + }, + { + "epoch": 29.51, + "learning_rate": 4.555461843626027e-05, + "loss": 0.0788, + "step": 104970 + }, + { + "epoch": 29.52, + "learning_rate": 4.553587605035455e-05, + "loss": 0.0795, + "step": 105000 + }, + { + "epoch": 29.53, + "learning_rate": 4.551713366444882e-05, + "loss": 0.0681, + "step": 105030 + }, + { + "epoch": 29.54, + "learning_rate": 4.549901602473995e-05, + "loss": 0.0824, + "step": 105060 + }, + { + "epoch": 29.54, + "learning_rate": 4.5480273638834226e-05, + "loss": 0.07, + "step": 105090 + }, + { + "epoch": 29.55, + "learning_rate": 4.54615312529285e-05, + "loss": 0.0744, + "step": 105120 + }, + { + "epoch": 29.56, + "learning_rate": 4.5442788867022774e-05, + "loss": 0.0818, + "step": 105150 + }, + { + "epoch": 29.57, + "learning_rate": 4.542404648111705e-05, + "loss": 0.0759, + "step": 105180 + }, + { + "epoch": 29.58, + "learning_rate": 4.540530409521132e-05, + "loss": 0.0817, + "step": 105210 + }, + { + "epoch": 29.59, + "learning_rate": 4.53865617093056e-05, + "loss": 0.0694, + "step": 105240 + }, + { + "epoch": 29.6, + "learning_rate": 4.536781932339987e-05, + "loss": 0.0796, + "step": 105270 + }, + { + "epoch": 29.6, + "learning_rate": 4.5349076937494145e-05, + "loss": 0.0778, + "step": 105300 + }, + { + "epoch": 29.61, + "learning_rate": 4.533033455158842e-05, + "loss": 0.0717, + "step": 105330 + }, + { + "epoch": 29.62, + "learning_rate": 4.5311592165682694e-05, + "loss": 0.0786, + "step": 105360 + }, + { + "epoch": 29.63, + "learning_rate": 4.529284977977697e-05, + "loss": 0.075, + "step": 105390 + }, + { + "epoch": 29.64, + "learning_rate": 4.527410739387124e-05, + "loss": 0.0798, + "step": 105420 + }, + { + "epoch": 29.65, + "learning_rate": 4.5255365007965516e-05, + "loss": 0.0775, + "step": 105450 + }, + { + "epoch": 29.65, + "learning_rate": 4.523662262205979e-05, + "loss": 0.0785, + "step": 105480 + }, + { + "epoch": 29.66, + "learning_rate": 4.5217880236154065e-05, + "loss": 0.0831, + "step": 105510 + }, + { + "epoch": 29.67, + "learning_rate": 4.519913785024834e-05, + "loss": 0.0715, + "step": 105540 + }, + { + "epoch": 29.68, + "learning_rate": 4.518039546434261e-05, + "loss": 0.0793, + "step": 105570 + }, + { + "epoch": 29.69, + "learning_rate": 4.516165307843689e-05, + "loss": 0.079, + "step": 105600 + }, + { + "epoch": 29.7, + "learning_rate": 4.514291069253116e-05, + "loss": 0.0714, + "step": 105630 + }, + { + "epoch": 29.7, + "learning_rate": 4.5124168306625435e-05, + "loss": 0.081, + "step": 105660 + }, + { + "epoch": 29.71, + "learning_rate": 4.510542592071971e-05, + "loss": 0.0654, + "step": 105690 + }, + { + "epoch": 29.72, + "learning_rate": 4.5086683534813984e-05, + "loss": 0.0782, + "step": 105720 + }, + { + "epoch": 29.73, + "learning_rate": 4.506794114890826e-05, + "loss": 0.0768, + "step": 105750 + }, + { + "epoch": 29.74, + "learning_rate": 4.504919876300253e-05, + "loss": 0.0735, + "step": 105780 + }, + { + "epoch": 29.75, + "learning_rate": 4.5030456377096806e-05, + "loss": 0.08, + "step": 105810 + }, + { + "epoch": 29.76, + "learning_rate": 4.501171399119108e-05, + "loss": 0.0737, + "step": 105840 + }, + { + "epoch": 29.76, + "learning_rate": 4.4992971605285355e-05, + "loss": 0.0811, + "step": 105870 + }, + { + "epoch": 29.77, + "learning_rate": 4.497422921937963e-05, + "loss": 0.0814, + "step": 105900 + }, + { + "epoch": 29.78, + "learning_rate": 4.49554868334739e-05, + "loss": 0.0803, + "step": 105930 + }, + { + "epoch": 29.79, + "learning_rate": 4.493674444756818e-05, + "loss": 0.0851, + "step": 105960 + }, + { + "epoch": 29.8, + "learning_rate": 4.491800206166245e-05, + "loss": 0.0689, + "step": 105990 + }, + { + "epoch": 29.81, + "learning_rate": 4.4899259675756726e-05, + "loss": 0.0775, + "step": 106020 + }, + { + "epoch": 29.81, + "learning_rate": 4.4880517289851e-05, + "loss": 0.0799, + "step": 106050 + }, + { + "epoch": 29.82, + "learning_rate": 4.4861774903945274e-05, + "loss": 0.0739, + "step": 106080 + }, + { + "epoch": 29.83, + "learning_rate": 4.484303251803955e-05, + "loss": 0.0798, + "step": 106110 + }, + { + "epoch": 29.84, + "learning_rate": 4.482429013213382e-05, + "loss": 0.0688, + "step": 106140 + }, + { + "epoch": 29.85, + "learning_rate": 4.48055477462281e-05, + "loss": 0.0817, + "step": 106170 + }, + { + "epoch": 29.86, + "learning_rate": 4.478680536032237e-05, + "loss": 0.0755, + "step": 106200 + }, + { + "epoch": 29.86, + "learning_rate": 4.4768062974416645e-05, + "loss": 0.0779, + "step": 106230 + }, + { + "epoch": 29.87, + "learning_rate": 4.474932058851092e-05, + "loss": 0.0822, + "step": 106260 + }, + { + "epoch": 29.88, + "learning_rate": 4.4730578202605193e-05, + "loss": 0.0724, + "step": 106290 + }, + { + "epoch": 29.89, + "learning_rate": 4.471183581669947e-05, + "loss": 0.0782, + "step": 106320 + }, + { + "epoch": 29.9, + "learning_rate": 4.469309343079374e-05, + "loss": 0.0734, + "step": 106350 + }, + { + "epoch": 29.91, + "learning_rate": 4.4674351044888016e-05, + "loss": 0.0763, + "step": 106380 + }, + { + "epoch": 29.92, + "learning_rate": 4.465560865898229e-05, + "loss": 0.0879, + "step": 106410 + }, + { + "epoch": 29.92, + "learning_rate": 4.4636866273076564e-05, + "loss": 0.0741, + "step": 106440 + }, + { + "epoch": 29.93, + "learning_rate": 4.461812388717084e-05, + "loss": 0.0808, + "step": 106470 + }, + { + "epoch": 29.94, + "learning_rate": 4.459938150126511e-05, + "loss": 0.0785, + "step": 106500 + }, + { + "epoch": 29.95, + "learning_rate": 4.458063911535939e-05, + "loss": 0.0715, + "step": 106530 + }, + { + "epoch": 29.96, + "learning_rate": 4.456189672945366e-05, + "loss": 0.0826, + "step": 106560 + }, + { + "epoch": 29.97, + "learning_rate": 4.4543154343547935e-05, + "loss": 0.0769, + "step": 106590 + }, + { + "epoch": 29.97, + "learning_rate": 4.452441195764221e-05, + "loss": 0.0789, + "step": 106620 + }, + { + "epoch": 29.98, + "learning_rate": 4.4505669571736484e-05, + "loss": 0.0756, + "step": 106650 + }, + { + "epoch": 29.99, + "learning_rate": 4.448692718583076e-05, + "loss": 0.0798, + "step": 106680 + }, + { + "epoch": 30.0, + "learning_rate": 4.446818479992503e-05, + "loss": 0.0833, + "step": 106710 + }, + { + "epoch": 30.0, + "eval_loss": 0.17258290946483612, + "eval_runtime": 506.0764, + "eval_samples_per_second": 31.681, + "eval_steps_per_second": 0.992, + "eval_wer": 0.13696040833594914, + "step": 106710 + }, + { + "epoch": 30.01, + "learning_rate": 4.4449442414019306e-05, + "loss": 0.0671, + "step": 106740 + }, + { + "epoch": 30.02, + "learning_rate": 4.443070002811358e-05, + "loss": 0.0827, + "step": 106770 + }, + { + "epoch": 30.03, + "learning_rate": 4.4411957642207855e-05, + "loss": 0.0711, + "step": 106800 + }, + { + "epoch": 30.03, + "learning_rate": 4.439321525630213e-05, + "loss": 0.0783, + "step": 106830 + }, + { + "epoch": 30.04, + "learning_rate": 4.43744728703964e-05, + "loss": 0.0789, + "step": 106860 + }, + { + "epoch": 30.05, + "learning_rate": 4.435573048449068e-05, + "loss": 0.0674, + "step": 106890 + }, + { + "epoch": 30.06, + "learning_rate": 4.433698809858495e-05, + "loss": 0.0807, + "step": 106920 + }, + { + "epoch": 30.07, + "learning_rate": 4.4318245712679226e-05, + "loss": 0.069, + "step": 106950 + }, + { + "epoch": 30.08, + "learning_rate": 4.42995033267735e-05, + "loss": 0.0757, + "step": 106980 + }, + { + "epoch": 30.08, + "learning_rate": 4.4280760940867774e-05, + "loss": 0.0769, + "step": 107010 + }, + { + "epoch": 30.09, + "learning_rate": 4.426201855496205e-05, + "loss": 0.0683, + "step": 107040 + }, + { + "epoch": 30.1, + "learning_rate": 4.424327616905632e-05, + "loss": 0.0827, + "step": 107070 + }, + { + "epoch": 30.11, + "learning_rate": 4.42245337831506e-05, + "loss": 0.0689, + "step": 107100 + }, + { + "epoch": 30.12, + "learning_rate": 4.420579139724487e-05, + "loss": 0.075, + "step": 107130 + }, + { + "epoch": 30.13, + "learning_rate": 4.4187049011339145e-05, + "loss": 0.0843, + "step": 107160 + }, + { + "epoch": 30.13, + "learning_rate": 4.416830662543342e-05, + "loss": 0.0668, + "step": 107190 + }, + { + "epoch": 30.14, + "learning_rate": 4.4149564239527693e-05, + "loss": 0.0776, + "step": 107220 + }, + { + "epoch": 30.15, + "learning_rate": 4.413082185362197e-05, + "loss": 0.0678, + "step": 107250 + }, + { + "epoch": 30.16, + "learning_rate": 4.411207946771624e-05, + "loss": 0.0759, + "step": 107280 + }, + { + "epoch": 30.17, + "learning_rate": 4.4093337081810516e-05, + "loss": 0.0749, + "step": 107310 + }, + { + "epoch": 30.18, + "learning_rate": 4.407459469590479e-05, + "loss": 0.0633, + "step": 107340 + }, + { + "epoch": 30.19, + "learning_rate": 4.4055852309999064e-05, + "loss": 0.075, + "step": 107370 + }, + { + "epoch": 30.19, + "learning_rate": 4.403710992409334e-05, + "loss": 0.0706, + "step": 107400 + }, + { + "epoch": 30.2, + "learning_rate": 4.401836753818761e-05, + "loss": 0.0728, + "step": 107430 + }, + { + "epoch": 30.21, + "learning_rate": 4.399962515228189e-05, + "loss": 0.0838, + "step": 107460 + }, + { + "epoch": 30.22, + "learning_rate": 4.398088276637616e-05, + "loss": 0.0633, + "step": 107490 + }, + { + "epoch": 30.23, + "learning_rate": 4.3962140380470435e-05, + "loss": 0.0811, + "step": 107520 + }, + { + "epoch": 30.24, + "learning_rate": 4.394339799456471e-05, + "loss": 0.0734, + "step": 107550 + }, + { + "epoch": 30.24, + "learning_rate": 4.3924655608658984e-05, + "loss": 0.074, + "step": 107580 + }, + { + "epoch": 30.25, + "learning_rate": 4.390591322275326e-05, + "loss": 0.0857, + "step": 107610 + }, + { + "epoch": 30.26, + "learning_rate": 4.388717083684753e-05, + "loss": 0.067, + "step": 107640 + }, + { + "epoch": 30.27, + "learning_rate": 4.3868428450941806e-05, + "loss": 0.0819, + "step": 107670 + }, + { + "epoch": 30.28, + "learning_rate": 4.384968606503608e-05, + "loss": 0.0696, + "step": 107700 + }, + { + "epoch": 30.29, + "learning_rate": 4.3830943679130355e-05, + "loss": 0.0794, + "step": 107730 + }, + { + "epoch": 30.3, + "learning_rate": 4.381220129322463e-05, + "loss": 0.0793, + "step": 107760 + }, + { + "epoch": 30.3, + "learning_rate": 4.37934589073189e-05, + "loss": 0.0663, + "step": 107790 + }, + { + "epoch": 30.31, + "learning_rate": 4.377471652141318e-05, + "loss": 0.0837, + "step": 107820 + }, + { + "epoch": 30.32, + "learning_rate": 4.375597413550746e-05, + "loss": 0.0678, + "step": 107850 + }, + { + "epoch": 30.33, + "learning_rate": 4.3737231749601726e-05, + "loss": 0.0759, + "step": 107880 + }, + { + "epoch": 30.34, + "learning_rate": 4.3718489363696e-05, + "loss": 0.0829, + "step": 107910 + }, + { + "epoch": 30.35, + "learning_rate": 4.3699746977790274e-05, + "loss": 0.0726, + "step": 107940 + }, + { + "epoch": 30.35, + "learning_rate": 4.368100459188455e-05, + "loss": 0.0777, + "step": 107970 + }, + { + "epoch": 30.36, + "learning_rate": 4.366226220597882e-05, + "loss": 0.0726, + "step": 108000 + }, + { + "epoch": 30.37, + "learning_rate": 4.3643519820073097e-05, + "loss": 0.0811, + "step": 108030 + }, + { + "epoch": 30.38, + "learning_rate": 4.362477743416738e-05, + "loss": 0.082, + "step": 108060 + }, + { + "epoch": 30.39, + "learning_rate": 4.3606035048261645e-05, + "loss": 0.0697, + "step": 108090 + }, + { + "epoch": 30.4, + "learning_rate": 4.358729266235592e-05, + "loss": 0.0796, + "step": 108120 + }, + { + "epoch": 30.4, + "learning_rate": 4.356855027645019e-05, + "loss": 0.0698, + "step": 108150 + }, + { + "epoch": 30.41, + "learning_rate": 4.354980789054447e-05, + "loss": 0.079, + "step": 108180 + }, + { + "epoch": 30.42, + "learning_rate": 4.353106550463874e-05, + "loss": 0.0828, + "step": 108210 + }, + { + "epoch": 30.43, + "learning_rate": 4.3512323118733016e-05, + "loss": 0.0682, + "step": 108240 + }, + { + "epoch": 30.44, + "learning_rate": 4.34935807328273e-05, + "loss": 0.0858, + "step": 108270 + }, + { + "epoch": 30.45, + "learning_rate": 4.3474838346921564e-05, + "loss": 0.076, + "step": 108300 + }, + { + "epoch": 30.46, + "learning_rate": 4.345609596101584e-05, + "loss": 0.0731, + "step": 108330 + }, + { + "epoch": 30.46, + "learning_rate": 4.343735357511011e-05, + "loss": 0.0752, + "step": 108360 + }, + { + "epoch": 30.47, + "learning_rate": 4.341861118920439e-05, + "loss": 0.0666, + "step": 108390 + }, + { + "epoch": 30.48, + "learning_rate": 4.339986880329866e-05, + "loss": 0.0776, + "step": 108420 + }, + { + "epoch": 30.49, + "learning_rate": 4.3381126417392935e-05, + "loss": 0.0693, + "step": 108450 + }, + { + "epoch": 30.5, + "learning_rate": 4.336238403148721e-05, + "loss": 0.072, + "step": 108480 + }, + { + "epoch": 30.51, + "learning_rate": 4.3343641645581484e-05, + "loss": 0.0791, + "step": 108510 + }, + { + "epoch": 30.51, + "learning_rate": 4.332489925967576e-05, + "loss": 0.0724, + "step": 108540 + }, + { + "epoch": 30.52, + "learning_rate": 4.330615687377003e-05, + "loss": 0.0732, + "step": 108570 + }, + { + "epoch": 30.53, + "learning_rate": 4.3287414487864306e-05, + "loss": 0.0653, + "step": 108600 + }, + { + "epoch": 30.54, + "learning_rate": 4.326867210195858e-05, + "loss": 0.0739, + "step": 108630 + }, + { + "epoch": 30.55, + "learning_rate": 4.3249929716052855e-05, + "loss": 0.0801, + "step": 108660 + }, + { + "epoch": 30.56, + "learning_rate": 4.323118733014713e-05, + "loss": 0.0671, + "step": 108690 + }, + { + "epoch": 30.57, + "learning_rate": 4.32124449442414e-05, + "loss": 0.0822, + "step": 108720 + }, + { + "epoch": 30.57, + "learning_rate": 4.319370255833568e-05, + "loss": 0.071, + "step": 108750 + }, + { + "epoch": 30.58, + "learning_rate": 4.317496017242995e-05, + "loss": 0.0774, + "step": 108780 + }, + { + "epoch": 30.59, + "learning_rate": 4.3156217786524225e-05, + "loss": 0.082, + "step": 108810 + }, + { + "epoch": 30.6, + "learning_rate": 4.31374754006185e-05, + "loss": 0.0675, + "step": 108840 + }, + { + "epoch": 30.61, + "learning_rate": 4.3118733014712774e-05, + "loss": 0.0816, + "step": 108870 + }, + { + "epoch": 30.62, + "learning_rate": 4.309999062880705e-05, + "loss": 0.0709, + "step": 108900 + }, + { + "epoch": 30.62, + "learning_rate": 4.308124824290132e-05, + "loss": 0.0743, + "step": 108930 + }, + { + "epoch": 30.63, + "learning_rate": 4.3062505856995596e-05, + "loss": 0.0817, + "step": 108960 + }, + { + "epoch": 30.64, + "learning_rate": 4.304376347108987e-05, + "loss": 0.072, + "step": 108990 + }, + { + "epoch": 30.65, + "learning_rate": 4.3025021085184145e-05, + "loss": 0.0858, + "step": 109020 + }, + { + "epoch": 30.66, + "learning_rate": 4.300627869927842e-05, + "loss": 0.0747, + "step": 109050 + }, + { + "epoch": 30.67, + "learning_rate": 4.298753631337269e-05, + "loss": 0.076, + "step": 109080 + }, + { + "epoch": 30.67, + "learning_rate": 4.296879392746697e-05, + "loss": 0.0823, + "step": 109110 + }, + { + "epoch": 30.68, + "learning_rate": 4.295005154156124e-05, + "loss": 0.0695, + "step": 109140 + }, + { + "epoch": 30.69, + "learning_rate": 4.2931933901852376e-05, + "loss": 0.0779, + "step": 109170 + }, + { + "epoch": 30.7, + "learning_rate": 4.291319151594665e-05, + "loss": 0.0732, + "step": 109200 + }, + { + "epoch": 30.71, + "learning_rate": 4.289507387623778e-05, + "loss": 0.079, + "step": 109230 + }, + { + "epoch": 30.72, + "learning_rate": 4.287633149033206e-05, + "loss": 0.083, + "step": 109260 + }, + { + "epoch": 30.73, + "learning_rate": 4.2857589104426326e-05, + "loss": 0.0726, + "step": 109290 + }, + { + "epoch": 30.73, + "learning_rate": 4.28388467185206e-05, + "loss": 0.0793, + "step": 109320 + }, + { + "epoch": 30.74, + "learning_rate": 4.282010433261488e-05, + "loss": 0.0714, + "step": 109350 + }, + { + "epoch": 30.75, + "learning_rate": 4.280136194670915e-05, + "loss": 0.0753, + "step": 109380 + }, + { + "epoch": 30.76, + "learning_rate": 4.278261956080343e-05, + "loss": 0.0886, + "step": 109410 + }, + { + "epoch": 30.77, + "learning_rate": 4.27638771748977e-05, + "loss": 0.0705, + "step": 109440 + }, + { + "epoch": 30.78, + "learning_rate": 4.274513478899198e-05, + "loss": 0.0826, + "step": 109470 + }, + { + "epoch": 30.78, + "learning_rate": 4.2726392403086245e-05, + "loss": 0.0712, + "step": 109500 + }, + { + "epoch": 30.79, + "learning_rate": 4.2707650017180526e-05, + "loss": 0.0717, + "step": 109530 + }, + { + "epoch": 30.8, + "learning_rate": 4.26889076312748e-05, + "loss": 0.0787, + "step": 109560 + }, + { + "epoch": 30.81, + "learning_rate": 4.267016524536907e-05, + "loss": 0.0677, + "step": 109590 + }, + { + "epoch": 30.82, + "learning_rate": 4.265142285946335e-05, + "loss": 0.0852, + "step": 109620 + }, + { + "epoch": 30.83, + "learning_rate": 4.2632680473557616e-05, + "loss": 0.0714, + "step": 109650 + }, + { + "epoch": 30.83, + "learning_rate": 4.26139380876519e-05, + "loss": 0.0792, + "step": 109680 + }, + { + "epoch": 30.84, + "learning_rate": 4.2595195701746164e-05, + "loss": 0.0828, + "step": 109710 + }, + { + "epoch": 30.85, + "learning_rate": 4.2576453315840445e-05, + "loss": 0.0699, + "step": 109740 + }, + { + "epoch": 30.86, + "learning_rate": 4.255771092993472e-05, + "loss": 0.0783, + "step": 109770 + }, + { + "epoch": 30.87, + "learning_rate": 4.253896854402899e-05, + "loss": 0.076, + "step": 109800 + }, + { + "epoch": 30.88, + "learning_rate": 4.252022615812327e-05, + "loss": 0.079, + "step": 109830 + }, + { + "epoch": 30.89, + "learning_rate": 4.2501483772217535e-05, + "loss": 0.0754, + "step": 109860 + }, + { + "epoch": 30.89, + "learning_rate": 4.2482741386311816e-05, + "loss": 0.066, + "step": 109890 + }, + { + "epoch": 30.9, + "learning_rate": 4.2463999000406084e-05, + "loss": 0.0786, + "step": 109920 + }, + { + "epoch": 30.91, + "learning_rate": 4.2445256614500365e-05, + "loss": 0.0684, + "step": 109950 + }, + { + "epoch": 30.92, + "learning_rate": 4.242651422859464e-05, + "loss": 0.076, + "step": 109980 + }, + { + "epoch": 30.93, + "learning_rate": 4.2407771842688906e-05, + "loss": 0.0846, + "step": 110010 + }, + { + "epoch": 30.94, + "learning_rate": 4.238902945678319e-05, + "loss": 0.0667, + "step": 110040 + }, + { + "epoch": 30.94, + "learning_rate": 4.2370287070877455e-05, + "loss": 0.0792, + "step": 110070 + }, + { + "epoch": 30.95, + "learning_rate": 4.2351544684971736e-05, + "loss": 0.0701, + "step": 110100 + }, + { + "epoch": 30.96, + "learning_rate": 4.2332802299066e-05, + "loss": 0.076, + "step": 110130 + }, + { + "epoch": 30.97, + "learning_rate": 4.2314059913160284e-05, + "loss": 0.0851, + "step": 110160 + }, + { + "epoch": 30.98, + "learning_rate": 4.229531752725455e-05, + "loss": 0.069, + "step": 110190 + }, + { + "epoch": 30.99, + "learning_rate": 4.2276575141348826e-05, + "loss": 0.0819, + "step": 110220 + }, + { + "epoch": 31.0, + "learning_rate": 4.225783275544311e-05, + "loss": 0.0753, + "step": 110250 + }, + { + "epoch": 31.0, + "eval_loss": 0.17743565142154694, + "eval_runtime": 503.5026, + "eval_samples_per_second": 31.843, + "eval_steps_per_second": 0.997, + "eval_wer": 0.13531587351411845, + "step": 110267 + }, + { + "epoch": 31.0, + "learning_rate": 4.2239090369537374e-05, + "loss": 0.0764, + "step": 110280 + }, + { + "epoch": 31.01, + "learning_rate": 4.2220347983631655e-05, + "loss": 0.0728, + "step": 110310 + }, + { + "epoch": 31.02, + "learning_rate": 4.220160559772592e-05, + "loss": 0.0717, + "step": 110340 + }, + { + "epoch": 31.03, + "learning_rate": 4.2182863211820203e-05, + "loss": 0.0774, + "step": 110370 + }, + { + "epoch": 31.04, + "learning_rate": 4.216412082591447e-05, + "loss": 0.0677, + "step": 110400 + }, + { + "epoch": 31.05, + "learning_rate": 4.2145378440008745e-05, + "loss": 0.0734, + "step": 110430 + }, + { + "epoch": 31.05, + "learning_rate": 4.2126636054103026e-05, + "loss": 0.0719, + "step": 110460 + }, + { + "epoch": 31.06, + "learning_rate": 4.2107893668197293e-05, + "loss": 0.0743, + "step": 110490 + }, + { + "epoch": 31.07, + "learning_rate": 4.2089151282291574e-05, + "loss": 0.0812, + "step": 110520 + }, + { + "epoch": 31.08, + "learning_rate": 4.207040889638584e-05, + "loss": 0.0674, + "step": 110550 + }, + { + "epoch": 31.09, + "learning_rate": 4.205166651048012e-05, + "loss": 0.0747, + "step": 110580 + }, + { + "epoch": 31.1, + "learning_rate": 4.203292412457439e-05, + "loss": 0.0694, + "step": 110610 + }, + { + "epoch": 31.1, + "learning_rate": 4.2014181738668664e-05, + "loss": 0.0727, + "step": 110640 + }, + { + "epoch": 31.11, + "learning_rate": 4.1995439352762945e-05, + "loss": 0.0805, + "step": 110670 + }, + { + "epoch": 31.12, + "learning_rate": 4.197669696685721e-05, + "loss": 0.0661, + "step": 110700 + }, + { + "epoch": 31.13, + "learning_rate": 4.1957954580951494e-05, + "loss": 0.0732, + "step": 110730 + }, + { + "epoch": 31.14, + "learning_rate": 4.193921219504576e-05, + "loss": 0.0737, + "step": 110760 + }, + { + "epoch": 31.15, + "learning_rate": 4.192046980914004e-05, + "loss": 0.0691, + "step": 110790 + }, + { + "epoch": 31.16, + "learning_rate": 4.190172742323431e-05, + "loss": 0.0802, + "step": 110820 + }, + { + "epoch": 31.16, + "learning_rate": 4.1882985037328584e-05, + "loss": 0.0687, + "step": 110850 + }, + { + "epoch": 31.17, + "learning_rate": 4.1864242651422865e-05, + "loss": 0.0741, + "step": 110880 + }, + { + "epoch": 31.18, + "learning_rate": 4.184550026551713e-05, + "loss": 0.0684, + "step": 110910 + }, + { + "epoch": 31.19, + "learning_rate": 4.182675787961141e-05, + "loss": 0.0706, + "step": 110940 + }, + { + "epoch": 31.2, + "learning_rate": 4.180801549370568e-05, + "loss": 0.0806, + "step": 110970 + }, + { + "epoch": 31.21, + "learning_rate": 4.178927310779996e-05, + "loss": 0.067, + "step": 111000 + }, + { + "epoch": 31.21, + "learning_rate": 4.177053072189423e-05, + "loss": 0.0762, + "step": 111030 + }, + { + "epoch": 31.22, + "learning_rate": 4.175178833598851e-05, + "loss": 0.0692, + "step": 111060 + }, + { + "epoch": 31.23, + "learning_rate": 4.1733045950082784e-05, + "loss": 0.0731, + "step": 111090 + }, + { + "epoch": 31.24, + "learning_rate": 4.171430356417705e-05, + "loss": 0.0766, + "step": 111120 + }, + { + "epoch": 31.25, + "learning_rate": 4.169556117827133e-05, + "loss": 0.0659, + "step": 111150 + }, + { + "epoch": 31.26, + "learning_rate": 4.16768187923656e-05, + "loss": 0.0748, + "step": 111180 + }, + { + "epoch": 31.27, + "learning_rate": 4.165807640645988e-05, + "loss": 0.0704, + "step": 111210 + }, + { + "epoch": 31.27, + "learning_rate": 4.163933402055415e-05, + "loss": 0.0729, + "step": 111240 + }, + { + "epoch": 31.28, + "learning_rate": 4.162059163464843e-05, + "loss": 0.0836, + "step": 111270 + }, + { + "epoch": 31.29, + "learning_rate": 4.16018492487427e-05, + "loss": 0.0654, + "step": 111300 + }, + { + "epoch": 31.3, + "learning_rate": 4.158310686283697e-05, + "loss": 0.0783, + "step": 111330 + }, + { + "epoch": 31.31, + "learning_rate": 4.156436447693125e-05, + "loss": 0.0718, + "step": 111360 + }, + { + "epoch": 31.32, + "learning_rate": 4.154562209102552e-05, + "loss": 0.0779, + "step": 111390 + }, + { + "epoch": 31.32, + "learning_rate": 4.15268797051198e-05, + "loss": 0.0802, + "step": 111420 + }, + { + "epoch": 31.33, + "learning_rate": 4.150813731921407e-05, + "loss": 0.0666, + "step": 111450 + }, + { + "epoch": 31.34, + "learning_rate": 4.148939493330835e-05, + "loss": 0.0749, + "step": 111480 + }, + { + "epoch": 31.35, + "learning_rate": 4.147065254740262e-05, + "loss": 0.0723, + "step": 111510 + }, + { + "epoch": 31.36, + "learning_rate": 4.145191016149689e-05, + "loss": 0.0714, + "step": 111540 + }, + { + "epoch": 31.37, + "learning_rate": 4.143316777559117e-05, + "loss": 0.0817, + "step": 111570 + }, + { + "epoch": 31.37, + "learning_rate": 4.141442538968544e-05, + "loss": 0.06, + "step": 111600 + }, + { + "epoch": 31.38, + "learning_rate": 4.139568300377972e-05, + "loss": 0.076, + "step": 111630 + }, + { + "epoch": 31.39, + "learning_rate": 4.137694061787399e-05, + "loss": 0.0739, + "step": 111660 + }, + { + "epoch": 31.4, + "learning_rate": 4.135819823196827e-05, + "loss": 0.0708, + "step": 111690 + }, + { + "epoch": 31.41, + "learning_rate": 4.133945584606254e-05, + "loss": 0.0807, + "step": 111720 + }, + { + "epoch": 31.42, + "learning_rate": 4.132071346015681e-05, + "loss": 0.065, + "step": 111750 + }, + { + "epoch": 31.43, + "learning_rate": 4.130197107425109e-05, + "loss": 0.0744, + "step": 111780 + }, + { + "epoch": 31.43, + "learning_rate": 4.128322868834536e-05, + "loss": 0.0714, + "step": 111810 + }, + { + "epoch": 31.44, + "learning_rate": 4.126448630243964e-05, + "loss": 0.0724, + "step": 111840 + }, + { + "epoch": 31.45, + "learning_rate": 4.1245743916533906e-05, + "loss": 0.0763, + "step": 111870 + }, + { + "epoch": 31.46, + "learning_rate": 4.122700153062819e-05, + "loss": 0.0647, + "step": 111900 + }, + { + "epoch": 31.47, + "learning_rate": 4.120825914472246e-05, + "loss": 0.0724, + "step": 111930 + }, + { + "epoch": 31.48, + "learning_rate": 4.118951675881673e-05, + "loss": 0.0729, + "step": 111960 + }, + { + "epoch": 31.48, + "learning_rate": 4.117077437291101e-05, + "loss": 0.0748, + "step": 111990 + }, + { + "epoch": 31.49, + "learning_rate": 4.115203198700528e-05, + "loss": 0.0776, + "step": 112020 + }, + { + "epoch": 31.5, + "learning_rate": 4.113328960109956e-05, + "loss": 0.0696, + "step": 112050 + }, + { + "epoch": 31.51, + "learning_rate": 4.1114547215193826e-05, + "loss": 0.0803, + "step": 112080 + }, + { + "epoch": 31.52, + "learning_rate": 4.1095804829288106e-05, + "loss": 0.0692, + "step": 112110 + }, + { + "epoch": 31.53, + "learning_rate": 4.107706244338238e-05, + "loss": 0.0719, + "step": 112140 + }, + { + "epoch": 31.53, + "learning_rate": 4.105832005747665e-05, + "loss": 0.0827, + "step": 112170 + }, + { + "epoch": 31.54, + "learning_rate": 4.103957767157093e-05, + "loss": 0.0664, + "step": 112200 + }, + { + "epoch": 31.55, + "learning_rate": 4.1020835285665196e-05, + "loss": 0.0749, + "step": 112230 + }, + { + "epoch": 31.56, + "learning_rate": 4.100209289975948e-05, + "loss": 0.0766, + "step": 112260 + }, + { + "epoch": 31.57, + "learning_rate": 4.0983350513853745e-05, + "loss": 0.0713, + "step": 112290 + }, + { + "epoch": 31.58, + "learning_rate": 4.0964608127948026e-05, + "loss": 0.0797, + "step": 112320 + }, + { + "epoch": 31.59, + "learning_rate": 4.09458657420423e-05, + "loss": 0.0632, + "step": 112350 + }, + { + "epoch": 31.59, + "learning_rate": 4.092712335613657e-05, + "loss": 0.0828, + "step": 112380 + }, + { + "epoch": 31.6, + "learning_rate": 4.090838097023085e-05, + "loss": 0.0671, + "step": 112410 + }, + { + "epoch": 31.61, + "learning_rate": 4.0889638584325116e-05, + "loss": 0.0722, + "step": 112440 + }, + { + "epoch": 31.62, + "learning_rate": 4.08708961984194e-05, + "loss": 0.0797, + "step": 112470 + }, + { + "epoch": 31.63, + "learning_rate": 4.0852153812513664e-05, + "loss": 0.0683, + "step": 112500 + }, + { + "epoch": 31.64, + "learning_rate": 4.0833411426607945e-05, + "loss": 0.0732, + "step": 112530 + }, + { + "epoch": 31.64, + "learning_rate": 4.081466904070222e-05, + "loss": 0.0758, + "step": 112560 + }, + { + "epoch": 31.65, + "learning_rate": 4.0795926654796494e-05, + "loss": 0.0727, + "step": 112590 + }, + { + "epoch": 31.66, + "learning_rate": 4.077718426889077e-05, + "loss": 0.0804, + "step": 112620 + }, + { + "epoch": 31.67, + "learning_rate": 4.0758441882985035e-05, + "loss": 0.0671, + "step": 112650 + }, + { + "epoch": 31.68, + "learning_rate": 4.0739699497079316e-05, + "loss": 0.078, + "step": 112680 + }, + { + "epoch": 31.69, + "learning_rate": 4.0720957111173584e-05, + "loss": 0.0729, + "step": 112710 + }, + { + "epoch": 31.7, + "learning_rate": 4.0702214725267864e-05, + "loss": 0.0754, + "step": 112740 + }, + { + "epoch": 31.7, + "learning_rate": 4.068347233936214e-05, + "loss": 0.0798, + "step": 112770 + }, + { + "epoch": 31.71, + "learning_rate": 4.066472995345641e-05, + "loss": 0.0683, + "step": 112800 + }, + { + "epoch": 31.72, + "learning_rate": 4.064598756755069e-05, + "loss": 0.0776, + "step": 112830 + }, + { + "epoch": 31.73, + "learning_rate": 4.0627245181644954e-05, + "loss": 0.0702, + "step": 112860 + }, + { + "epoch": 31.74, + "learning_rate": 4.0608502795739235e-05, + "loss": 0.0764, + "step": 112890 + }, + { + "epoch": 31.75, + "learning_rate": 4.05897604098335e-05, + "loss": 0.0824, + "step": 112920 + }, + { + "epoch": 31.75, + "learning_rate": 4.0571018023927784e-05, + "loss": 0.0669, + "step": 112950 + }, + { + "epoch": 31.76, + "learning_rate": 4.055227563802206e-05, + "loss": 0.0786, + "step": 112980 + }, + { + "epoch": 31.77, + "learning_rate": 4.053353325211633e-05, + "loss": 0.0693, + "step": 113010 + }, + { + "epoch": 31.78, + "learning_rate": 4.0514790866210606e-05, + "loss": 0.0786, + "step": 113040 + }, + { + "epoch": 31.79, + "learning_rate": 4.0496048480304874e-05, + "loss": 0.0769, + "step": 113070 + }, + { + "epoch": 31.8, + "learning_rate": 4.0477306094399155e-05, + "loss": 0.0667, + "step": 113100 + }, + { + "epoch": 31.8, + "learning_rate": 4.045856370849342e-05, + "loss": 0.0788, + "step": 113130 + }, + { + "epoch": 31.81, + "learning_rate": 4.04398213225877e-05, + "loss": 0.0712, + "step": 113160 + }, + { + "epoch": 31.82, + "learning_rate": 4.042107893668198e-05, + "loss": 0.0721, + "step": 113190 + }, + { + "epoch": 31.83, + "learning_rate": 4.040233655077625e-05, + "loss": 0.0794, + "step": 113220 + }, + { + "epoch": 31.84, + "learning_rate": 4.0383594164870526e-05, + "loss": 0.0639, + "step": 113250 + }, + { + "epoch": 31.85, + "learning_rate": 4.036485177896479e-05, + "loss": 0.081, + "step": 113280 + }, + { + "epoch": 31.86, + "learning_rate": 4.0346109393059074e-05, + "loss": 0.0683, + "step": 113310 + }, + { + "epoch": 31.86, + "learning_rate": 4.032736700715334e-05, + "loss": 0.0754, + "step": 113340 + }, + { + "epoch": 31.87, + "learning_rate": 4.030862462124762e-05, + "loss": 0.0803, + "step": 113370 + }, + { + "epoch": 31.88, + "learning_rate": 4.02898822353419e-05, + "loss": 0.0671, + "step": 113400 + }, + { + "epoch": 31.89, + "learning_rate": 4.027113984943617e-05, + "loss": 0.0778, + "step": 113430 + }, + { + "epoch": 31.9, + "learning_rate": 4.0252397463530445e-05, + "loss": 0.071, + "step": 113460 + }, + { + "epoch": 31.91, + "learning_rate": 4.023365507762471e-05, + "loss": 0.0723, + "step": 113490 + }, + { + "epoch": 31.91, + "learning_rate": 4.0214912691718993e-05, + "loss": 0.0788, + "step": 113520 + }, + { + "epoch": 31.92, + "learning_rate": 4.019617030581326e-05, + "loss": 0.0643, + "step": 113550 + }, + { + "epoch": 31.93, + "learning_rate": 4.017742791990754e-05, + "loss": 0.0819, + "step": 113580 + }, + { + "epoch": 31.94, + "learning_rate": 4.0158685534001816e-05, + "loss": 0.0708, + "step": 113610 + }, + { + "epoch": 31.95, + "learning_rate": 4.013994314809609e-05, + "loss": 0.0754, + "step": 113640 + }, + { + "epoch": 31.96, + "learning_rate": 4.0121200762190364e-05, + "loss": 0.0797, + "step": 113670 + }, + { + "epoch": 31.97, + "learning_rate": 4.010245837628463e-05, + "loss": 0.0661, + "step": 113700 + }, + { + "epoch": 31.97, + "learning_rate": 4.008434073657577e-05, + "loss": 0.0755, + "step": 113730 + }, + { + "epoch": 31.98, + "learning_rate": 4.006559835067004e-05, + "loss": 0.0708, + "step": 113760 + }, + { + "epoch": 31.99, + "learning_rate": 4.004685596476432e-05, + "loss": 0.07, + "step": 113790 + }, + { + "epoch": 32.0, + "learning_rate": 4.002873832505545e-05, + "loss": 0.08, + "step": 113820 + }, + { + "epoch": 32.0, + "eval_loss": 0.17339888215065002, + "eval_runtime": 504.4941, + "eval_samples_per_second": 31.78, + "eval_steps_per_second": 0.995, + "eval_wer": 0.1343946610620556, + "step": 113824 + }, + { + "epoch": 32.01, + "learning_rate": 4.000999593914972e-05, + "loss": 0.0651, + "step": 113850 + }, + { + "epoch": 32.02, + "learning_rate": 3.9991253553244e-05, + "loss": 0.0778, + "step": 113880 + }, + { + "epoch": 32.02, + "learning_rate": 3.997251116733827e-05, + "loss": 0.0642, + "step": 113910 + }, + { + "epoch": 32.03, + "learning_rate": 3.9953768781432545e-05, + "loss": 0.0787, + "step": 113940 + }, + { + "epoch": 32.04, + "learning_rate": 3.993502639552682e-05, + "loss": 0.0719, + "step": 113970 + }, + { + "epoch": 32.05, + "learning_rate": 3.9916284009621094e-05, + "loss": 0.0725, + "step": 114000 + }, + { + "epoch": 32.06, + "learning_rate": 3.989754162371537e-05, + "loss": 0.0718, + "step": 114030 + }, + { + "epoch": 32.07, + "learning_rate": 3.987879923780964e-05, + "loss": 0.0685, + "step": 114060 + }, + { + "epoch": 32.07, + "learning_rate": 3.9860056851903916e-05, + "loss": 0.0722, + "step": 114090 + }, + { + "epoch": 32.08, + "learning_rate": 3.984131446599819e-05, + "loss": 0.0678, + "step": 114120 + }, + { + "epoch": 32.09, + "learning_rate": 3.9822572080092465e-05, + "loss": 0.0681, + "step": 114150 + }, + { + "epoch": 32.1, + "learning_rate": 3.980382969418674e-05, + "loss": 0.0781, + "step": 114180 + }, + { + "epoch": 32.11, + "learning_rate": 3.978508730828101e-05, + "loss": 0.0688, + "step": 114210 + }, + { + "epoch": 32.12, + "learning_rate": 3.976634492237529e-05, + "loss": 0.0761, + "step": 114240 + }, + { + "epoch": 32.13, + "learning_rate": 3.974760253646956e-05, + "loss": 0.07, + "step": 114270 + }, + { + "epoch": 32.13, + "learning_rate": 3.9728860150563836e-05, + "loss": 0.0743, + "step": 114300 + }, + { + "epoch": 32.14, + "learning_rate": 3.971011776465811e-05, + "loss": 0.0765, + "step": 114330 + }, + { + "epoch": 32.15, + "learning_rate": 3.9691375378752384e-05, + "loss": 0.062, + "step": 114360 + }, + { + "epoch": 32.16, + "learning_rate": 3.967263299284666e-05, + "loss": 0.0747, + "step": 114390 + }, + { + "epoch": 32.17, + "learning_rate": 3.965389060694093e-05, + "loss": 0.0753, + "step": 114420 + }, + { + "epoch": 32.18, + "learning_rate": 3.963514822103521e-05, + "loss": 0.0737, + "step": 114450 + }, + { + "epoch": 32.18, + "learning_rate": 3.961640583512948e-05, + "loss": 0.0771, + "step": 114480 + }, + { + "epoch": 32.19, + "learning_rate": 3.9597663449223755e-05, + "loss": 0.0675, + "step": 114510 + }, + { + "epoch": 32.2, + "learning_rate": 3.957892106331803e-05, + "loss": 0.0757, + "step": 114540 + }, + { + "epoch": 32.21, + "learning_rate": 3.95601786774123e-05, + "loss": 0.0698, + "step": 114570 + }, + { + "epoch": 32.22, + "learning_rate": 3.954143629150658e-05, + "loss": 0.0689, + "step": 114600 + }, + { + "epoch": 32.23, + "learning_rate": 3.952269390560085e-05, + "loss": 0.0773, + "step": 114630 + }, + { + "epoch": 32.23, + "learning_rate": 3.9503951519695126e-05, + "loss": 0.0695, + "step": 114660 + }, + { + "epoch": 32.24, + "learning_rate": 3.94852091337894e-05, + "loss": 0.0754, + "step": 114690 + }, + { + "epoch": 32.25, + "learning_rate": 3.9466466747883674e-05, + "loss": 0.0689, + "step": 114720 + }, + { + "epoch": 32.26, + "learning_rate": 3.944772436197795e-05, + "loss": 0.0677, + "step": 114750 + }, + { + "epoch": 32.27, + "learning_rate": 3.942898197607222e-05, + "loss": 0.0772, + "step": 114780 + }, + { + "epoch": 32.28, + "learning_rate": 3.94102395901665e-05, + "loss": 0.0616, + "step": 114810 + }, + { + "epoch": 32.29, + "learning_rate": 3.939149720426077e-05, + "loss": 0.068, + "step": 114840 + }, + { + "epoch": 32.29, + "learning_rate": 3.9372754818355045e-05, + "loss": 0.0726, + "step": 114870 + }, + { + "epoch": 32.3, + "learning_rate": 3.935401243244932e-05, + "loss": 0.0765, + "step": 114900 + }, + { + "epoch": 32.31, + "learning_rate": 3.9335270046543594e-05, + "loss": 0.076, + "step": 114930 + }, + { + "epoch": 32.32, + "learning_rate": 3.931652766063787e-05, + "loss": 0.0674, + "step": 114960 + }, + { + "epoch": 32.33, + "learning_rate": 3.929778527473214e-05, + "loss": 0.0703, + "step": 114990 + }, + { + "epoch": 32.34, + "learning_rate": 3.9279042888826416e-05, + "loss": 0.0698, + "step": 115020 + }, + { + "epoch": 32.34, + "learning_rate": 3.926030050292069e-05, + "loss": 0.0699, + "step": 115050 + }, + { + "epoch": 32.35, + "learning_rate": 3.9241558117014965e-05, + "loss": 0.0794, + "step": 115080 + }, + { + "epoch": 32.36, + "learning_rate": 3.922281573110924e-05, + "loss": 0.0702, + "step": 115110 + }, + { + "epoch": 32.37, + "learning_rate": 3.920407334520351e-05, + "loss": 0.0742, + "step": 115140 + }, + { + "epoch": 32.38, + "learning_rate": 3.918533095929779e-05, + "loss": 0.0728, + "step": 115170 + }, + { + "epoch": 32.39, + "learning_rate": 3.916658857339206e-05, + "loss": 0.0682, + "step": 115200 + }, + { + "epoch": 32.4, + "learning_rate": 3.9147846187486336e-05, + "loss": 0.0743, + "step": 115230 + }, + { + "epoch": 32.4, + "learning_rate": 3.912910380158061e-05, + "loss": 0.0833, + "step": 115260 + }, + { + "epoch": 32.41, + "learning_rate": 3.9110361415674884e-05, + "loss": 0.0739, + "step": 115290 + }, + { + "epoch": 32.42, + "learning_rate": 3.909161902976916e-05, + "loss": 0.0723, + "step": 115320 + }, + { + "epoch": 32.43, + "learning_rate": 3.907287664386343e-05, + "loss": 0.0676, + "step": 115350 + }, + { + "epoch": 32.44, + "learning_rate": 3.9054134257957707e-05, + "loss": 0.0776, + "step": 115380 + }, + { + "epoch": 32.45, + "learning_rate": 3.903539187205198e-05, + "loss": 0.0676, + "step": 115410 + }, + { + "epoch": 32.45, + "learning_rate": 3.9016649486146255e-05, + "loss": 0.0735, + "step": 115440 + }, + { + "epoch": 32.46, + "learning_rate": 3.899790710024053e-05, + "loss": 0.0732, + "step": 115470 + }, + { + "epoch": 32.47, + "learning_rate": 3.89791647143348e-05, + "loss": 0.0712, + "step": 115500 + }, + { + "epoch": 32.48, + "learning_rate": 3.896042232842908e-05, + "loss": 0.0762, + "step": 115530 + }, + { + "epoch": 32.49, + "learning_rate": 3.894167994252335e-05, + "loss": 0.0624, + "step": 115560 + }, + { + "epoch": 32.5, + "learning_rate": 3.8922937556617626e-05, + "loss": 0.0805, + "step": 115590 + }, + { + "epoch": 32.5, + "learning_rate": 3.89041951707119e-05, + "loss": 0.0696, + "step": 115620 + }, + { + "epoch": 32.51, + "learning_rate": 3.8885452784806174e-05, + "loss": 0.0691, + "step": 115650 + }, + { + "epoch": 32.52, + "learning_rate": 3.886671039890045e-05, + "loss": 0.0795, + "step": 115680 + }, + { + "epoch": 32.53, + "learning_rate": 3.884796801299472e-05, + "loss": 0.0689, + "step": 115710 + }, + { + "epoch": 32.54, + "learning_rate": 3.8829225627089e-05, + "loss": 0.0736, + "step": 115740 + }, + { + "epoch": 32.55, + "learning_rate": 3.881048324118327e-05, + "loss": 0.0689, + "step": 115770 + }, + { + "epoch": 32.56, + "learning_rate": 3.8791740855277545e-05, + "loss": 0.0721, + "step": 115800 + }, + { + "epoch": 32.56, + "learning_rate": 3.877299846937182e-05, + "loss": 0.0763, + "step": 115830 + }, + { + "epoch": 32.57, + "learning_rate": 3.8754256083466094e-05, + "loss": 0.0676, + "step": 115860 + }, + { + "epoch": 32.58, + "learning_rate": 3.873551369756037e-05, + "loss": 0.0779, + "step": 115890 + }, + { + "epoch": 32.59, + "learning_rate": 3.871677131165464e-05, + "loss": 0.0727, + "step": 115920 + }, + { + "epoch": 32.6, + "learning_rate": 3.8698028925748916e-05, + "loss": 0.0716, + "step": 115950 + }, + { + "epoch": 32.61, + "learning_rate": 3.867928653984319e-05, + "loss": 0.0728, + "step": 115980 + }, + { + "epoch": 32.61, + "learning_rate": 3.8660544153937465e-05, + "loss": 0.0667, + "step": 116010 + }, + { + "epoch": 32.62, + "learning_rate": 3.864180176803174e-05, + "loss": 0.0741, + "step": 116040 + }, + { + "epoch": 32.63, + "learning_rate": 3.862305938212601e-05, + "loss": 0.073, + "step": 116070 + }, + { + "epoch": 32.64, + "learning_rate": 3.860431699622029e-05, + "loss": 0.07, + "step": 116100 + }, + { + "epoch": 32.65, + "learning_rate": 3.858557461031456e-05, + "loss": 0.0731, + "step": 116130 + }, + { + "epoch": 32.66, + "learning_rate": 3.8566832224408835e-05, + "loss": 0.0615, + "step": 116160 + }, + { + "epoch": 32.67, + "learning_rate": 3.854808983850311e-05, + "loss": 0.0712, + "step": 116190 + }, + { + "epoch": 32.67, + "learning_rate": 3.8529347452597384e-05, + "loss": 0.0686, + "step": 116220 + }, + { + "epoch": 32.68, + "learning_rate": 3.851060506669166e-05, + "loss": 0.0717, + "step": 116250 + }, + { + "epoch": 32.69, + "learning_rate": 3.849186268078593e-05, + "loss": 0.0768, + "step": 116280 + }, + { + "epoch": 32.7, + "learning_rate": 3.8473120294880206e-05, + "loss": 0.069, + "step": 116310 + }, + { + "epoch": 32.71, + "learning_rate": 3.845437790897448e-05, + "loss": 0.0742, + "step": 116340 + }, + { + "epoch": 32.72, + "learning_rate": 3.8435635523068755e-05, + "loss": 0.0685, + "step": 116370 + }, + { + "epoch": 32.72, + "learning_rate": 3.841689313716303e-05, + "loss": 0.066, + "step": 116400 + }, + { + "epoch": 32.73, + "learning_rate": 3.83981507512573e-05, + "loss": 0.0743, + "step": 116430 + }, + { + "epoch": 32.74, + "learning_rate": 3.837940836535158e-05, + "loss": 0.0687, + "step": 116460 + }, + { + "epoch": 32.75, + "learning_rate": 3.836066597944585e-05, + "loss": 0.0778, + "step": 116490 + }, + { + "epoch": 32.76, + "learning_rate": 3.8341923593540126e-05, + "loss": 0.0695, + "step": 116520 + }, + { + "epoch": 32.77, + "learning_rate": 3.83231812076344e-05, + "loss": 0.071, + "step": 116550 + }, + { + "epoch": 32.77, + "learning_rate": 3.8304438821728674e-05, + "loss": 0.0755, + "step": 116580 + }, + { + "epoch": 32.78, + "learning_rate": 3.828569643582295e-05, + "loss": 0.0654, + "step": 116610 + }, + { + "epoch": 32.79, + "learning_rate": 3.826695404991722e-05, + "loss": 0.0739, + "step": 116640 + }, + { + "epoch": 32.8, + "learning_rate": 3.82482116640115e-05, + "loss": 0.0711, + "step": 116670 + }, + { + "epoch": 32.81, + "learning_rate": 3.822946927810577e-05, + "loss": 0.0727, + "step": 116700 + }, + { + "epoch": 32.82, + "learning_rate": 3.8210726892200045e-05, + "loss": 0.0772, + "step": 116730 + }, + { + "epoch": 32.83, + "learning_rate": 3.819198450629432e-05, + "loss": 0.0666, + "step": 116760 + }, + { + "epoch": 32.83, + "learning_rate": 3.8173242120388593e-05, + "loss": 0.0703, + "step": 116790 + }, + { + "epoch": 32.84, + "learning_rate": 3.815449973448287e-05, + "loss": 0.0709, + "step": 116820 + }, + { + "epoch": 32.85, + "learning_rate": 3.813575734857714e-05, + "loss": 0.0669, + "step": 116850 + }, + { + "epoch": 32.86, + "learning_rate": 3.8117014962671416e-05, + "loss": 0.0814, + "step": 116880 + }, + { + "epoch": 32.87, + "learning_rate": 3.809827257676569e-05, + "loss": 0.0667, + "step": 116910 + }, + { + "epoch": 32.88, + "learning_rate": 3.8079530190859964e-05, + "loss": 0.0762, + "step": 116940 + }, + { + "epoch": 32.88, + "learning_rate": 3.806078780495424e-05, + "loss": 0.0712, + "step": 116970 + }, + { + "epoch": 32.89, + "learning_rate": 3.804204541904851e-05, + "loss": 0.0705, + "step": 117000 + }, + { + "epoch": 32.9, + "learning_rate": 3.802330303314279e-05, + "loss": 0.0774, + "step": 117030 + }, + { + "epoch": 32.91, + "learning_rate": 3.800456064723706e-05, + "loss": 0.0662, + "step": 117060 + }, + { + "epoch": 32.92, + "learning_rate": 3.7985818261331335e-05, + "loss": 0.0753, + "step": 117090 + }, + { + "epoch": 32.93, + "learning_rate": 3.796707587542561e-05, + "loss": 0.0716, + "step": 117120 + }, + { + "epoch": 32.93, + "learning_rate": 3.7948333489519884e-05, + "loss": 0.0707, + "step": 117150 + }, + { + "epoch": 32.94, + "learning_rate": 3.792959110361416e-05, + "loss": 0.0788, + "step": 117180 + }, + { + "epoch": 32.95, + "learning_rate": 3.791084871770843e-05, + "loss": 0.0658, + "step": 117210 + }, + { + "epoch": 32.96, + "learning_rate": 3.7892106331802706e-05, + "loss": 0.0779, + "step": 117240 + }, + { + "epoch": 32.97, + "learning_rate": 3.787336394589698e-05, + "loss": 0.0709, + "step": 117270 + }, + { + "epoch": 32.98, + "learning_rate": 3.7854621559991255e-05, + "loss": 0.0752, + "step": 117300 + }, + { + "epoch": 32.99, + "learning_rate": 3.783587917408553e-05, + "loss": 0.083, + "step": 117330 + }, + { + "epoch": 32.99, + "learning_rate": 3.78171367881798e-05, + "loss": 0.0644, + "step": 117360 + }, + { + "epoch": 33.0, + "eval_loss": 0.1736820936203003, + "eval_runtime": 505.177, + "eval_samples_per_second": 31.737, + "eval_steps_per_second": 0.994, + "eval_wer": 0.13342568203840433, + "step": 117381 + }, + { + "epoch": 33.0, + "learning_rate": 3.779839440227408e-05, + "loss": 0.0821, + "step": 117390 + }, + { + "epoch": 33.01, + "learning_rate": 3.777965201636835e-05, + "loss": 0.0647, + "step": 117420 + }, + { + "epoch": 33.02, + "learning_rate": 3.7760909630462626e-05, + "loss": 0.072, + "step": 117450 + }, + { + "epoch": 33.03, + "learning_rate": 3.77421672445569e-05, + "loss": 0.07, + "step": 117480 + }, + { + "epoch": 33.04, + "learning_rate": 3.7723424858651174e-05, + "loss": 0.0648, + "step": 117510 + }, + { + "epoch": 33.04, + "learning_rate": 3.770468247274545e-05, + "loss": 0.0759, + "step": 117540 + }, + { + "epoch": 33.05, + "learning_rate": 3.768594008683972e-05, + "loss": 0.0648, + "step": 117570 + }, + { + "epoch": 33.06, + "learning_rate": 3.7667197700934e-05, + "loss": 0.0713, + "step": 117600 + }, + { + "epoch": 33.07, + "learning_rate": 3.764845531502827e-05, + "loss": 0.0697, + "step": 117630 + }, + { + "epoch": 33.08, + "learning_rate": 3.7629712929122545e-05, + "loss": 0.0647, + "step": 117660 + }, + { + "epoch": 33.09, + "learning_rate": 3.761097054321682e-05, + "loss": 0.0765, + "step": 117690 + }, + { + "epoch": 33.1, + "learning_rate": 3.7592228157311093e-05, + "loss": 0.0637, + "step": 117720 + }, + { + "epoch": 33.1, + "learning_rate": 3.757348577140537e-05, + "loss": 0.0722, + "step": 117750 + }, + { + "epoch": 33.11, + "learning_rate": 3.755474338549964e-05, + "loss": 0.0717, + "step": 117780 + }, + { + "epoch": 33.12, + "learning_rate": 3.7536000999593916e-05, + "loss": 0.0668, + "step": 117810 + }, + { + "epoch": 33.13, + "learning_rate": 3.751725861368819e-05, + "loss": 0.0749, + "step": 117840 + }, + { + "epoch": 33.14, + "learning_rate": 3.7498516227782464e-05, + "loss": 0.0646, + "step": 117870 + }, + { + "epoch": 33.15, + "learning_rate": 3.747977384187674e-05, + "loss": 0.0745, + "step": 117900 + }, + { + "epoch": 33.15, + "learning_rate": 3.746103145597101e-05, + "loss": 0.0757, + "step": 117930 + }, + { + "epoch": 33.16, + "learning_rate": 3.744228907006529e-05, + "loss": 0.0638, + "step": 117960 + }, + { + "epoch": 33.17, + "learning_rate": 3.742354668415956e-05, + "loss": 0.0761, + "step": 117990 + }, + { + "epoch": 33.18, + "learning_rate": 3.7404804298253835e-05, + "loss": 0.0671, + "step": 118020 + }, + { + "epoch": 33.19, + "learning_rate": 3.738606191234811e-05, + "loss": 0.0693, + "step": 118050 + }, + { + "epoch": 33.2, + "learning_rate": 3.7367319526442384e-05, + "loss": 0.0707, + "step": 118080 + }, + { + "epoch": 33.2, + "learning_rate": 3.734920188673352e-05, + "loss": 0.0654, + "step": 118110 + }, + { + "epoch": 33.21, + "learning_rate": 3.733108424702465e-05, + "loss": 0.0924, + "step": 118140 + }, + { + "epoch": 33.22, + "learning_rate": 3.731234186111892e-05, + "loss": 0.0655, + "step": 118170 + }, + { + "epoch": 33.23, + "learning_rate": 3.72935994752132e-05, + "loss": 0.0746, + "step": 118200 + }, + { + "epoch": 33.24, + "learning_rate": 3.727485708930747e-05, + "loss": 0.0739, + "step": 118230 + }, + { + "epoch": 33.25, + "learning_rate": 3.725611470340175e-05, + "loss": 0.0618, + "step": 118260 + }, + { + "epoch": 33.26, + "learning_rate": 3.7237372317496016e-05, + "loss": 0.0719, + "step": 118290 + }, + { + "epoch": 33.26, + "learning_rate": 3.721862993159029e-05, + "loss": 0.0637, + "step": 118320 + }, + { + "epoch": 33.27, + "learning_rate": 3.719988754568457e-05, + "loss": 0.0712, + "step": 118350 + }, + { + "epoch": 33.28, + "learning_rate": 3.718114515977884e-05, + "loss": 0.0729, + "step": 118380 + }, + { + "epoch": 33.29, + "learning_rate": 3.716240277387312e-05, + "loss": 0.0642, + "step": 118410 + }, + { + "epoch": 33.3, + "learning_rate": 3.714366038796739e-05, + "loss": 0.0766, + "step": 118440 + }, + { + "epoch": 33.31, + "learning_rate": 3.712491800206167e-05, + "loss": 0.0649, + "step": 118470 + }, + { + "epoch": 33.31, + "learning_rate": 3.7106175616155936e-05, + "loss": 0.0727, + "step": 118500 + }, + { + "epoch": 33.32, + "learning_rate": 3.708743323025021e-05, + "loss": 0.0738, + "step": 118530 + }, + { + "epoch": 33.33, + "learning_rate": 3.706869084434449e-05, + "loss": 0.0699, + "step": 118560 + }, + { + "epoch": 33.34, + "learning_rate": 3.704994845843876e-05, + "loss": 0.0803, + "step": 118590 + }, + { + "epoch": 33.35, + "learning_rate": 3.703120607253304e-05, + "loss": 0.0693, + "step": 118620 + }, + { + "epoch": 33.36, + "learning_rate": 3.7012463686627307e-05, + "loss": 0.0686, + "step": 118650 + }, + { + "epoch": 33.37, + "learning_rate": 3.699372130072159e-05, + "loss": 0.072, + "step": 118680 + }, + { + "epoch": 33.37, + "learning_rate": 3.6974978914815855e-05, + "loss": 0.0638, + "step": 118710 + }, + { + "epoch": 33.38, + "learning_rate": 3.695623652891013e-05, + "loss": 0.0771, + "step": 118740 + }, + { + "epoch": 33.39, + "learning_rate": 3.693749414300441e-05, + "loss": 0.0655, + "step": 118770 + }, + { + "epoch": 33.4, + "learning_rate": 3.691875175709868e-05, + "loss": 0.0731, + "step": 118800 + }, + { + "epoch": 33.41, + "learning_rate": 3.690000937119296e-05, + "loss": 0.0711, + "step": 118830 + }, + { + "epoch": 33.42, + "learning_rate": 3.6881266985287226e-05, + "loss": 0.0667, + "step": 118860 + }, + { + "epoch": 33.42, + "learning_rate": 3.686252459938151e-05, + "loss": 0.0784, + "step": 118890 + }, + { + "epoch": 33.43, + "learning_rate": 3.6843782213475774e-05, + "loss": 0.07, + "step": 118920 + }, + { + "epoch": 33.44, + "learning_rate": 3.682503982757005e-05, + "loss": 0.0707, + "step": 118950 + }, + { + "epoch": 33.45, + "learning_rate": 3.680629744166433e-05, + "loss": 0.0738, + "step": 118980 + }, + { + "epoch": 33.46, + "learning_rate": 3.67875550557586e-05, + "loss": 0.0649, + "step": 119010 + }, + { + "epoch": 33.47, + "learning_rate": 3.676881266985288e-05, + "loss": 0.0812, + "step": 119040 + }, + { + "epoch": 33.47, + "learning_rate": 3.6750070283947145e-05, + "loss": 0.0659, + "step": 119070 + }, + { + "epoch": 33.48, + "learning_rate": 3.6731327898041426e-05, + "loss": 0.0679, + "step": 119100 + }, + { + "epoch": 33.49, + "learning_rate": 3.6712585512135694e-05, + "loss": 0.0721, + "step": 119130 + }, + { + "epoch": 33.5, + "learning_rate": 3.669384312622997e-05, + "loss": 0.0634, + "step": 119160 + }, + { + "epoch": 33.51, + "learning_rate": 3.667510074032425e-05, + "loss": 0.0753, + "step": 119190 + }, + { + "epoch": 33.52, + "learning_rate": 3.6656358354418516e-05, + "loss": 0.0668, + "step": 119220 + }, + { + "epoch": 33.53, + "learning_rate": 3.66376159685128e-05, + "loss": 0.0718, + "step": 119250 + }, + { + "epoch": 33.53, + "learning_rate": 3.6618873582607065e-05, + "loss": 0.0759, + "step": 119280 + }, + { + "epoch": 33.54, + "learning_rate": 3.6600131196701346e-05, + "loss": 0.0681, + "step": 119310 + }, + { + "epoch": 33.55, + "learning_rate": 3.658138881079561e-05, + "loss": 0.0753, + "step": 119340 + }, + { + "epoch": 33.56, + "learning_rate": 3.656264642488989e-05, + "loss": 0.0653, + "step": 119370 + }, + { + "epoch": 33.57, + "learning_rate": 3.654390403898417e-05, + "loss": 0.0715, + "step": 119400 + }, + { + "epoch": 33.58, + "learning_rate": 3.6525161653078436e-05, + "loss": 0.0702, + "step": 119430 + }, + { + "epoch": 33.58, + "learning_rate": 3.6506419267172716e-05, + "loss": 0.0669, + "step": 119460 + }, + { + "epoch": 33.59, + "learning_rate": 3.6487676881266984e-05, + "loss": 0.0732, + "step": 119490 + }, + { + "epoch": 33.6, + "learning_rate": 3.6468934495361265e-05, + "loss": 0.0674, + "step": 119520 + }, + { + "epoch": 33.61, + "learning_rate": 3.645019210945553e-05, + "loss": 0.0692, + "step": 119550 + }, + { + "epoch": 33.62, + "learning_rate": 3.6431449723549806e-05, + "loss": 0.0688, + "step": 119580 + }, + { + "epoch": 33.63, + "learning_rate": 3.641270733764409e-05, + "loss": 0.067, + "step": 119610 + }, + { + "epoch": 33.63, + "learning_rate": 3.6393964951738355e-05, + "loss": 0.0742, + "step": 119640 + }, + { + "epoch": 33.64, + "learning_rate": 3.6375222565832636e-05, + "loss": 0.0663, + "step": 119670 + }, + { + "epoch": 33.65, + "learning_rate": 3.63564801799269e-05, + "loss": 0.0678, + "step": 119700 + }, + { + "epoch": 33.66, + "learning_rate": 3.6337737794021184e-05, + "loss": 0.0758, + "step": 119730 + }, + { + "epoch": 33.67, + "learning_rate": 3.631899540811545e-05, + "loss": 0.067, + "step": 119760 + }, + { + "epoch": 33.68, + "learning_rate": 3.630025302220973e-05, + "loss": 0.0794, + "step": 119790 + }, + { + "epoch": 33.69, + "learning_rate": 3.628151063630401e-05, + "loss": 0.0641, + "step": 119820 + }, + { + "epoch": 33.69, + "learning_rate": 3.6262768250398274e-05, + "loss": 0.0699, + "step": 119850 + }, + { + "epoch": 33.7, + "learning_rate": 3.6244025864492555e-05, + "loss": 0.0687, + "step": 119880 + }, + { + "epoch": 33.71, + "learning_rate": 3.622528347858682e-05, + "loss": 0.0673, + "step": 119910 + }, + { + "epoch": 33.72, + "learning_rate": 3.6206541092681104e-05, + "loss": 0.0728, + "step": 119940 + }, + { + "epoch": 33.73, + "learning_rate": 3.618779870677537e-05, + "loss": 0.065, + "step": 119970 + }, + { + "epoch": 33.74, + "learning_rate": 3.616905632086965e-05, + "loss": 0.0722, + "step": 120000 + }, + { + "epoch": 33.74, + "learning_rate": 3.6150313934963926e-05, + "loss": 0.0713, + "step": 120030 + }, + { + "epoch": 33.75, + "learning_rate": 3.6131571549058194e-05, + "loss": 0.0648, + "step": 120060 + }, + { + "epoch": 33.76, + "learning_rate": 3.6112829163152474e-05, + "loss": 0.072, + "step": 120090 + }, + { + "epoch": 33.77, + "learning_rate": 3.609408677724674e-05, + "loss": 0.0638, + "step": 120120 + }, + { + "epoch": 33.78, + "learning_rate": 3.607534439134102e-05, + "loss": 0.07, + "step": 120150 + }, + { + "epoch": 33.79, + "learning_rate": 3.605660200543529e-05, + "loss": 0.074, + "step": 120180 + }, + { + "epoch": 33.8, + "learning_rate": 3.603785961952957e-05, + "loss": 0.0681, + "step": 120210 + }, + { + "epoch": 33.8, + "learning_rate": 3.6019117233623845e-05, + "loss": 0.0749, + "step": 120240 + }, + { + "epoch": 33.81, + "learning_rate": 3.600037484771811e-05, + "loss": 0.0671, + "step": 120270 + }, + { + "epoch": 33.82, + "learning_rate": 3.5981632461812394e-05, + "loss": 0.0671, + "step": 120300 + }, + { + "epoch": 33.83, + "learning_rate": 3.596289007590666e-05, + "loss": 0.0676, + "step": 120330 + }, + { + "epoch": 33.84, + "learning_rate": 3.594414769000094e-05, + "loss": 0.0637, + "step": 120360 + }, + { + "epoch": 33.85, + "learning_rate": 3.592540530409521e-05, + "loss": 0.0791, + "step": 120390 + }, + { + "epoch": 33.85, + "learning_rate": 3.590666291818949e-05, + "loss": 0.0633, + "step": 120420 + }, + { + "epoch": 33.86, + "learning_rate": 3.5887920532283765e-05, + "loss": 0.0718, + "step": 120450 + }, + { + "epoch": 33.87, + "learning_rate": 3.586917814637803e-05, + "loss": 0.0754, + "step": 120480 + }, + { + "epoch": 33.88, + "learning_rate": 3.585043576047231e-05, + "loss": 0.067, + "step": 120510 + }, + { + "epoch": 33.89, + "learning_rate": 3.583169337456658e-05, + "loss": 0.0729, + "step": 120540 + }, + { + "epoch": 33.9, + "learning_rate": 3.581295098866086e-05, + "loss": 0.0651, + "step": 120570 + }, + { + "epoch": 33.9, + "learning_rate": 3.579420860275513e-05, + "loss": 0.0733, + "step": 120600 + }, + { + "epoch": 33.91, + "learning_rate": 3.577546621684941e-05, + "loss": 0.0754, + "step": 120630 + }, + { + "epoch": 33.92, + "learning_rate": 3.5756723830943684e-05, + "loss": 0.0666, + "step": 120660 + }, + { + "epoch": 33.93, + "learning_rate": 3.573798144503795e-05, + "loss": 0.0755, + "step": 120690 + }, + { + "epoch": 33.94, + "learning_rate": 3.571923905913223e-05, + "loss": 0.0694, + "step": 120720 + }, + { + "epoch": 33.95, + "learning_rate": 3.57004966732265e-05, + "loss": 0.0732, + "step": 120750 + }, + { + "epoch": 33.96, + "learning_rate": 3.568175428732078e-05, + "loss": 0.0734, + "step": 120780 + }, + { + "epoch": 33.96, + "learning_rate": 3.566301190141505e-05, + "loss": 0.0657, + "step": 120810 + }, + { + "epoch": 33.97, + "learning_rate": 3.564426951550933e-05, + "loss": 0.0697, + "step": 120840 + }, + { + "epoch": 33.98, + "learning_rate": 3.56255271296036e-05, + "loss": 0.0639, + "step": 120870 + }, + { + "epoch": 33.99, + "learning_rate": 3.560678474369787e-05, + "loss": 0.0722, + "step": 120900 + }, + { + "epoch": 34.0, + "learning_rate": 3.558804235779215e-05, + "loss": 0.0745, + "step": 120930 + }, + { + "epoch": 34.0, + "eval_loss": 0.17628006637096405, + "eval_runtime": 505.7594, + "eval_samples_per_second": 31.701, + "eval_steps_per_second": 0.993, + "eval_wer": 0.13345297722216914, + "step": 120938 + }, + { + "epoch": 34.01, + "learning_rate": 3.556929997188642e-05, + "loss": 0.0622, + "step": 120960 + }, + { + "epoch": 34.01, + "learning_rate": 3.55505575859807e-05, + "loss": 0.0761, + "step": 120990 + }, + { + "epoch": 34.02, + "learning_rate": 3.553181520007497e-05, + "loss": 0.0592, + "step": 121020 + }, + { + "epoch": 34.03, + "learning_rate": 3.551307281416925e-05, + "loss": 0.0716, + "step": 121050 + }, + { + "epoch": 34.04, + "learning_rate": 3.5494330428263516e-05, + "loss": 0.07, + "step": 121080 + }, + { + "epoch": 34.05, + "learning_rate": 3.547558804235779e-05, + "loss": 0.0654, + "step": 121110 + }, + { + "epoch": 34.06, + "learning_rate": 3.545684565645207e-05, + "loss": 0.0767, + "step": 121140 + }, + { + "epoch": 34.07, + "learning_rate": 3.543810327054634e-05, + "loss": 0.0632, + "step": 121170 + }, + { + "epoch": 34.07, + "learning_rate": 3.541936088464062e-05, + "loss": 0.0701, + "step": 121200 + }, + { + "epoch": 34.08, + "learning_rate": 3.540061849873489e-05, + "loss": 0.0663, + "step": 121230 + }, + { + "epoch": 34.09, + "learning_rate": 3.538187611282917e-05, + "loss": 0.0699, + "step": 121260 + }, + { + "epoch": 34.1, + "learning_rate": 3.5363133726923435e-05, + "loss": 0.0768, + "step": 121290 + }, + { + "epoch": 34.11, + "learning_rate": 3.5344391341017716e-05, + "loss": 0.0639, + "step": 121320 + }, + { + "epoch": 34.12, + "learning_rate": 3.532564895511199e-05, + "loss": 0.0739, + "step": 121350 + }, + { + "epoch": 34.12, + "learning_rate": 3.530690656920626e-05, + "loss": 0.0649, + "step": 121380 + }, + { + "epoch": 34.13, + "learning_rate": 3.528816418330054e-05, + "loss": 0.0691, + "step": 121410 + }, + { + "epoch": 34.14, + "learning_rate": 3.5269421797394806e-05, + "loss": 0.0708, + "step": 121440 + }, + { + "epoch": 34.15, + "learning_rate": 3.525067941148909e-05, + "loss": 0.0601, + "step": 121470 + }, + { + "epoch": 34.16, + "learning_rate": 3.5231937025583355e-05, + "loss": 0.0718, + "step": 121500 + }, + { + "epoch": 34.17, + "learning_rate": 3.5213194639677636e-05, + "loss": 0.072, + "step": 121530 + }, + { + "epoch": 34.17, + "learning_rate": 3.519445225377191e-05, + "loss": 0.063, + "step": 121560 + }, + { + "epoch": 34.18, + "learning_rate": 3.517570986786618e-05, + "loss": 0.078, + "step": 121590 + }, + { + "epoch": 34.19, + "learning_rate": 3.515696748196046e-05, + "loss": 0.0597, + "step": 121620 + }, + { + "epoch": 34.2, + "learning_rate": 3.5138849842251586e-05, + "loss": 0.0781, + "step": 121650 + }, + { + "epoch": 34.21, + "learning_rate": 3.512010745634586e-05, + "loss": 0.0674, + "step": 121680 + }, + { + "epoch": 34.22, + "learning_rate": 3.5101365070440134e-05, + "loss": 0.069, + "step": 121710 + }, + { + "epoch": 34.23, + "learning_rate": 3.508262268453441e-05, + "loss": 0.0778, + "step": 121740 + }, + { + "epoch": 34.23, + "learning_rate": 3.506388029862868e-05, + "loss": 0.0619, + "step": 121770 + }, + { + "epoch": 34.24, + "learning_rate": 3.5045137912722957e-05, + "loss": 0.0716, + "step": 121800 + }, + { + "epoch": 34.25, + "learning_rate": 3.502639552681723e-05, + "loss": 0.0629, + "step": 121830 + }, + { + "epoch": 34.26, + "learning_rate": 3.5007653140911505e-05, + "loss": 0.072, + "step": 121860 + }, + { + "epoch": 34.27, + "learning_rate": 3.4988910755005786e-05, + "loss": 0.0704, + "step": 121890 + }, + { + "epoch": 34.28, + "learning_rate": 3.497016836910005e-05, + "loss": 0.0623, + "step": 121920 + }, + { + "epoch": 34.28, + "learning_rate": 3.495142598319433e-05, + "loss": 0.079, + "step": 121950 + }, + { + "epoch": 34.29, + "learning_rate": 3.49326835972886e-05, + "loss": 0.0659, + "step": 121980 + }, + { + "epoch": 34.3, + "learning_rate": 3.4913941211382876e-05, + "loss": 0.0664, + "step": 122010 + }, + { + "epoch": 34.31, + "learning_rate": 3.489519882547715e-05, + "loss": 0.0731, + "step": 122040 + }, + { + "epoch": 34.32, + "learning_rate": 3.4876456439571424e-05, + "loss": 0.0645, + "step": 122070 + }, + { + "epoch": 34.33, + "learning_rate": 3.4857714053665705e-05, + "loss": 0.0716, + "step": 122100 + }, + { + "epoch": 34.34, + "learning_rate": 3.483897166775997e-05, + "loss": 0.0663, + "step": 122130 + }, + { + "epoch": 34.34, + "learning_rate": 3.482022928185425e-05, + "loss": 0.0694, + "step": 122160 + }, + { + "epoch": 34.35, + "learning_rate": 3.480148689594852e-05, + "loss": 0.0785, + "step": 122190 + }, + { + "epoch": 34.36, + "learning_rate": 3.4782744510042795e-05, + "loss": 0.0592, + "step": 122220 + }, + { + "epoch": 34.37, + "learning_rate": 3.476400212413707e-05, + "loss": 0.0727, + "step": 122250 + }, + { + "epoch": 34.38, + "learning_rate": 3.4745259738231344e-05, + "loss": 0.066, + "step": 122280 + }, + { + "epoch": 34.39, + "learning_rate": 3.4726517352325625e-05, + "loss": 0.0675, + "step": 122310 + }, + { + "epoch": 34.39, + "learning_rate": 3.470777496641989e-05, + "loss": 0.0738, + "step": 122340 + }, + { + "epoch": 34.4, + "learning_rate": 3.4689032580514166e-05, + "loss": 0.0627, + "step": 122370 + }, + { + "epoch": 34.41, + "learning_rate": 3.467029019460844e-05, + "loss": 0.0754, + "step": 122400 + }, + { + "epoch": 34.42, + "learning_rate": 3.4651547808702715e-05, + "loss": 0.0693, + "step": 122430 + }, + { + "epoch": 34.43, + "learning_rate": 3.463280542279699e-05, + "loss": 0.0647, + "step": 122460 + }, + { + "epoch": 34.44, + "learning_rate": 3.461406303689126e-05, + "loss": 0.077, + "step": 122490 + }, + { + "epoch": 34.44, + "learning_rate": 3.4595320650985544e-05, + "loss": 0.0636, + "step": 122520 + }, + { + "epoch": 34.45, + "learning_rate": 3.457657826507981e-05, + "loss": 0.0692, + "step": 122550 + }, + { + "epoch": 34.46, + "learning_rate": 3.4557835879174086e-05, + "loss": 0.0654, + "step": 122580 + }, + { + "epoch": 34.47, + "learning_rate": 3.453909349326836e-05, + "loss": 0.0719, + "step": 122610 + }, + { + "epoch": 34.48, + "learning_rate": 3.4520351107362634e-05, + "loss": 0.0772, + "step": 122640 + }, + { + "epoch": 34.49, + "learning_rate": 3.450160872145691e-05, + "loss": 0.0612, + "step": 122670 + }, + { + "epoch": 34.5, + "learning_rate": 3.448286633555118e-05, + "loss": 0.0712, + "step": 122700 + }, + { + "epoch": 34.5, + "learning_rate": 3.446412394964546e-05, + "loss": 0.0642, + "step": 122730 + }, + { + "epoch": 34.51, + "learning_rate": 3.444538156373973e-05, + "loss": 0.0673, + "step": 122760 + }, + { + "epoch": 34.52, + "learning_rate": 3.4426639177834005e-05, + "loss": 0.0801, + "step": 122790 + }, + { + "epoch": 34.53, + "learning_rate": 3.440789679192828e-05, + "loss": 0.0653, + "step": 122820 + }, + { + "epoch": 34.54, + "learning_rate": 3.438915440602255e-05, + "loss": 0.0733, + "step": 122850 + }, + { + "epoch": 34.55, + "learning_rate": 3.437041202011683e-05, + "loss": 0.0657, + "step": 122880 + }, + { + "epoch": 34.55, + "learning_rate": 3.43516696342111e-05, + "loss": 0.0713, + "step": 122910 + }, + { + "epoch": 34.56, + "learning_rate": 3.433292724830538e-05, + "loss": 0.0749, + "step": 122940 + }, + { + "epoch": 34.57, + "learning_rate": 3.431418486239965e-05, + "loss": 0.0617, + "step": 122970 + }, + { + "epoch": 34.58, + "learning_rate": 3.4295442476493924e-05, + "loss": 0.0714, + "step": 123000 + }, + { + "epoch": 34.59, + "learning_rate": 3.42767000905882e-05, + "loss": 0.0654, + "step": 123030 + }, + { + "epoch": 34.6, + "learning_rate": 3.425795770468247e-05, + "loss": 0.0703, + "step": 123060 + }, + { + "epoch": 34.6, + "learning_rate": 3.423921531877675e-05, + "loss": 0.0721, + "step": 123090 + }, + { + "epoch": 34.61, + "learning_rate": 3.422047293287102e-05, + "loss": 0.0595, + "step": 123120 + }, + { + "epoch": 34.62, + "learning_rate": 3.42017305469653e-05, + "loss": 0.07, + "step": 123150 + }, + { + "epoch": 34.63, + "learning_rate": 3.418298816105957e-05, + "loss": 0.0703, + "step": 123180 + }, + { + "epoch": 34.64, + "learning_rate": 3.416424577515385e-05, + "loss": 0.0674, + "step": 123210 + }, + { + "epoch": 34.65, + "learning_rate": 3.414550338924812e-05, + "loss": 0.0748, + "step": 123240 + }, + { + "epoch": 34.66, + "learning_rate": 3.412676100334239e-05, + "loss": 0.0611, + "step": 123270 + }, + { + "epoch": 34.66, + "learning_rate": 3.4108018617436666e-05, + "loss": 0.0697, + "step": 123300 + }, + { + "epoch": 34.67, + "learning_rate": 3.408927623153094e-05, + "loss": 0.0675, + "step": 123330 + }, + { + "epoch": 34.68, + "learning_rate": 3.407053384562522e-05, + "loss": 0.0681, + "step": 123360 + }, + { + "epoch": 34.69, + "learning_rate": 3.405179145971949e-05, + "loss": 0.0752, + "step": 123390 + }, + { + "epoch": 34.7, + "learning_rate": 3.403304907381377e-05, + "loss": 0.0615, + "step": 123420 + }, + { + "epoch": 34.71, + "learning_rate": 3.401430668790804e-05, + "loss": 0.0723, + "step": 123450 + }, + { + "epoch": 34.71, + "learning_rate": 3.399618904819917e-05, + "loss": 0.0674, + "step": 123480 + }, + { + "epoch": 34.72, + "learning_rate": 3.3977446662293445e-05, + "loss": 0.0747, + "step": 123510 + }, + { + "epoch": 34.73, + "learning_rate": 3.395870427638772e-05, + "loss": 0.0762, + "step": 123540 + }, + { + "epoch": 34.74, + "learning_rate": 3.3939961890481994e-05, + "loss": 0.0643, + "step": 123570 + }, + { + "epoch": 34.75, + "learning_rate": 3.392121950457627e-05, + "loss": 0.0757, + "step": 123600 + }, + { + "epoch": 34.76, + "learning_rate": 3.390247711867054e-05, + "loss": 0.0599, + "step": 123630 + }, + { + "epoch": 34.77, + "learning_rate": 3.3883734732764816e-05, + "loss": 0.0727, + "step": 123660 + }, + { + "epoch": 34.77, + "learning_rate": 3.386499234685909e-05, + "loss": 0.0705, + "step": 123690 + }, + { + "epoch": 34.78, + "learning_rate": 3.3846249960953365e-05, + "loss": 0.0598, + "step": 123720 + }, + { + "epoch": 34.79, + "learning_rate": 3.382750757504764e-05, + "loss": 0.0719, + "step": 123750 + }, + { + "epoch": 34.8, + "learning_rate": 3.380876518914191e-05, + "loss": 0.0674, + "step": 123780 + }, + { + "epoch": 34.81, + "learning_rate": 3.379002280323619e-05, + "loss": 0.0704, + "step": 123810 + }, + { + "epoch": 34.82, + "learning_rate": 3.377128041733046e-05, + "loss": 0.0741, + "step": 123840 + }, + { + "epoch": 34.82, + "learning_rate": 3.3752538031424736e-05, + "loss": 0.063, + "step": 123870 + }, + { + "epoch": 34.83, + "learning_rate": 3.373379564551901e-05, + "loss": 0.0703, + "step": 123900 + }, + { + "epoch": 34.84, + "learning_rate": 3.3715053259613284e-05, + "loss": 0.0686, + "step": 123930 + }, + { + "epoch": 34.85, + "learning_rate": 3.369631087370756e-05, + "loss": 0.0759, + "step": 123960 + }, + { + "epoch": 34.86, + "learning_rate": 3.367756848780183e-05, + "loss": 0.0726, + "step": 123990 + }, + { + "epoch": 34.87, + "learning_rate": 3.365882610189611e-05, + "loss": 0.0641, + "step": 124020 + }, + { + "epoch": 34.87, + "learning_rate": 3.364008371599038e-05, + "loss": 0.0711, + "step": 124050 + }, + { + "epoch": 34.88, + "learning_rate": 3.3621341330084655e-05, + "loss": 0.0667, + "step": 124080 + }, + { + "epoch": 34.89, + "learning_rate": 3.360259894417893e-05, + "loss": 0.0673, + "step": 124110 + }, + { + "epoch": 34.9, + "learning_rate": 3.3583856558273203e-05, + "loss": 0.0793, + "step": 124140 + }, + { + "epoch": 34.91, + "learning_rate": 3.356511417236748e-05, + "loss": 0.0624, + "step": 124170 + }, + { + "epoch": 34.92, + "learning_rate": 3.354637178646175e-05, + "loss": 0.0705, + "step": 124200 + }, + { + "epoch": 34.93, + "learning_rate": 3.3527629400556026e-05, + "loss": 0.0656, + "step": 124230 + }, + { + "epoch": 34.93, + "learning_rate": 3.35088870146503e-05, + "loss": 0.068, + "step": 124260 + }, + { + "epoch": 34.94, + "learning_rate": 3.3490144628744574e-05, + "loss": 0.0793, + "step": 124290 + }, + { + "epoch": 34.95, + "learning_rate": 3.347140224283885e-05, + "loss": 0.0624, + "step": 124320 + }, + { + "epoch": 34.96, + "learning_rate": 3.345265985693312e-05, + "loss": 0.0718, + "step": 124350 + }, + { + "epoch": 34.97, + "learning_rate": 3.34339174710274e-05, + "loss": 0.0681, + "step": 124380 + }, + { + "epoch": 34.98, + "learning_rate": 3.341517508512167e-05, + "loss": 0.067, + "step": 124410 + }, + { + "epoch": 34.98, + "learning_rate": 3.3396432699215945e-05, + "loss": 0.0727, + "step": 124440 + }, + { + "epoch": 34.99, + "learning_rate": 3.337769031331022e-05, + "loss": 0.0629, + "step": 124470 + }, + { + "epoch": 35.0, + "eval_loss": 0.1761113852262497, + "eval_runtime": 507.443, + "eval_samples_per_second": 31.596, + "eval_steps_per_second": 0.989, + "eval_wer": 0.13112606280621783, + "step": 124495 + }, + { + "epoch": 35.0, + "learning_rate": 3.3358947927404494e-05, + "loss": 0.0739, + "step": 124500 + }, + { + "epoch": 35.01, + "learning_rate": 3.334020554149877e-05, + "loss": 0.0606, + "step": 124530 + }, + { + "epoch": 35.02, + "learning_rate": 3.332146315559304e-05, + "loss": 0.0696, + "step": 124560 + }, + { + "epoch": 35.03, + "learning_rate": 3.3302720769687316e-05, + "loss": 0.0621, + "step": 124590 + }, + { + "epoch": 35.04, + "learning_rate": 3.328397838378159e-05, + "loss": 0.0666, + "step": 124620 + }, + { + "epoch": 35.04, + "learning_rate": 3.3265235997875865e-05, + "loss": 0.0742, + "step": 124650 + }, + { + "epoch": 35.05, + "learning_rate": 3.324649361197014e-05, + "loss": 0.0615, + "step": 124680 + }, + { + "epoch": 35.06, + "learning_rate": 3.322775122606441e-05, + "loss": 0.0659, + "step": 124710 + }, + { + "epoch": 35.07, + "learning_rate": 3.320900884015869e-05, + "loss": 0.0686, + "step": 124740 + }, + { + "epoch": 35.08, + "learning_rate": 3.319026645425296e-05, + "loss": 0.0666, + "step": 124770 + }, + { + "epoch": 35.09, + "learning_rate": 3.3171524068347236e-05, + "loss": 0.0668, + "step": 124800 + }, + { + "epoch": 35.09, + "learning_rate": 3.315278168244151e-05, + "loss": 0.0635, + "step": 124830 + }, + { + "epoch": 35.1, + "learning_rate": 3.3134039296535784e-05, + "loss": 0.0668, + "step": 124860 + }, + { + "epoch": 35.11, + "learning_rate": 3.311529691063006e-05, + "loss": 0.0675, + "step": 124890 + }, + { + "epoch": 35.12, + "learning_rate": 3.309655452472433e-05, + "loss": 0.0698, + "step": 124920 + }, + { + "epoch": 35.13, + "learning_rate": 3.307781213881861e-05, + "loss": 0.0706, + "step": 124950 + }, + { + "epoch": 35.14, + "learning_rate": 3.305906975291288e-05, + "loss": 0.0669, + "step": 124980 + }, + { + "epoch": 35.14, + "learning_rate": 3.3040327367007155e-05, + "loss": 0.0731, + "step": 125010 + }, + { + "epoch": 35.15, + "learning_rate": 3.302158498110143e-05, + "loss": 0.0644, + "step": 125040 + }, + { + "epoch": 35.16, + "learning_rate": 3.30028425951957e-05, + "loss": 0.0603, + "step": 125070 + }, + { + "epoch": 35.17, + "learning_rate": 3.298410020928998e-05, + "loss": 0.0705, + "step": 125100 + }, + { + "epoch": 35.18, + "learning_rate": 3.296535782338425e-05, + "loss": 0.0666, + "step": 125130 + }, + { + "epoch": 35.19, + "learning_rate": 3.2946615437478526e-05, + "loss": 0.0695, + "step": 125160 + }, + { + "epoch": 35.2, + "learning_rate": 3.29278730515728e-05, + "loss": 0.0696, + "step": 125190 + }, + { + "epoch": 35.2, + "learning_rate": 3.2909130665667074e-05, + "loss": 0.0649, + "step": 125220 + }, + { + "epoch": 35.21, + "learning_rate": 3.289038827976135e-05, + "loss": 0.0723, + "step": 125250 + }, + { + "epoch": 35.22, + "learning_rate": 3.287164589385562e-05, + "loss": 0.06, + "step": 125280 + }, + { + "epoch": 35.23, + "learning_rate": 3.28529035079499e-05, + "loss": 0.0716, + "step": 125310 + }, + { + "epoch": 35.24, + "learning_rate": 3.283416112204417e-05, + "loss": 0.0679, + "step": 125340 + }, + { + "epoch": 35.25, + "learning_rate": 3.2815418736138445e-05, + "loss": 0.0639, + "step": 125370 + }, + { + "epoch": 35.25, + "learning_rate": 3.279667635023272e-05, + "loss": 0.0715, + "step": 125400 + }, + { + "epoch": 35.26, + "learning_rate": 3.2777933964326994e-05, + "loss": 0.0607, + "step": 125430 + }, + { + "epoch": 35.27, + "learning_rate": 3.275919157842127e-05, + "loss": 0.0664, + "step": 125460 + }, + { + "epoch": 35.28, + "learning_rate": 3.274044919251554e-05, + "loss": 0.066, + "step": 125490 + }, + { + "epoch": 35.29, + "learning_rate": 3.2721706806609816e-05, + "loss": 0.065, + "step": 125520 + }, + { + "epoch": 35.3, + "learning_rate": 3.270296442070409e-05, + "loss": 0.0746, + "step": 125550 + }, + { + "epoch": 35.3, + "learning_rate": 3.2684222034798365e-05, + "loss": 0.0616, + "step": 125580 + }, + { + "epoch": 35.31, + "learning_rate": 3.266547964889264e-05, + "loss": 0.0716, + "step": 125610 + }, + { + "epoch": 35.32, + "learning_rate": 3.264673726298691e-05, + "loss": 0.0714, + "step": 125640 + }, + { + "epoch": 35.33, + "learning_rate": 3.262799487708119e-05, + "loss": 0.0641, + "step": 125670 + }, + { + "epoch": 35.34, + "learning_rate": 3.260925249117546e-05, + "loss": 0.0735, + "step": 125700 + }, + { + "epoch": 35.35, + "learning_rate": 3.2590510105269736e-05, + "loss": 0.0591, + "step": 125730 + }, + { + "epoch": 35.36, + "learning_rate": 3.257176771936401e-05, + "loss": 0.0727, + "step": 125760 + }, + { + "epoch": 35.36, + "learning_rate": 3.2553025333458284e-05, + "loss": 0.0652, + "step": 125790 + }, + { + "epoch": 35.37, + "learning_rate": 3.253428294755256e-05, + "loss": 0.0671, + "step": 125820 + }, + { + "epoch": 35.38, + "learning_rate": 3.251554056164683e-05, + "loss": 0.0725, + "step": 125850 + }, + { + "epoch": 35.39, + "learning_rate": 3.2496798175741107e-05, + "loss": 0.0627, + "step": 125880 + }, + { + "epoch": 35.4, + "learning_rate": 3.247805578983538e-05, + "loss": 0.0703, + "step": 125910 + }, + { + "epoch": 35.41, + "learning_rate": 3.2459313403929655e-05, + "loss": 0.064, + "step": 125940 + }, + { + "epoch": 35.41, + "learning_rate": 3.244057101802393e-05, + "loss": 0.0622, + "step": 125970 + }, + { + "epoch": 35.42, + "learning_rate": 3.24218286321182e-05, + "loss": 0.0756, + "step": 126000 + }, + { + "epoch": 35.43, + "learning_rate": 3.240308624621248e-05, + "loss": 0.063, + "step": 126030 + }, + { + "epoch": 35.44, + "learning_rate": 3.238434386030675e-05, + "loss": 0.0776, + "step": 126060 + }, + { + "epoch": 35.45, + "learning_rate": 3.2365601474401026e-05, + "loss": 0.0668, + "step": 126090 + }, + { + "epoch": 35.46, + "learning_rate": 3.23468590884953e-05, + "loss": 0.0692, + "step": 126120 + }, + { + "epoch": 35.47, + "learning_rate": 3.2328116702589574e-05, + "loss": 0.0752, + "step": 126150 + }, + { + "epoch": 35.47, + "learning_rate": 3.230937431668385e-05, + "loss": 0.0594, + "step": 126180 + }, + { + "epoch": 35.48, + "learning_rate": 3.229063193077812e-05, + "loss": 0.0692, + "step": 126210 + }, + { + "epoch": 35.49, + "learning_rate": 3.22718895448724e-05, + "loss": 0.0669, + "step": 126240 + }, + { + "epoch": 35.5, + "learning_rate": 3.225314715896667e-05, + "loss": 0.0648, + "step": 126270 + }, + { + "epoch": 35.51, + "learning_rate": 3.2234404773060945e-05, + "loss": 0.072, + "step": 126300 + }, + { + "epoch": 35.52, + "learning_rate": 3.221566238715522e-05, + "loss": 0.0603, + "step": 126330 + }, + { + "epoch": 35.52, + "learning_rate": 3.2196920001249494e-05, + "loss": 0.0711, + "step": 126360 + }, + { + "epoch": 35.53, + "learning_rate": 3.217817761534377e-05, + "loss": 0.0703, + "step": 126390 + }, + { + "epoch": 35.54, + "learning_rate": 3.215943522943804e-05, + "loss": 0.0601, + "step": 126420 + }, + { + "epoch": 35.55, + "learning_rate": 3.2140692843532316e-05, + "loss": 0.074, + "step": 126450 + }, + { + "epoch": 35.56, + "learning_rate": 3.212195045762659e-05, + "loss": 0.0598, + "step": 126480 + }, + { + "epoch": 35.57, + "learning_rate": 3.2103208071720865e-05, + "loss": 0.0682, + "step": 126510 + }, + { + "epoch": 35.57, + "learning_rate": 3.208446568581514e-05, + "loss": 0.0702, + "step": 126540 + }, + { + "epoch": 35.58, + "learning_rate": 3.206572329990941e-05, + "loss": 0.0616, + "step": 126570 + }, + { + "epoch": 35.59, + "learning_rate": 3.204698091400369e-05, + "loss": 0.0727, + "step": 126600 + }, + { + "epoch": 35.6, + "learning_rate": 3.202823852809796e-05, + "loss": 0.0639, + "step": 126630 + }, + { + "epoch": 35.61, + "learning_rate": 3.2009496142192235e-05, + "loss": 0.0706, + "step": 126660 + }, + { + "epoch": 35.62, + "learning_rate": 3.199075375628651e-05, + "loss": 0.066, + "step": 126690 + }, + { + "epoch": 35.63, + "learning_rate": 3.1972011370380784e-05, + "loss": 0.0681, + "step": 126720 + }, + { + "epoch": 35.63, + "learning_rate": 3.195326898447506e-05, + "loss": 0.0735, + "step": 126750 + }, + { + "epoch": 35.64, + "learning_rate": 3.193452659856933e-05, + "loss": 0.0624, + "step": 126780 + }, + { + "epoch": 35.65, + "learning_rate": 3.1915784212663606e-05, + "loss": 0.067, + "step": 126810 + }, + { + "epoch": 35.66, + "learning_rate": 3.189704182675788e-05, + "loss": 0.07, + "step": 126840 + }, + { + "epoch": 35.67, + "learning_rate": 3.1878299440852155e-05, + "loss": 0.0624, + "step": 126870 + }, + { + "epoch": 35.68, + "learning_rate": 3.185955705494643e-05, + "loss": 0.0707, + "step": 126900 + }, + { + "epoch": 35.68, + "learning_rate": 3.18408146690407e-05, + "loss": 0.0582, + "step": 126930 + }, + { + "epoch": 35.69, + "learning_rate": 3.182207228313498e-05, + "loss": 0.0675, + "step": 126960 + }, + { + "epoch": 35.7, + "learning_rate": 3.180332989722925e-05, + "loss": 0.0676, + "step": 126990 + }, + { + "epoch": 35.71, + "learning_rate": 3.1784587511323526e-05, + "loss": 0.0668, + "step": 127020 + }, + { + "epoch": 35.72, + "learning_rate": 3.17658451254178e-05, + "loss": 0.0721, + "step": 127050 + }, + { + "epoch": 35.73, + "learning_rate": 3.1747102739512074e-05, + "loss": 0.06, + "step": 127080 + }, + { + "epoch": 35.74, + "learning_rate": 3.172836035360635e-05, + "loss": 0.0674, + "step": 127110 + }, + { + "epoch": 35.74, + "learning_rate": 3.170961796770062e-05, + "loss": 0.0684, + "step": 127140 + }, + { + "epoch": 35.75, + "learning_rate": 3.16908755817949e-05, + "loss": 0.0682, + "step": 127170 + }, + { + "epoch": 35.76, + "learning_rate": 3.167213319588917e-05, + "loss": 0.0729, + "step": 127200 + }, + { + "epoch": 35.77, + "learning_rate": 3.1653390809983445e-05, + "loss": 0.0629, + "step": 127230 + }, + { + "epoch": 35.78, + "learning_rate": 3.163527317027458e-05, + "loss": 0.0674, + "step": 127260 + }, + { + "epoch": 35.79, + "learning_rate": 3.1616530784368854e-05, + "loss": 0.0656, + "step": 127290 + }, + { + "epoch": 35.79, + "learning_rate": 3.159778839846312e-05, + "loss": 0.0672, + "step": 127320 + }, + { + "epoch": 35.8, + "learning_rate": 3.15790460125574e-05, + "loss": 0.073, + "step": 127350 + }, + { + "epoch": 35.81, + "learning_rate": 3.156030362665167e-05, + "loss": 0.063, + "step": 127380 + }, + { + "epoch": 35.82, + "learning_rate": 3.154156124074595e-05, + "loss": 0.0674, + "step": 127410 + }, + { + "epoch": 35.83, + "learning_rate": 3.1522818854840224e-05, + "loss": 0.0636, + "step": 127440 + }, + { + "epoch": 35.84, + "learning_rate": 3.15040764689345e-05, + "loss": 0.0635, + "step": 127470 + }, + { + "epoch": 35.84, + "learning_rate": 3.148533408302877e-05, + "loss": 0.0782, + "step": 127500 + }, + { + "epoch": 35.85, + "learning_rate": 3.146659169712304e-05, + "loss": 0.0609, + "step": 127530 + }, + { + "epoch": 35.86, + "learning_rate": 3.144784931121732e-05, + "loss": 0.0694, + "step": 127560 + }, + { + "epoch": 35.87, + "learning_rate": 3.142910692531159e-05, + "loss": 0.0665, + "step": 127590 + }, + { + "epoch": 35.88, + "learning_rate": 3.141036453940587e-05, + "loss": 0.0686, + "step": 127620 + }, + { + "epoch": 35.89, + "learning_rate": 3.1391622153500144e-05, + "loss": 0.0709, + "step": 127650 + }, + { + "epoch": 35.9, + "learning_rate": 3.137287976759442e-05, + "loss": 0.0598, + "step": 127680 + }, + { + "epoch": 35.9, + "learning_rate": 3.135413738168869e-05, + "loss": 0.0657, + "step": 127710 + }, + { + "epoch": 35.91, + "learning_rate": 3.133539499578296e-05, + "loss": 0.0662, + "step": 127740 + }, + { + "epoch": 35.92, + "learning_rate": 3.131665260987724e-05, + "loss": 0.0667, + "step": 127770 + }, + { + "epoch": 35.93, + "learning_rate": 3.129791022397151e-05, + "loss": 0.0715, + "step": 127800 + }, + { + "epoch": 35.94, + "learning_rate": 3.127916783806579e-05, + "loss": 0.0582, + "step": 127830 + }, + { + "epoch": 35.95, + "learning_rate": 3.126042545216006e-05, + "loss": 0.0724, + "step": 127860 + }, + { + "epoch": 35.95, + "learning_rate": 3.124168306625434e-05, + "loss": 0.0695, + "step": 127890 + }, + { + "epoch": 35.96, + "learning_rate": 3.122294068034861e-05, + "loss": 0.0652, + "step": 127920 + }, + { + "epoch": 35.97, + "learning_rate": 3.1204198294442886e-05, + "loss": 0.0737, + "step": 127950 + }, + { + "epoch": 35.98, + "learning_rate": 3.118545590853716e-05, + "loss": 0.062, + "step": 127980 + }, + { + "epoch": 35.99, + "learning_rate": 3.116671352263143e-05, + "loss": 0.0685, + "step": 128010 + }, + { + "epoch": 36.0, + "learning_rate": 3.114797113672571e-05, + "loss": 0.0654, + "step": 128040 + }, + { + "epoch": 36.0, + "eval_loss": 0.17177008092403412, + "eval_runtime": 506.5545, + "eval_samples_per_second": 31.651, + "eval_steps_per_second": 0.991, + "eval_wer": 0.13024579312980225, + "step": 128052 + }, + { + "epoch": 36.01, + "learning_rate": 3.112922875081998e-05, + "loss": 0.0672, + "step": 128070 + }, + { + "epoch": 36.01, + "learning_rate": 3.111048636491426e-05, + "loss": 0.0701, + "step": 128100 + }, + { + "epoch": 36.02, + "learning_rate": 3.109174397900853e-05, + "loss": 0.0635, + "step": 128130 + }, + { + "epoch": 36.03, + "learning_rate": 3.1073001593102805e-05, + "loss": 0.0681, + "step": 128160 + }, + { + "epoch": 36.04, + "learning_rate": 3.105425920719708e-05, + "loss": 0.0589, + "step": 128190 + }, + { + "epoch": 36.05, + "learning_rate": 3.103551682129135e-05, + "loss": 0.0651, + "step": 128220 + }, + { + "epoch": 36.06, + "learning_rate": 3.101677443538563e-05, + "loss": 0.0698, + "step": 128250 + }, + { + "epoch": 36.06, + "learning_rate": 3.09980320494799e-05, + "loss": 0.0625, + "step": 128280 + }, + { + "epoch": 36.07, + "learning_rate": 3.0979289663574176e-05, + "loss": 0.0688, + "step": 128310 + }, + { + "epoch": 36.08, + "learning_rate": 3.096054727766845e-05, + "loss": 0.0597, + "step": 128340 + }, + { + "epoch": 36.09, + "learning_rate": 3.0941804891762724e-05, + "loss": 0.0728, + "step": 128370 + }, + { + "epoch": 36.1, + "learning_rate": 3.0923062505857e-05, + "loss": 0.0727, + "step": 128400 + }, + { + "epoch": 36.11, + "learning_rate": 3.0904320119951266e-05, + "loss": 0.0589, + "step": 128430 + }, + { + "epoch": 36.11, + "learning_rate": 3.088557773404555e-05, + "loss": 0.0677, + "step": 128460 + }, + { + "epoch": 36.12, + "learning_rate": 3.086683534813982e-05, + "loss": 0.063, + "step": 128490 + }, + { + "epoch": 36.13, + "learning_rate": 3.0848092962234095e-05, + "loss": 0.0649, + "step": 128520 + }, + { + "epoch": 36.14, + "learning_rate": 3.082935057632837e-05, + "loss": 0.0688, + "step": 128550 + }, + { + "epoch": 36.15, + "learning_rate": 3.0810608190422644e-05, + "loss": 0.0653, + "step": 128580 + }, + { + "epoch": 36.16, + "learning_rate": 3.079186580451692e-05, + "loss": 0.0697, + "step": 128610 + }, + { + "epoch": 36.17, + "learning_rate": 3.0773123418611185e-05, + "loss": 0.0592, + "step": 128640 + }, + { + "epoch": 36.17, + "learning_rate": 3.0754381032705466e-05, + "loss": 0.0658, + "step": 128670 + }, + { + "epoch": 36.18, + "learning_rate": 3.073563864679974e-05, + "loss": 0.0678, + "step": 128700 + }, + { + "epoch": 36.19, + "learning_rate": 3.0716896260894015e-05, + "loss": 0.0602, + "step": 128730 + }, + { + "epoch": 36.2, + "learning_rate": 3.069815387498829e-05, + "loss": 0.0697, + "step": 128760 + }, + { + "epoch": 36.21, + "learning_rate": 3.067941148908256e-05, + "loss": 0.0628, + "step": 128790 + }, + { + "epoch": 36.22, + "learning_rate": 3.066066910317684e-05, + "loss": 0.0679, + "step": 128820 + }, + { + "epoch": 36.22, + "learning_rate": 3.0641926717271105e-05, + "loss": 0.0663, + "step": 128850 + }, + { + "epoch": 36.23, + "learning_rate": 3.0623184331365386e-05, + "loss": 0.0629, + "step": 128880 + }, + { + "epoch": 36.24, + "learning_rate": 3.060444194545966e-05, + "loss": 0.0737, + "step": 128910 + }, + { + "epoch": 36.25, + "learning_rate": 3.0585699559553934e-05, + "loss": 0.0578, + "step": 128940 + }, + { + "epoch": 36.26, + "learning_rate": 3.056695717364821e-05, + "loss": 0.0681, + "step": 128970 + }, + { + "epoch": 36.27, + "learning_rate": 3.054821478774248e-05, + "loss": 0.0705, + "step": 129000 + }, + { + "epoch": 36.27, + "learning_rate": 3.0529472401836757e-05, + "loss": 0.063, + "step": 129030 + }, + { + "epoch": 36.28, + "learning_rate": 3.0510730015931027e-05, + "loss": 0.0745, + "step": 129060 + }, + { + "epoch": 36.29, + "learning_rate": 3.0491987630025305e-05, + "loss": 0.0611, + "step": 129090 + }, + { + "epoch": 36.3, + "learning_rate": 3.047324524411958e-05, + "loss": 0.0647, + "step": 129120 + }, + { + "epoch": 36.31, + "learning_rate": 3.045450285821385e-05, + "loss": 0.0706, + "step": 129150 + }, + { + "epoch": 36.32, + "learning_rate": 3.0435760472308128e-05, + "loss": 0.0584, + "step": 129180 + }, + { + "epoch": 36.33, + "learning_rate": 3.04170180864024e-05, + "loss": 0.076, + "step": 129210 + }, + { + "epoch": 36.33, + "learning_rate": 3.0398275700496676e-05, + "loss": 0.0613, + "step": 129240 + }, + { + "epoch": 36.34, + "learning_rate": 3.0379533314590947e-05, + "loss": 0.0734, + "step": 129270 + }, + { + "epoch": 36.35, + "learning_rate": 3.0360790928685224e-05, + "loss": 0.066, + "step": 129300 + }, + { + "epoch": 36.36, + "learning_rate": 3.03420485427795e-05, + "loss": 0.0603, + "step": 129330 + }, + { + "epoch": 36.37, + "learning_rate": 3.032330615687377e-05, + "loss": 0.0732, + "step": 129360 + }, + { + "epoch": 36.38, + "learning_rate": 3.0304563770968047e-05, + "loss": 0.0607, + "step": 129390 + }, + { + "epoch": 36.38, + "learning_rate": 3.0285821385062318e-05, + "loss": 0.068, + "step": 129420 + }, + { + "epoch": 36.39, + "learning_rate": 3.0267078999156595e-05, + "loss": 0.071, + "step": 129450 + }, + { + "epoch": 36.4, + "learning_rate": 3.0248336613250866e-05, + "loss": 0.0636, + "step": 129480 + }, + { + "epoch": 36.41, + "learning_rate": 3.0229594227345144e-05, + "loss": 0.0733, + "step": 129510 + }, + { + "epoch": 36.42, + "learning_rate": 3.0210851841439418e-05, + "loss": 0.0625, + "step": 129540 + }, + { + "epoch": 36.43, + "learning_rate": 3.019210945553369e-05, + "loss": 0.0689, + "step": 129570 + }, + { + "epoch": 36.44, + "learning_rate": 3.0173367069627966e-05, + "loss": 0.0715, + "step": 129600 + }, + { + "epoch": 36.44, + "learning_rate": 3.0154624683722237e-05, + "loss": 0.0599, + "step": 129630 + }, + { + "epoch": 36.45, + "learning_rate": 3.0135882297816515e-05, + "loss": 0.069, + "step": 129660 + }, + { + "epoch": 36.46, + "learning_rate": 3.0117139911910785e-05, + "loss": 0.0635, + "step": 129690 + }, + { + "epoch": 36.47, + "learning_rate": 3.0098397526005063e-05, + "loss": 0.0671, + "step": 129720 + }, + { + "epoch": 36.48, + "learning_rate": 3.0079655140099337e-05, + "loss": 0.0697, + "step": 129750 + }, + { + "epoch": 36.49, + "learning_rate": 3.006091275419361e-05, + "loss": 0.0637, + "step": 129780 + }, + { + "epoch": 36.49, + "learning_rate": 3.0042170368287886e-05, + "loss": 0.0708, + "step": 129810 + }, + { + "epoch": 36.5, + "learning_rate": 3.0023427982382156e-05, + "loss": 0.0637, + "step": 129840 + }, + { + "epoch": 36.51, + "learning_rate": 3.0004685596476434e-05, + "loss": 0.0671, + "step": 129870 + }, + { + "epoch": 36.52, + "learning_rate": 2.9985943210570705e-05, + "loss": 0.066, + "step": 129900 + }, + { + "epoch": 36.53, + "learning_rate": 2.9967200824664982e-05, + "loss": 0.0631, + "step": 129930 + }, + { + "epoch": 36.54, + "learning_rate": 2.9948458438759256e-05, + "loss": 0.0715, + "step": 129960 + }, + { + "epoch": 36.54, + "learning_rate": 2.992971605285353e-05, + "loss": 0.0615, + "step": 129990 + }, + { + "epoch": 36.55, + "learning_rate": 2.9910973666947805e-05, + "loss": 0.0705, + "step": 130020 + }, + { + "epoch": 36.56, + "learning_rate": 2.9892231281042076e-05, + "loss": 0.0685, + "step": 130050 + }, + { + "epoch": 36.57, + "learning_rate": 2.9873488895136353e-05, + "loss": 0.0622, + "step": 130080 + }, + { + "epoch": 36.58, + "learning_rate": 2.9854746509230624e-05, + "loss": 0.0738, + "step": 130110 + }, + { + "epoch": 36.59, + "learning_rate": 2.98360041233249e-05, + "loss": 0.0627, + "step": 130140 + }, + { + "epoch": 36.6, + "learning_rate": 2.981726173741918e-05, + "loss": 0.0689, + "step": 130170 + }, + { + "epoch": 36.6, + "learning_rate": 2.979851935151345e-05, + "loss": 0.0665, + "step": 130200 + }, + { + "epoch": 36.61, + "learning_rate": 2.9779776965607724e-05, + "loss": 0.0591, + "step": 130230 + }, + { + "epoch": 36.62, + "learning_rate": 2.9761034579701995e-05, + "loss": 0.071, + "step": 130260 + }, + { + "epoch": 36.63, + "learning_rate": 2.9742292193796273e-05, + "loss": 0.0637, + "step": 130290 + }, + { + "epoch": 36.64, + "learning_rate": 2.9723549807890543e-05, + "loss": 0.0668, + "step": 130320 + }, + { + "epoch": 36.65, + "learning_rate": 2.970480742198482e-05, + "loss": 0.073, + "step": 130350 + }, + { + "epoch": 36.65, + "learning_rate": 2.96860650360791e-05, + "loss": 0.0632, + "step": 130380 + }, + { + "epoch": 36.66, + "learning_rate": 2.966732265017337e-05, + "loss": 0.07, + "step": 130410 + }, + { + "epoch": 36.67, + "learning_rate": 2.9648580264267644e-05, + "loss": 0.0596, + "step": 130440 + }, + { + "epoch": 36.68, + "learning_rate": 2.9629837878361914e-05, + "loss": 0.0616, + "step": 130470 + }, + { + "epoch": 36.69, + "learning_rate": 2.9611095492456192e-05, + "loss": 0.0632, + "step": 130500 + }, + { + "epoch": 36.7, + "learning_rate": 2.9592353106550463e-05, + "loss": 0.0628, + "step": 130530 + }, + { + "epoch": 36.7, + "learning_rate": 2.957361072064474e-05, + "loss": 0.0701, + "step": 130560 + }, + { + "epoch": 36.71, + "learning_rate": 2.955486833473901e-05, + "loss": 0.0607, + "step": 130590 + }, + { + "epoch": 36.72, + "learning_rate": 2.953612594883329e-05, + "loss": 0.066, + "step": 130620 + }, + { + "epoch": 36.73, + "learning_rate": 2.9517383562927563e-05, + "loss": 0.068, + "step": 130650 + }, + { + "epoch": 36.74, + "learning_rate": 2.9498641177021834e-05, + "loss": 0.0609, + "step": 130680 + }, + { + "epoch": 36.75, + "learning_rate": 2.947989879111611e-05, + "loss": 0.0714, + "step": 130710 + }, + { + "epoch": 36.76, + "learning_rate": 2.9461156405210382e-05, + "loss": 0.0627, + "step": 130740 + }, + { + "epoch": 36.76, + "learning_rate": 2.944241401930466e-05, + "loss": 0.0624, + "step": 130770 + }, + { + "epoch": 36.77, + "learning_rate": 2.942367163339893e-05, + "loss": 0.071, + "step": 130800 + }, + { + "epoch": 36.78, + "learning_rate": 2.9404929247493208e-05, + "loss": 0.0633, + "step": 130830 + }, + { + "epoch": 36.79, + "learning_rate": 2.9386186861587482e-05, + "loss": 0.0703, + "step": 130860 + }, + { + "epoch": 36.8, + "learning_rate": 2.9367444475681753e-05, + "loss": 0.0596, + "step": 130890 + }, + { + "epoch": 36.81, + "learning_rate": 2.934870208977603e-05, + "loss": 0.0656, + "step": 130920 + }, + { + "epoch": 36.81, + "learning_rate": 2.93299597038703e-05, + "loss": 0.0622, + "step": 130950 + }, + { + "epoch": 36.82, + "learning_rate": 2.931121731796458e-05, + "loss": 0.0631, + "step": 130980 + }, + { + "epoch": 36.83, + "learning_rate": 2.929247493205885e-05, + "loss": 0.0717, + "step": 131010 + }, + { + "epoch": 36.84, + "learning_rate": 2.9273732546153127e-05, + "loss": 0.0582, + "step": 131040 + }, + { + "epoch": 36.85, + "learning_rate": 2.92549901602474e-05, + "loss": 0.0676, + "step": 131070 + }, + { + "epoch": 36.86, + "learning_rate": 2.9236247774341676e-05, + "loss": 0.0679, + "step": 131100 + }, + { + "epoch": 36.87, + "learning_rate": 2.921750538843595e-05, + "loss": 0.0596, + "step": 131130 + }, + { + "epoch": 36.87, + "learning_rate": 2.919876300253022e-05, + "loss": 0.0693, + "step": 131160 + }, + { + "epoch": 36.88, + "learning_rate": 2.9180020616624498e-05, + "loss": 0.0609, + "step": 131190 + }, + { + "epoch": 36.89, + "learning_rate": 2.916127823071877e-05, + "loss": 0.0664, + "step": 131220 + }, + { + "epoch": 36.9, + "learning_rate": 2.9142535844813047e-05, + "loss": 0.0642, + "step": 131250 + }, + { + "epoch": 36.91, + "learning_rate": 2.912379345890732e-05, + "loss": 0.0648, + "step": 131280 + }, + { + "epoch": 36.92, + "learning_rate": 2.9105051073001595e-05, + "loss": 0.0705, + "step": 131310 + }, + { + "epoch": 36.92, + "learning_rate": 2.908630868709587e-05, + "loss": 0.0584, + "step": 131340 + }, + { + "epoch": 36.93, + "learning_rate": 2.906756630119014e-05, + "loss": 0.0678, + "step": 131370 + }, + { + "epoch": 36.94, + "learning_rate": 2.9048823915284418e-05, + "loss": 0.073, + "step": 131400 + }, + { + "epoch": 36.95, + "learning_rate": 2.903008152937869e-05, + "loss": 0.0688, + "step": 131430 + }, + { + "epoch": 36.96, + "learning_rate": 2.9011339143472966e-05, + "loss": 0.0712, + "step": 131460 + }, + { + "epoch": 36.97, + "learning_rate": 2.8992596757567244e-05, + "loss": 0.0621, + "step": 131490 + }, + { + "epoch": 36.97, + "learning_rate": 2.8973854371661514e-05, + "loss": 0.066, + "step": 131520 + }, + { + "epoch": 36.98, + "learning_rate": 2.895511198575579e-05, + "loss": 0.0684, + "step": 131550 + }, + { + "epoch": 36.99, + "learning_rate": 2.893636959985006e-05, + "loss": 0.0656, + "step": 131580 + }, + { + "epoch": 37.0, + "eval_loss": 0.16971024870872498, + "eval_runtime": 512.0403, + "eval_samples_per_second": 31.312, + "eval_steps_per_second": 0.98, + "eval_wer": 0.1300888458231545, + "step": 131609 + }, + { + "epoch": 37.0, + "learning_rate": 2.8917627213944337e-05, + "loss": 0.0744, + "step": 131610 + }, + { + "epoch": 37.01, + "learning_rate": 2.8898884828038608e-05, + "loss": 0.0581, + "step": 131640 + }, + { + "epoch": 37.02, + "learning_rate": 2.8880142442132885e-05, + "loss": 0.0647, + "step": 131670 + }, + { + "epoch": 37.03, + "learning_rate": 2.8861400056227163e-05, + "loss": 0.0616, + "step": 131700 + }, + { + "epoch": 37.03, + "learning_rate": 2.8842657670321434e-05, + "loss": 0.0666, + "step": 131730 + }, + { + "epoch": 37.04, + "learning_rate": 2.8823915284415708e-05, + "loss": 0.0673, + "step": 131760 + }, + { + "epoch": 37.05, + "learning_rate": 2.880517289850998e-05, + "loss": 0.0608, + "step": 131790 + }, + { + "epoch": 37.06, + "learning_rate": 2.8786430512604256e-05, + "loss": 0.0646, + "step": 131820 + }, + { + "epoch": 37.07, + "learning_rate": 2.8767688126698527e-05, + "loss": 0.0618, + "step": 131850 + }, + { + "epoch": 37.08, + "learning_rate": 2.8749570486989665e-05, + "loss": 0.0658, + "step": 131880 + }, + { + "epoch": 37.08, + "learning_rate": 2.8730828101083935e-05, + "loss": 0.0694, + "step": 131910 + }, + { + "epoch": 37.09, + "learning_rate": 2.871208571517821e-05, + "loss": 0.0546, + "step": 131940 + }, + { + "epoch": 37.1, + "learning_rate": 2.869334332927248e-05, + "loss": 0.069, + "step": 131970 + }, + { + "epoch": 37.11, + "learning_rate": 2.8675225689563618e-05, + "loss": 0.0626, + "step": 132000 + }, + { + "epoch": 37.12, + "learning_rate": 2.865648330365789e-05, + "loss": 0.0661, + "step": 132030 + }, + { + "epoch": 37.13, + "learning_rate": 2.8637740917752166e-05, + "loss": 0.0661, + "step": 132060 + }, + { + "epoch": 37.14, + "learning_rate": 2.861899853184644e-05, + "loss": 0.055, + "step": 132090 + }, + { + "epoch": 37.14, + "learning_rate": 2.860025614594071e-05, + "loss": 0.0661, + "step": 132120 + }, + { + "epoch": 37.15, + "learning_rate": 2.858151376003499e-05, + "loss": 0.0613, + "step": 132150 + }, + { + "epoch": 37.16, + "learning_rate": 2.856277137412926e-05, + "loss": 0.068, + "step": 132180 + }, + { + "epoch": 37.17, + "learning_rate": 2.8544028988223537e-05, + "loss": 0.0707, + "step": 132210 + }, + { + "epoch": 37.18, + "learning_rate": 2.8525286602317808e-05, + "loss": 0.0566, + "step": 132240 + }, + { + "epoch": 37.19, + "learning_rate": 2.8506544216412086e-05, + "loss": 0.0651, + "step": 132270 + }, + { + "epoch": 37.19, + "learning_rate": 2.8487801830506357e-05, + "loss": 0.0643, + "step": 132300 + }, + { + "epoch": 37.2, + "learning_rate": 2.846905944460063e-05, + "loss": 0.0626, + "step": 132330 + }, + { + "epoch": 37.21, + "learning_rate": 2.845031705869491e-05, + "loss": 0.0681, + "step": 132360 + }, + { + "epoch": 37.22, + "learning_rate": 2.843157467278918e-05, + "loss": 0.0581, + "step": 132390 + }, + { + "epoch": 37.23, + "learning_rate": 2.8412832286883457e-05, + "loss": 0.0708, + "step": 132420 + }, + { + "epoch": 37.24, + "learning_rate": 2.8394089900977728e-05, + "loss": 0.0591, + "step": 132450 + }, + { + "epoch": 37.24, + "learning_rate": 2.8375347515072005e-05, + "loss": 0.0672, + "step": 132480 + }, + { + "epoch": 37.25, + "learning_rate": 2.8356605129166276e-05, + "loss": 0.0694, + "step": 132510 + }, + { + "epoch": 37.26, + "learning_rate": 2.833786274326055e-05, + "loss": 0.0558, + "step": 132540 + }, + { + "epoch": 37.27, + "learning_rate": 2.8319120357354828e-05, + "loss": 0.0692, + "step": 132570 + }, + { + "epoch": 37.28, + "learning_rate": 2.83003779714491e-05, + "loss": 0.0627, + "step": 132600 + }, + { + "epoch": 37.29, + "learning_rate": 2.8281635585543376e-05, + "loss": 0.0657, + "step": 132630 + }, + { + "epoch": 37.3, + "learning_rate": 2.8262893199637647e-05, + "loss": 0.0702, + "step": 132660 + }, + { + "epoch": 37.3, + "learning_rate": 2.8244150813731924e-05, + "loss": 0.0574, + "step": 132690 + }, + { + "epoch": 37.31, + "learning_rate": 2.8225408427826195e-05, + "loss": 0.072, + "step": 132720 + }, + { + "epoch": 37.32, + "learning_rate": 2.820666604192047e-05, + "loss": 0.0657, + "step": 132750 + }, + { + "epoch": 37.33, + "learning_rate": 2.8187923656014747e-05, + "loss": 0.066, + "step": 132780 + }, + { + "epoch": 37.34, + "learning_rate": 2.8169181270109018e-05, + "loss": 0.0695, + "step": 132810 + }, + { + "epoch": 37.35, + "learning_rate": 2.8150438884203295e-05, + "loss": 0.0594, + "step": 132840 + }, + { + "epoch": 37.35, + "learning_rate": 2.8131696498297566e-05, + "loss": 0.0709, + "step": 132870 + }, + { + "epoch": 37.36, + "learning_rate": 2.8112954112391844e-05, + "loss": 0.0587, + "step": 132900 + }, + { + "epoch": 37.37, + "learning_rate": 2.8094211726486115e-05, + "loss": 0.0699, + "step": 132930 + }, + { + "epoch": 37.38, + "learning_rate": 2.807546934058039e-05, + "loss": 0.0726, + "step": 132960 + }, + { + "epoch": 37.39, + "learning_rate": 2.8056726954674666e-05, + "loss": 0.0552, + "step": 132990 + }, + { + "epoch": 37.4, + "learning_rate": 2.8037984568768937e-05, + "loss": 0.0686, + "step": 133020 + }, + { + "epoch": 37.41, + "learning_rate": 2.8019242182863215e-05, + "loss": 0.061, + "step": 133050 + }, + { + "epoch": 37.41, + "learning_rate": 2.8000499796957486e-05, + "loss": 0.0668, + "step": 133080 + }, + { + "epoch": 37.42, + "learning_rate": 2.7981757411051763e-05, + "loss": 0.0683, + "step": 133110 + }, + { + "epoch": 37.43, + "learning_rate": 2.7963015025146034e-05, + "loss": 0.0578, + "step": 133140 + }, + { + "epoch": 37.44, + "learning_rate": 2.7944272639240308e-05, + "loss": 0.0715, + "step": 133170 + }, + { + "epoch": 37.45, + "learning_rate": 2.7925530253334586e-05, + "loss": 0.0643, + "step": 133200 + }, + { + "epoch": 37.46, + "learning_rate": 2.7906787867428857e-05, + "loss": 0.0645, + "step": 133230 + }, + { + "epoch": 37.46, + "learning_rate": 2.7888045481523134e-05, + "loss": 0.0698, + "step": 133260 + }, + { + "epoch": 37.47, + "learning_rate": 2.7869303095617405e-05, + "loss": 0.0554, + "step": 133290 + }, + { + "epoch": 37.48, + "learning_rate": 2.7850560709711682e-05, + "loss": 0.0722, + "step": 133320 + }, + { + "epoch": 37.49, + "learning_rate": 2.7831818323805953e-05, + "loss": 0.0607, + "step": 133350 + }, + { + "epoch": 37.5, + "learning_rate": 2.781307593790023e-05, + "loss": 0.0681, + "step": 133380 + }, + { + "epoch": 37.51, + "learning_rate": 2.7794333551994505e-05, + "loss": 0.0677, + "step": 133410 + }, + { + "epoch": 37.51, + "learning_rate": 2.7775591166088776e-05, + "loss": 0.0576, + "step": 133440 + }, + { + "epoch": 37.52, + "learning_rate": 2.7756848780183053e-05, + "loss": 0.0652, + "step": 133470 + }, + { + "epoch": 37.53, + "learning_rate": 2.7738106394277324e-05, + "loss": 0.0607, + "step": 133500 + }, + { + "epoch": 37.54, + "learning_rate": 2.7719364008371602e-05, + "loss": 0.0645, + "step": 133530 + }, + { + "epoch": 37.55, + "learning_rate": 2.7700621622465873e-05, + "loss": 0.0672, + "step": 133560 + }, + { + "epoch": 37.56, + "learning_rate": 2.768187923656015e-05, + "loss": 0.0513, + "step": 133590 + }, + { + "epoch": 37.57, + "learning_rate": 2.7663136850654424e-05, + "loss": 0.0654, + "step": 133620 + }, + { + "epoch": 37.57, + "learning_rate": 2.7644394464748695e-05, + "loss": 0.0584, + "step": 133650 + }, + { + "epoch": 37.58, + "learning_rate": 2.7625652078842973e-05, + "loss": 0.0637, + "step": 133680 + }, + { + "epoch": 37.59, + "learning_rate": 2.7606909692937244e-05, + "loss": 0.071, + "step": 133710 + }, + { + "epoch": 37.6, + "learning_rate": 2.758816730703152e-05, + "loss": 0.0593, + "step": 133740 + }, + { + "epoch": 37.61, + "learning_rate": 2.7569424921125792e-05, + "loss": 0.0717, + "step": 133770 + }, + { + "epoch": 37.62, + "learning_rate": 2.755068253522007e-05, + "loss": 0.0621, + "step": 133800 + }, + { + "epoch": 37.62, + "learning_rate": 2.7531940149314344e-05, + "loss": 0.0652, + "step": 133830 + }, + { + "epoch": 37.63, + "learning_rate": 2.7513197763408615e-05, + "loss": 0.0706, + "step": 133860 + }, + { + "epoch": 37.64, + "learning_rate": 2.7494455377502892e-05, + "loss": 0.0557, + "step": 133890 + }, + { + "epoch": 37.65, + "learning_rate": 2.7475712991597163e-05, + "loss": 0.0712, + "step": 133920 + }, + { + "epoch": 37.66, + "learning_rate": 2.745697060569144e-05, + "loss": 0.0629, + "step": 133950 + }, + { + "epoch": 37.67, + "learning_rate": 2.743822821978571e-05, + "loss": 0.0655, + "step": 133980 + }, + { + "epoch": 37.67, + "learning_rate": 2.741948583387999e-05, + "loss": 0.0706, + "step": 134010 + }, + { + "epoch": 37.68, + "learning_rate": 2.7400743447974263e-05, + "loss": 0.06, + "step": 134040 + }, + { + "epoch": 37.69, + "learning_rate": 2.7382001062068534e-05, + "loss": 0.07, + "step": 134070 + }, + { + "epoch": 37.7, + "learning_rate": 2.736325867616281e-05, + "loss": 0.0618, + "step": 134100 + }, + { + "epoch": 37.71, + "learning_rate": 2.7344516290257082e-05, + "loss": 0.0618, + "step": 134130 + }, + { + "epoch": 37.72, + "learning_rate": 2.732577390435136e-05, + "loss": 0.0699, + "step": 134160 + }, + { + "epoch": 37.73, + "learning_rate": 2.730703151844563e-05, + "loss": 0.0592, + "step": 134190 + }, + { + "epoch": 37.73, + "learning_rate": 2.7288289132539908e-05, + "loss": 0.0712, + "step": 134220 + }, + { + "epoch": 37.74, + "learning_rate": 2.7269546746634182e-05, + "loss": 0.0622, + "step": 134250 + }, + { + "epoch": 37.75, + "learning_rate": 2.7250804360728453e-05, + "loss": 0.0662, + "step": 134280 + }, + { + "epoch": 37.76, + "learning_rate": 2.723206197482273e-05, + "loss": 0.0715, + "step": 134310 + }, + { + "epoch": 37.77, + "learning_rate": 2.7213319588917e-05, + "loss": 0.0597, + "step": 134340 + }, + { + "epoch": 37.78, + "learning_rate": 2.719457720301128e-05, + "loss": 0.0687, + "step": 134370 + }, + { + "epoch": 37.78, + "learning_rate": 2.717583481710555e-05, + "loss": 0.063, + "step": 134400 + }, + { + "epoch": 37.79, + "learning_rate": 2.7157092431199828e-05, + "loss": 0.0663, + "step": 134430 + }, + { + "epoch": 37.8, + "learning_rate": 2.7138350045294102e-05, + "loss": 0.0702, + "step": 134460 + }, + { + "epoch": 37.81, + "learning_rate": 2.7119607659388373e-05, + "loss": 0.0579, + "step": 134490 + }, + { + "epoch": 37.82, + "learning_rate": 2.710086527348265e-05, + "loss": 0.0695, + "step": 134520 + }, + { + "epoch": 37.83, + "learning_rate": 2.708212288757692e-05, + "loss": 0.0628, + "step": 134550 + }, + { + "epoch": 37.84, + "learning_rate": 2.70633805016712e-05, + "loss": 0.0642, + "step": 134580 + }, + { + "epoch": 37.84, + "learning_rate": 2.704463811576547e-05, + "loss": 0.0705, + "step": 134610 + }, + { + "epoch": 37.85, + "learning_rate": 2.7025895729859747e-05, + "loss": 0.0566, + "step": 134640 + }, + { + "epoch": 37.86, + "learning_rate": 2.700715334395402e-05, + "loss": 0.0691, + "step": 134670 + }, + { + "epoch": 37.87, + "learning_rate": 2.6988410958048295e-05, + "loss": 0.061, + "step": 134700 + }, + { + "epoch": 37.88, + "learning_rate": 2.696966857214257e-05, + "loss": 0.0641, + "step": 134730 + }, + { + "epoch": 37.89, + "learning_rate": 2.695092618623684e-05, + "loss": 0.0707, + "step": 134760 + }, + { + "epoch": 37.89, + "learning_rate": 2.6932183800331118e-05, + "loss": 0.0619, + "step": 134790 + }, + { + "epoch": 37.9, + "learning_rate": 2.691344141442539e-05, + "loss": 0.0681, + "step": 134820 + }, + { + "epoch": 37.91, + "learning_rate": 2.6894699028519666e-05, + "loss": 0.0629, + "step": 134850 + }, + { + "epoch": 37.92, + "learning_rate": 2.687595664261394e-05, + "loss": 0.0627, + "step": 134880 + }, + { + "epoch": 37.93, + "learning_rate": 2.6857214256708215e-05, + "loss": 0.0701, + "step": 134910 + }, + { + "epoch": 37.94, + "learning_rate": 2.683847187080249e-05, + "loss": 0.0587, + "step": 134940 + }, + { + "epoch": 37.94, + "learning_rate": 2.681972948489676e-05, + "loss": 0.0652, + "step": 134970 + }, + { + "epoch": 37.95, + "learning_rate": 2.6800987098991037e-05, + "loss": 0.0597, + "step": 135000 + }, + { + "epoch": 37.96, + "learning_rate": 2.6782244713085308e-05, + "loss": 0.0651, + "step": 135030 + }, + { + "epoch": 37.97, + "learning_rate": 2.6763502327179586e-05, + "loss": 0.0755, + "step": 135060 + }, + { + "epoch": 37.98, + "learning_rate": 2.6744759941273863e-05, + "loss": 0.0553, + "step": 135090 + }, + { + "epoch": 37.99, + "learning_rate": 2.6726017555368134e-05, + "loss": 0.0671, + "step": 135120 + }, + { + "epoch": 38.0, + "learning_rate": 2.6707275169462408e-05, + "loss": 0.0643, + "step": 135150 + }, + { + "epoch": 38.0, + "eval_loss": 0.17159442603588104, + "eval_runtime": 506.1667, + "eval_samples_per_second": 31.675, + "eval_steps_per_second": 0.992, + "eval_wer": 0.1278642883463213, + "step": 135166 + }, + { + "epoch": 38.0, + "learning_rate": 2.668853278355668e-05, + "loss": 0.0666, + "step": 135180 + }, + { + "epoch": 38.01, + "learning_rate": 2.6669790397650956e-05, + "loss": 0.0625, + "step": 135210 + }, + { + "epoch": 38.02, + "learning_rate": 2.6651048011745227e-05, + "loss": 0.0608, + "step": 135240 + }, + { + "epoch": 38.03, + "learning_rate": 2.6632305625839505e-05, + "loss": 0.0697, + "step": 135270 + }, + { + "epoch": 38.04, + "learning_rate": 2.6613563239933782e-05, + "loss": 0.057, + "step": 135300 + }, + { + "epoch": 38.05, + "learning_rate": 2.6594820854028053e-05, + "loss": 0.066, + "step": 135330 + }, + { + "epoch": 38.05, + "learning_rate": 2.6576078468122327e-05, + "loss": 0.0618, + "step": 135360 + }, + { + "epoch": 38.06, + "learning_rate": 2.6557336082216598e-05, + "loss": 0.0627, + "step": 135390 + }, + { + "epoch": 38.07, + "learning_rate": 2.6538593696310876e-05, + "loss": 0.0692, + "step": 135420 + }, + { + "epoch": 38.08, + "learning_rate": 2.6519851310405147e-05, + "loss": 0.0555, + "step": 135450 + }, + { + "epoch": 38.09, + "learning_rate": 2.6501108924499424e-05, + "loss": 0.0611, + "step": 135480 + }, + { + "epoch": 38.1, + "learning_rate": 2.6482366538593702e-05, + "loss": 0.0603, + "step": 135510 + }, + { + "epoch": 38.11, + "learning_rate": 2.6463624152687973e-05, + "loss": 0.0618, + "step": 135540 + }, + { + "epoch": 38.11, + "learning_rate": 2.6444881766782247e-05, + "loss": 0.0688, + "step": 135570 + }, + { + "epoch": 38.12, + "learning_rate": 2.6426139380876518e-05, + "loss": 0.0591, + "step": 135600 + }, + { + "epoch": 38.13, + "learning_rate": 2.6407396994970795e-05, + "loss": 0.0661, + "step": 135630 + }, + { + "epoch": 38.14, + "learning_rate": 2.6388654609065066e-05, + "loss": 0.0619, + "step": 135660 + }, + { + "epoch": 38.15, + "learning_rate": 2.6369912223159344e-05, + "loss": 0.0609, + "step": 135690 + }, + { + "epoch": 38.16, + "learning_rate": 2.6351169837253614e-05, + "loss": 0.0686, + "step": 135720 + }, + { + "epoch": 38.16, + "learning_rate": 2.6332427451347892e-05, + "loss": 0.0557, + "step": 135750 + }, + { + "epoch": 38.17, + "learning_rate": 2.6313685065442166e-05, + "loss": 0.0644, + "step": 135780 + }, + { + "epoch": 38.18, + "learning_rate": 2.6294942679536437e-05, + "loss": 0.0611, + "step": 135810 + }, + { + "epoch": 38.19, + "learning_rate": 2.6276200293630714e-05, + "loss": 0.0602, + "step": 135840 + }, + { + "epoch": 38.2, + "learning_rate": 2.6257457907724985e-05, + "loss": 0.0695, + "step": 135870 + }, + { + "epoch": 38.21, + "learning_rate": 2.6238715521819263e-05, + "loss": 0.0559, + "step": 135900 + }, + { + "epoch": 38.21, + "learning_rate": 2.6219973135913534e-05, + "loss": 0.0652, + "step": 135930 + }, + { + "epoch": 38.22, + "learning_rate": 2.620123075000781e-05, + "loss": 0.0596, + "step": 135960 + }, + { + "epoch": 38.23, + "learning_rate": 2.6182488364102085e-05, + "loss": 0.0575, + "step": 135990 + }, + { + "epoch": 38.24, + "learning_rate": 2.6163745978196356e-05, + "loss": 0.07, + "step": 136020 + }, + { + "epoch": 38.25, + "learning_rate": 2.6145003592290634e-05, + "loss": 0.0574, + "step": 136050 + }, + { + "epoch": 38.26, + "learning_rate": 2.6126261206384905e-05, + "loss": 0.0678, + "step": 136080 + }, + { + "epoch": 38.27, + "learning_rate": 2.6107518820479182e-05, + "loss": 0.0615, + "step": 136110 + }, + { + "epoch": 38.27, + "learning_rate": 2.6088776434573453e-05, + "loss": 0.0627, + "step": 136140 + }, + { + "epoch": 38.28, + "learning_rate": 2.607003404866773e-05, + "loss": 0.068, + "step": 136170 + }, + { + "epoch": 38.29, + "learning_rate": 2.6051291662762005e-05, + "loss": 0.0536, + "step": 136200 + }, + { + "epoch": 38.3, + "learning_rate": 2.603254927685628e-05, + "loss": 0.0641, + "step": 136230 + }, + { + "epoch": 38.31, + "learning_rate": 2.6013806890950553e-05, + "loss": 0.0609, + "step": 136260 + }, + { + "epoch": 38.32, + "learning_rate": 2.5995064505044824e-05, + "loss": 0.0607, + "step": 136290 + }, + { + "epoch": 38.32, + "learning_rate": 2.59763221191391e-05, + "loss": 0.0664, + "step": 136320 + }, + { + "epoch": 38.33, + "learning_rate": 2.5957579733233372e-05, + "loss": 0.0577, + "step": 136350 + }, + { + "epoch": 38.34, + "learning_rate": 2.593883734732765e-05, + "loss": 0.0637, + "step": 136380 + }, + { + "epoch": 38.35, + "learning_rate": 2.5920094961421924e-05, + "loss": 0.0601, + "step": 136410 + }, + { + "epoch": 38.36, + "learning_rate": 2.5901352575516198e-05, + "loss": 0.0567, + "step": 136440 + }, + { + "epoch": 38.37, + "learning_rate": 2.5882610189610472e-05, + "loss": 0.0659, + "step": 136470 + }, + { + "epoch": 38.37, + "learning_rate": 2.5863867803704743e-05, + "loss": 0.0586, + "step": 136500 + }, + { + "epoch": 38.38, + "learning_rate": 2.584512541779902e-05, + "loss": 0.07, + "step": 136530 + }, + { + "epoch": 38.39, + "learning_rate": 2.582638303189329e-05, + "loss": 0.062, + "step": 136560 + }, + { + "epoch": 38.4, + "learning_rate": 2.580764064598757e-05, + "loss": 0.0627, + "step": 136590 + }, + { + "epoch": 38.41, + "learning_rate": 2.5788898260081847e-05, + "loss": 0.0653, + "step": 136620 + }, + { + "epoch": 38.42, + "learning_rate": 2.5770155874176118e-05, + "loss": 0.0578, + "step": 136650 + }, + { + "epoch": 38.43, + "learning_rate": 2.5751413488270392e-05, + "loss": 0.0665, + "step": 136680 + }, + { + "epoch": 38.43, + "learning_rate": 2.5732671102364663e-05, + "loss": 0.0635, + "step": 136710 + }, + { + "epoch": 38.44, + "learning_rate": 2.571392871645894e-05, + "loss": 0.0629, + "step": 136740 + }, + { + "epoch": 38.45, + "learning_rate": 2.569518633055321e-05, + "loss": 0.0676, + "step": 136770 + }, + { + "epoch": 38.46, + "learning_rate": 2.567644394464749e-05, + "loss": 0.0621, + "step": 136800 + }, + { + "epoch": 38.47, + "learning_rate": 2.5657701558741766e-05, + "loss": 0.0614, + "step": 136830 + }, + { + "epoch": 38.48, + "learning_rate": 2.5638959172836037e-05, + "loss": 0.0633, + "step": 136860 + }, + { + "epoch": 38.48, + "learning_rate": 2.562021678693031e-05, + "loss": 0.0576, + "step": 136890 + }, + { + "epoch": 38.49, + "learning_rate": 2.5601474401024582e-05, + "loss": 0.0681, + "step": 136920 + }, + { + "epoch": 38.5, + "learning_rate": 2.558273201511886e-05, + "loss": 0.0561, + "step": 136950 + }, + { + "epoch": 38.51, + "learning_rate": 2.556398962921313e-05, + "loss": 0.0658, + "step": 136980 + }, + { + "epoch": 38.52, + "learning_rate": 2.5545247243307408e-05, + "loss": 0.061, + "step": 137010 + }, + { + "epoch": 38.53, + "learning_rate": 2.5526504857401686e-05, + "loss": 0.0622, + "step": 137040 + }, + { + "epoch": 38.54, + "learning_rate": 2.5507762471495956e-05, + "loss": 0.0692, + "step": 137070 + }, + { + "epoch": 38.54, + "learning_rate": 2.548902008559023e-05, + "loss": 0.0578, + "step": 137100 + }, + { + "epoch": 38.55, + "learning_rate": 2.54702776996845e-05, + "loss": 0.0665, + "step": 137130 + }, + { + "epoch": 38.56, + "learning_rate": 2.545153531377878e-05, + "loss": 0.0652, + "step": 137160 + }, + { + "epoch": 38.57, + "learning_rate": 2.543279292787305e-05, + "loss": 0.0628, + "step": 137190 + }, + { + "epoch": 38.58, + "learning_rate": 2.5414050541967327e-05, + "loss": 0.0734, + "step": 137220 + }, + { + "epoch": 38.59, + "learning_rate": 2.5395308156061605e-05, + "loss": 0.0568, + "step": 137250 + }, + { + "epoch": 38.59, + "learning_rate": 2.5376565770155876e-05, + "loss": 0.0678, + "step": 137280 + }, + { + "epoch": 38.6, + "learning_rate": 2.535782338425015e-05, + "loss": 0.0592, + "step": 137310 + }, + { + "epoch": 38.61, + "learning_rate": 2.533908099834442e-05, + "loss": 0.0614, + "step": 137340 + }, + { + "epoch": 38.62, + "learning_rate": 2.5320338612438698e-05, + "loss": 0.0709, + "step": 137370 + }, + { + "epoch": 38.63, + "learning_rate": 2.530159622653297e-05, + "loss": 0.0609, + "step": 137400 + }, + { + "epoch": 38.64, + "learning_rate": 2.5282853840627247e-05, + "loss": 0.0657, + "step": 137430 + }, + { + "epoch": 38.64, + "learning_rate": 2.5264111454721524e-05, + "loss": 0.0652, + "step": 137460 + }, + { + "epoch": 38.65, + "learning_rate": 2.5245369068815795e-05, + "loss": 0.0643, + "step": 137490 + }, + { + "epoch": 38.66, + "learning_rate": 2.522662668291007e-05, + "loss": 0.0734, + "step": 137520 + }, + { + "epoch": 38.67, + "learning_rate": 2.520788429700434e-05, + "loss": 0.0602, + "step": 137550 + }, + { + "epoch": 38.68, + "learning_rate": 2.5189141911098618e-05, + "loss": 0.0645, + "step": 137580 + }, + { + "epoch": 38.69, + "learning_rate": 2.517039952519289e-05, + "loss": 0.0608, + "step": 137610 + }, + { + "epoch": 38.7, + "learning_rate": 2.5151657139287166e-05, + "loss": 0.0623, + "step": 137640 + }, + { + "epoch": 38.7, + "learning_rate": 2.5132914753381444e-05, + "loss": 0.0656, + "step": 137670 + }, + { + "epoch": 38.71, + "learning_rate": 2.5114172367475714e-05, + "loss": 0.0556, + "step": 137700 + }, + { + "epoch": 38.72, + "learning_rate": 2.509542998156999e-05, + "loss": 0.0627, + "step": 137730 + }, + { + "epoch": 38.73, + "learning_rate": 2.5076687595664263e-05, + "loss": 0.0622, + "step": 137760 + }, + { + "epoch": 38.74, + "learning_rate": 2.5057945209758537e-05, + "loss": 0.0634, + "step": 137790 + }, + { + "epoch": 38.75, + "learning_rate": 2.5039202823852808e-05, + "loss": 0.0677, + "step": 137820 + }, + { + "epoch": 38.75, + "learning_rate": 2.5020460437947085e-05, + "loss": 0.0546, + "step": 137850 + }, + { + "epoch": 38.76, + "learning_rate": 2.5001718052041363e-05, + "loss": 0.0666, + "step": 137880 + }, + { + "epoch": 38.77, + "learning_rate": 2.4982975666135634e-05, + "loss": 0.061, + "step": 137910 + }, + { + "epoch": 38.78, + "learning_rate": 2.4964233280229908e-05, + "loss": 0.0638, + "step": 137940 + }, + { + "epoch": 38.79, + "learning_rate": 2.4945490894324182e-05, + "loss": 0.0704, + "step": 137970 + }, + { + "epoch": 38.8, + "learning_rate": 2.4926748508418456e-05, + "loss": 0.0535, + "step": 138000 + }, + { + "epoch": 38.81, + "learning_rate": 2.4908630868709587e-05, + "loss": 0.0662, + "step": 138030 + }, + { + "epoch": 38.81, + "learning_rate": 2.488988848280386e-05, + "loss": 0.0658, + "step": 138060 + }, + { + "epoch": 38.82, + "learning_rate": 2.487114609689814e-05, + "loss": 0.0631, + "step": 138090 + }, + { + "epoch": 38.83, + "learning_rate": 2.485240371099241e-05, + "loss": 0.0691, + "step": 138120 + }, + { + "epoch": 38.84, + "learning_rate": 2.4833661325086684e-05, + "loss": 0.058, + "step": 138150 + }, + { + "epoch": 38.85, + "learning_rate": 2.4814918939180958e-05, + "loss": 0.07, + "step": 138180 + }, + { + "epoch": 38.86, + "learning_rate": 2.4796176553275232e-05, + "loss": 0.0663, + "step": 138210 + }, + { + "epoch": 38.86, + "learning_rate": 2.4777434167369506e-05, + "loss": 0.0623, + "step": 138240 + }, + { + "epoch": 38.87, + "learning_rate": 2.475869178146378e-05, + "loss": 0.0784, + "step": 138270 + }, + { + "epoch": 38.88, + "learning_rate": 2.4739949395558058e-05, + "loss": 0.0632, + "step": 138300 + }, + { + "epoch": 38.89, + "learning_rate": 2.4721207009652332e-05, + "loss": 0.0666, + "step": 138330 + }, + { + "epoch": 38.9, + "learning_rate": 2.4702464623746603e-05, + "loss": 0.0645, + "step": 138360 + }, + { + "epoch": 38.91, + "learning_rate": 2.4683722237840877e-05, + "loss": 0.0616, + "step": 138390 + }, + { + "epoch": 38.91, + "learning_rate": 2.466497985193515e-05, + "loss": 0.07, + "step": 138420 + }, + { + "epoch": 38.92, + "learning_rate": 2.4646237466029426e-05, + "loss": 0.0581, + "step": 138450 + }, + { + "epoch": 38.93, + "learning_rate": 2.46274950801237e-05, + "loss": 0.0619, + "step": 138480 + }, + { + "epoch": 38.94, + "learning_rate": 2.4608752694217977e-05, + "loss": 0.0605, + "step": 138510 + }, + { + "epoch": 38.95, + "learning_rate": 2.459001030831225e-05, + "loss": 0.0621, + "step": 138540 + }, + { + "epoch": 38.96, + "learning_rate": 2.4571267922406522e-05, + "loss": 0.068, + "step": 138570 + }, + { + "epoch": 38.97, + "learning_rate": 2.4552525536500797e-05, + "loss": 0.054, + "step": 138600 + }, + { + "epoch": 38.97, + "learning_rate": 2.453378315059507e-05, + "loss": 0.0649, + "step": 138630 + }, + { + "epoch": 38.98, + "learning_rate": 2.4515040764689345e-05, + "loss": 0.0632, + "step": 138660 + }, + { + "epoch": 38.99, + "learning_rate": 2.449629837878362e-05, + "loss": 0.0639, + "step": 138690 + }, + { + "epoch": 39.0, + "learning_rate": 2.4477555992877897e-05, + "loss": 0.0683, + "step": 138720 + }, + { + "epoch": 39.0, + "eval_loss": 0.17769518494606018, + "eval_runtime": 505.9269, + "eval_samples_per_second": 31.69, + "eval_steps_per_second": 0.992, + "eval_wer": 0.12791205491790975, + "step": 138723 + }, + { + "epoch": 39.01, + "learning_rate": 2.445881360697217e-05, + "loss": 0.056, + "step": 138750 + }, + { + "epoch": 39.02, + "learning_rate": 2.4440071221066442e-05, + "loss": 0.0672, + "step": 138780 + }, + { + "epoch": 39.02, + "learning_rate": 2.4421328835160716e-05, + "loss": 0.0538, + "step": 138810 + }, + { + "epoch": 39.03, + "learning_rate": 2.440258644925499e-05, + "loss": 0.0613, + "step": 138840 + }, + { + "epoch": 39.04, + "learning_rate": 2.4383844063349264e-05, + "loss": 0.0664, + "step": 138870 + }, + { + "epoch": 39.05, + "learning_rate": 2.436510167744354e-05, + "loss": 0.0597, + "step": 138900 + }, + { + "epoch": 39.06, + "learning_rate": 2.4346984037734673e-05, + "loss": 0.0637, + "step": 138930 + }, + { + "epoch": 39.07, + "learning_rate": 2.4328241651828944e-05, + "loss": 0.0584, + "step": 138960 + }, + { + "epoch": 39.08, + "learning_rate": 2.4309499265923218e-05, + "loss": 0.0651, + "step": 138990 + }, + { + "epoch": 39.08, + "learning_rate": 2.4290756880017492e-05, + "loss": 0.0643, + "step": 139020 + }, + { + "epoch": 39.09, + "learning_rate": 2.427201449411177e-05, + "loss": 0.06, + "step": 139050 + }, + { + "epoch": 39.1, + "learning_rate": 2.4253272108206044e-05, + "loss": 0.0657, + "step": 139080 + }, + { + "epoch": 39.11, + "learning_rate": 2.4234529722300318e-05, + "loss": 0.0607, + "step": 139110 + }, + { + "epoch": 39.12, + "learning_rate": 2.4215787336394592e-05, + "loss": 0.0648, + "step": 139140 + }, + { + "epoch": 39.13, + "learning_rate": 2.4197044950488866e-05, + "loss": 0.0618, + "step": 139170 + }, + { + "epoch": 39.13, + "learning_rate": 2.4178302564583137e-05, + "loss": 0.0586, + "step": 139200 + }, + { + "epoch": 39.14, + "learning_rate": 2.415956017867741e-05, + "loss": 0.0662, + "step": 139230 + }, + { + "epoch": 39.15, + "learning_rate": 2.414081779277169e-05, + "loss": 0.0581, + "step": 139260 + }, + { + "epoch": 39.16, + "learning_rate": 2.4122075406865963e-05, + "loss": 0.0647, + "step": 139290 + }, + { + "epoch": 39.17, + "learning_rate": 2.4103333020960237e-05, + "loss": 0.0656, + "step": 139320 + }, + { + "epoch": 39.18, + "learning_rate": 2.408459063505451e-05, + "loss": 0.0591, + "step": 139350 + }, + { + "epoch": 39.18, + "learning_rate": 2.4065848249148786e-05, + "loss": 0.069, + "step": 139380 + }, + { + "epoch": 39.19, + "learning_rate": 2.4047105863243056e-05, + "loss": 0.0589, + "step": 139410 + }, + { + "epoch": 39.2, + "learning_rate": 2.402836347733733e-05, + "loss": 0.0607, + "step": 139440 + }, + { + "epoch": 39.21, + "learning_rate": 2.4009621091431608e-05, + "loss": 0.062, + "step": 139470 + }, + { + "epoch": 39.22, + "learning_rate": 2.3990878705525882e-05, + "loss": 0.0585, + "step": 139500 + }, + { + "epoch": 39.23, + "learning_rate": 2.3972136319620157e-05, + "loss": 0.0688, + "step": 139530 + }, + { + "epoch": 39.24, + "learning_rate": 2.395339393371443e-05, + "loss": 0.0581, + "step": 139560 + }, + { + "epoch": 39.24, + "learning_rate": 2.3934651547808705e-05, + "loss": 0.0714, + "step": 139590 + }, + { + "epoch": 39.25, + "learning_rate": 2.3915909161902976e-05, + "loss": 0.062, + "step": 139620 + }, + { + "epoch": 39.26, + "learning_rate": 2.389716677599725e-05, + "loss": 0.0565, + "step": 139650 + }, + { + "epoch": 39.27, + "learning_rate": 2.3878424390091528e-05, + "loss": 0.0726, + "step": 139680 + }, + { + "epoch": 39.28, + "learning_rate": 2.3859682004185802e-05, + "loss": 0.056, + "step": 139710 + }, + { + "epoch": 39.29, + "learning_rate": 2.3840939618280076e-05, + "loss": 0.0601, + "step": 139740 + }, + { + "epoch": 39.29, + "learning_rate": 2.382219723237435e-05, + "loss": 0.0627, + "step": 139770 + }, + { + "epoch": 39.3, + "learning_rate": 2.3803454846468624e-05, + "loss": 0.0603, + "step": 139800 + }, + { + "epoch": 39.31, + "learning_rate": 2.37847124605629e-05, + "loss": 0.0623, + "step": 139830 + }, + { + "epoch": 39.32, + "learning_rate": 2.376597007465717e-05, + "loss": 0.0577, + "step": 139860 + }, + { + "epoch": 39.33, + "learning_rate": 2.3747227688751447e-05, + "loss": 0.0633, + "step": 139890 + }, + { + "epoch": 39.34, + "learning_rate": 2.372848530284572e-05, + "loss": 0.0645, + "step": 139920 + }, + { + "epoch": 39.34, + "learning_rate": 2.3709742916939995e-05, + "loss": 0.0568, + "step": 139950 + }, + { + "epoch": 39.35, + "learning_rate": 2.369100053103427e-05, + "loss": 0.0637, + "step": 139980 + }, + { + "epoch": 39.36, + "learning_rate": 2.3672258145128544e-05, + "loss": 0.0589, + "step": 140010 + }, + { + "epoch": 39.37, + "learning_rate": 2.3653515759222818e-05, + "loss": 0.0617, + "step": 140040 + }, + { + "epoch": 39.38, + "learning_rate": 2.363477337331709e-05, + "loss": 0.0622, + "step": 140070 + }, + { + "epoch": 39.39, + "learning_rate": 2.3616030987411363e-05, + "loss": 0.0591, + "step": 140100 + }, + { + "epoch": 39.4, + "learning_rate": 2.359728860150564e-05, + "loss": 0.0652, + "step": 140130 + }, + { + "epoch": 39.4, + "learning_rate": 2.3578546215599915e-05, + "loss": 0.059, + "step": 140160 + }, + { + "epoch": 39.41, + "learning_rate": 2.355980382969419e-05, + "loss": 0.0647, + "step": 140190 + }, + { + "epoch": 39.42, + "learning_rate": 2.3541061443788463e-05, + "loss": 0.0638, + "step": 140220 + }, + { + "epoch": 39.43, + "learning_rate": 2.3522319057882737e-05, + "loss": 0.0575, + "step": 140250 + }, + { + "epoch": 39.44, + "learning_rate": 2.3503576671977008e-05, + "loss": 0.0632, + "step": 140280 + }, + { + "epoch": 39.45, + "learning_rate": 2.3484834286071282e-05, + "loss": 0.0602, + "step": 140310 + }, + { + "epoch": 39.45, + "learning_rate": 2.346609190016556e-05, + "loss": 0.0621, + "step": 140340 + }, + { + "epoch": 39.46, + "learning_rate": 2.3447349514259834e-05, + "loss": 0.0629, + "step": 140370 + }, + { + "epoch": 39.47, + "learning_rate": 2.3428607128354108e-05, + "loss": 0.0601, + "step": 140400 + }, + { + "epoch": 39.48, + "learning_rate": 2.3409864742448382e-05, + "loss": 0.0647, + "step": 140430 + }, + { + "epoch": 39.49, + "learning_rate": 2.3391122356542656e-05, + "loss": 0.058, + "step": 140460 + }, + { + "epoch": 39.5, + "learning_rate": 2.3372379970636927e-05, + "loss": 0.0641, + "step": 140490 + }, + { + "epoch": 39.51, + "learning_rate": 2.33536375847312e-05, + "loss": 0.0642, + "step": 140520 + }, + { + "epoch": 39.51, + "learning_rate": 2.333489519882548e-05, + "loss": 0.0573, + "step": 140550 + }, + { + "epoch": 39.52, + "learning_rate": 2.3316152812919753e-05, + "loss": 0.0669, + "step": 140580 + }, + { + "epoch": 39.53, + "learning_rate": 2.3297410427014027e-05, + "loss": 0.0584, + "step": 140610 + }, + { + "epoch": 39.54, + "learning_rate": 2.32786680411083e-05, + "loss": 0.0648, + "step": 140640 + }, + { + "epoch": 39.55, + "learning_rate": 2.3259925655202576e-05, + "loss": 0.0634, + "step": 140670 + }, + { + "epoch": 39.56, + "learning_rate": 2.324118326929685e-05, + "loss": 0.0604, + "step": 140700 + }, + { + "epoch": 39.56, + "learning_rate": 2.322244088339112e-05, + "loss": 0.07, + "step": 140730 + }, + { + "epoch": 39.57, + "learning_rate": 2.32036984974854e-05, + "loss": 0.0565, + "step": 140760 + }, + { + "epoch": 39.58, + "learning_rate": 2.3184956111579673e-05, + "loss": 0.0623, + "step": 140790 + }, + { + "epoch": 39.59, + "learning_rate": 2.3166213725673947e-05, + "loss": 0.0636, + "step": 140820 + }, + { + "epoch": 39.6, + "learning_rate": 2.314747133976822e-05, + "loss": 0.0595, + "step": 140850 + }, + { + "epoch": 39.61, + "learning_rate": 2.3128728953862495e-05, + "loss": 0.0674, + "step": 140880 + }, + { + "epoch": 39.61, + "learning_rate": 2.310998656795677e-05, + "loss": 0.0563, + "step": 140910 + }, + { + "epoch": 39.62, + "learning_rate": 2.309124418205104e-05, + "loss": 0.0668, + "step": 140940 + }, + { + "epoch": 39.63, + "learning_rate": 2.3072501796145318e-05, + "loss": 0.0648, + "step": 140970 + }, + { + "epoch": 39.64, + "learning_rate": 2.3053759410239592e-05, + "loss": 0.0583, + "step": 141000 + }, + { + "epoch": 39.65, + "learning_rate": 2.3035017024333866e-05, + "loss": 0.0655, + "step": 141030 + }, + { + "epoch": 39.66, + "learning_rate": 2.301627463842814e-05, + "loss": 0.0621, + "step": 141060 + }, + { + "epoch": 39.67, + "learning_rate": 2.2997532252522414e-05, + "loss": 0.0595, + "step": 141090 + }, + { + "epoch": 39.67, + "learning_rate": 2.297878986661669e-05, + "loss": 0.0634, + "step": 141120 + }, + { + "epoch": 39.68, + "learning_rate": 2.296004748071096e-05, + "loss": 0.0637, + "step": 141150 + }, + { + "epoch": 39.69, + "learning_rate": 2.2941305094805237e-05, + "loss": 0.0682, + "step": 141180 + }, + { + "epoch": 39.7, + "learning_rate": 2.292256270889951e-05, + "loss": 0.0651, + "step": 141210 + }, + { + "epoch": 39.71, + "learning_rate": 2.2903820322993785e-05, + "loss": 0.0655, + "step": 141240 + }, + { + "epoch": 39.72, + "learning_rate": 2.288507793708806e-05, + "loss": 0.064, + "step": 141270 + }, + { + "epoch": 39.72, + "learning_rate": 2.2866335551182334e-05, + "loss": 0.0611, + "step": 141300 + }, + { + "epoch": 39.73, + "learning_rate": 2.2847593165276608e-05, + "loss": 0.0695, + "step": 141330 + }, + { + "epoch": 39.74, + "learning_rate": 2.2828850779370882e-05, + "loss": 0.0575, + "step": 141360 + }, + { + "epoch": 39.75, + "learning_rate": 2.2810108393465156e-05, + "loss": 0.0654, + "step": 141390 + }, + { + "epoch": 39.76, + "learning_rate": 2.279136600755943e-05, + "loss": 0.0618, + "step": 141420 + }, + { + "epoch": 39.77, + "learning_rate": 2.2772623621653705e-05, + "loss": 0.0602, + "step": 141450 + }, + { + "epoch": 39.77, + "learning_rate": 2.275388123574798e-05, + "loss": 0.0654, + "step": 141480 + }, + { + "epoch": 39.78, + "learning_rate": 2.2735138849842253e-05, + "loss": 0.0563, + "step": 141510 + }, + { + "epoch": 39.79, + "learning_rate": 2.2716396463936527e-05, + "loss": 0.0671, + "step": 141540 + }, + { + "epoch": 39.8, + "learning_rate": 2.26976540780308e-05, + "loss": 0.0623, + "step": 141570 + }, + { + "epoch": 39.81, + "learning_rate": 2.2678911692125076e-05, + "loss": 0.0625, + "step": 141600 + }, + { + "epoch": 39.82, + "learning_rate": 2.266016930621935e-05, + "loss": 0.0687, + "step": 141630 + }, + { + "epoch": 39.83, + "learning_rate": 2.2641426920313624e-05, + "loss": 0.0564, + "step": 141660 + }, + { + "epoch": 39.83, + "learning_rate": 2.2622684534407898e-05, + "loss": 0.0636, + "step": 141690 + }, + { + "epoch": 39.84, + "learning_rate": 2.2603942148502172e-05, + "loss": 0.062, + "step": 141720 + }, + { + "epoch": 39.85, + "learning_rate": 2.2585199762596447e-05, + "loss": 0.0589, + "step": 141750 + }, + { + "epoch": 39.86, + "learning_rate": 2.256645737669072e-05, + "loss": 0.0629, + "step": 141780 + }, + { + "epoch": 39.87, + "learning_rate": 2.2547714990784995e-05, + "loss": 0.0558, + "step": 141810 + }, + { + "epoch": 39.88, + "learning_rate": 2.252897260487927e-05, + "loss": 0.0612, + "step": 141840 + }, + { + "epoch": 39.88, + "learning_rate": 2.2510230218973543e-05, + "loss": 0.0627, + "step": 141870 + }, + { + "epoch": 39.89, + "learning_rate": 2.2491487833067818e-05, + "loss": 0.0566, + "step": 141900 + }, + { + "epoch": 39.9, + "learning_rate": 2.2472745447162092e-05, + "loss": 0.0665, + "step": 141930 + }, + { + "epoch": 39.91, + "learning_rate": 2.2454003061256366e-05, + "loss": 0.0547, + "step": 141960 + }, + { + "epoch": 39.92, + "learning_rate": 2.2435885421547497e-05, + "loss": 0.0638, + "step": 141990 + }, + { + "epoch": 39.93, + "learning_rate": 2.241714303564177e-05, + "loss": 0.0575, + "step": 142020 + }, + { + "epoch": 39.94, + "learning_rate": 2.2398400649736045e-05, + "loss": 0.0584, + "step": 142050 + }, + { + "epoch": 39.94, + "learning_rate": 2.237965826383032e-05, + "loss": 0.0676, + "step": 142080 + }, + { + "epoch": 39.95, + "learning_rate": 2.2360915877924594e-05, + "loss": 0.0615, + "step": 142110 + }, + { + "epoch": 39.96, + "learning_rate": 2.234217349201887e-05, + "loss": 0.0631, + "step": 142140 + }, + { + "epoch": 39.97, + "learning_rate": 2.2323431106113142e-05, + "loss": 0.0652, + "step": 142170 + }, + { + "epoch": 39.98, + "learning_rate": 2.2304688720207416e-05, + "loss": 0.0623, + "step": 142200 + }, + { + "epoch": 39.99, + "learning_rate": 2.228594633430169e-05, + "loss": 0.0696, + "step": 142230 + }, + { + "epoch": 39.99, + "learning_rate": 2.2267203948395965e-05, + "loss": 0.0587, + "step": 142260 + }, + { + "epoch": 40.0, + "eval_loss": 0.17351745069026947, + "eval_runtime": 506.6702, + "eval_samples_per_second": 31.644, + "eval_steps_per_second": 0.991, + "eval_wer": 0.1271068469968474, + "step": 142280 + }, + { + "epoch": 40.0, + "learning_rate": 2.224846156249024e-05, + "loss": 0.0646, + "step": 142290 + }, + { + "epoch": 40.01, + "learning_rate": 2.2229719176584513e-05, + "loss": 0.057, + "step": 142320 + }, + { + "epoch": 40.02, + "learning_rate": 2.221097679067879e-05, + "loss": 0.0635, + "step": 142350 + }, + { + "epoch": 40.03, + "learning_rate": 2.219223440477306e-05, + "loss": 0.0667, + "step": 142380 + }, + { + "epoch": 40.04, + "learning_rate": 2.2173492018867336e-05, + "loss": 0.0561, + "step": 142410 + }, + { + "epoch": 40.04, + "learning_rate": 2.215474963296161e-05, + "loss": 0.0643, + "step": 142440 + }, + { + "epoch": 40.05, + "learning_rate": 2.2136007247055884e-05, + "loss": 0.0562, + "step": 142470 + }, + { + "epoch": 40.06, + "learning_rate": 2.2117264861150158e-05, + "loss": 0.062, + "step": 142500 + }, + { + "epoch": 40.07, + "learning_rate": 2.2098522475244432e-05, + "loss": 0.0686, + "step": 142530 + }, + { + "epoch": 40.08, + "learning_rate": 2.207978008933871e-05, + "loss": 0.0547, + "step": 142560 + }, + { + "epoch": 40.09, + "learning_rate": 2.2061037703432984e-05, + "loss": 0.06, + "step": 142590 + }, + { + "epoch": 40.1, + "learning_rate": 2.2042295317527255e-05, + "loss": 0.0572, + "step": 142620 + }, + { + "epoch": 40.1, + "learning_rate": 2.202355293162153e-05, + "loss": 0.0626, + "step": 142650 + }, + { + "epoch": 40.11, + "learning_rate": 2.2004810545715803e-05, + "loss": 0.0668, + "step": 142680 + }, + { + "epoch": 40.12, + "learning_rate": 2.1986068159810077e-05, + "loss": 0.0525, + "step": 142710 + }, + { + "epoch": 40.13, + "learning_rate": 2.196732577390435e-05, + "loss": 0.0625, + "step": 142740 + }, + { + "epoch": 40.14, + "learning_rate": 2.1948583387998626e-05, + "loss": 0.0567, + "step": 142770 + }, + { + "epoch": 40.15, + "learning_rate": 2.1929841002092903e-05, + "loss": 0.0651, + "step": 142800 + }, + { + "epoch": 40.15, + "learning_rate": 2.1911098616187174e-05, + "loss": 0.0704, + "step": 142830 + }, + { + "epoch": 40.16, + "learning_rate": 2.189235623028145e-05, + "loss": 0.0512, + "step": 142860 + }, + { + "epoch": 40.17, + "learning_rate": 2.1873613844375723e-05, + "loss": 0.0663, + "step": 142890 + }, + { + "epoch": 40.18, + "learning_rate": 2.1854871458469997e-05, + "loss": 0.0588, + "step": 142920 + }, + { + "epoch": 40.19, + "learning_rate": 2.183612907256427e-05, + "loss": 0.0641, + "step": 142950 + }, + { + "epoch": 40.2, + "learning_rate": 2.1817386686658545e-05, + "loss": 0.0659, + "step": 142980 + }, + { + "epoch": 40.21, + "learning_rate": 2.1798644300752823e-05, + "loss": 0.0563, + "step": 143010 + }, + { + "epoch": 40.21, + "learning_rate": 2.1779901914847094e-05, + "loss": 0.0662, + "step": 143040 + }, + { + "epoch": 40.22, + "learning_rate": 2.1761159528941368e-05, + "loss": 0.0565, + "step": 143070 + }, + { + "epoch": 40.23, + "learning_rate": 2.1742417143035642e-05, + "loss": 0.0601, + "step": 143100 + }, + { + "epoch": 40.24, + "learning_rate": 2.1723674757129916e-05, + "loss": 0.0693, + "step": 143130 + }, + { + "epoch": 40.25, + "learning_rate": 2.170493237122419e-05, + "loss": 0.056, + "step": 143160 + }, + { + "epoch": 40.26, + "learning_rate": 2.1686189985318464e-05, + "loss": 0.0677, + "step": 143190 + }, + { + "epoch": 40.26, + "learning_rate": 2.1667447599412742e-05, + "loss": 0.0562, + "step": 143220 + }, + { + "epoch": 40.27, + "learning_rate": 2.1648705213507013e-05, + "loss": 0.0635, + "step": 143250 + }, + { + "epoch": 40.28, + "learning_rate": 2.1629962827601287e-05, + "loss": 0.0686, + "step": 143280 + }, + { + "epoch": 40.29, + "learning_rate": 2.161122044169556e-05, + "loss": 0.0511, + "step": 143310 + }, + { + "epoch": 40.3, + "learning_rate": 2.1592478055789835e-05, + "loss": 0.066, + "step": 143340 + }, + { + "epoch": 40.31, + "learning_rate": 2.157373566988411e-05, + "loss": 0.0583, + "step": 143370 + }, + { + "epoch": 40.31, + "learning_rate": 2.1554993283978384e-05, + "loss": 0.055, + "step": 143400 + }, + { + "epoch": 40.32, + "learning_rate": 2.153625089807266e-05, + "loss": 0.0644, + "step": 143430 + }, + { + "epoch": 40.33, + "learning_rate": 2.1517508512166936e-05, + "loss": 0.0525, + "step": 143460 + }, + { + "epoch": 40.34, + "learning_rate": 2.1498766126261206e-05, + "loss": 0.0653, + "step": 143490 + }, + { + "epoch": 40.35, + "learning_rate": 2.148002374035548e-05, + "loss": 0.0569, + "step": 143520 + }, + { + "epoch": 40.36, + "learning_rate": 2.1461281354449755e-05, + "loss": 0.0593, + "step": 143550 + }, + { + "epoch": 40.37, + "learning_rate": 2.144253896854403e-05, + "loss": 0.0691, + "step": 143580 + }, + { + "epoch": 40.37, + "learning_rate": 2.1423796582638303e-05, + "loss": 0.0546, + "step": 143610 + }, + { + "epoch": 40.38, + "learning_rate": 2.140505419673258e-05, + "loss": 0.06, + "step": 143640 + }, + { + "epoch": 40.39, + "learning_rate": 2.1386311810826855e-05, + "loss": 0.0573, + "step": 143670 + }, + { + "epoch": 40.4, + "learning_rate": 2.1367569424921126e-05, + "loss": 0.0635, + "step": 143700 + }, + { + "epoch": 40.41, + "learning_rate": 2.13488270390154e-05, + "loss": 0.0698, + "step": 143730 + }, + { + "epoch": 40.42, + "learning_rate": 2.1330084653109674e-05, + "loss": 0.0514, + "step": 143760 + }, + { + "epoch": 40.42, + "learning_rate": 2.1311342267203948e-05, + "loss": 0.0637, + "step": 143790 + }, + { + "epoch": 40.43, + "learning_rate": 2.1292599881298222e-05, + "loss": 0.0572, + "step": 143820 + }, + { + "epoch": 40.44, + "learning_rate": 2.12738574953925e-05, + "loss": 0.0603, + "step": 143850 + }, + { + "epoch": 40.45, + "learning_rate": 2.1255115109486774e-05, + "loss": 0.0636, + "step": 143880 + }, + { + "epoch": 40.46, + "learning_rate": 2.1236372723581045e-05, + "loss": 0.0547, + "step": 143910 + }, + { + "epoch": 40.47, + "learning_rate": 2.121763033767532e-05, + "loss": 0.0613, + "step": 143940 + }, + { + "epoch": 40.48, + "learning_rate": 2.1198887951769593e-05, + "loss": 0.0591, + "step": 143970 + }, + { + "epoch": 40.48, + "learning_rate": 2.1180145565863868e-05, + "loss": 0.0599, + "step": 144000 + }, + { + "epoch": 40.49, + "learning_rate": 2.1161403179958142e-05, + "loss": 0.064, + "step": 144030 + }, + { + "epoch": 40.5, + "learning_rate": 2.114266079405242e-05, + "loss": 0.0556, + "step": 144060 + }, + { + "epoch": 40.51, + "learning_rate": 2.1123918408146694e-05, + "loss": 0.0625, + "step": 144090 + }, + { + "epoch": 40.52, + "learning_rate": 2.1105176022240968e-05, + "loss": 0.0587, + "step": 144120 + }, + { + "epoch": 40.53, + "learning_rate": 2.108643363633524e-05, + "loss": 0.0641, + "step": 144150 + }, + { + "epoch": 40.53, + "learning_rate": 2.1067691250429513e-05, + "loss": 0.0702, + "step": 144180 + }, + { + "epoch": 40.54, + "learning_rate": 2.1048948864523787e-05, + "loss": 0.0522, + "step": 144210 + }, + { + "epoch": 40.55, + "learning_rate": 2.103020647861806e-05, + "loss": 0.0663, + "step": 144240 + }, + { + "epoch": 40.56, + "learning_rate": 2.101146409271234e-05, + "loss": 0.0607, + "step": 144270 + }, + { + "epoch": 40.57, + "learning_rate": 2.0992721706806613e-05, + "loss": 0.0607, + "step": 144300 + }, + { + "epoch": 40.58, + "learning_rate": 2.0973979320900887e-05, + "loss": 0.0684, + "step": 144330 + }, + { + "epoch": 40.58, + "learning_rate": 2.0955236934995158e-05, + "loss": 0.058, + "step": 144360 + }, + { + "epoch": 40.59, + "learning_rate": 2.0936494549089432e-05, + "loss": 0.0644, + "step": 144390 + }, + { + "epoch": 40.6, + "learning_rate": 2.0917752163183706e-05, + "loss": 0.0573, + "step": 144420 + }, + { + "epoch": 40.61, + "learning_rate": 2.089900977727798e-05, + "loss": 0.0609, + "step": 144450 + }, + { + "epoch": 40.62, + "learning_rate": 2.0880267391372258e-05, + "loss": 0.0652, + "step": 144480 + }, + { + "epoch": 40.63, + "learning_rate": 2.0861525005466532e-05, + "loss": 0.0529, + "step": 144510 + }, + { + "epoch": 40.64, + "learning_rate": 2.0842782619560806e-05, + "loss": 0.0618, + "step": 144540 + }, + { + "epoch": 40.64, + "learning_rate": 2.0824040233655077e-05, + "loss": 0.0558, + "step": 144570 + }, + { + "epoch": 40.65, + "learning_rate": 2.080529784774935e-05, + "loss": 0.0609, + "step": 144600 + }, + { + "epoch": 40.66, + "learning_rate": 2.0786555461843626e-05, + "loss": 0.066, + "step": 144630 + }, + { + "epoch": 40.67, + "learning_rate": 2.07678130759379e-05, + "loss": 0.055, + "step": 144660 + }, + { + "epoch": 40.68, + "learning_rate": 2.0749070690032174e-05, + "loss": 0.0647, + "step": 144690 + }, + { + "epoch": 40.69, + "learning_rate": 2.073032830412645e-05, + "loss": 0.0555, + "step": 144720 + }, + { + "epoch": 40.69, + "learning_rate": 2.0711585918220726e-05, + "loss": 0.0592, + "step": 144750 + }, + { + "epoch": 40.7, + "learning_rate": 2.0692843532315e-05, + "loss": 0.0675, + "step": 144780 + }, + { + "epoch": 40.71, + "learning_rate": 2.067410114640927e-05, + "loss": 0.0522, + "step": 144810 + }, + { + "epoch": 40.72, + "learning_rate": 2.0655358760503545e-05, + "loss": 0.0653, + "step": 144840 + }, + { + "epoch": 40.73, + "learning_rate": 2.063661637459782e-05, + "loss": 0.0554, + "step": 144870 + }, + { + "epoch": 40.74, + "learning_rate": 2.0617873988692093e-05, + "loss": 0.0629, + "step": 144900 + }, + { + "epoch": 40.74, + "learning_rate": 2.059913160278637e-05, + "loss": 0.0666, + "step": 144930 + }, + { + "epoch": 40.75, + "learning_rate": 2.0580389216880645e-05, + "loss": 0.0524, + "step": 144960 + }, + { + "epoch": 40.76, + "learning_rate": 2.056164683097492e-05, + "loss": 0.0612, + "step": 144990 + }, + { + "epoch": 40.77, + "learning_rate": 2.054290444506919e-05, + "loss": 0.0573, + "step": 145020 + }, + { + "epoch": 40.78, + "learning_rate": 2.0524162059163464e-05, + "loss": 0.0659, + "step": 145050 + }, + { + "epoch": 40.79, + "learning_rate": 2.050541967325774e-05, + "loss": 0.0641, + "step": 145080 + }, + { + "epoch": 40.8, + "learning_rate": 2.0486677287352013e-05, + "loss": 0.0565, + "step": 145110 + }, + { + "epoch": 40.8, + "learning_rate": 2.046793490144629e-05, + "loss": 0.0605, + "step": 145140 + }, + { + "epoch": 40.81, + "learning_rate": 2.0449192515540564e-05, + "loss": 0.0622, + "step": 145170 + }, + { + "epoch": 40.82, + "learning_rate": 2.043045012963484e-05, + "loss": 0.0639, + "step": 145200 + }, + { + "epoch": 40.83, + "learning_rate": 2.041170774372911e-05, + "loss": 0.0667, + "step": 145230 + }, + { + "epoch": 40.84, + "learning_rate": 2.0392965357823384e-05, + "loss": 0.056, + "step": 145260 + }, + { + "epoch": 40.85, + "learning_rate": 2.0374222971917658e-05, + "loss": 0.0647, + "step": 145290 + }, + { + "epoch": 40.85, + "learning_rate": 2.0355480586011932e-05, + "loss": 0.0572, + "step": 145320 + }, + { + "epoch": 40.86, + "learning_rate": 2.033673820010621e-05, + "loss": 0.0603, + "step": 145350 + }, + { + "epoch": 40.87, + "learning_rate": 2.0317995814200484e-05, + "loss": 0.0619, + "step": 145380 + }, + { + "epoch": 40.88, + "learning_rate": 2.0299253428294758e-05, + "loss": 0.0524, + "step": 145410 + }, + { + "epoch": 40.89, + "learning_rate": 2.028051104238903e-05, + "loss": 0.0642, + "step": 145440 + }, + { + "epoch": 40.9, + "learning_rate": 2.0261768656483303e-05, + "loss": 0.0577, + "step": 145470 + }, + { + "epoch": 40.91, + "learning_rate": 2.0243026270577577e-05, + "loss": 0.0584, + "step": 145500 + }, + { + "epoch": 40.91, + "learning_rate": 2.022428388467185e-05, + "loss": 0.0677, + "step": 145530 + }, + { + "epoch": 40.92, + "learning_rate": 2.020554149876613e-05, + "loss": 0.0515, + "step": 145560 + }, + { + "epoch": 40.93, + "learning_rate": 2.0186799112860403e-05, + "loss": 0.0625, + "step": 145590 + }, + { + "epoch": 40.94, + "learning_rate": 2.0168056726954677e-05, + "loss": 0.0558, + "step": 145620 + }, + { + "epoch": 40.95, + "learning_rate": 2.014931434104895e-05, + "loss": 0.0605, + "step": 145650 + }, + { + "epoch": 40.96, + "learning_rate": 2.0130571955143222e-05, + "loss": 0.0691, + "step": 145680 + }, + { + "epoch": 40.96, + "learning_rate": 2.0111829569237496e-05, + "loss": 0.0519, + "step": 145710 + }, + { + "epoch": 40.97, + "learning_rate": 2.009308718333177e-05, + "loss": 0.0686, + "step": 145740 + }, + { + "epoch": 40.98, + "learning_rate": 2.0074344797426048e-05, + "loss": 0.0576, + "step": 145770 + }, + { + "epoch": 40.99, + "learning_rate": 2.0055602411520322e-05, + "loss": 0.0631, + "step": 145800 + }, + { + "epoch": 41.0, + "learning_rate": 2.0036860025614597e-05, + "loss": 0.0693, + "step": 145830 + }, + { + "epoch": 41.0, + "eval_loss": 0.1780107468366623, + "eval_runtime": 506.6643, + "eval_samples_per_second": 31.644, + "eval_steps_per_second": 0.991, + "eval_wer": 0.1259945682584308, + "step": 145837 + }, + { + "epoch": 41.01, + "learning_rate": 2.001811763970887e-05, + "loss": 0.0566, + "step": 145860 + }, + { + "epoch": 41.01, + "learning_rate": 1.999937525380314e-05, + "loss": 0.0635, + "step": 145890 + }, + { + "epoch": 41.02, + "learning_rate": 1.9980632867897416e-05, + "loss": 0.0551, + "step": 145920 + }, + { + "epoch": 41.03, + "learning_rate": 1.996189048199169e-05, + "loss": 0.0635, + "step": 145950 + }, + { + "epoch": 41.04, + "learning_rate": 1.9943148096085968e-05, + "loss": 0.0601, + "step": 145980 + }, + { + "epoch": 41.05, + "learning_rate": 1.9924405710180242e-05, + "loss": 0.0547, + "step": 146010 + }, + { + "epoch": 41.06, + "learning_rate": 1.9905663324274516e-05, + "loss": 0.0628, + "step": 146040 + }, + { + "epoch": 41.07, + "learning_rate": 1.988692093836879e-05, + "loss": 0.0534, + "step": 146070 + }, + { + "epoch": 41.07, + "learning_rate": 1.986817855246306e-05, + "loss": 0.0635, + "step": 146100 + }, + { + "epoch": 41.08, + "learning_rate": 1.9849436166557335e-05, + "loss": 0.0573, + "step": 146130 + }, + { + "epoch": 41.09, + "learning_rate": 1.983069378065161e-05, + "loss": 0.0627, + "step": 146160 + }, + { + "epoch": 41.1, + "learning_rate": 1.9811951394745887e-05, + "loss": 0.0647, + "step": 146190 + }, + { + "epoch": 41.11, + "learning_rate": 1.979320900884016e-05, + "loss": 0.0539, + "step": 146220 + }, + { + "epoch": 41.12, + "learning_rate": 1.9774466622934435e-05, + "loss": 0.062, + "step": 146250 + }, + { + "epoch": 41.12, + "learning_rate": 1.975572423702871e-05, + "loss": 0.057, + "step": 146280 + }, + { + "epoch": 41.13, + "learning_rate": 1.9736981851122984e-05, + "loss": 0.061, + "step": 146310 + }, + { + "epoch": 41.14, + "learning_rate": 1.9718239465217254e-05, + "loss": 0.0651, + "step": 146340 + }, + { + "epoch": 41.15, + "learning_rate": 1.969949707931153e-05, + "loss": 0.051, + "step": 146370 + }, + { + "epoch": 41.16, + "learning_rate": 1.9680754693405803e-05, + "loss": 0.0586, + "step": 146400 + }, + { + "epoch": 41.17, + "learning_rate": 1.966201230750008e-05, + "loss": 0.0554, + "step": 146430 + }, + { + "epoch": 41.18, + "learning_rate": 1.9643269921594355e-05, + "loss": 0.0632, + "step": 146460 + }, + { + "epoch": 41.18, + "learning_rate": 1.962452753568863e-05, + "loss": 0.0656, + "step": 146490 + }, + { + "epoch": 41.19, + "learning_rate": 1.9605785149782903e-05, + "loss": 0.0501, + "step": 146520 + }, + { + "epoch": 41.2, + "learning_rate": 1.9587042763877174e-05, + "loss": 0.0619, + "step": 146550 + }, + { + "epoch": 41.21, + "learning_rate": 1.9568300377971448e-05, + "loss": 0.0565, + "step": 146580 + }, + { + "epoch": 41.22, + "learning_rate": 1.9549557992065722e-05, + "loss": 0.0596, + "step": 146610 + }, + { + "epoch": 41.23, + "learning_rate": 1.953081560616e-05, + "loss": 0.0659, + "step": 146640 + }, + { + "epoch": 41.23, + "learning_rate": 1.9512073220254274e-05, + "loss": 0.0554, + "step": 146670 + }, + { + "epoch": 41.24, + "learning_rate": 1.9493330834348548e-05, + "loss": 0.0626, + "step": 146700 + }, + { + "epoch": 41.25, + "learning_rate": 1.9474588448442822e-05, + "loss": 0.0579, + "step": 146730 + }, + { + "epoch": 41.26, + "learning_rate": 1.9455846062537093e-05, + "loss": 0.0573, + "step": 146760 + }, + { + "epoch": 41.27, + "learning_rate": 1.9437103676631367e-05, + "loss": 0.0667, + "step": 146790 + }, + { + "epoch": 41.28, + "learning_rate": 1.941836129072564e-05, + "loss": 0.0567, + "step": 146820 + }, + { + "epoch": 41.28, + "learning_rate": 1.939961890481992e-05, + "loss": 0.0638, + "step": 146850 + }, + { + "epoch": 41.29, + "learning_rate": 1.9380876518914193e-05, + "loss": 0.0557, + "step": 146880 + }, + { + "epoch": 41.3, + "learning_rate": 1.9362134133008467e-05, + "loss": 0.0563, + "step": 146910 + }, + { + "epoch": 41.31, + "learning_rate": 1.934339174710274e-05, + "loss": 0.0658, + "step": 146940 + }, + { + "epoch": 41.32, + "learning_rate": 1.9324649361197016e-05, + "loss": 0.0549, + "step": 146970 + }, + { + "epoch": 41.33, + "learning_rate": 1.9305906975291287e-05, + "loss": 0.0648, + "step": 147000 + }, + { + "epoch": 41.34, + "learning_rate": 1.928716458938556e-05, + "loss": 0.0604, + "step": 147030 + }, + { + "epoch": 41.34, + "learning_rate": 1.926842220347984e-05, + "loss": 0.0551, + "step": 147060 + }, + { + "epoch": 41.35, + "learning_rate": 1.9249679817574113e-05, + "loss": 0.0669, + "step": 147090 + }, + { + "epoch": 41.36, + "learning_rate": 1.9230937431668387e-05, + "loss": 0.0539, + "step": 147120 + }, + { + "epoch": 41.37, + "learning_rate": 1.921219504576266e-05, + "loss": 0.063, + "step": 147150 + }, + { + "epoch": 41.38, + "learning_rate": 1.9193452659856935e-05, + "loss": 0.0593, + "step": 147180 + }, + { + "epoch": 41.39, + "learning_rate": 1.9174710273951206e-05, + "loss": 0.0571, + "step": 147210 + }, + { + "epoch": 41.39, + "learning_rate": 1.915659263424234e-05, + "loss": 0.0637, + "step": 147240 + }, + { + "epoch": 41.4, + "learning_rate": 1.9137850248336614e-05, + "loss": 0.0539, + "step": 147270 + }, + { + "epoch": 41.41, + "learning_rate": 1.911910786243089e-05, + "loss": 0.06, + "step": 147300 + }, + { + "epoch": 41.42, + "learning_rate": 1.9100365476525163e-05, + "loss": 0.0584, + "step": 147330 + }, + { + "epoch": 41.43, + "learning_rate": 1.9081623090619437e-05, + "loss": 0.0589, + "step": 147360 + }, + { + "epoch": 41.44, + "learning_rate": 1.906288070471371e-05, + "loss": 0.0638, + "step": 147390 + }, + { + "epoch": 41.44, + "learning_rate": 1.9044138318807985e-05, + "loss": 0.0534, + "step": 147420 + }, + { + "epoch": 41.45, + "learning_rate": 1.902539593290226e-05, + "loss": 0.0597, + "step": 147450 + }, + { + "epoch": 41.46, + "learning_rate": 1.9006653546996534e-05, + "loss": 0.0564, + "step": 147480 + }, + { + "epoch": 41.47, + "learning_rate": 1.8987911161090808e-05, + "loss": 0.0567, + "step": 147510 + }, + { + "epoch": 41.48, + "learning_rate": 1.8969168775185082e-05, + "loss": 0.0648, + "step": 147540 + }, + { + "epoch": 41.49, + "learning_rate": 1.8950426389279356e-05, + "loss": 0.0531, + "step": 147570 + }, + { + "epoch": 41.5, + "learning_rate": 1.893168400337363e-05, + "loss": 0.0667, + "step": 147600 + }, + { + "epoch": 41.5, + "learning_rate": 1.8912941617467905e-05, + "loss": 0.0603, + "step": 147630 + }, + { + "epoch": 41.51, + "learning_rate": 1.889419923156218e-05, + "loss": 0.0593, + "step": 147660 + }, + { + "epoch": 41.52, + "learning_rate": 1.8875456845656453e-05, + "loss": 0.0606, + "step": 147690 + }, + { + "epoch": 41.53, + "learning_rate": 1.8856714459750727e-05, + "loss": 0.0559, + "step": 147720 + }, + { + "epoch": 41.54, + "learning_rate": 1.8837972073845e-05, + "loss": 0.0642, + "step": 147750 + }, + { + "epoch": 41.55, + "learning_rate": 1.8819229687939276e-05, + "loss": 0.0586, + "step": 147780 + }, + { + "epoch": 41.55, + "learning_rate": 1.880048730203355e-05, + "loss": 0.0589, + "step": 147810 + }, + { + "epoch": 41.56, + "learning_rate": 1.8781744916127824e-05, + "loss": 0.0693, + "step": 147840 + }, + { + "epoch": 41.57, + "learning_rate": 1.8763002530222098e-05, + "loss": 0.0565, + "step": 147870 + }, + { + "epoch": 41.58, + "learning_rate": 1.8744260144316372e-05, + "loss": 0.061, + "step": 147900 + }, + { + "epoch": 41.59, + "learning_rate": 1.8725517758410647e-05, + "loss": 0.0595, + "step": 147930 + }, + { + "epoch": 41.6, + "learning_rate": 1.870677537250492e-05, + "loss": 0.0585, + "step": 147960 + }, + { + "epoch": 41.61, + "learning_rate": 1.8688032986599195e-05, + "loss": 0.0627, + "step": 147990 + }, + { + "epoch": 41.61, + "learning_rate": 1.866929060069347e-05, + "loss": 0.0516, + "step": 148020 + }, + { + "epoch": 41.62, + "learning_rate": 1.8650548214787743e-05, + "loss": 0.0617, + "step": 148050 + }, + { + "epoch": 41.63, + "learning_rate": 1.8631805828882018e-05, + "loss": 0.0587, + "step": 148080 + }, + { + "epoch": 41.64, + "learning_rate": 1.8613063442976292e-05, + "loss": 0.062, + "step": 148110 + }, + { + "epoch": 41.65, + "learning_rate": 1.8594321057070566e-05, + "loss": 0.0639, + "step": 148140 + }, + { + "epoch": 41.66, + "learning_rate": 1.857557867116484e-05, + "loss": 0.0527, + "step": 148170 + }, + { + "epoch": 41.66, + "learning_rate": 1.8556836285259114e-05, + "loss": 0.0596, + "step": 148200 + }, + { + "epoch": 41.67, + "learning_rate": 1.853809389935339e-05, + "loss": 0.065, + "step": 148230 + }, + { + "epoch": 41.68, + "learning_rate": 1.8519351513447663e-05, + "loss": 0.061, + "step": 148260 + }, + { + "epoch": 41.69, + "learning_rate": 1.8500609127541937e-05, + "loss": 0.0621, + "step": 148290 + }, + { + "epoch": 41.7, + "learning_rate": 1.848186674163621e-05, + "loss": 0.0533, + "step": 148320 + }, + { + "epoch": 41.71, + "learning_rate": 1.8463124355730485e-05, + "loss": 0.0678, + "step": 148350 + }, + { + "epoch": 41.71, + "learning_rate": 1.844438196982476e-05, + "loss": 0.059, + "step": 148380 + }, + { + "epoch": 41.72, + "learning_rate": 1.8425639583919034e-05, + "loss": 0.0575, + "step": 148410 + }, + { + "epoch": 41.73, + "learning_rate": 1.8406897198013308e-05, + "loss": 0.0686, + "step": 148440 + }, + { + "epoch": 41.74, + "learning_rate": 1.8388154812107582e-05, + "loss": 0.0525, + "step": 148470 + }, + { + "epoch": 41.75, + "learning_rate": 1.8369412426201856e-05, + "loss": 0.0626, + "step": 148500 + }, + { + "epoch": 41.76, + "learning_rate": 1.835067004029613e-05, + "loss": 0.0574, + "step": 148530 + }, + { + "epoch": 41.77, + "learning_rate": 1.8331927654390405e-05, + "loss": 0.058, + "step": 148560 + }, + { + "epoch": 41.77, + "learning_rate": 1.831318526848468e-05, + "loss": 0.0654, + "step": 148590 + }, + { + "epoch": 41.78, + "learning_rate": 1.8294442882578953e-05, + "loss": 0.051, + "step": 148620 + }, + { + "epoch": 41.79, + "learning_rate": 1.8275700496673227e-05, + "loss": 0.0614, + "step": 148650 + }, + { + "epoch": 41.8, + "learning_rate": 1.82569581107675e-05, + "loss": 0.06, + "step": 148680 + }, + { + "epoch": 41.81, + "learning_rate": 1.8238215724861776e-05, + "loss": 0.0604, + "step": 148710 + }, + { + "epoch": 41.82, + "learning_rate": 1.821947333895605e-05, + "loss": 0.0686, + "step": 148740 + }, + { + "epoch": 41.82, + "learning_rate": 1.8200730953050324e-05, + "loss": 0.0546, + "step": 148770 + }, + { + "epoch": 41.83, + "learning_rate": 1.8181988567144598e-05, + "loss": 0.0612, + "step": 148800 + }, + { + "epoch": 41.84, + "learning_rate": 1.8163246181238872e-05, + "loss": 0.0577, + "step": 148830 + }, + { + "epoch": 41.85, + "learning_rate": 1.8144503795333147e-05, + "loss": 0.0598, + "step": 148860 + }, + { + "epoch": 41.86, + "learning_rate": 1.812576140942742e-05, + "loss": 0.0654, + "step": 148890 + }, + { + "epoch": 41.87, + "learning_rate": 1.8107019023521695e-05, + "loss": 0.0494, + "step": 148920 + }, + { + "epoch": 41.88, + "learning_rate": 1.808827663761597e-05, + "loss": 0.062, + "step": 148950 + }, + { + "epoch": 41.88, + "learning_rate": 1.8069534251710243e-05, + "loss": 0.0607, + "step": 148980 + }, + { + "epoch": 41.89, + "learning_rate": 1.8050791865804517e-05, + "loss": 0.0595, + "step": 149010 + }, + { + "epoch": 41.9, + "learning_rate": 1.803204947989879e-05, + "loss": 0.0628, + "step": 149040 + }, + { + "epoch": 41.91, + "learning_rate": 1.8013307093993066e-05, + "loss": 0.0518, + "step": 149070 + }, + { + "epoch": 41.92, + "learning_rate": 1.799456470808734e-05, + "loss": 0.065, + "step": 149100 + }, + { + "epoch": 41.93, + "learning_rate": 1.7975822322181614e-05, + "loss": 0.0615, + "step": 149130 + }, + { + "epoch": 41.93, + "learning_rate": 1.795707993627589e-05, + "loss": 0.0552, + "step": 149160 + }, + { + "epoch": 41.94, + "learning_rate": 1.7938337550370163e-05, + "loss": 0.063, + "step": 149190 + }, + { + "epoch": 41.95, + "learning_rate": 1.7919595164464437e-05, + "loss": 0.056, + "step": 149220 + }, + { + "epoch": 41.96, + "learning_rate": 1.790085277855871e-05, + "loss": 0.0608, + "step": 149250 + }, + { + "epoch": 41.97, + "learning_rate": 1.7882110392652985e-05, + "loss": 0.059, + "step": 149280 + }, + { + "epoch": 41.98, + "learning_rate": 1.786336800674726e-05, + "loss": 0.0579, + "step": 149310 + }, + { + "epoch": 41.98, + "learning_rate": 1.7844625620841534e-05, + "loss": 0.0664, + "step": 149340 + }, + { + "epoch": 41.99, + "learning_rate": 1.7825883234935808e-05, + "loss": 0.0532, + "step": 149370 + }, + { + "epoch": 42.0, + "eval_loss": 0.17243234813213348, + "eval_runtime": 510.6741, + "eval_samples_per_second": 31.396, + "eval_steps_per_second": 0.983, + "eval_wer": 0.12452062833513027, + "step": 149394 + }, + { + "epoch": 42.0, + "learning_rate": 1.7807140849030082e-05, + "loss": 0.065, + "step": 149400 + }, + { + "epoch": 42.01, + "learning_rate": 1.7788398463124356e-05, + "loss": 0.0509, + "step": 149430 + }, + { + "epoch": 42.02, + "learning_rate": 1.776965607721863e-05, + "loss": 0.0653, + "step": 149460 + }, + { + "epoch": 42.03, + "learning_rate": 1.7750913691312905e-05, + "loss": 0.0577, + "step": 149490 + }, + { + "epoch": 42.04, + "learning_rate": 1.773217130540718e-05, + "loss": 0.0545, + "step": 149520 + }, + { + "epoch": 42.04, + "learning_rate": 1.7713428919501453e-05, + "loss": 0.0632, + "step": 149550 + }, + { + "epoch": 42.05, + "learning_rate": 1.7695311279792584e-05, + "loss": 0.0741, + "step": 149580 + }, + { + "epoch": 42.06, + "learning_rate": 1.767656889388686e-05, + "loss": 0.0606, + "step": 149610 + }, + { + "epoch": 42.07, + "learning_rate": 1.7658451254177992e-05, + "loss": 0.0579, + "step": 149640 + }, + { + "epoch": 42.08, + "learning_rate": 1.7639708868272263e-05, + "loss": 0.0573, + "step": 149670 + }, + { + "epoch": 42.09, + "learning_rate": 1.7620966482366537e-05, + "loss": 0.0611, + "step": 149700 + }, + { + "epoch": 42.09, + "learning_rate": 1.7602224096460815e-05, + "loss": 0.0555, + "step": 149730 + }, + { + "epoch": 42.1, + "learning_rate": 1.758348171055509e-05, + "loss": 0.0646, + "step": 149760 + }, + { + "epoch": 42.11, + "learning_rate": 1.7564739324649363e-05, + "loss": 0.0568, + "step": 149790 + }, + { + "epoch": 42.12, + "learning_rate": 1.7545996938743637e-05, + "loss": 0.0569, + "step": 149820 + }, + { + "epoch": 42.13, + "learning_rate": 1.752725455283791e-05, + "loss": 0.0643, + "step": 149850 + }, + { + "epoch": 42.14, + "learning_rate": 1.7508512166932182e-05, + "loss": 0.0523, + "step": 149880 + }, + { + "epoch": 42.15, + "learning_rate": 1.7489769781026456e-05, + "loss": 0.0598, + "step": 149910 + }, + { + "epoch": 42.15, + "learning_rate": 1.7471027395120734e-05, + "loss": 0.0607, + "step": 149940 + }, + { + "epoch": 42.16, + "learning_rate": 1.7452285009215008e-05, + "loss": 0.0533, + "step": 149970 + }, + { + "epoch": 42.17, + "learning_rate": 1.7433542623309282e-05, + "loss": 0.061, + "step": 150000 + }, + { + "epoch": 42.18, + "learning_rate": 1.7414800237403557e-05, + "loss": 0.0495, + "step": 150030 + }, + { + "epoch": 42.19, + "learning_rate": 1.739605785149783e-05, + "loss": 0.0625, + "step": 150060 + }, + { + "epoch": 42.2, + "learning_rate": 1.7377315465592105e-05, + "loss": 0.0547, + "step": 150090 + }, + { + "epoch": 42.2, + "learning_rate": 1.7358573079686376e-05, + "loss": 0.0549, + "step": 150120 + }, + { + "epoch": 42.21, + "learning_rate": 1.7339830693780653e-05, + "loss": 0.0626, + "step": 150150 + }, + { + "epoch": 42.22, + "learning_rate": 1.7321088307874928e-05, + "loss": 0.0496, + "step": 150180 + }, + { + "epoch": 42.23, + "learning_rate": 1.7302345921969202e-05, + "loss": 0.0555, + "step": 150210 + }, + { + "epoch": 42.24, + "learning_rate": 1.7283603536063476e-05, + "loss": 0.0624, + "step": 150240 + }, + { + "epoch": 42.25, + "learning_rate": 1.726486115015775e-05, + "loss": 0.057, + "step": 150270 + }, + { + "epoch": 42.25, + "learning_rate": 1.7246118764252024e-05, + "loss": 0.065, + "step": 150300 + }, + { + "epoch": 42.26, + "learning_rate": 1.7227376378346295e-05, + "loss": 0.0516, + "step": 150330 + }, + { + "epoch": 42.27, + "learning_rate": 1.7208633992440573e-05, + "loss": 0.0626, + "step": 150360 + }, + { + "epoch": 42.28, + "learning_rate": 1.7189891606534847e-05, + "loss": 0.061, + "step": 150390 + }, + { + "epoch": 42.29, + "learning_rate": 1.717114922062912e-05, + "loss": 0.0561, + "step": 150420 + }, + { + "epoch": 42.3, + "learning_rate": 1.7152406834723395e-05, + "loss": 0.0657, + "step": 150450 + }, + { + "epoch": 42.31, + "learning_rate": 1.713366444881767e-05, + "loss": 0.0559, + "step": 150480 + }, + { + "epoch": 42.31, + "learning_rate": 1.7114922062911944e-05, + "loss": 0.06, + "step": 150510 + }, + { + "epoch": 42.32, + "learning_rate": 1.7096179677006214e-05, + "loss": 0.0657, + "step": 150540 + }, + { + "epoch": 42.33, + "learning_rate": 1.7077437291100492e-05, + "loss": 0.0559, + "step": 150570 + }, + { + "epoch": 42.34, + "learning_rate": 1.7059319651391623e-05, + "loss": 0.0602, + "step": 150600 + }, + { + "epoch": 42.35, + "learning_rate": 1.7040577265485897e-05, + "loss": 0.0482, + "step": 150630 + }, + { + "epoch": 42.36, + "learning_rate": 1.702183487958017e-05, + "loss": 0.06, + "step": 150660 + }, + { + "epoch": 42.36, + "learning_rate": 1.7003092493674445e-05, + "loss": 0.06, + "step": 150690 + }, + { + "epoch": 42.37, + "learning_rate": 1.698435010776872e-05, + "loss": 0.0608, + "step": 150720 + }, + { + "epoch": 42.38, + "learning_rate": 1.6965607721862994e-05, + "loss": 0.0606, + "step": 150750 + }, + { + "epoch": 42.39, + "learning_rate": 1.6946865335957268e-05, + "loss": 0.0522, + "step": 150780 + }, + { + "epoch": 42.4, + "learning_rate": 1.6928122950051542e-05, + "loss": 0.0573, + "step": 150810 + }, + { + "epoch": 42.41, + "learning_rate": 1.6909380564145816e-05, + "loss": 0.0575, + "step": 150840 + }, + { + "epoch": 42.41, + "learning_rate": 1.689063817824009e-05, + "loss": 0.0579, + "step": 150870 + }, + { + "epoch": 42.42, + "learning_rate": 1.6871895792334365e-05, + "loss": 0.0635, + "step": 150900 + }, + { + "epoch": 42.43, + "learning_rate": 1.685315340642864e-05, + "loss": 0.0533, + "step": 150930 + }, + { + "epoch": 42.44, + "learning_rate": 1.6834411020522913e-05, + "loss": 0.0555, + "step": 150960 + }, + { + "epoch": 42.45, + "learning_rate": 1.6815668634617187e-05, + "loss": 0.0541, + "step": 150990 + }, + { + "epoch": 42.46, + "learning_rate": 1.679692624871146e-05, + "loss": 0.0573, + "step": 151020 + }, + { + "epoch": 42.47, + "learning_rate": 1.6778183862805736e-05, + "loss": 0.0667, + "step": 151050 + }, + { + "epoch": 42.47, + "learning_rate": 1.675944147690001e-05, + "loss": 0.0522, + "step": 151080 + }, + { + "epoch": 42.48, + "learning_rate": 1.6740699090994284e-05, + "loss": 0.0646, + "step": 151110 + }, + { + "epoch": 42.49, + "learning_rate": 1.6721956705088558e-05, + "loss": 0.0604, + "step": 151140 + }, + { + "epoch": 42.5, + "learning_rate": 1.6703214319182832e-05, + "loss": 0.0561, + "step": 151170 + }, + { + "epoch": 42.51, + "learning_rate": 1.6684471933277107e-05, + "loss": 0.0636, + "step": 151200 + }, + { + "epoch": 42.52, + "learning_rate": 1.666572954737138e-05, + "loss": 0.0518, + "step": 151230 + }, + { + "epoch": 42.52, + "learning_rate": 1.6646987161465655e-05, + "loss": 0.0594, + "step": 151260 + }, + { + "epoch": 42.53, + "learning_rate": 1.662824477555993e-05, + "loss": 0.0559, + "step": 151290 + }, + { + "epoch": 42.54, + "learning_rate": 1.6609502389654207e-05, + "loss": 0.0547, + "step": 151320 + }, + { + "epoch": 42.55, + "learning_rate": 1.6590760003748478e-05, + "loss": 0.066, + "step": 151350 + }, + { + "epoch": 42.56, + "learning_rate": 1.6572017617842752e-05, + "loss": 0.0541, + "step": 151380 + }, + { + "epoch": 42.57, + "learning_rate": 1.6553275231937026e-05, + "loss": 0.0618, + "step": 151410 + }, + { + "epoch": 42.58, + "learning_rate": 1.65345328460313e-05, + "loss": 0.0605, + "step": 151440 + }, + { + "epoch": 42.58, + "learning_rate": 1.6515790460125574e-05, + "loss": 0.054, + "step": 151470 + }, + { + "epoch": 42.59, + "learning_rate": 1.649704807421985e-05, + "loss": 0.0649, + "step": 151500 + }, + { + "epoch": 42.6, + "learning_rate": 1.6478305688314123e-05, + "loss": 0.0532, + "step": 151530 + }, + { + "epoch": 42.61, + "learning_rate": 1.6459563302408397e-05, + "loss": 0.0598, + "step": 151560 + }, + { + "epoch": 42.62, + "learning_rate": 1.644082091650267e-05, + "loss": 0.0595, + "step": 151590 + }, + { + "epoch": 42.63, + "learning_rate": 1.6422078530596945e-05, + "loss": 0.0566, + "step": 151620 + }, + { + "epoch": 42.63, + "learning_rate": 1.640333614469122e-05, + "loss": 0.065, + "step": 151650 + }, + { + "epoch": 42.64, + "learning_rate": 1.6384593758785494e-05, + "loss": 0.0528, + "step": 151680 + }, + { + "epoch": 42.65, + "learning_rate": 1.6365851372879768e-05, + "loss": 0.0613, + "step": 151710 + }, + { + "epoch": 42.66, + "learning_rate": 1.6347108986974042e-05, + "loss": 0.0598, + "step": 151740 + }, + { + "epoch": 42.67, + "learning_rate": 1.6328366601068316e-05, + "loss": 0.0616, + "step": 151770 + }, + { + "epoch": 42.68, + "learning_rate": 1.630962421516259e-05, + "loss": 0.0597, + "step": 151800 + }, + { + "epoch": 42.68, + "learning_rate": 1.6290881829256865e-05, + "loss": 0.0538, + "step": 151830 + }, + { + "epoch": 42.69, + "learning_rate": 1.627213944335114e-05, + "loss": 0.0593, + "step": 151860 + }, + { + "epoch": 42.7, + "learning_rate": 1.6253397057445413e-05, + "loss": 0.059, + "step": 151890 + }, + { + "epoch": 42.71, + "learning_rate": 1.6234654671539687e-05, + "loss": 0.055, + "step": 151920 + }, + { + "epoch": 42.72, + "learning_rate": 1.621591228563396e-05, + "loss": 0.0632, + "step": 151950 + }, + { + "epoch": 42.73, + "learning_rate": 1.6197169899728236e-05, + "loss": 0.0557, + "step": 151980 + }, + { + "epoch": 42.74, + "learning_rate": 1.617842751382251e-05, + "loss": 0.0612, + "step": 152010 + }, + { + "epoch": 42.74, + "learning_rate": 1.6159685127916784e-05, + "loss": 0.0629, + "step": 152040 + }, + { + "epoch": 42.75, + "learning_rate": 1.6140942742011058e-05, + "loss": 0.0619, + "step": 152070 + }, + { + "epoch": 42.76, + "learning_rate": 1.6122200356105332e-05, + "loss": 0.0692, + "step": 152100 + }, + { + "epoch": 42.77, + "learning_rate": 1.6103457970199607e-05, + "loss": 0.0527, + "step": 152130 + }, + { + "epoch": 42.78, + "learning_rate": 1.608471558429388e-05, + "loss": 0.0573, + "step": 152160 + }, + { + "epoch": 42.79, + "learning_rate": 1.606597319838816e-05, + "loss": 0.0592, + "step": 152190 + }, + { + "epoch": 42.79, + "learning_rate": 1.604723081248243e-05, + "loss": 0.056, + "step": 152220 + }, + { + "epoch": 42.8, + "learning_rate": 1.6028488426576703e-05, + "loss": 0.0651, + "step": 152250 + }, + { + "epoch": 42.81, + "learning_rate": 1.6009746040670978e-05, + "loss": 0.0556, + "step": 152280 + }, + { + "epoch": 42.82, + "learning_rate": 1.5991003654765252e-05, + "loss": 0.0595, + "step": 152310 + }, + { + "epoch": 42.83, + "learning_rate": 1.5972261268859526e-05, + "loss": 0.0586, + "step": 152340 + }, + { + "epoch": 42.84, + "learning_rate": 1.59535188829538e-05, + "loss": 0.0548, + "step": 152370 + }, + { + "epoch": 42.84, + "learning_rate": 1.5934776497048078e-05, + "loss": 0.0653, + "step": 152400 + }, + { + "epoch": 42.85, + "learning_rate": 1.591603411114235e-05, + "loss": 0.0561, + "step": 152430 + }, + { + "epoch": 42.86, + "learning_rate": 1.5897291725236623e-05, + "loss": 0.0607, + "step": 152460 + }, + { + "epoch": 42.87, + "learning_rate": 1.5878549339330897e-05, + "loss": 0.0566, + "step": 152490 + }, + { + "epoch": 42.88, + "learning_rate": 1.585980695342517e-05, + "loss": 0.0568, + "step": 152520 + }, + { + "epoch": 42.89, + "learning_rate": 1.5841064567519445e-05, + "loss": 0.0603, + "step": 152550 + }, + { + "epoch": 42.9, + "learning_rate": 1.582232218161372e-05, + "loss": 0.0559, + "step": 152580 + }, + { + "epoch": 42.9, + "learning_rate": 1.5803579795707997e-05, + "loss": 0.0677, + "step": 152610 + }, + { + "epoch": 42.91, + "learning_rate": 1.5784837409802268e-05, + "loss": 0.0572, + "step": 152640 + }, + { + "epoch": 42.92, + "learning_rate": 1.5766095023896542e-05, + "loss": 0.0584, + "step": 152670 + }, + { + "epoch": 42.93, + "learning_rate": 1.5747352637990816e-05, + "loss": 0.062, + "step": 152700 + }, + { + "epoch": 42.94, + "learning_rate": 1.572861025208509e-05, + "loss": 0.0536, + "step": 152730 + }, + { + "epoch": 42.95, + "learning_rate": 1.5709867866179365e-05, + "loss": 0.0574, + "step": 152760 + }, + { + "epoch": 42.95, + "learning_rate": 1.569112548027364e-05, + "loss": 0.0591, + "step": 152790 + }, + { + "epoch": 42.96, + "learning_rate": 1.5672383094367916e-05, + "loss": 0.0591, + "step": 152820 + }, + { + "epoch": 42.97, + "learning_rate": 1.565364070846219e-05, + "loss": 0.0623, + "step": 152850 + }, + { + "epoch": 42.98, + "learning_rate": 1.563489832255646e-05, + "loss": 0.054, + "step": 152880 + }, + { + "epoch": 42.99, + "learning_rate": 1.5616155936650736e-05, + "loss": 0.0598, + "step": 152910 + }, + { + "epoch": 43.0, + "learning_rate": 1.559741355074501e-05, + "loss": 0.0594, + "step": 152940 + }, + { + "epoch": 43.0, + "eval_loss": 0.1735638976097107, + "eval_runtime": 506.7114, + "eval_samples_per_second": 31.641, + "eval_steps_per_second": 0.991, + "eval_wer": 0.12498464645913229, + "step": 152951 + }, + { + "epoch": 43.01, + "learning_rate": 1.5578671164839284e-05, + "loss": 0.058, + "step": 152970 + }, + { + "epoch": 43.01, + "learning_rate": 1.5559928778933558e-05, + "loss": 0.0646, + "step": 153000 + }, + { + "epoch": 43.02, + "learning_rate": 1.5541186393027836e-05, + "loss": 0.0515, + "step": 153030 + }, + { + "epoch": 43.03, + "learning_rate": 1.552244400712211e-05, + "loss": 0.0589, + "step": 153060 + }, + { + "epoch": 43.04, + "learning_rate": 1.550370162121638e-05, + "loss": 0.0527, + "step": 153090 + }, + { + "epoch": 43.05, + "learning_rate": 1.5484959235310655e-05, + "loss": 0.0596, + "step": 153120 + }, + { + "epoch": 43.06, + "learning_rate": 1.546621684940493e-05, + "loss": 0.058, + "step": 153150 + }, + { + "epoch": 43.06, + "learning_rate": 1.5447474463499203e-05, + "loss": 0.0518, + "step": 153180 + }, + { + "epoch": 43.07, + "learning_rate": 1.5428732077593477e-05, + "loss": 0.0603, + "step": 153210 + }, + { + "epoch": 43.08, + "learning_rate": 1.5409989691687755e-05, + "loss": 0.0545, + "step": 153240 + }, + { + "epoch": 43.09, + "learning_rate": 1.539124730578203e-05, + "loss": 0.0763, + "step": 153270 + }, + { + "epoch": 43.1, + "learning_rate": 1.53725049198763e-05, + "loss": 0.0657, + "step": 153300 + }, + { + "epoch": 43.11, + "learning_rate": 1.5353762533970574e-05, + "loss": 0.0535, + "step": 153330 + }, + { + "epoch": 43.11, + "learning_rate": 1.533502014806485e-05, + "loss": 0.0641, + "step": 153360 + }, + { + "epoch": 43.12, + "learning_rate": 1.5316277762159123e-05, + "loss": 0.0534, + "step": 153390 + }, + { + "epoch": 43.13, + "learning_rate": 1.5297535376253397e-05, + "loss": 0.0562, + "step": 153420 + }, + { + "epoch": 43.14, + "learning_rate": 1.527879299034767e-05, + "loss": 0.0569, + "step": 153450 + }, + { + "epoch": 43.15, + "learning_rate": 1.526005060444195e-05, + "loss": 0.0514, + "step": 153480 + }, + { + "epoch": 43.16, + "learning_rate": 1.5241308218536221e-05, + "loss": 0.0619, + "step": 153510 + }, + { + "epoch": 43.17, + "learning_rate": 1.5222565832630495e-05, + "loss": 0.0569, + "step": 153540 + }, + { + "epoch": 43.17, + "learning_rate": 1.520382344672477e-05, + "loss": 0.0569, + "step": 153570 + }, + { + "epoch": 43.18, + "learning_rate": 1.5185081060819042e-05, + "loss": 0.0601, + "step": 153600 + }, + { + "epoch": 43.19, + "learning_rate": 1.5166338674913316e-05, + "loss": 0.0535, + "step": 153630 + }, + { + "epoch": 43.2, + "learning_rate": 1.514759628900759e-05, + "loss": 0.063, + "step": 153660 + }, + { + "epoch": 43.21, + "learning_rate": 1.5128853903101866e-05, + "loss": 0.0532, + "step": 153690 + }, + { + "epoch": 43.22, + "learning_rate": 1.511011151719614e-05, + "loss": 0.0586, + "step": 153720 + }, + { + "epoch": 43.22, + "learning_rate": 1.5091369131290415e-05, + "loss": 0.0607, + "step": 153750 + }, + { + "epoch": 43.23, + "learning_rate": 1.5072626745384689e-05, + "loss": 0.0506, + "step": 153780 + }, + { + "epoch": 43.24, + "learning_rate": 1.5053884359478961e-05, + "loss": 0.0633, + "step": 153810 + }, + { + "epoch": 43.25, + "learning_rate": 1.5035141973573235e-05, + "loss": 0.0569, + "step": 153840 + }, + { + "epoch": 43.26, + "learning_rate": 1.501639958766751e-05, + "loss": 0.0582, + "step": 153870 + }, + { + "epoch": 43.27, + "learning_rate": 1.4997657201761786e-05, + "loss": 0.0581, + "step": 153900 + }, + { + "epoch": 43.28, + "learning_rate": 1.497891481585606e-05, + "loss": 0.0496, + "step": 153930 + }, + { + "epoch": 43.28, + "learning_rate": 1.4960172429950334e-05, + "loss": 0.0606, + "step": 153960 + }, + { + "epoch": 43.29, + "learning_rate": 1.4941430044044608e-05, + "loss": 0.0549, + "step": 153990 + }, + { + "epoch": 43.3, + "learning_rate": 1.492268765813888e-05, + "loss": 0.0587, + "step": 154020 + }, + { + "epoch": 43.31, + "learning_rate": 1.4903945272233155e-05, + "loss": 0.065, + "step": 154050 + }, + { + "epoch": 43.32, + "learning_rate": 1.4885202886327429e-05, + "loss": 0.0527, + "step": 154080 + }, + { + "epoch": 43.33, + "learning_rate": 1.4866460500421705e-05, + "loss": 0.0596, + "step": 154110 + }, + { + "epoch": 43.33, + "learning_rate": 1.4847718114515979e-05, + "loss": 0.0544, + "step": 154140 + }, + { + "epoch": 43.34, + "learning_rate": 1.4828975728610253e-05, + "loss": 0.0581, + "step": 154170 + }, + { + "epoch": 43.35, + "learning_rate": 1.4810233342704527e-05, + "loss": 0.0574, + "step": 154200 + }, + { + "epoch": 43.36, + "learning_rate": 1.4791490956798802e-05, + "loss": 0.0519, + "step": 154230 + }, + { + "epoch": 43.37, + "learning_rate": 1.4772748570893074e-05, + "loss": 0.0609, + "step": 154260 + }, + { + "epoch": 43.38, + "learning_rate": 1.4754006184987348e-05, + "loss": 0.054, + "step": 154290 + }, + { + "epoch": 43.38, + "learning_rate": 1.4735263799081626e-05, + "loss": 0.0565, + "step": 154320 + }, + { + "epoch": 43.39, + "learning_rate": 1.4716521413175898e-05, + "loss": 0.06, + "step": 154350 + }, + { + "epoch": 43.4, + "learning_rate": 1.4697779027270173e-05, + "loss": 0.0529, + "step": 154380 + }, + { + "epoch": 43.41, + "learning_rate": 1.4679036641364447e-05, + "loss": 0.0611, + "step": 154410 + }, + { + "epoch": 43.42, + "learning_rate": 1.4660294255458721e-05, + "loss": 0.0519, + "step": 154440 + }, + { + "epoch": 43.43, + "learning_rate": 1.4641551869552993e-05, + "loss": 0.0566, + "step": 154470 + }, + { + "epoch": 43.44, + "learning_rate": 1.4622809483647268e-05, + "loss": 0.0599, + "step": 154500 + }, + { + "epoch": 43.44, + "learning_rate": 1.4604067097741545e-05, + "loss": 0.0513, + "step": 154530 + }, + { + "epoch": 43.45, + "learning_rate": 1.4585324711835818e-05, + "loss": 0.0621, + "step": 154560 + }, + { + "epoch": 43.46, + "learning_rate": 1.4566582325930092e-05, + "loss": 0.0563, + "step": 154590 + }, + { + "epoch": 43.47, + "learning_rate": 1.4547839940024366e-05, + "loss": 0.0609, + "step": 154620 + }, + { + "epoch": 43.48, + "learning_rate": 1.452909755411864e-05, + "loss": 0.0577, + "step": 154650 + }, + { + "epoch": 43.49, + "learning_rate": 1.4510355168212913e-05, + "loss": 0.0541, + "step": 154680 + }, + { + "epoch": 43.49, + "learning_rate": 1.4491612782307187e-05, + "loss": 0.0621, + "step": 154710 + }, + { + "epoch": 43.5, + "learning_rate": 1.4472870396401465e-05, + "loss": 0.0534, + "step": 154740 + }, + { + "epoch": 43.51, + "learning_rate": 1.4454128010495737e-05, + "loss": 0.0585, + "step": 154770 + }, + { + "epoch": 43.52, + "learning_rate": 1.4435385624590011e-05, + "loss": 0.0571, + "step": 154800 + }, + { + "epoch": 43.53, + "learning_rate": 1.4416643238684285e-05, + "loss": 0.0563, + "step": 154830 + }, + { + "epoch": 43.54, + "learning_rate": 1.439790085277856e-05, + "loss": 0.0591, + "step": 154860 + }, + { + "epoch": 43.55, + "learning_rate": 1.4379158466872834e-05, + "loss": 0.06, + "step": 154890 + }, + { + "epoch": 43.55, + "learning_rate": 1.4360416080967106e-05, + "loss": 0.0647, + "step": 154920 + }, + { + "epoch": 43.56, + "learning_rate": 1.4341673695061384e-05, + "loss": 0.0583, + "step": 154950 + }, + { + "epoch": 43.57, + "learning_rate": 1.4322931309155656e-05, + "loss": 0.0507, + "step": 154980 + }, + { + "epoch": 43.58, + "learning_rate": 1.430418892324993e-05, + "loss": 0.063, + "step": 155010 + }, + { + "epoch": 43.59, + "learning_rate": 1.4285446537344205e-05, + "loss": 0.0525, + "step": 155040 + }, + { + "epoch": 43.6, + "learning_rate": 1.4266704151438479e-05, + "loss": 0.0562, + "step": 155070 + }, + { + "epoch": 43.6, + "learning_rate": 1.4247961765532753e-05, + "loss": 0.0595, + "step": 155100 + }, + { + "epoch": 43.61, + "learning_rate": 1.4229219379627026e-05, + "loss": 0.0555, + "step": 155130 + }, + { + "epoch": 43.62, + "learning_rate": 1.42104769937213e-05, + "loss": 0.0622, + "step": 155160 + }, + { + "epoch": 43.63, + "learning_rate": 1.4191734607815577e-05, + "loss": 0.0581, + "step": 155190 + }, + { + "epoch": 43.64, + "learning_rate": 1.417299222190985e-05, + "loss": 0.0565, + "step": 155220 + }, + { + "epoch": 43.65, + "learning_rate": 1.4154249836004124e-05, + "loss": 0.0633, + "step": 155250 + }, + { + "epoch": 43.65, + "learning_rate": 1.4135507450098398e-05, + "loss": 0.053, + "step": 155280 + }, + { + "epoch": 43.66, + "learning_rate": 1.4116765064192672e-05, + "loss": 0.0616, + "step": 155310 + }, + { + "epoch": 43.67, + "learning_rate": 1.4098022678286945e-05, + "loss": 0.0551, + "step": 155340 + }, + { + "epoch": 43.68, + "learning_rate": 1.4079280292381219e-05, + "loss": 0.0575, + "step": 155370 + }, + { + "epoch": 43.69, + "learning_rate": 1.4060537906475497e-05, + "loss": 0.0622, + "step": 155400 + }, + { + "epoch": 43.7, + "learning_rate": 1.404179552056977e-05, + "loss": 0.0535, + "step": 155430 + }, + { + "epoch": 43.71, + "learning_rate": 1.4023053134664043e-05, + "loss": 0.0651, + "step": 155460 + }, + { + "epoch": 43.71, + "learning_rate": 1.4004310748758318e-05, + "loss": 0.0561, + "step": 155490 + }, + { + "epoch": 43.72, + "learning_rate": 1.3985568362852592e-05, + "loss": 0.056, + "step": 155520 + }, + { + "epoch": 43.73, + "learning_rate": 1.3966825976946864e-05, + "loss": 0.0572, + "step": 155550 + }, + { + "epoch": 43.74, + "learning_rate": 1.3948083591041138e-05, + "loss": 0.0556, + "step": 155580 + }, + { + "epoch": 43.75, + "learning_rate": 1.3929341205135416e-05, + "loss": 0.0617, + "step": 155610 + }, + { + "epoch": 43.76, + "learning_rate": 1.3910598819229689e-05, + "loss": 0.0533, + "step": 155640 + }, + { + "epoch": 43.76, + "learning_rate": 1.3891856433323963e-05, + "loss": 0.0672, + "step": 155670 + }, + { + "epoch": 43.77, + "learning_rate": 1.3873114047418237e-05, + "loss": 0.0613, + "step": 155700 + }, + { + "epoch": 43.78, + "learning_rate": 1.3854371661512511e-05, + "loss": 0.055, + "step": 155730 + }, + { + "epoch": 43.79, + "learning_rate": 1.3835629275606785e-05, + "loss": 0.0598, + "step": 155760 + }, + { + "epoch": 43.8, + "learning_rate": 1.3816886889701058e-05, + "loss": 0.0558, + "step": 155790 + }, + { + "epoch": 43.81, + "learning_rate": 1.3798144503795335e-05, + "loss": 0.0637, + "step": 155820 + }, + { + "epoch": 43.81, + "learning_rate": 1.377940211788961e-05, + "loss": 0.0619, + "step": 155850 + }, + { + "epoch": 43.82, + "learning_rate": 1.3760659731983882e-05, + "loss": 0.0494, + "step": 155880 + }, + { + "epoch": 43.83, + "learning_rate": 1.3741917346078156e-05, + "loss": 0.0653, + "step": 155910 + }, + { + "epoch": 43.84, + "learning_rate": 1.372317496017243e-05, + "loss": 0.0554, + "step": 155940 + }, + { + "epoch": 43.85, + "learning_rate": 1.3704432574266705e-05, + "loss": 0.0629, + "step": 155970 + }, + { + "epoch": 43.86, + "learning_rate": 1.3685690188360977e-05, + "loss": 0.0594, + "step": 156000 + }, + { + "epoch": 43.87, + "learning_rate": 1.3666947802455255e-05, + "loss": 0.0552, + "step": 156030 + }, + { + "epoch": 43.87, + "learning_rate": 1.3648205416549529e-05, + "loss": 0.0632, + "step": 156060 + }, + { + "epoch": 43.88, + "learning_rate": 1.3629463030643801e-05, + "loss": 0.0565, + "step": 156090 + }, + { + "epoch": 43.89, + "learning_rate": 1.3610720644738076e-05, + "loss": 0.0563, + "step": 156120 + }, + { + "epoch": 43.9, + "learning_rate": 1.359197825883235e-05, + "loss": 0.0622, + "step": 156150 + }, + { + "epoch": 43.91, + "learning_rate": 1.3573235872926624e-05, + "loss": 0.0528, + "step": 156180 + }, + { + "epoch": 43.92, + "learning_rate": 1.3554493487020896e-05, + "loss": 0.0609, + "step": 156210 + }, + { + "epoch": 43.92, + "learning_rate": 1.353637584731203e-05, + "loss": 0.0729, + "step": 156240 + }, + { + "epoch": 43.93, + "learning_rate": 1.3517633461406303e-05, + "loss": 0.0566, + "step": 156270 + }, + { + "epoch": 43.94, + "learning_rate": 1.3498891075500577e-05, + "loss": 0.0588, + "step": 156300 + }, + { + "epoch": 43.95, + "learning_rate": 1.3480148689594852e-05, + "loss": 0.052, + "step": 156330 + }, + { + "epoch": 43.96, + "learning_rate": 1.3461406303689127e-05, + "loss": 0.0612, + "step": 156360 + }, + { + "epoch": 43.97, + "learning_rate": 1.3442663917783402e-05, + "loss": 0.0516, + "step": 156390 + }, + { + "epoch": 43.98, + "learning_rate": 1.3423921531877676e-05, + "loss": 0.058, + "step": 156420 + }, + { + "epoch": 43.98, + "learning_rate": 1.340517914597195e-05, + "loss": 0.058, + "step": 156450 + }, + { + "epoch": 43.99, + "learning_rate": 1.3386436760066223e-05, + "loss": 0.0544, + "step": 156480 + }, + { + "epoch": 44.0, + "eval_loss": 0.17437909543514252, + "eval_runtime": 509.2768, + "eval_samples_per_second": 31.482, + "eval_steps_per_second": 0.986, + "eval_wer": 0.1237768345775388, + "step": 156508 + }, + { + "epoch": 44.0, + "learning_rate": 1.3367694374160497e-05, + "loss": 0.0637, + "step": 156510 + }, + { + "epoch": 44.01, + "learning_rate": 1.3348951988254771e-05, + "loss": 0.049, + "step": 156540 + }, + { + "epoch": 44.02, + "learning_rate": 1.3330209602349047e-05, + "loss": 0.0665, + "step": 156570 + }, + { + "epoch": 44.03, + "learning_rate": 1.3311467216443321e-05, + "loss": 0.058, + "step": 156600 + }, + { + "epoch": 44.03, + "learning_rate": 1.3292724830537595e-05, + "loss": 0.0575, + "step": 156630 + }, + { + "epoch": 44.04, + "learning_rate": 1.327398244463187e-05, + "loss": 0.0585, + "step": 156660 + }, + { + "epoch": 44.05, + "learning_rate": 1.3255240058726144e-05, + "loss": 0.0499, + "step": 156690 + }, + { + "epoch": 44.06, + "learning_rate": 1.3236497672820416e-05, + "loss": 0.0607, + "step": 156720 + }, + { + "epoch": 44.07, + "learning_rate": 1.321775528691469e-05, + "loss": 0.0541, + "step": 156750 + }, + { + "epoch": 44.08, + "learning_rate": 1.3199012901008966e-05, + "loss": 0.0554, + "step": 156780 + }, + { + "epoch": 44.08, + "learning_rate": 1.318027051510324e-05, + "loss": 0.0599, + "step": 156810 + }, + { + "epoch": 44.09, + "learning_rate": 1.3161528129197515e-05, + "loss": 0.0511, + "step": 156840 + }, + { + "epoch": 44.1, + "learning_rate": 1.3142785743291789e-05, + "loss": 0.0618, + "step": 156870 + }, + { + "epoch": 44.11, + "learning_rate": 1.3124043357386063e-05, + "loss": 0.0551, + "step": 156900 + }, + { + "epoch": 44.12, + "learning_rate": 1.3105300971480335e-05, + "loss": 0.051, + "step": 156930 + }, + { + "epoch": 44.13, + "learning_rate": 1.308655858557461e-05, + "loss": 0.0605, + "step": 156960 + }, + { + "epoch": 44.14, + "learning_rate": 1.3067816199668887e-05, + "loss": 0.055, + "step": 156990 + }, + { + "epoch": 44.14, + "learning_rate": 1.304907381376316e-05, + "loss": 0.0584, + "step": 157020 + }, + { + "epoch": 44.15, + "learning_rate": 1.3030331427857434e-05, + "loss": 0.0567, + "step": 157050 + }, + { + "epoch": 44.16, + "learning_rate": 1.3011589041951708e-05, + "loss": 0.0541, + "step": 157080 + }, + { + "epoch": 44.17, + "learning_rate": 1.2992846656045982e-05, + "loss": 0.0606, + "step": 157110 + }, + { + "epoch": 44.18, + "learning_rate": 1.2974104270140255e-05, + "loss": 0.0478, + "step": 157140 + }, + { + "epoch": 44.19, + "learning_rate": 1.2955361884234529e-05, + "loss": 0.0612, + "step": 157170 + }, + { + "epoch": 44.19, + "learning_rate": 1.2936619498328806e-05, + "loss": 0.0552, + "step": 157200 + }, + { + "epoch": 44.2, + "learning_rate": 1.2917877112423079e-05, + "loss": 0.0547, + "step": 157230 + }, + { + "epoch": 44.21, + "learning_rate": 1.2899134726517353e-05, + "loss": 0.0606, + "step": 157260 + }, + { + "epoch": 44.22, + "learning_rate": 1.2880392340611627e-05, + "loss": 0.0454, + "step": 157290 + }, + { + "epoch": 44.23, + "learning_rate": 1.2861649954705902e-05, + "loss": 0.0611, + "step": 157320 + }, + { + "epoch": 44.24, + "learning_rate": 1.2842907568800174e-05, + "loss": 0.0572, + "step": 157350 + }, + { + "epoch": 44.25, + "learning_rate": 1.2824165182894448e-05, + "loss": 0.0582, + "step": 157380 + }, + { + "epoch": 44.25, + "learning_rate": 1.2805422796988726e-05, + "loss": 0.0657, + "step": 157410 + }, + { + "epoch": 44.26, + "learning_rate": 1.2786680411082998e-05, + "loss": 0.0498, + "step": 157440 + }, + { + "epoch": 44.27, + "learning_rate": 1.2767938025177273e-05, + "loss": 0.0617, + "step": 157470 + }, + { + "epoch": 44.28, + "learning_rate": 1.2749195639271547e-05, + "loss": 0.0553, + "step": 157500 + }, + { + "epoch": 44.29, + "learning_rate": 1.2730453253365821e-05, + "loss": 0.0577, + "step": 157530 + }, + { + "epoch": 44.3, + "learning_rate": 1.2711710867460095e-05, + "loss": 0.0607, + "step": 157560 + }, + { + "epoch": 44.3, + "learning_rate": 1.2692968481554368e-05, + "loss": 0.0551, + "step": 157590 + }, + { + "epoch": 44.31, + "learning_rate": 1.2674226095648645e-05, + "loss": 0.0598, + "step": 157620 + }, + { + "epoch": 44.32, + "learning_rate": 1.265548370974292e-05, + "loss": 0.0538, + "step": 157650 + }, + { + "epoch": 44.33, + "learning_rate": 1.2636741323837192e-05, + "loss": 0.0581, + "step": 157680 + }, + { + "epoch": 44.34, + "learning_rate": 1.2617998937931466e-05, + "loss": 0.0622, + "step": 157710 + }, + { + "epoch": 44.35, + "learning_rate": 1.259925655202574e-05, + "loss": 0.0542, + "step": 157740 + }, + { + "epoch": 44.35, + "learning_rate": 1.2580514166120014e-05, + "loss": 0.0617, + "step": 157770 + }, + { + "epoch": 44.36, + "learning_rate": 1.2561771780214287e-05, + "loss": 0.0519, + "step": 157800 + }, + { + "epoch": 44.37, + "learning_rate": 1.2543029394308561e-05, + "loss": 0.0595, + "step": 157830 + }, + { + "epoch": 44.38, + "learning_rate": 1.2524287008402839e-05, + "loss": 0.0653, + "step": 157860 + }, + { + "epoch": 44.39, + "learning_rate": 1.2505544622497111e-05, + "loss": 0.0531, + "step": 157890 + }, + { + "epoch": 44.4, + "learning_rate": 1.2486802236591385e-05, + "loss": 0.0593, + "step": 157920 + }, + { + "epoch": 44.41, + "learning_rate": 1.246805985068566e-05, + "loss": 0.0545, + "step": 157950 + }, + { + "epoch": 44.41, + "learning_rate": 1.2449317464779934e-05, + "loss": 0.0569, + "step": 157980 + }, + { + "epoch": 44.42, + "learning_rate": 1.2430575078874208e-05, + "loss": 0.0627, + "step": 158010 + }, + { + "epoch": 44.43, + "learning_rate": 1.2411832692968482e-05, + "loss": 0.054, + "step": 158040 + }, + { + "epoch": 44.44, + "learning_rate": 1.2393090307062756e-05, + "loss": 0.0552, + "step": 158070 + }, + { + "epoch": 44.45, + "learning_rate": 1.237434792115703e-05, + "loss": 0.0522, + "step": 158100 + }, + { + "epoch": 44.46, + "learning_rate": 1.2355605535251305e-05, + "loss": 0.0571, + "step": 158130 + }, + { + "epoch": 44.46, + "learning_rate": 1.2336863149345579e-05, + "loss": 0.0617, + "step": 158160 + }, + { + "epoch": 44.47, + "learning_rate": 1.2318120763439853e-05, + "loss": 0.054, + "step": 158190 + }, + { + "epoch": 44.48, + "learning_rate": 1.2299378377534127e-05, + "loss": 0.0623, + "step": 158220 + }, + { + "epoch": 44.49, + "learning_rate": 1.2280635991628401e-05, + "loss": 0.0538, + "step": 158250 + }, + { + "epoch": 44.5, + "learning_rate": 1.2261893605722676e-05, + "loss": 0.0541, + "step": 158280 + }, + { + "epoch": 44.51, + "learning_rate": 1.224315121981695e-05, + "loss": 0.0589, + "step": 158310 + }, + { + "epoch": 44.51, + "learning_rate": 1.2224408833911224e-05, + "loss": 0.0503, + "step": 158340 + }, + { + "epoch": 44.52, + "learning_rate": 1.2205666448005498e-05, + "loss": 0.0572, + "step": 158370 + }, + { + "epoch": 44.53, + "learning_rate": 1.2186924062099772e-05, + "loss": 0.0564, + "step": 158400 + }, + { + "epoch": 44.54, + "learning_rate": 1.2168181676194047e-05, + "loss": 0.0558, + "step": 158430 + }, + { + "epoch": 44.55, + "learning_rate": 1.214943929028832e-05, + "loss": 0.0608, + "step": 158460 + }, + { + "epoch": 44.56, + "learning_rate": 1.2130696904382595e-05, + "loss": 0.0498, + "step": 158490 + }, + { + "epoch": 44.57, + "learning_rate": 1.211195451847687e-05, + "loss": 0.0609, + "step": 158520 + }, + { + "epoch": 44.57, + "learning_rate": 1.2093212132571143e-05, + "loss": 0.0531, + "step": 158550 + }, + { + "epoch": 44.58, + "learning_rate": 1.2074469746665418e-05, + "loss": 0.0563, + "step": 158580 + }, + { + "epoch": 44.59, + "learning_rate": 1.2055727360759692e-05, + "loss": 0.0602, + "step": 158610 + }, + { + "epoch": 44.6, + "learning_rate": 1.2036984974853966e-05, + "loss": 0.0506, + "step": 158640 + }, + { + "epoch": 44.61, + "learning_rate": 1.201824258894824e-05, + "loss": 0.0606, + "step": 158670 + }, + { + "epoch": 44.62, + "learning_rate": 1.1999500203042514e-05, + "loss": 0.0543, + "step": 158700 + }, + { + "epoch": 44.62, + "learning_rate": 1.1980757817136789e-05, + "loss": 0.0563, + "step": 158730 + }, + { + "epoch": 44.63, + "learning_rate": 1.1962015431231063e-05, + "loss": 0.066, + "step": 158760 + }, + { + "epoch": 44.64, + "learning_rate": 1.1943273045325337e-05, + "loss": 0.0493, + "step": 158790 + }, + { + "epoch": 44.65, + "learning_rate": 1.1924530659419611e-05, + "loss": 0.0626, + "step": 158820 + }, + { + "epoch": 44.66, + "learning_rate": 1.1905788273513887e-05, + "loss": 0.0517, + "step": 158850 + }, + { + "epoch": 44.67, + "learning_rate": 1.188704588760816e-05, + "loss": 0.0547, + "step": 158880 + }, + { + "epoch": 44.68, + "learning_rate": 1.1868303501702434e-05, + "loss": 0.0585, + "step": 158910 + }, + { + "epoch": 44.68, + "learning_rate": 1.1849561115796708e-05, + "loss": 0.0493, + "step": 158940 + }, + { + "epoch": 44.69, + "learning_rate": 1.1830818729890982e-05, + "loss": 0.0568, + "step": 158970 + }, + { + "epoch": 44.7, + "learning_rate": 1.1812076343985256e-05, + "loss": 0.0549, + "step": 159000 + }, + { + "epoch": 44.71, + "learning_rate": 1.179333395807953e-05, + "loss": 0.0556, + "step": 159030 + }, + { + "epoch": 44.72, + "learning_rate": 1.1774591572173805e-05, + "loss": 0.0627, + "step": 159060 + }, + { + "epoch": 44.73, + "learning_rate": 1.1755849186268079e-05, + "loss": 0.0494, + "step": 159090 + }, + { + "epoch": 44.73, + "learning_rate": 1.1737106800362353e-05, + "loss": 0.0618, + "step": 159120 + }, + { + "epoch": 44.74, + "learning_rate": 1.1718364414456627e-05, + "loss": 0.0573, + "step": 159150 + }, + { + "epoch": 44.75, + "learning_rate": 1.1699622028550903e-05, + "loss": 0.0555, + "step": 159180 + }, + { + "epoch": 44.76, + "learning_rate": 1.1680879642645176e-05, + "loss": 0.0565, + "step": 159210 + }, + { + "epoch": 44.77, + "learning_rate": 1.166213725673945e-05, + "loss": 0.0532, + "step": 159240 + }, + { + "epoch": 44.78, + "learning_rate": 1.1643394870833724e-05, + "loss": 0.0633, + "step": 159270 + }, + { + "epoch": 44.78, + "learning_rate": 1.1624652484927998e-05, + "loss": 0.0493, + "step": 159300 + }, + { + "epoch": 44.79, + "learning_rate": 1.1605910099022272e-05, + "loss": 0.0591, + "step": 159330 + }, + { + "epoch": 44.8, + "learning_rate": 1.1587167713116547e-05, + "loss": 0.0632, + "step": 159360 + }, + { + "epoch": 44.81, + "learning_rate": 1.1568425327210822e-05, + "loss": 0.049, + "step": 159390 + }, + { + "epoch": 44.82, + "learning_rate": 1.1549682941305095e-05, + "loss": 0.0626, + "step": 159420 + }, + { + "epoch": 44.83, + "learning_rate": 1.1530940555399369e-05, + "loss": 0.0528, + "step": 159450 + }, + { + "epoch": 44.84, + "learning_rate": 1.1512198169493643e-05, + "loss": 0.0589, + "step": 159480 + }, + { + "epoch": 44.84, + "learning_rate": 1.149345578358792e-05, + "loss": 0.0589, + "step": 159510 + }, + { + "epoch": 44.85, + "learning_rate": 1.1474713397682192e-05, + "loss": 0.0497, + "step": 159540 + }, + { + "epoch": 44.86, + "learning_rate": 1.1455971011776466e-05, + "loss": 0.0609, + "step": 159570 + }, + { + "epoch": 44.87, + "learning_rate": 1.1437228625870742e-05, + "loss": 0.0542, + "step": 159600 + }, + { + "epoch": 44.88, + "learning_rate": 1.1418486239965014e-05, + "loss": 0.0564, + "step": 159630 + }, + { + "epoch": 44.89, + "learning_rate": 1.1399743854059288e-05, + "loss": 0.0622, + "step": 159660 + }, + { + "epoch": 44.89, + "learning_rate": 1.1381001468153563e-05, + "loss": 0.05, + "step": 159690 + }, + { + "epoch": 44.9, + "learning_rate": 1.1362259082247839e-05, + "loss": 0.059, + "step": 159720 + }, + { + "epoch": 44.91, + "learning_rate": 1.1343516696342111e-05, + "loss": 0.0544, + "step": 159750 + }, + { + "epoch": 44.92, + "learning_rate": 1.1324774310436385e-05, + "loss": 0.0565, + "step": 159780 + }, + { + "epoch": 44.93, + "learning_rate": 1.1306031924530661e-05, + "loss": 0.0603, + "step": 159810 + }, + { + "epoch": 44.94, + "learning_rate": 1.1287289538624935e-05, + "loss": 0.0492, + "step": 159840 + }, + { + "epoch": 44.95, + "learning_rate": 1.1268547152719208e-05, + "loss": 0.0571, + "step": 159870 + }, + { + "epoch": 44.95, + "learning_rate": 1.1249804766813482e-05, + "loss": 0.0561, + "step": 159900 + }, + { + "epoch": 44.96, + "learning_rate": 1.1231062380907758e-05, + "loss": 0.0554, + "step": 159930 + }, + { + "epoch": 44.97, + "learning_rate": 1.121231999500203e-05, + "loss": 0.0617, + "step": 159960 + }, + { + "epoch": 44.98, + "learning_rate": 1.1193577609096305e-05, + "loss": 0.0534, + "step": 159990 + }, + { + "epoch": 44.99, + "learning_rate": 1.1174835223190579e-05, + "loss": 0.0629, + "step": 160020 + }, + { + "epoch": 45.0, + "learning_rate": 1.1156092837284855e-05, + "loss": 0.0559, + "step": 160050 + }, + { + "epoch": 45.0, + "eval_loss": 0.1769741326570511, + "eval_runtime": 534.7373, + "eval_samples_per_second": 29.983, + "eval_steps_per_second": 0.939, + "eval_wer": 0.1232309309022423, + "step": 160065 + }, + { + "epoch": 45.0, + "learning_rate": 1.1137350451379127e-05, + "loss": 0.058, + "step": 160080 + }, + { + "epoch": 45.01, + "learning_rate": 1.1118608065473401e-05, + "loss": 0.0529, + "step": 160110 + }, + { + "epoch": 45.02, + "learning_rate": 1.1099865679567677e-05, + "loss": 0.0541, + "step": 160140 + }, + { + "epoch": 45.03, + "learning_rate": 1.108112329366195e-05, + "loss": 0.0572, + "step": 160170 + }, + { + "epoch": 45.04, + "learning_rate": 1.1062380907756224e-05, + "loss": 0.0506, + "step": 160200 + }, + { + "epoch": 45.05, + "learning_rate": 1.1043638521850498e-05, + "loss": 0.057, + "step": 160230 + }, + { + "epoch": 45.05, + "learning_rate": 1.1024896135944774e-05, + "loss": 0.0572, + "step": 160260 + }, + { + "epoch": 45.06, + "learning_rate": 1.1006153750039046e-05, + "loss": 0.0508, + "step": 160290 + }, + { + "epoch": 45.07, + "learning_rate": 1.098741136413332e-05, + "loss": 0.0617, + "step": 160320 + }, + { + "epoch": 45.08, + "learning_rate": 1.0968668978227597e-05, + "loss": 0.0488, + "step": 160350 + }, + { + "epoch": 45.09, + "learning_rate": 1.094992659232187e-05, + "loss": 0.0569, + "step": 160380 + }, + { + "epoch": 45.1, + "learning_rate": 1.0931184206416143e-05, + "loss": 0.0547, + "step": 160410 + }, + { + "epoch": 45.11, + "learning_rate": 1.0912441820510417e-05, + "loss": 0.0544, + "step": 160440 + }, + { + "epoch": 45.11, + "learning_rate": 1.0893699434604693e-05, + "loss": 0.0601, + "step": 160470 + }, + { + "epoch": 45.12, + "learning_rate": 1.0874957048698966e-05, + "loss": 0.0528, + "step": 160500 + }, + { + "epoch": 45.13, + "learning_rate": 1.085621466279324e-05, + "loss": 0.0533, + "step": 160530 + }, + { + "epoch": 45.14, + "learning_rate": 1.0838097023084372e-05, + "loss": 0.0542, + "step": 160560 + }, + { + "epoch": 45.15, + "learning_rate": 1.0819354637178647e-05, + "loss": 0.0509, + "step": 160590 + }, + { + "epoch": 45.16, + "learning_rate": 1.0800612251272921e-05, + "loss": 0.0604, + "step": 160620 + }, + { + "epoch": 45.16, + "learning_rate": 1.0781869865367195e-05, + "loss": 0.0529, + "step": 160650 + }, + { + "epoch": 45.17, + "learning_rate": 1.0763752225658328e-05, + "loss": 0.0732, + "step": 160680 + }, + { + "epoch": 45.18, + "learning_rate": 1.0745009839752602e-05, + "loss": 0.0576, + "step": 160710 + }, + { + "epoch": 45.19, + "learning_rate": 1.0726267453846874e-05, + "loss": 0.0511, + "step": 160740 + }, + { + "epoch": 45.2, + "learning_rate": 1.0707525067941148e-05, + "loss": 0.0603, + "step": 160770 + }, + { + "epoch": 45.21, + "learning_rate": 1.0688782682035424e-05, + "loss": 0.0513, + "step": 160800 + }, + { + "epoch": 45.22, + "learning_rate": 1.0670040296129699e-05, + "loss": 0.0604, + "step": 160830 + }, + { + "epoch": 45.22, + "learning_rate": 1.0651297910223971e-05, + "loss": 0.0523, + "step": 160860 + }, + { + "epoch": 45.23, + "learning_rate": 1.0632555524318247e-05, + "loss": 0.0555, + "step": 160890 + }, + { + "epoch": 45.24, + "learning_rate": 1.0613813138412521e-05, + "loss": 0.0621, + "step": 160920 + }, + { + "epoch": 45.25, + "learning_rate": 1.0595070752506794e-05, + "loss": 0.0495, + "step": 160950 + }, + { + "epoch": 45.26, + "learning_rate": 1.0576328366601068e-05, + "loss": 0.0579, + "step": 160980 + }, + { + "epoch": 45.27, + "learning_rate": 1.0557585980695344e-05, + "loss": 0.0576, + "step": 161010 + }, + { + "epoch": 45.27, + "learning_rate": 1.0538843594789618e-05, + "loss": 0.054, + "step": 161040 + }, + { + "epoch": 45.28, + "learning_rate": 1.052010120888389e-05, + "loss": 0.0584, + "step": 161070 + }, + { + "epoch": 45.29, + "learning_rate": 1.0501358822978166e-05, + "loss": 0.0493, + "step": 161100 + }, + { + "epoch": 45.3, + "learning_rate": 1.048261643707244e-05, + "loss": 0.0602, + "step": 161130 + }, + { + "epoch": 45.31, + "learning_rate": 1.0463874051166715e-05, + "loss": 0.0564, + "step": 161160 + }, + { + "epoch": 45.32, + "learning_rate": 1.0445131665260987e-05, + "loss": 0.0517, + "step": 161190 + }, + { + "epoch": 45.32, + "learning_rate": 1.0426389279355263e-05, + "loss": 0.0614, + "step": 161220 + }, + { + "epoch": 45.33, + "learning_rate": 1.0407646893449537e-05, + "loss": 0.0488, + "step": 161250 + }, + { + "epoch": 45.34, + "learning_rate": 1.038890450754381e-05, + "loss": 0.0553, + "step": 161280 + }, + { + "epoch": 45.35, + "learning_rate": 1.0370162121638086e-05, + "loss": 0.058, + "step": 161310 + }, + { + "epoch": 45.36, + "learning_rate": 1.035141973573236e-05, + "loss": 0.0557, + "step": 161340 + }, + { + "epoch": 45.37, + "learning_rate": 1.0332677349826634e-05, + "loss": 0.061, + "step": 161370 + }, + { + "epoch": 45.38, + "learning_rate": 1.0313934963920906e-05, + "loss": 0.0514, + "step": 161400 + }, + { + "epoch": 45.38, + "learning_rate": 1.029581732421204e-05, + "loss": 0.0803, + "step": 161430 + }, + { + "epoch": 45.39, + "learning_rate": 1.0277074938306313e-05, + "loss": 0.0538, + "step": 161460 + }, + { + "epoch": 45.4, + "learning_rate": 1.0258332552400587e-05, + "loss": 0.0548, + "step": 161490 + }, + { + "epoch": 45.41, + "learning_rate": 1.0239590166494863e-05, + "loss": 0.0611, + "step": 161520 + }, + { + "epoch": 45.42, + "learning_rate": 1.0220847780589136e-05, + "loss": 0.0488, + "step": 161550 + }, + { + "epoch": 45.43, + "learning_rate": 1.020210539468341e-05, + "loss": 0.0586, + "step": 161580 + }, + { + "epoch": 45.43, + "learning_rate": 1.0183363008777684e-05, + "loss": 0.0536, + "step": 161610 + }, + { + "epoch": 45.44, + "learning_rate": 1.016462062287196e-05, + "loss": 0.0543, + "step": 161640 + }, + { + "epoch": 45.45, + "learning_rate": 1.0145878236966232e-05, + "loss": 0.0645, + "step": 161670 + }, + { + "epoch": 45.46, + "learning_rate": 1.0127135851060507e-05, + "loss": 0.0513, + "step": 161700 + }, + { + "epoch": 45.47, + "learning_rate": 1.010839346515478e-05, + "loss": 0.0576, + "step": 161730 + }, + { + "epoch": 45.48, + "learning_rate": 1.0089651079249057e-05, + "loss": 0.0545, + "step": 161760 + }, + { + "epoch": 45.48, + "learning_rate": 1.007090869334333e-05, + "loss": 0.0539, + "step": 161790 + }, + { + "epoch": 45.49, + "learning_rate": 1.0052166307437603e-05, + "loss": 0.0629, + "step": 161820 + }, + { + "epoch": 45.5, + "learning_rate": 1.003342392153188e-05, + "loss": 0.0551, + "step": 161850 + }, + { + "epoch": 45.51, + "learning_rate": 1.0014681535626152e-05, + "loss": 0.0568, + "step": 161880 + }, + { + "epoch": 45.52, + "learning_rate": 9.995939149720426e-06, + "loss": 0.0542, + "step": 161910 + }, + { + "epoch": 45.53, + "learning_rate": 9.9771967638147e-06, + "loss": 0.0511, + "step": 161940 + }, + { + "epoch": 45.54, + "learning_rate": 9.958454377908976e-06, + "loss": 0.0594, + "step": 161970 + }, + { + "epoch": 45.54, + "learning_rate": 9.939711992003249e-06, + "loss": 0.0499, + "step": 162000 + }, + { + "epoch": 45.55, + "learning_rate": 9.920969606097523e-06, + "loss": 0.0568, + "step": 162030 + }, + { + "epoch": 45.56, + "learning_rate": 9.902227220191799e-06, + "loss": 0.0549, + "step": 162060 + }, + { + "epoch": 45.57, + "learning_rate": 9.883484834286071e-06, + "loss": 0.0536, + "step": 162090 + }, + { + "epoch": 45.58, + "learning_rate": 9.864742448380345e-06, + "loss": 0.0638, + "step": 162120 + }, + { + "epoch": 45.59, + "learning_rate": 9.84600006247462e-06, + "loss": 0.0486, + "step": 162150 + }, + { + "epoch": 45.59, + "learning_rate": 9.827257676568895e-06, + "loss": 0.058, + "step": 162180 + }, + { + "epoch": 45.6, + "learning_rate": 9.808515290663168e-06, + "loss": 0.0561, + "step": 162210 + }, + { + "epoch": 45.61, + "learning_rate": 9.789772904757442e-06, + "loss": 0.0528, + "step": 162240 + }, + { + "epoch": 45.62, + "learning_rate": 9.771030518851718e-06, + "loss": 0.0583, + "step": 162270 + }, + { + "epoch": 45.63, + "learning_rate": 9.752288132945992e-06, + "loss": 0.0503, + "step": 162300 + }, + { + "epoch": 45.64, + "learning_rate": 9.733545747040265e-06, + "loss": 0.0634, + "step": 162330 + }, + { + "epoch": 45.65, + "learning_rate": 9.714803361134539e-06, + "loss": 0.0523, + "step": 162360 + }, + { + "epoch": 45.65, + "learning_rate": 9.696060975228815e-06, + "loss": 0.057, + "step": 162390 + }, + { + "epoch": 45.66, + "learning_rate": 9.677318589323087e-06, + "loss": 0.0641, + "step": 162420 + }, + { + "epoch": 45.67, + "learning_rate": 9.658576203417361e-06, + "loss": 0.0489, + "step": 162450 + }, + { + "epoch": 45.68, + "learning_rate": 9.639833817511636e-06, + "loss": 0.0546, + "step": 162480 + }, + { + "epoch": 45.69, + "learning_rate": 9.621091431605911e-06, + "loss": 0.0549, + "step": 162510 + }, + { + "epoch": 45.7, + "learning_rate": 9.602349045700184e-06, + "loss": 0.0508, + "step": 162540 + }, + { + "epoch": 45.7, + "learning_rate": 9.583606659794458e-06, + "loss": 0.0595, + "step": 162570 + }, + { + "epoch": 45.71, + "learning_rate": 9.564864273888734e-06, + "loss": 0.0511, + "step": 162600 + }, + { + "epoch": 45.72, + "learning_rate": 9.546121887983008e-06, + "loss": 0.0605, + "step": 162630 + }, + { + "epoch": 45.73, + "learning_rate": 9.52737950207728e-06, + "loss": 0.0532, + "step": 162660 + }, + { + "epoch": 45.74, + "learning_rate": 9.508637116171555e-06, + "loss": 0.0575, + "step": 162690 + }, + { + "epoch": 45.75, + "learning_rate": 9.48989473026583e-06, + "loss": 0.066, + "step": 162720 + }, + { + "epoch": 45.75, + "learning_rate": 9.471152344360103e-06, + "loss": 0.0477, + "step": 162750 + }, + { + "epoch": 45.76, + "learning_rate": 9.452409958454378e-06, + "loss": 0.0579, + "step": 162780 + }, + { + "epoch": 45.77, + "learning_rate": 9.433667572548653e-06, + "loss": 0.058, + "step": 162810 + }, + { + "epoch": 45.78, + "learning_rate": 9.414925186642928e-06, + "loss": 0.0591, + "step": 162840 + }, + { + "epoch": 45.79, + "learning_rate": 9.3961828007372e-06, + "loss": 0.0565, + "step": 162870 + }, + { + "epoch": 45.8, + "learning_rate": 9.377440414831474e-06, + "loss": 0.048, + "step": 162900 + }, + { + "epoch": 45.81, + "learning_rate": 9.35869802892575e-06, + "loss": 0.0537, + "step": 162930 + }, + { + "epoch": 45.81, + "learning_rate": 9.339955643020024e-06, + "loss": 0.0558, + "step": 162960 + }, + { + "epoch": 45.82, + "learning_rate": 9.321213257114297e-06, + "loss": 0.057, + "step": 162990 + }, + { + "epoch": 45.83, + "learning_rate": 9.302470871208573e-06, + "loss": 0.0584, + "step": 163020 + }, + { + "epoch": 45.84, + "learning_rate": 9.283728485302847e-06, + "loss": 0.0501, + "step": 163050 + }, + { + "epoch": 45.85, + "learning_rate": 9.26498609939712e-06, + "loss": 0.0561, + "step": 163080 + }, + { + "epoch": 45.86, + "learning_rate": 9.246243713491394e-06, + "loss": 0.0555, + "step": 163110 + }, + { + "epoch": 45.86, + "learning_rate": 9.22750132758567e-06, + "loss": 0.053, + "step": 163140 + }, + { + "epoch": 45.87, + "learning_rate": 9.208758941679944e-06, + "loss": 0.0616, + "step": 163170 + }, + { + "epoch": 45.88, + "learning_rate": 9.190016555774216e-06, + "loss": 0.0491, + "step": 163200 + }, + { + "epoch": 45.89, + "learning_rate": 9.171274169868492e-06, + "loss": 0.0592, + "step": 163230 + }, + { + "epoch": 45.9, + "learning_rate": 9.152531783962766e-06, + "loss": 0.0538, + "step": 163260 + }, + { + "epoch": 45.91, + "learning_rate": 9.13378939805704e-06, + "loss": 0.0526, + "step": 163290 + }, + { + "epoch": 45.91, + "learning_rate": 9.115047012151313e-06, + "loss": 0.0579, + "step": 163320 + }, + { + "epoch": 45.92, + "learning_rate": 9.096304626245589e-06, + "loss": 0.0513, + "step": 163350 + }, + { + "epoch": 45.93, + "learning_rate": 9.077562240339863e-06, + "loss": 0.0617, + "step": 163380 + }, + { + "epoch": 45.94, + "learning_rate": 9.058819854434136e-06, + "loss": 0.0545, + "step": 163410 + }, + { + "epoch": 45.95, + "learning_rate": 9.04007746852841e-06, + "loss": 0.0522, + "step": 163440 + }, + { + "epoch": 45.96, + "learning_rate": 9.021335082622686e-06, + "loss": 0.063, + "step": 163470 + }, + { + "epoch": 45.97, + "learning_rate": 9.00259269671696e-06, + "loss": 0.0515, + "step": 163500 + }, + { + "epoch": 45.97, + "learning_rate": 8.983850310811232e-06, + "loss": 0.0603, + "step": 163530 + }, + { + "epoch": 45.98, + "learning_rate": 8.965107924905508e-06, + "loss": 0.052, + "step": 163560 + }, + { + "epoch": 45.99, + "learning_rate": 8.946365538999782e-06, + "loss": 0.0519, + "step": 163590 + }, + { + "epoch": 46.0, + "learning_rate": 8.927623153094057e-06, + "loss": 0.0557, + "step": 163620 + }, + { + "epoch": 46.0, + "eval_loss": 0.1765855848789215, + "eval_runtime": 511.5794, + "eval_samples_per_second": 31.34, + "eval_steps_per_second": 0.981, + "eval_wer": 0.12310127877935938, + "step": 163622 + }, + { + "epoch": 46.01, + "learning_rate": 8.908880767188329e-06, + "loss": 0.0524, + "step": 163650 + }, + { + "epoch": 46.02, + "learning_rate": 8.890138381282605e-06, + "loss": 0.0607, + "step": 163680 + }, + { + "epoch": 46.02, + "learning_rate": 8.871395995376879e-06, + "loss": 0.0514, + "step": 163710 + }, + { + "epoch": 46.03, + "learning_rate": 8.852653609471152e-06, + "loss": 0.0511, + "step": 163740 + }, + { + "epoch": 46.04, + "learning_rate": 8.833911223565428e-06, + "loss": 0.0576, + "step": 163770 + }, + { + "epoch": 46.05, + "learning_rate": 8.815168837659702e-06, + "loss": 0.0529, + "step": 163800 + }, + { + "epoch": 46.06, + "learning_rate": 8.796426451753976e-06, + "loss": 0.0597, + "step": 163830 + }, + { + "epoch": 46.07, + "learning_rate": 8.777684065848248e-06, + "loss": 0.0501, + "step": 163860 + }, + { + "epoch": 46.08, + "learning_rate": 8.758941679942524e-06, + "loss": 0.0592, + "step": 163890 + }, + { + "epoch": 46.08, + "learning_rate": 8.740199294036798e-06, + "loss": 0.0547, + "step": 163920 + }, + { + "epoch": 46.09, + "learning_rate": 8.721456908131071e-06, + "loss": 0.0494, + "step": 163950 + }, + { + "epoch": 46.1, + "learning_rate": 8.702714522225347e-06, + "loss": 0.0599, + "step": 163980 + }, + { + "epoch": 46.11, + "learning_rate": 8.683972136319621e-06, + "loss": 0.0494, + "step": 164010 + }, + { + "epoch": 46.12, + "learning_rate": 8.665229750413895e-06, + "loss": 0.0565, + "step": 164040 + }, + { + "epoch": 46.13, + "learning_rate": 8.646487364508168e-06, + "loss": 0.057, + "step": 164070 + }, + { + "epoch": 46.13, + "learning_rate": 8.627744978602444e-06, + "loss": 0.0481, + "step": 164100 + }, + { + "epoch": 46.14, + "learning_rate": 8.609002592696718e-06, + "loss": 0.0621, + "step": 164130 + }, + { + "epoch": 46.15, + "learning_rate": 8.590260206790992e-06, + "loss": 0.0558, + "step": 164160 + }, + { + "epoch": 46.16, + "learning_rate": 8.571517820885266e-06, + "loss": 0.0536, + "step": 164190 + }, + { + "epoch": 46.17, + "learning_rate": 8.55277543497954e-06, + "loss": 0.0584, + "step": 164220 + }, + { + "epoch": 46.18, + "learning_rate": 8.534033049073815e-06, + "loss": 0.0535, + "step": 164250 + }, + { + "epoch": 46.18, + "learning_rate": 8.515290663168087e-06, + "loss": 0.0599, + "step": 164280 + }, + { + "epoch": 46.19, + "learning_rate": 8.496548277262363e-06, + "loss": 0.0533, + "step": 164310 + }, + { + "epoch": 46.2, + "learning_rate": 8.477805891356637e-06, + "loss": 0.0561, + "step": 164340 + }, + { + "epoch": 46.21, + "learning_rate": 8.459063505450911e-06, + "loss": 0.0579, + "step": 164370 + }, + { + "epoch": 46.22, + "learning_rate": 8.440321119545184e-06, + "loss": 0.0515, + "step": 164400 + }, + { + "epoch": 46.23, + "learning_rate": 8.42157873363946e-06, + "loss": 0.0577, + "step": 164430 + }, + { + "epoch": 46.24, + "learning_rate": 8.402836347733734e-06, + "loss": 0.0515, + "step": 164460 + }, + { + "epoch": 46.24, + "learning_rate": 8.384093961828008e-06, + "loss": 0.0561, + "step": 164490 + }, + { + "epoch": 46.25, + "learning_rate": 8.365351575922282e-06, + "loss": 0.058, + "step": 164520 + }, + { + "epoch": 46.26, + "learning_rate": 8.346609190016556e-06, + "loss": 0.0565, + "step": 164550 + }, + { + "epoch": 46.27, + "learning_rate": 8.32786680411083e-06, + "loss": 0.0569, + "step": 164580 + }, + { + "epoch": 46.28, + "learning_rate": 8.309124418205103e-06, + "loss": 0.0501, + "step": 164610 + }, + { + "epoch": 46.29, + "learning_rate": 8.290382032299379e-06, + "loss": 0.0552, + "step": 164640 + }, + { + "epoch": 46.29, + "learning_rate": 8.271639646393653e-06, + "loss": 0.0579, + "step": 164670 + }, + { + "epoch": 46.3, + "learning_rate": 8.252897260487927e-06, + "loss": 0.053, + "step": 164700 + }, + { + "epoch": 46.31, + "learning_rate": 8.234154874582202e-06, + "loss": 0.0593, + "step": 164730 + }, + { + "epoch": 46.32, + "learning_rate": 8.215412488676476e-06, + "loss": 0.0569, + "step": 164760 + }, + { + "epoch": 46.33, + "learning_rate": 8.19667010277075e-06, + "loss": 0.0564, + "step": 164790 + }, + { + "epoch": 46.34, + "learning_rate": 8.177927716865024e-06, + "loss": 0.0555, + "step": 164820 + }, + { + "epoch": 46.35, + "learning_rate": 8.159185330959298e-06, + "loss": 0.0488, + "step": 164850 + }, + { + "epoch": 46.35, + "learning_rate": 8.140442945053573e-06, + "loss": 0.0574, + "step": 164880 + }, + { + "epoch": 46.36, + "learning_rate": 8.121700559147847e-06, + "loss": 0.0524, + "step": 164910 + }, + { + "epoch": 46.37, + "learning_rate": 8.102958173242121e-06, + "loss": 0.0555, + "step": 164940 + }, + { + "epoch": 46.38, + "learning_rate": 8.084215787336395e-06, + "loss": 0.057, + "step": 164970 + }, + { + "epoch": 46.39, + "learning_rate": 8.06547340143067e-06, + "loss": 0.0489, + "step": 165000 + }, + { + "epoch": 46.4, + "learning_rate": 8.046731015524944e-06, + "loss": 0.0597, + "step": 165030 + }, + { + "epoch": 46.4, + "learning_rate": 8.027988629619218e-06, + "loss": 0.0496, + "step": 165060 + }, + { + "epoch": 46.41, + "learning_rate": 8.009246243713492e-06, + "loss": 0.0549, + "step": 165090 + }, + { + "epoch": 46.42, + "learning_rate": 7.990503857807766e-06, + "loss": 0.0574, + "step": 165120 + }, + { + "epoch": 46.43, + "learning_rate": 7.97176147190204e-06, + "loss": 0.0487, + "step": 165150 + }, + { + "epoch": 46.44, + "learning_rate": 7.953019085996314e-06, + "loss": 0.0583, + "step": 165180 + }, + { + "epoch": 46.45, + "learning_rate": 7.934276700090589e-06, + "loss": 0.0495, + "step": 165210 + }, + { + "epoch": 46.45, + "learning_rate": 7.915534314184863e-06, + "loss": 0.0556, + "step": 165240 + }, + { + "epoch": 46.46, + "learning_rate": 7.896791928279137e-06, + "loss": 0.0554, + "step": 165270 + }, + { + "epoch": 46.47, + "learning_rate": 7.878049542373411e-06, + "loss": 0.0541, + "step": 165300 + }, + { + "epoch": 46.48, + "learning_rate": 7.859307156467685e-06, + "loss": 0.0556, + "step": 165330 + }, + { + "epoch": 46.49, + "learning_rate": 7.84056477056196e-06, + "loss": 0.055, + "step": 165360 + }, + { + "epoch": 46.5, + "learning_rate": 7.821822384656234e-06, + "loss": 0.058, + "step": 165390 + }, + { + "epoch": 46.51, + "learning_rate": 7.803079998750508e-06, + "loss": 0.055, + "step": 165420 + }, + { + "epoch": 46.51, + "learning_rate": 7.784337612844782e-06, + "loss": 0.0521, + "step": 165450 + }, + { + "epoch": 46.52, + "learning_rate": 7.765595226939056e-06, + "loss": 0.0582, + "step": 165480 + }, + { + "epoch": 46.53, + "learning_rate": 7.74685284103333e-06, + "loss": 0.0499, + "step": 165510 + }, + { + "epoch": 46.54, + "learning_rate": 7.728110455127605e-06, + "loss": 0.0502, + "step": 165540 + }, + { + "epoch": 46.55, + "learning_rate": 7.709368069221879e-06, + "loss": 0.0574, + "step": 165570 + }, + { + "epoch": 46.56, + "learning_rate": 7.690625683316153e-06, + "loss": 0.0521, + "step": 165600 + }, + { + "epoch": 46.56, + "learning_rate": 7.671883297410427e-06, + "loss": 0.0585, + "step": 165630 + }, + { + "epoch": 46.57, + "learning_rate": 7.653140911504702e-06, + "loss": 0.0479, + "step": 165660 + }, + { + "epoch": 46.58, + "learning_rate": 7.634398525598976e-06, + "loss": 0.0542, + "step": 165690 + }, + { + "epoch": 46.59, + "learning_rate": 7.61565613969325e-06, + "loss": 0.0586, + "step": 165720 + }, + { + "epoch": 46.6, + "learning_rate": 7.596913753787524e-06, + "loss": 0.0526, + "step": 165750 + }, + { + "epoch": 46.61, + "learning_rate": 7.5781713678817974e-06, + "loss": 0.0595, + "step": 165780 + }, + { + "epoch": 46.62, + "learning_rate": 7.559428981976073e-06, + "loss": 0.0525, + "step": 165810 + }, + { + "epoch": 46.62, + "learning_rate": 7.540686596070347e-06, + "loss": 0.0523, + "step": 165840 + }, + { + "epoch": 46.63, + "learning_rate": 7.521944210164621e-06, + "loss": 0.0541, + "step": 165870 + }, + { + "epoch": 46.64, + "learning_rate": 7.503201824258896e-06, + "loss": 0.0512, + "step": 165900 + }, + { + "epoch": 46.65, + "learning_rate": 7.484459438353169e-06, + "loss": 0.0587, + "step": 165930 + }, + { + "epoch": 46.66, + "learning_rate": 7.4657170524474434e-06, + "loss": 0.0512, + "step": 165960 + }, + { + "epoch": 46.67, + "learning_rate": 7.446974666541718e-06, + "loss": 0.0546, + "step": 165990 + }, + { + "epoch": 46.67, + "learning_rate": 7.428232280635993e-06, + "loss": 0.0558, + "step": 166020 + }, + { + "epoch": 46.68, + "learning_rate": 7.409489894730266e-06, + "loss": 0.0516, + "step": 166050 + }, + { + "epoch": 46.69, + "learning_rate": 7.39074750882454e-06, + "loss": 0.0595, + "step": 166080 + }, + { + "epoch": 46.7, + "learning_rate": 7.3720051229188135e-06, + "loss": 0.0517, + "step": 166110 + }, + { + "epoch": 46.71, + "learning_rate": 7.353262737013089e-06, + "loss": 0.0557, + "step": 166140 + }, + { + "epoch": 46.72, + "learning_rate": 7.334520351107363e-06, + "loss": 0.0584, + "step": 166170 + }, + { + "epoch": 46.72, + "learning_rate": 7.315777965201637e-06, + "loss": 0.0535, + "step": 166200 + }, + { + "epoch": 46.73, + "learning_rate": 7.297035579295912e-06, + "loss": 0.0629, + "step": 166230 + }, + { + "epoch": 46.74, + "learning_rate": 7.278293193390185e-06, + "loss": 0.0497, + "step": 166260 + }, + { + "epoch": 46.75, + "learning_rate": 7.2595508074844595e-06, + "loss": 0.0563, + "step": 166290 + }, + { + "epoch": 46.76, + "learning_rate": 7.240808421578734e-06, + "loss": 0.059, + "step": 166320 + }, + { + "epoch": 46.77, + "learning_rate": 7.222066035673009e-06, + "loss": 0.0484, + "step": 166350 + }, + { + "epoch": 46.78, + "learning_rate": 7.203323649767282e-06, + "loss": 0.0602, + "step": 166380 + }, + { + "epoch": 46.78, + "learning_rate": 7.184581263861556e-06, + "loss": 0.0503, + "step": 166410 + }, + { + "epoch": 46.79, + "learning_rate": 7.165838877955831e-06, + "loss": 0.0563, + "step": 166440 + }, + { + "epoch": 46.8, + "learning_rate": 7.1470964920501055e-06, + "loss": 0.0559, + "step": 166470 + }, + { + "epoch": 46.81, + "learning_rate": 7.128354106144379e-06, + "loss": 0.0509, + "step": 166500 + }, + { + "epoch": 46.82, + "learning_rate": 7.109611720238653e-06, + "loss": 0.0609, + "step": 166530 + }, + { + "epoch": 46.83, + "learning_rate": 7.090869334332928e-06, + "loss": 0.0539, + "step": 166560 + }, + { + "epoch": 46.83, + "learning_rate": 7.0721269484272014e-06, + "loss": 0.0547, + "step": 166590 + }, + { + "epoch": 46.84, + "learning_rate": 7.053384562521476e-06, + "loss": 0.0566, + "step": 166620 + }, + { + "epoch": 46.85, + "learning_rate": 7.034642176615751e-06, + "loss": 0.0474, + "step": 166650 + }, + { + "epoch": 46.86, + "learning_rate": 7.015899790710025e-06, + "loss": 0.0596, + "step": 166680 + }, + { + "epoch": 46.87, + "learning_rate": 6.997157404804298e-06, + "loss": 0.0503, + "step": 166710 + }, + { + "epoch": 46.88, + "learning_rate": 6.978415018898572e-06, + "loss": 0.0583, + "step": 166740 + }, + { + "epoch": 46.88, + "learning_rate": 6.959672632992847e-06, + "loss": 0.0577, + "step": 166770 + }, + { + "epoch": 46.89, + "learning_rate": 6.940930247087122e-06, + "loss": 0.0511, + "step": 166800 + }, + { + "epoch": 46.9, + "learning_rate": 6.922187861181395e-06, + "loss": 0.0559, + "step": 166830 + }, + { + "epoch": 46.91, + "learning_rate": 6.90344547527567e-06, + "loss": 0.0507, + "step": 166860 + }, + { + "epoch": 46.92, + "learning_rate": 6.884703089369944e-06, + "loss": 0.0565, + "step": 166890 + }, + { + "epoch": 46.93, + "learning_rate": 6.8659607034642175e-06, + "loss": 0.0549, + "step": 166920 + }, + { + "epoch": 46.94, + "learning_rate": 6.847218317558492e-06, + "loss": 0.0536, + "step": 166950 + }, + { + "epoch": 46.94, + "learning_rate": 6.828475931652767e-06, + "loss": 0.0589, + "step": 166980 + }, + { + "epoch": 46.95, + "learning_rate": 6.809733545747041e-06, + "loss": 0.0529, + "step": 167010 + }, + { + "epoch": 46.96, + "learning_rate": 6.790991159841314e-06, + "loss": 0.055, + "step": 167040 + }, + { + "epoch": 46.97, + "learning_rate": 6.7722487739355885e-06, + "loss": 0.0593, + "step": 167070 + }, + { + "epoch": 46.98, + "learning_rate": 6.7535063880298635e-06, + "loss": 0.0528, + "step": 167100 + }, + { + "epoch": 46.99, + "learning_rate": 6.734764002124138e-06, + "loss": 0.0577, + "step": 167130 + }, + { + "epoch": 46.99, + "learning_rate": 6.716021616218411e-06, + "loss": 0.0521, + "step": 167160 + }, + { + "epoch": 47.0, + "eval_loss": 0.17507979273796082, + "eval_runtime": 537.6874, + "eval_samples_per_second": 29.818, + "eval_steps_per_second": 0.934, + "eval_wer": 0.12198900004094278, + "step": 167179 + }, + { + "epoch": 47.0, + "learning_rate": 6.697279230312686e-06, + "loss": 0.0557, + "step": 167190 + }, + { + "epoch": 47.01, + "learning_rate": 6.67853684440696e-06, + "loss": 0.0514, + "step": 167220 + }, + { + "epoch": 47.02, + "learning_rate": 6.659794458501234e-06, + "loss": 0.0556, + "step": 167250 + }, + { + "epoch": 47.03, + "learning_rate": 6.641052072595508e-06, + "loss": 0.0593, + "step": 167280 + }, + { + "epoch": 47.04, + "learning_rate": 6.622309686689783e-06, + "loss": 0.0473, + "step": 167310 + }, + { + "epoch": 47.05, + "learning_rate": 6.603567300784057e-06, + "loss": 0.0545, + "step": 167340 + }, + { + "epoch": 47.05, + "learning_rate": 6.58482491487833e-06, + "loss": 0.0525, + "step": 167370 + }, + { + "epoch": 47.06, + "learning_rate": 6.5660825289726054e-06, + "loss": 0.0552, + "step": 167400 + }, + { + "epoch": 47.07, + "learning_rate": 6.54734014306688e-06, + "loss": 0.0604, + "step": 167430 + }, + { + "epoch": 47.08, + "learning_rate": 6.528597757161154e-06, + "loss": 0.0467, + "step": 167460 + }, + { + "epoch": 47.09, + "learning_rate": 6.509855371255427e-06, + "loss": 0.0604, + "step": 167490 + }, + { + "epoch": 47.1, + "learning_rate": 6.491112985349702e-06, + "loss": 0.0526, + "step": 167520 + }, + { + "epoch": 47.1, + "learning_rate": 6.472995345640834e-06, + "loss": 0.0562, + "step": 167550 + }, + { + "epoch": 47.11, + "learning_rate": 6.454252959735107e-06, + "loss": 0.0605, + "step": 167580 + }, + { + "epoch": 47.12, + "learning_rate": 6.435510573829383e-06, + "loss": 0.049, + "step": 167610 + }, + { + "epoch": 47.13, + "learning_rate": 6.416768187923656e-06, + "loss": 0.0584, + "step": 167640 + }, + { + "epoch": 47.14, + "learning_rate": 6.398025802017931e-06, + "loss": 0.0491, + "step": 167670 + }, + { + "epoch": 47.15, + "learning_rate": 6.379283416112204e-06, + "loss": 0.058, + "step": 167700 + }, + { + "epoch": 47.15, + "learning_rate": 6.360541030206479e-06, + "loss": 0.0603, + "step": 167730 + }, + { + "epoch": 47.16, + "learning_rate": 6.341798644300753e-06, + "loss": 0.0488, + "step": 167760 + }, + { + "epoch": 47.17, + "learning_rate": 6.323056258395027e-06, + "loss": 0.0544, + "step": 167790 + }, + { + "epoch": 47.18, + "learning_rate": 6.304313872489301e-06, + "loss": 0.0517, + "step": 167820 + }, + { + "epoch": 47.19, + "learning_rate": 6.285571486583576e-06, + "loss": 0.0545, + "step": 167850 + }, + { + "epoch": 47.2, + "learning_rate": 6.267453846874707e-06, + "loss": 0.0571, + "step": 167880 + }, + { + "epoch": 47.21, + "learning_rate": 6.248711460968982e-06, + "loss": 0.0485, + "step": 167910 + }, + { + "epoch": 47.21, + "learning_rate": 6.229969075063256e-06, + "loss": 0.0601, + "step": 167940 + }, + { + "epoch": 47.22, + "learning_rate": 6.21122668915753e-06, + "loss": 0.052, + "step": 167970 + }, + { + "epoch": 47.23, + "learning_rate": 6.192484303251804e-06, + "loss": 0.0539, + "step": 168000 + }, + { + "epoch": 47.24, + "learning_rate": 6.173741917346078e-06, + "loss": 0.0597, + "step": 168030 + }, + { + "epoch": 47.25, + "learning_rate": 6.1549995314403526e-06, + "loss": 0.0451, + "step": 168060 + }, + { + "epoch": 47.26, + "learning_rate": 6.136257145534627e-06, + "loss": 0.0548, + "step": 168090 + }, + { + "epoch": 47.26, + "learning_rate": 6.117514759628901e-06, + "loss": 0.0492, + "step": 168120 + }, + { + "epoch": 47.27, + "learning_rate": 6.098772373723175e-06, + "loss": 0.0506, + "step": 168150 + }, + { + "epoch": 47.28, + "learning_rate": 6.080029987817449e-06, + "loss": 0.0577, + "step": 168180 + }, + { + "epoch": 47.29, + "learning_rate": 6.0612876019117235e-06, + "loss": 0.0476, + "step": 168210 + }, + { + "epoch": 47.3, + "learning_rate": 6.042545216005998e-06, + "loss": 0.0573, + "step": 168240 + }, + { + "epoch": 47.31, + "learning_rate": 6.023802830100272e-06, + "loss": 0.05, + "step": 168270 + }, + { + "epoch": 47.32, + "learning_rate": 6.005060444194546e-06, + "loss": 0.0559, + "step": 168300 + }, + { + "epoch": 47.32, + "learning_rate": 5.986318058288821e-06, + "loss": 0.058, + "step": 168330 + }, + { + "epoch": 47.33, + "learning_rate": 5.9675756723830945e-06, + "loss": 0.0469, + "step": 168360 + }, + { + "epoch": 47.34, + "learning_rate": 5.9488332864773695e-06, + "loss": 0.0583, + "step": 168390 + }, + { + "epoch": 47.35, + "learning_rate": 5.930090900571643e-06, + "loss": 0.0507, + "step": 168420 + }, + { + "epoch": 47.36, + "learning_rate": 5.911348514665917e-06, + "loss": 0.0551, + "step": 168450 + }, + { + "epoch": 47.37, + "learning_rate": 5.892606128760191e-06, + "loss": 0.0633, + "step": 168480 + }, + { + "epoch": 47.37, + "learning_rate": 5.873863742854465e-06, + "loss": 0.0474, + "step": 168510 + }, + { + "epoch": 47.38, + "learning_rate": 5.85512135694874e-06, + "loss": 0.0554, + "step": 168540 + }, + { + "epoch": 47.39, + "learning_rate": 5.836378971043014e-06, + "loss": 0.0541, + "step": 168570 + }, + { + "epoch": 47.4, + "learning_rate": 5.817636585137289e-06, + "loss": 0.0513, + "step": 168600 + }, + { + "epoch": 47.41, + "learning_rate": 5.798894199231562e-06, + "loss": 0.0595, + "step": 168630 + }, + { + "epoch": 47.42, + "learning_rate": 5.780151813325837e-06, + "loss": 0.0474, + "step": 168660 + }, + { + "epoch": 47.42, + "learning_rate": 5.7614094274201106e-06, + "loss": 0.0535, + "step": 168690 + }, + { + "epoch": 47.43, + "learning_rate": 5.742667041514385e-06, + "loss": 0.052, + "step": 168720 + }, + { + "epoch": 47.44, + "learning_rate": 5.723924655608659e-06, + "loss": 0.0532, + "step": 168750 + }, + { + "epoch": 47.45, + "learning_rate": 5.705182269702933e-06, + "loss": 0.0568, + "step": 168780 + }, + { + "epoch": 47.46, + "learning_rate": 5.686439883797208e-06, + "loss": 0.0495, + "step": 168810 + }, + { + "epoch": 47.47, + "learning_rate": 5.6676974978914815e-06, + "loss": 0.0593, + "step": 168840 + }, + { + "epoch": 47.48, + "learning_rate": 5.6489551119857566e-06, + "loss": 0.0527, + "step": 168870 + }, + { + "epoch": 47.48, + "learning_rate": 5.63021272608003e-06, + "loss": 0.0544, + "step": 168900 + }, + { + "epoch": 47.49, + "learning_rate": 5.611470340174305e-06, + "loss": 0.061, + "step": 168930 + }, + { + "epoch": 47.5, + "learning_rate": 5.592727954268578e-06, + "loss": 0.0474, + "step": 168960 + }, + { + "epoch": 47.51, + "learning_rate": 5.573985568362853e-06, + "loss": 0.0632, + "step": 168990 + }, + { + "epoch": 47.52, + "learning_rate": 5.555243182457127e-06, + "loss": 0.0534, + "step": 169020 + }, + { + "epoch": 47.53, + "learning_rate": 5.536500796551401e-06, + "loss": 0.0547, + "step": 169050 + }, + { + "epoch": 47.53, + "learning_rate": 5.517758410645676e-06, + "loss": 0.0556, + "step": 169080 + }, + { + "epoch": 47.54, + "learning_rate": 5.499016024739949e-06, + "loss": 0.0489, + "step": 169110 + }, + { + "epoch": 47.55, + "learning_rate": 5.480273638834224e-06, + "loss": 0.0583, + "step": 169140 + }, + { + "epoch": 47.56, + "learning_rate": 5.461531252928498e-06, + "loss": 0.0521, + "step": 169170 + }, + { + "epoch": 47.57, + "learning_rate": 5.442788867022773e-06, + "loss": 0.0528, + "step": 169200 + }, + { + "epoch": 47.58, + "learning_rate": 5.424046481117046e-06, + "loss": 0.0625, + "step": 169230 + }, + { + "epoch": 47.58, + "learning_rate": 5.405304095211321e-06, + "loss": 0.0453, + "step": 169260 + }, + { + "epoch": 47.59, + "learning_rate": 5.386561709305595e-06, + "loss": 0.0594, + "step": 169290 + }, + { + "epoch": 47.6, + "learning_rate": 5.367819323399869e-06, + "loss": 0.0507, + "step": 169320 + }, + { + "epoch": 47.61, + "learning_rate": 5.349076937494144e-06, + "loss": 0.0533, + "step": 169350 + }, + { + "epoch": 47.62, + "learning_rate": 5.330334551588417e-06, + "loss": 0.0618, + "step": 169380 + }, + { + "epoch": 47.63, + "learning_rate": 5.311592165682692e-06, + "loss": 0.0491, + "step": 169410 + }, + { + "epoch": 47.64, + "learning_rate": 5.292849779776965e-06, + "loss": 0.0605, + "step": 169440 + }, + { + "epoch": 47.64, + "learning_rate": 5.27410739387124e-06, + "loss": 0.0532, + "step": 169470 + }, + { + "epoch": 47.65, + "learning_rate": 5.255365007965514e-06, + "loss": 0.0561, + "step": 169500 + }, + { + "epoch": 47.66, + "learning_rate": 5.236622622059789e-06, + "loss": 0.0609, + "step": 169530 + }, + { + "epoch": 47.67, + "learning_rate": 5.217880236154063e-06, + "loss": 0.0497, + "step": 169560 + }, + { + "epoch": 47.68, + "learning_rate": 5.199137850248337e-06, + "loss": 0.0589, + "step": 169590 + }, + { + "epoch": 47.69, + "learning_rate": 5.180395464342611e-06, + "loss": 0.0533, + "step": 169620 + }, + { + "epoch": 47.69, + "learning_rate": 5.161653078436885e-06, + "loss": 0.0546, + "step": 169650 + }, + { + "epoch": 47.7, + "learning_rate": 5.14291069253116e-06, + "loss": 0.0598, + "step": 169680 + }, + { + "epoch": 47.71, + "learning_rate": 5.124168306625433e-06, + "loss": 0.0486, + "step": 169710 + }, + { + "epoch": 47.72, + "learning_rate": 5.105425920719708e-06, + "loss": 0.0598, + "step": 169740 + }, + { + "epoch": 47.73, + "learning_rate": 5.086683534813982e-06, + "loss": 0.0545, + "step": 169770 + }, + { + "epoch": 47.74, + "learning_rate": 5.0679411489082565e-06, + "loss": 0.0564, + "step": 169800 + }, + { + "epoch": 47.75, + "learning_rate": 5.049198763002531e-06, + "loss": 0.0578, + "step": 169830 + }, + { + "epoch": 47.75, + "learning_rate": 5.030456377096805e-06, + "loss": 0.0471, + "step": 169860 + }, + { + "epoch": 47.76, + "learning_rate": 5.011713991191079e-06, + "loss": 0.0535, + "step": 169890 + }, + { + "epoch": 47.77, + "learning_rate": 4.992971605285353e-06, + "loss": 0.0474, + "step": 169920 + }, + { + "epoch": 47.78, + "learning_rate": 4.974229219379627e-06, + "loss": 0.0525, + "step": 169950 + }, + { + "epoch": 47.79, + "learning_rate": 4.955486833473901e-06, + "loss": 0.0583, + "step": 169980 + }, + { + "epoch": 47.8, + "learning_rate": 4.936744447568176e-06, + "loss": 0.0493, + "step": 170010 + }, + { + "epoch": 47.8, + "learning_rate": 4.91800206166245e-06, + "loss": 0.0604, + "step": 170040 + }, + { + "epoch": 47.81, + "learning_rate": 4.899259675756724e-06, + "loss": 0.0514, + "step": 170070 + }, + { + "epoch": 47.82, + "learning_rate": 4.880517289850998e-06, + "loss": 0.0532, + "step": 170100 + }, + { + "epoch": 47.83, + "learning_rate": 4.8617749039452726e-06, + "loss": 0.0637, + "step": 170130 + }, + { + "epoch": 47.84, + "learning_rate": 4.843032518039547e-06, + "loss": 0.0481, + "step": 170160 + }, + { + "epoch": 47.85, + "learning_rate": 4.824290132133821e-06, + "loss": 0.0545, + "step": 170190 + }, + { + "epoch": 47.85, + "learning_rate": 4.805547746228095e-06, + "loss": 0.0503, + "step": 170220 + }, + { + "epoch": 47.86, + "learning_rate": 4.786805360322369e-06, + "loss": 0.0542, + "step": 170250 + }, + { + "epoch": 47.87, + "learning_rate": 4.7680629744166435e-06, + "loss": 0.0575, + "step": 170280 + }, + { + "epoch": 47.88, + "learning_rate": 4.749320588510918e-06, + "loss": 0.0445, + "step": 170310 + }, + { + "epoch": 47.89, + "learning_rate": 4.730578202605192e-06, + "loss": 0.0553, + "step": 170340 + }, + { + "epoch": 47.9, + "learning_rate": 4.711835816699466e-06, + "loss": 0.0514, + "step": 170370 + }, + { + "epoch": 47.91, + "learning_rate": 4.69309343079374e-06, + "loss": 0.0547, + "step": 170400 + }, + { + "epoch": 47.91, + "learning_rate": 4.6743510448880145e-06, + "loss": 0.057, + "step": 170430 + }, + { + "epoch": 47.92, + "learning_rate": 4.655608658982289e-06, + "loss": 0.0547, + "step": 170460 + }, + { + "epoch": 47.93, + "learning_rate": 4.636866273076563e-06, + "loss": 0.0579, + "step": 170490 + }, + { + "epoch": 47.94, + "learning_rate": 4.618123887170837e-06, + "loss": 0.0515, + "step": 170520 + }, + { + "epoch": 47.95, + "learning_rate": 4.599381501265111e-06, + "loss": 0.0546, + "step": 170550 + }, + { + "epoch": 47.96, + "learning_rate": 4.5806391153593854e-06, + "loss": 0.059, + "step": 170580 + }, + { + "epoch": 47.96, + "learning_rate": 4.56189672945366e-06, + "loss": 0.0451, + "step": 170610 + }, + { + "epoch": 47.97, + "learning_rate": 4.543154343547934e-06, + "loss": 0.0563, + "step": 170640 + }, + { + "epoch": 47.98, + "learning_rate": 4.524411957642208e-06, + "loss": 0.0526, + "step": 170670 + }, + { + "epoch": 47.99, + "learning_rate": 4.505669571736482e-06, + "loss": 0.0515, + "step": 170700 + }, + { + "epoch": 48.0, + "learning_rate": 4.486927185830756e-06, + "loss": 0.0591, + "step": 170730 + }, + { + "epoch": 48.0, + "eval_loss": 0.17236961424350739, + "eval_runtime": 503.3181, + "eval_samples_per_second": 31.855, + "eval_steps_per_second": 0.997, + "eval_wer": 0.12165463403982367, + "step": 170736 + }, + { + "epoch": 48.01, + "learning_rate": 4.4681847999250306e-06, + "loss": 0.0496, + "step": 170760 + }, + { + "epoch": 48.02, + "learning_rate": 4.449442414019305e-06, + "loss": 0.0607, + "step": 170790 + }, + { + "epoch": 48.02, + "learning_rate": 4.430700028113579e-06, + "loss": 0.0494, + "step": 170820 + }, + { + "epoch": 48.03, + "learning_rate": 4.411957642207853e-06, + "loss": 0.0559, + "step": 170850 + }, + { + "epoch": 48.04, + "learning_rate": 4.393215256302127e-06, + "loss": 0.0481, + "step": 170880 + }, + { + "epoch": 48.05, + "learning_rate": 4.3744728703964015e-06, + "loss": 0.0554, + "step": 170910 + }, + { + "epoch": 48.06, + "learning_rate": 4.355730484490676e-06, + "loss": 0.0554, + "step": 170940 + }, + { + "epoch": 48.07, + "learning_rate": 4.33698809858495e-06, + "loss": 0.0499, + "step": 170970 + }, + { + "epoch": 48.07, + "learning_rate": 4.318245712679225e-06, + "loss": 0.0571, + "step": 171000 + }, + { + "epoch": 48.08, + "learning_rate": 4.299503326773498e-06, + "loss": 0.0554, + "step": 171030 + }, + { + "epoch": 48.09, + "learning_rate": 4.280760940867773e-06, + "loss": 0.0551, + "step": 171060 + }, + { + "epoch": 48.1, + "learning_rate": 4.262018554962047e-06, + "loss": 0.0568, + "step": 171090 + }, + { + "epoch": 48.11, + "learning_rate": 4.243276169056321e-06, + "loss": 0.0496, + "step": 171120 + }, + { + "epoch": 48.12, + "learning_rate": 4.224533783150595e-06, + "loss": 0.0542, + "step": 171150 + }, + { + "epoch": 48.12, + "learning_rate": 4.205791397244869e-06, + "loss": 0.0545, + "step": 171180 + }, + { + "epoch": 48.13, + "learning_rate": 4.1870490113391434e-06, + "loss": 0.0484, + "step": 171210 + }, + { + "epoch": 48.14, + "learning_rate": 4.168306625433418e-06, + "loss": 0.0591, + "step": 171240 + }, + { + "epoch": 48.15, + "learning_rate": 4.149564239527693e-06, + "loss": 0.0471, + "step": 171270 + }, + { + "epoch": 48.16, + "learning_rate": 4.130821853621966e-06, + "loss": 0.0557, + "step": 171300 + }, + { + "epoch": 48.17, + "learning_rate": 4.112079467716241e-06, + "loss": 0.0512, + "step": 171330 + }, + { + "epoch": 48.18, + "learning_rate": 4.093337081810514e-06, + "loss": 0.0523, + "step": 171360 + }, + { + "epoch": 48.18, + "learning_rate": 4.0745946959047886e-06, + "loss": 0.0574, + "step": 171390 + }, + { + "epoch": 48.19, + "learning_rate": 4.055852309999063e-06, + "loss": 0.0466, + "step": 171420 + }, + { + "epoch": 48.2, + "learning_rate": 4.037109924093337e-06, + "loss": 0.0569, + "step": 171450 + }, + { + "epoch": 48.21, + "learning_rate": 4.018367538187612e-06, + "loss": 0.0528, + "step": 171480 + }, + { + "epoch": 48.22, + "learning_rate": 3.999625152281885e-06, + "loss": 0.0541, + "step": 171510 + }, + { + "epoch": 48.23, + "learning_rate": 3.98088276637616e-06, + "loss": 0.0615, + "step": 171540 + }, + { + "epoch": 48.23, + "learning_rate": 3.962140380470434e-06, + "loss": 0.0504, + "step": 171570 + }, + { + "epoch": 48.24, + "learning_rate": 3.943397994564709e-06, + "loss": 0.0546, + "step": 171600 + }, + { + "epoch": 48.25, + "learning_rate": 3.924655608658982e-06, + "loss": 0.054, + "step": 171630 + }, + { + "epoch": 48.26, + "learning_rate": 3.905913222753257e-06, + "loss": 0.0488, + "step": 171660 + }, + { + "epoch": 48.27, + "learning_rate": 3.8871708368475305e-06, + "loss": 0.0552, + "step": 171690 + }, + { + "epoch": 48.28, + "learning_rate": 3.868428450941805e-06, + "loss": 0.0496, + "step": 171720 + }, + { + "epoch": 48.29, + "learning_rate": 3.84968606503608e-06, + "loss": 0.059, + "step": 171750 + }, + { + "epoch": 48.29, + "learning_rate": 3.830943679130353e-06, + "loss": 0.0544, + "step": 171780 + }, + { + "epoch": 48.3, + "learning_rate": 3.812201293224628e-06, + "loss": 0.0524, + "step": 171810 + }, + { + "epoch": 48.31, + "learning_rate": 3.793458907318902e-06, + "loss": 0.0593, + "step": 171840 + }, + { + "epoch": 48.32, + "learning_rate": 3.774716521413176e-06, + "loss": 0.0489, + "step": 171870 + }, + { + "epoch": 48.33, + "learning_rate": 3.7565988817043077e-06, + "loss": 0.0531, + "step": 171900 + }, + { + "epoch": 48.34, + "learning_rate": 3.737856495798582e-06, + "loss": 0.0596, + "step": 171930 + }, + { + "epoch": 48.34, + "learning_rate": 3.7191141098928565e-06, + "loss": 0.0526, + "step": 171960 + }, + { + "epoch": 48.35, + "learning_rate": 3.7009964701839878e-06, + "loss": 0.0604, + "step": 171990 + }, + { + "epoch": 48.36, + "learning_rate": 3.6822540842782624e-06, + "loss": 0.0494, + "step": 172020 + }, + { + "epoch": 48.37, + "learning_rate": 3.663511698372536e-06, + "loss": 0.0575, + "step": 172050 + }, + { + "epoch": 48.38, + "learning_rate": 3.6447693124668107e-06, + "loss": 0.052, + "step": 172080 + }, + { + "epoch": 48.39, + "learning_rate": 3.6260269265610845e-06, + "loss": 0.0528, + "step": 172110 + }, + { + "epoch": 48.39, + "learning_rate": 3.607284540655359e-06, + "loss": 0.0599, + "step": 172140 + }, + { + "epoch": 48.4, + "learning_rate": 3.588542154749633e-06, + "loss": 0.0498, + "step": 172170 + }, + { + "epoch": 48.41, + "learning_rate": 3.5697997688439075e-06, + "loss": 0.0517, + "step": 172200 + }, + { + "epoch": 48.42, + "learning_rate": 3.5510573829381817e-06, + "loss": 0.05, + "step": 172230 + }, + { + "epoch": 48.43, + "learning_rate": 3.5323149970324555e-06, + "loss": 0.0558, + "step": 172260 + }, + { + "epoch": 48.44, + "learning_rate": 3.51357261112673e-06, + "loss": 0.0572, + "step": 172290 + }, + { + "epoch": 48.45, + "learning_rate": 3.494830225221004e-06, + "loss": 0.0478, + "step": 172320 + }, + { + "epoch": 48.45, + "learning_rate": 3.4760878393152785e-06, + "loss": 0.0563, + "step": 172350 + }, + { + "epoch": 48.46, + "learning_rate": 3.4573454534095522e-06, + "loss": 0.053, + "step": 172380 + }, + { + "epoch": 48.47, + "learning_rate": 3.438603067503827e-06, + "loss": 0.0552, + "step": 172410 + }, + { + "epoch": 48.48, + "learning_rate": 3.4198606815981006e-06, + "loss": 0.0563, + "step": 172440 + }, + { + "epoch": 48.49, + "learning_rate": 3.4011182956923752e-06, + "loss": 0.046, + "step": 172470 + }, + { + "epoch": 48.5, + "learning_rate": 3.3823759097866494e-06, + "loss": 0.0548, + "step": 172500 + }, + { + "epoch": 48.5, + "learning_rate": 3.3636335238809236e-06, + "loss": 0.052, + "step": 172530 + }, + { + "epoch": 48.51, + "learning_rate": 3.344891137975198e-06, + "loss": 0.0545, + "step": 172560 + }, + { + "epoch": 48.52, + "learning_rate": 3.3261487520694716e-06, + "loss": 0.0577, + "step": 172590 + }, + { + "epoch": 48.53, + "learning_rate": 3.307406366163746e-06, + "loss": 0.0479, + "step": 172620 + }, + { + "epoch": 48.54, + "learning_rate": 3.28866398025802e-06, + "loss": 0.0529, + "step": 172650 + }, + { + "epoch": 48.55, + "learning_rate": 3.2699215943522946e-06, + "loss": 0.0545, + "step": 172680 + }, + { + "epoch": 48.55, + "learning_rate": 3.251179208446569e-06, + "loss": 0.0522, + "step": 172710 + }, + { + "epoch": 48.56, + "learning_rate": 3.232436822540843e-06, + "loss": 0.0598, + "step": 172740 + }, + { + "epoch": 48.57, + "learning_rate": 3.2136944366351176e-06, + "loss": 0.0462, + "step": 172770 + }, + { + "epoch": 48.58, + "learning_rate": 3.1949520507293913e-06, + "loss": 0.0521, + "step": 172800 + }, + { + "epoch": 48.59, + "learning_rate": 3.1762096648236655e-06, + "loss": 0.0532, + "step": 172830 + }, + { + "epoch": 48.6, + "learning_rate": 3.1574672789179397e-06, + "loss": 0.0518, + "step": 172860 + }, + { + "epoch": 48.61, + "learning_rate": 3.138724893012214e-06, + "loss": 0.0619, + "step": 172890 + }, + { + "epoch": 48.61, + "learning_rate": 3.119982507106488e-06, + "loss": 0.0485, + "step": 172920 + }, + { + "epoch": 48.62, + "learning_rate": 3.1012401212007623e-06, + "loss": 0.0556, + "step": 172950 + }, + { + "epoch": 48.63, + "learning_rate": 3.0824977352950365e-06, + "loss": 0.0496, + "step": 172980 + }, + { + "epoch": 48.64, + "learning_rate": 3.0637553493893107e-06, + "loss": 0.0494, + "step": 173010 + }, + { + "epoch": 48.65, + "learning_rate": 3.045012963483585e-06, + "loss": 0.0602, + "step": 173040 + }, + { + "epoch": 48.66, + "learning_rate": 3.0262705775778595e-06, + "loss": 0.0502, + "step": 173070 + }, + { + "epoch": 48.66, + "learning_rate": 3.0075281916721337e-06, + "loss": 0.0546, + "step": 173100 + }, + { + "epoch": 48.67, + "learning_rate": 2.9887858057664074e-06, + "loss": 0.0525, + "step": 173130 + }, + { + "epoch": 48.68, + "learning_rate": 2.9700434198606816e-06, + "loss": 0.0543, + "step": 173160 + }, + { + "epoch": 48.69, + "learning_rate": 2.951301033954956e-06, + "loss": 0.0594, + "step": 173190 + }, + { + "epoch": 48.7, + "learning_rate": 2.93255864804923e-06, + "loss": 0.0473, + "step": 173220 + }, + { + "epoch": 48.71, + "learning_rate": 2.913816262143504e-06, + "loss": 0.0531, + "step": 173250 + }, + { + "epoch": 48.72, + "learning_rate": 2.8950738762377784e-06, + "loss": 0.0539, + "step": 173280 + }, + { + "epoch": 48.72, + "learning_rate": 2.876331490332053e-06, + "loss": 0.0522, + "step": 173310 + }, + { + "epoch": 48.73, + "learning_rate": 2.857589104426327e-06, + "loss": 0.0575, + "step": 173340 + }, + { + "epoch": 48.74, + "learning_rate": 2.8388467185206014e-06, + "loss": 0.0487, + "step": 173370 + }, + { + "epoch": 48.75, + "learning_rate": 2.8201043326148756e-06, + "loss": 0.0583, + "step": 173400 + }, + { + "epoch": 48.76, + "learning_rate": 2.8013619467091493e-06, + "loss": 0.0527, + "step": 173430 + }, + { + "epoch": 48.77, + "learning_rate": 2.7826195608034235e-06, + "loss": 0.0557, + "step": 173460 + }, + { + "epoch": 48.77, + "learning_rate": 2.7638771748976977e-06, + "loss": 0.059, + "step": 173490 + }, + { + "epoch": 48.78, + "learning_rate": 2.745134788991972e-06, + "loss": 0.0476, + "step": 173520 + }, + { + "epoch": 48.79, + "learning_rate": 2.7263924030862465e-06, + "loss": 0.0529, + "step": 173550 + }, + { + "epoch": 48.8, + "learning_rate": 2.7076500171805207e-06, + "loss": 0.0501, + "step": 173580 + }, + { + "epoch": 48.81, + "learning_rate": 2.688907631274795e-06, + "loss": 0.0546, + "step": 173610 + }, + { + "epoch": 48.82, + "learning_rate": 2.670165245369069e-06, + "loss": 0.059, + "step": 173640 + }, + { + "epoch": 48.82, + "learning_rate": 2.6514228594633433e-06, + "loss": 0.0502, + "step": 173670 + }, + { + "epoch": 48.83, + "learning_rate": 2.6326804735576175e-06, + "loss": 0.0598, + "step": 173700 + }, + { + "epoch": 48.84, + "learning_rate": 2.6139380876518917e-06, + "loss": 0.0528, + "step": 173730 + }, + { + "epoch": 48.85, + "learning_rate": 2.5951957017461654e-06, + "loss": 0.0519, + "step": 173760 + }, + { + "epoch": 48.86, + "learning_rate": 2.57645331584044e-06, + "loss": 0.057, + "step": 173790 + }, + { + "epoch": 48.87, + "learning_rate": 2.5577109299347142e-06, + "loss": 0.0445, + "step": 173820 + }, + { + "epoch": 48.88, + "learning_rate": 2.5389685440289884e-06, + "loss": 0.0532, + "step": 173850 + }, + { + "epoch": 48.88, + "learning_rate": 2.5202261581232626e-06, + "loss": 0.0501, + "step": 173880 + }, + { + "epoch": 48.89, + "learning_rate": 2.501483772217537e-06, + "loss": 0.0557, + "step": 173910 + }, + { + "epoch": 48.9, + "learning_rate": 2.482741386311811e-06, + "loss": 0.0579, + "step": 173940 + }, + { + "epoch": 48.91, + "learning_rate": 2.463999000406085e-06, + "loss": 0.0465, + "step": 173970 + }, + { + "epoch": 48.92, + "learning_rate": 2.4452566145003594e-06, + "loss": 0.055, + "step": 174000 + }, + { + "epoch": 48.93, + "learning_rate": 2.4265142285946336e-06, + "loss": 0.0534, + "step": 174030 + }, + { + "epoch": 48.93, + "learning_rate": 2.4077718426889078e-06, + "loss": 0.0498, + "step": 174060 + }, + { + "epoch": 48.94, + "learning_rate": 2.389029456783182e-06, + "loss": 0.0587, + "step": 174090 + }, + { + "epoch": 48.95, + "learning_rate": 2.370287070877456e-06, + "loss": 0.0475, + "step": 174120 + }, + { + "epoch": 48.96, + "learning_rate": 2.3515446849717303e-06, + "loss": 0.0592, + "step": 174150 + }, + { + "epoch": 48.97, + "learning_rate": 2.3328022990660045e-06, + "loss": 0.0507, + "step": 174180 + }, + { + "epoch": 48.98, + "learning_rate": 2.3140599131602787e-06, + "loss": 0.0554, + "step": 174210 + }, + { + "epoch": 48.98, + "learning_rate": 2.295317527254553e-06, + "loss": 0.0582, + "step": 174240 + }, + { + "epoch": 48.99, + "learning_rate": 2.276575141348827e-06, + "loss": 0.0507, + "step": 174270 + }, + { + "epoch": 49.0, + "eval_loss": 0.1752515286207199, + "eval_runtime": 501.7816, + "eval_samples_per_second": 31.952, + "eval_steps_per_second": 1.0, + "eval_wer": 0.12116332073205682, + "step": 174293 + }, + { + "epoch": 49.0, + "learning_rate": 2.2578327554431013e-06, + "loss": 0.0557, + "step": 174300 + }, + { + "epoch": 49.01, + "learning_rate": 2.2390903695373755e-06, + "loss": 0.047, + "step": 174330 + }, + { + "epoch": 49.02, + "learning_rate": 2.2203479836316497e-06, + "loss": 0.0596, + "step": 174360 + }, + { + "epoch": 49.03, + "learning_rate": 2.201605597725924e-06, + "loss": 0.0517, + "step": 174390 + }, + { + "epoch": 49.04, + "learning_rate": 2.182863211820198e-06, + "loss": 0.049, + "step": 174420 + }, + { + "epoch": 49.04, + "learning_rate": 2.1641208259144722e-06, + "loss": 0.0616, + "step": 174450 + }, + { + "epoch": 49.05, + "learning_rate": 2.1453784400087464e-06, + "loss": 0.0516, + "step": 174480 + }, + { + "epoch": 49.06, + "learning_rate": 2.127260800299878e-06, + "loss": 0.0727, + "step": 174510 + }, + { + "epoch": 49.07, + "learning_rate": 2.1085184143941527e-06, + "loss": 0.0534, + "step": 174540 + }, + { + "epoch": 49.08, + "learning_rate": 2.089776028488427e-06, + "loss": 0.0548, + "step": 174570 + }, + { + "epoch": 49.09, + "learning_rate": 2.071033642582701e-06, + "loss": 0.0605, + "step": 174600 + }, + { + "epoch": 49.09, + "learning_rate": 2.0522912566769753e-06, + "loss": 0.0444, + "step": 174630 + }, + { + "epoch": 49.1, + "learning_rate": 2.0335488707712495e-06, + "loss": 0.0542, + "step": 174660 + }, + { + "epoch": 49.11, + "learning_rate": 2.0148064848655232e-06, + "loss": 0.0583, + "step": 174690 + }, + { + "epoch": 49.12, + "learning_rate": 1.9960640989597974e-06, + "loss": 0.0491, + "step": 174720 + }, + { + "epoch": 49.13, + "learning_rate": 1.9773217130540716e-06, + "loss": 0.0561, + "step": 174750 + }, + { + "epoch": 49.14, + "learning_rate": 1.9585793271483462e-06, + "loss": 0.0487, + "step": 174780 + }, + { + "epoch": 49.15, + "learning_rate": 1.9398369412426204e-06, + "loss": 0.0557, + "step": 174810 + }, + { + "epoch": 49.15, + "learning_rate": 1.9210945553368946e-06, + "loss": 0.0518, + "step": 174840 + }, + { + "epoch": 49.16, + "learning_rate": 1.9023521694311688e-06, + "loss": 0.0501, + "step": 174870 + }, + { + "epoch": 49.17, + "learning_rate": 1.8836097835254428e-06, + "loss": 0.0557, + "step": 174900 + }, + { + "epoch": 49.18, + "learning_rate": 1.864867397619717e-06, + "loss": 0.0483, + "step": 174930 + }, + { + "epoch": 49.19, + "learning_rate": 1.8461250117139912e-06, + "loss": 0.0521, + "step": 174960 + }, + { + "epoch": 49.2, + "learning_rate": 1.8273826258082653e-06, + "loss": 0.0543, + "step": 174990 + }, + { + "epoch": 49.2, + "learning_rate": 1.8086402399025398e-06, + "loss": 0.0483, + "step": 175020 + }, + { + "epoch": 49.21, + "learning_rate": 1.789897853996814e-06, + "loss": 0.0589, + "step": 175050 + }, + { + "epoch": 49.22, + "learning_rate": 1.7711554680910881e-06, + "loss": 0.0513, + "step": 175080 + }, + { + "epoch": 49.23, + "learning_rate": 1.7524130821853623e-06, + "loss": 0.052, + "step": 175110 + }, + { + "epoch": 49.24, + "learning_rate": 1.7336706962796365e-06, + "loss": 0.0544, + "step": 175140 + }, + { + "epoch": 49.25, + "learning_rate": 1.7149283103739107e-06, + "loss": 0.0525, + "step": 175170 + }, + { + "epoch": 49.25, + "learning_rate": 1.6961859244681847e-06, + "loss": 0.0579, + "step": 175200 + }, + { + "epoch": 49.26, + "learning_rate": 1.6774435385624589e-06, + "loss": 0.0489, + "step": 175230 + }, + { + "epoch": 49.27, + "learning_rate": 1.6587011526567335e-06, + "loss": 0.0567, + "step": 175260 + }, + { + "epoch": 49.28, + "learning_rate": 1.6399587667510077e-06, + "loss": 0.0503, + "step": 175290 + }, + { + "epoch": 49.29, + "learning_rate": 1.6212163808452817e-06, + "loss": 0.0498, + "step": 175320 + }, + { + "epoch": 49.3, + "learning_rate": 1.6024739949395558e-06, + "loss": 0.0578, + "step": 175350 + }, + { + "epoch": 49.31, + "learning_rate": 1.58373160903383e-06, + "loss": 0.0477, + "step": 175380 + }, + { + "epoch": 49.31, + "learning_rate": 1.5649892231281042e-06, + "loss": 0.0539, + "step": 175410 + }, + { + "epoch": 49.32, + "learning_rate": 1.5462468372223786e-06, + "loss": 0.059, + "step": 175440 + }, + { + "epoch": 49.33, + "learning_rate": 1.5275044513166526e-06, + "loss": 0.055, + "step": 175470 + }, + { + "epoch": 49.34, + "learning_rate": 1.5087620654109268e-06, + "loss": 0.0548, + "step": 175500 + }, + { + "epoch": 49.35, + "learning_rate": 1.490019679505201e-06, + "loss": 0.0494, + "step": 175530 + }, + { + "epoch": 49.36, + "learning_rate": 1.4712772935994754e-06, + "loss": 0.0526, + "step": 175560 + }, + { + "epoch": 49.36, + "learning_rate": 1.4525349076937496e-06, + "loss": 0.0554, + "step": 175590 + }, + { + "epoch": 49.37, + "learning_rate": 1.4337925217880238e-06, + "loss": 0.048, + "step": 175620 + }, + { + "epoch": 49.38, + "learning_rate": 1.4150501358822978e-06, + "loss": 0.057, + "step": 175650 + }, + { + "epoch": 49.39, + "learning_rate": 1.3963077499765722e-06, + "loss": 0.0498, + "step": 175680 + }, + { + "epoch": 49.4, + "learning_rate": 1.3775653640708463e-06, + "loss": 0.0549, + "step": 175710 + }, + { + "epoch": 49.41, + "learning_rate": 1.3588229781651205e-06, + "loss": 0.0579, + "step": 175740 + }, + { + "epoch": 49.42, + "learning_rate": 1.3400805922593947e-06, + "loss": 0.0468, + "step": 175770 + }, + { + "epoch": 49.42, + "learning_rate": 1.321338206353669e-06, + "loss": 0.0585, + "step": 175800 + }, + { + "epoch": 49.43, + "learning_rate": 1.3025958204479431e-06, + "loss": 0.0475, + "step": 175830 + }, + { + "epoch": 49.44, + "learning_rate": 1.2838534345422173e-06, + "loss": 0.0553, + "step": 175860 + }, + { + "epoch": 49.45, + "learning_rate": 1.2651110486364915e-06, + "loss": 0.053, + "step": 175890 + }, + { + "epoch": 49.46, + "learning_rate": 1.2463686627307657e-06, + "loss": 0.0531, + "step": 175920 + }, + { + "epoch": 49.47, + "learning_rate": 1.2276262768250399e-06, + "loss": 0.0588, + "step": 175950 + }, + { + "epoch": 49.47, + "learning_rate": 1.208883890919314e-06, + "loss": 0.0482, + "step": 175980 + }, + { + "epoch": 49.48, + "learning_rate": 1.1901415050135883e-06, + "loss": 0.0512, + "step": 176010 + }, + { + "epoch": 49.49, + "learning_rate": 1.1713991191078627e-06, + "loss": 0.0531, + "step": 176040 + }, + { + "epoch": 49.5, + "learning_rate": 1.1526567332021366e-06, + "loss": 0.0494, + "step": 176070 + }, + { + "epoch": 49.51, + "learning_rate": 1.1339143472964108e-06, + "loss": 0.059, + "step": 176100 + }, + { + "epoch": 49.52, + "learning_rate": 1.115171961390685e-06, + "loss": 0.0451, + "step": 176130 + }, + { + "epoch": 49.52, + "learning_rate": 1.0964295754849594e-06, + "loss": 0.0564, + "step": 176160 + }, + { + "epoch": 49.53, + "learning_rate": 1.0776871895792336e-06, + "loss": 0.0512, + "step": 176190 + }, + { + "epoch": 49.54, + "learning_rate": 1.0589448036735076e-06, + "loss": 0.0482, + "step": 176220 + }, + { + "epoch": 49.55, + "learning_rate": 1.0402024177677818e-06, + "loss": 0.0549, + "step": 176250 + }, + { + "epoch": 49.56, + "learning_rate": 1.0214600318620562e-06, + "loss": 0.0501, + "step": 176280 + }, + { + "epoch": 49.57, + "learning_rate": 1.0027176459563304e-06, + "loss": 0.0544, + "step": 176310 + }, + { + "epoch": 49.58, + "learning_rate": 9.839752600506046e-07, + "loss": 0.0524, + "step": 176340 + }, + { + "epoch": 49.58, + "learning_rate": 9.652328741448785e-07, + "loss": 0.047, + "step": 176370 + }, + { + "epoch": 49.59, + "learning_rate": 9.464904882391528e-07, + "loss": 0.0544, + "step": 176400 + }, + { + "epoch": 49.6, + "learning_rate": 9.277481023334271e-07, + "loss": 0.048, + "step": 176430 + }, + { + "epoch": 49.61, + "learning_rate": 9.090057164277013e-07, + "loss": 0.0566, + "step": 176460 + }, + { + "epoch": 49.62, + "learning_rate": 8.902633305219754e-07, + "loss": 0.053, + "step": 176490 + }, + { + "epoch": 49.63, + "learning_rate": 8.715209446162496e-07, + "loss": 0.049, + "step": 176520 + }, + { + "epoch": 49.63, + "learning_rate": 8.527785587105239e-07, + "loss": 0.058, + "step": 176550 + }, + { + "epoch": 49.64, + "learning_rate": 8.340361728047981e-07, + "loss": 0.0511, + "step": 176580 + }, + { + "epoch": 49.65, + "learning_rate": 8.152937868990723e-07, + "loss": 0.0571, + "step": 176610 + }, + { + "epoch": 49.66, + "learning_rate": 7.965514009933464e-07, + "loss": 0.0534, + "step": 176640 + }, + { + "epoch": 49.67, + "learning_rate": 7.778090150876207e-07, + "loss": 0.0514, + "step": 176670 + }, + { + "epoch": 49.68, + "learning_rate": 7.590666291818949e-07, + "loss": 0.0587, + "step": 176700 + }, + { + "epoch": 49.69, + "learning_rate": 7.40324243276169e-07, + "loss": 0.0506, + "step": 176730 + }, + { + "epoch": 49.69, + "learning_rate": 7.215818573704433e-07, + "loss": 0.0516, + "step": 176760 + }, + { + "epoch": 49.7, + "learning_rate": 7.028394714647174e-07, + "loss": 0.0537, + "step": 176790 + }, + { + "epoch": 49.71, + "learning_rate": 6.847218317558492e-07, + "loss": 0.0545, + "step": 176820 + }, + { + "epoch": 49.72, + "learning_rate": 6.659794458501234e-07, + "loss": 0.0559, + "step": 176850 + }, + { + "epoch": 49.73, + "learning_rate": 6.472370599443977e-07, + "loss": 0.0464, + "step": 176880 + }, + { + "epoch": 49.74, + "learning_rate": 6.284946740386718e-07, + "loss": 0.0533, + "step": 176910 + }, + { + "epoch": 49.74, + "learning_rate": 6.097522881329461e-07, + "loss": 0.0526, + "step": 176940 + }, + { + "epoch": 49.75, + "learning_rate": 5.910099022272201e-07, + "loss": 0.0481, + "step": 176970 + }, + { + "epoch": 49.76, + "learning_rate": 5.722675163214944e-07, + "loss": 0.06, + "step": 177000 + }, + { + "epoch": 49.77, + "learning_rate": 5.535251304157686e-07, + "loss": 0.0481, + "step": 177030 + }, + { + "epoch": 49.78, + "learning_rate": 5.347827445100428e-07, + "loss": 0.0515, + "step": 177060 + }, + { + "epoch": 49.79, + "learning_rate": 5.16040358604317e-07, + "loss": 0.0556, + "step": 177090 + }, + { + "epoch": 49.79, + "learning_rate": 4.972979726985912e-07, + "loss": 0.049, + "step": 177120 + }, + { + "epoch": 49.8, + "learning_rate": 4.785555867928654e-07, + "loss": 0.0578, + "step": 177150 + }, + { + "epoch": 49.81, + "learning_rate": 4.5981320088713964e-07, + "loss": 0.0505, + "step": 177180 + }, + { + "epoch": 49.82, + "learning_rate": 4.410708149814138e-07, + "loss": 0.0534, + "step": 177210 + }, + { + "epoch": 49.83, + "learning_rate": 4.22328429075688e-07, + "loss": 0.0532, + "step": 177240 + }, + { + "epoch": 49.84, + "learning_rate": 4.035860431699622e-07, + "loss": 0.0508, + "step": 177270 + }, + { + "epoch": 49.85, + "learning_rate": 3.848436572642364e-07, + "loss": 0.0569, + "step": 177300 + }, + { + "epoch": 49.85, + "learning_rate": 3.661012713585106e-07, + "loss": 0.0508, + "step": 177330 + }, + { + "epoch": 49.86, + "learning_rate": 3.473588854527848e-07, + "loss": 0.0516, + "step": 177360 + }, + { + "epoch": 49.87, + "learning_rate": 3.2861649954705903e-07, + "loss": 0.0528, + "step": 177390 + }, + { + "epoch": 49.88, + "learning_rate": 3.098741136413332e-07, + "loss": 0.0497, + "step": 177420 + }, + { + "epoch": 49.89, + "learning_rate": 2.911317277356074e-07, + "loss": 0.0543, + "step": 177450 + }, + { + "epoch": 49.9, + "learning_rate": 2.723893418298816e-07, + "loss": 0.0496, + "step": 177480 + }, + { + "epoch": 49.9, + "learning_rate": 2.536469559241558e-07, + "loss": 0.0525, + "step": 177510 + }, + { + "epoch": 49.91, + "learning_rate": 2.3490457001843e-07, + "loss": 0.0556, + "step": 177540 + }, + { + "epoch": 49.92, + "learning_rate": 2.161621841127042e-07, + "loss": 0.0506, + "step": 177570 + }, + { + "epoch": 49.93, + "learning_rate": 1.9741979820697842e-07, + "loss": 0.0552, + "step": 177600 + }, + { + "epoch": 49.94, + "learning_rate": 1.7867741230125263e-07, + "loss": 0.0478, + "step": 177630 + }, + { + "epoch": 49.95, + "learning_rate": 1.5993502639552682e-07, + "loss": 0.0597, + "step": 177660 + }, + { + "epoch": 49.95, + "learning_rate": 1.4119264048980104e-07, + "loss": 0.0508, + "step": 177690 + }, + { + "epoch": 49.96, + "learning_rate": 1.2245025458407523e-07, + "loss": 0.0461, + "step": 177720 + }, + { + "epoch": 49.97, + "learning_rate": 1.0370786867834943e-07, + "loss": 0.0566, + "step": 177750 + }, + { + "epoch": 49.98, + "learning_rate": 8.496548277262363e-08, + "loss": 0.0489, + "step": 177780 + }, + { + "epoch": 49.99, + "learning_rate": 6.622309686689783e-08, + "loss": 0.0531, + "step": 177810 + }, + { + "epoch": 50.0, + "learning_rate": 4.748071096117203e-08, + "loss": 0.0577, + "step": 177840 + }, + { + "epoch": 50.0, + "eval_loss": 0.1741643100976944, + "eval_runtime": 533.0988, + "eval_samples_per_second": 30.075, + "eval_steps_per_second": 0.942, + "eval_wer": 0.12089719269034979, + "step": 177850 + }, + { + "epoch": 50.0, + "step": 177850, + "total_flos": 1.1784689236730266e+21, + "train_loss": 0.042193543246732794, + "train_runtime": 659833.0285, + "train_samples_per_second": 34.505, + "train_steps_per_second": 0.27 + } + ], + "max_steps": 177850, + "num_train_epochs": 50, + "total_flos": 1.1784689236730266e+21, + "trial_name": null, + "trial_params": null +}